lihongjie commited on 18 days ago

Commit

dcf454d

1 Parent(s): 2dc6cb1

first commit

Files changed (35) hide show

.gitattributes +30 -0
README.md +90 -3
examples/demo01.jpg +3 -0
examples/demo02.jpg +3 -0
examples/demo03.jpg +3 -0
examples/demo04.jpg +3 -0
examples/demo05.jpg +3 -0
examples/demo06.jpg +3 -0
examples/demo07.jpg +3 -0
examples/demo08.jpg +3 -0
examples/demo09.jpg +3 -0
examples/demo10.jpg +3 -0
examples/demo11.jpg +3 -0
examples/demo12.jpg +3 -0
examples/demo13.jpg +3 -0
examples/demo14.jpg +3 -0
examples/demo15.jpg +3 -0
examples/demo16.jpg +3 -0
examples/demo17.jpg +3 -0
examples/demo18.jpg +3 -0
examples/demo19.jpg +3 -0
examples/demo20.jpg +3 -0
models/da3-base.axmodel +3 -0
models/da3-base.onnx +3 -0
models/da3-small.axmodel +3 -0
models/da3-small.onnx +3 -0
models/da3metric-large.axmodel +3 -0
models/da3metric-large.onnx +3 -0
models/da3mono-large.axmodel +3 -0
models/da3mono-large.onnx +3 -0
output-ax.png +3 -0
output-onnx.png +3 -0
python/infer.py +50 -0
python/infer_onnx.py +56 -0
python/requirements.txt +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,33 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+examples/demo16.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3-base.axmodel filter=lfs diff=lfs merge=lfs -text
+models/da3-base.onnx filter=lfs diff=lfs merge=lfs -text
+examples/demo04.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo08.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3mono-large.axmodel filter=lfs diff=lfs merge=lfs -text
+output-ax.png filter=lfs diff=lfs merge=lfs -text
+examples/demo19.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo02.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo10.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo11.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo15.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo12.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo20.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3-small.axmodel filter=lfs diff=lfs merge=lfs -text
+output-onnx.png filter=lfs diff=lfs merge=lfs -text
+examples/demo05.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo06.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo14.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3metric-large.onnx filter=lfs diff=lfs merge=lfs -text
+examples/demo13.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo17.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo09.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo18.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3mono-large.onnx filter=lfs diff=lfs merge=lfs -text
+models/da3-small.onnx filter=lfs diff=lfs merge=lfs -text
+examples/demo01.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo03.jpg filter=lfs diff=lfs merge=lfs -text
+examples/demo07.jpg filter=lfs diff=lfs merge=lfs -text
+models/da3metric-large.axmodel filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,3 +1,90 @@
----
-license: mit
----

+---
+license: bsd-3-clause
+language:
+- en
+base_model:
+- depth-anything/DA3-SMALL
+- depth-anything/DA3-BASE
+- depth-anything/DA3MONO-LARGE
+- depth-anything/DA3METRIC-LARGE
+pipeline_tag: depth-estimation
+tags:
+- Depth-Anything-3
+---
+# Depth-Anything-3
+This version of Depth-Anything-3  has been converted to run on the Axera NPU using **w8a16** quantization.
+This model has been optimized with the following LoRA:
+Compatible with Pulsar2 version: 3.4
+## Convert tools links:
+For those who are interested in model conversion, you can try to export axmodel through
+- [The repo of original](https://github.com/ByteDance-Seed/Depth-Anything-3)
+- [The repo of AXera Platform](https://github.com/AXERA-TECH/Depth-Anything-3.AXERA.git), which you can get the detial of guide
+- [Pulsar2 Link, How to Convert ONNX to axmodel](https://pulsar2-docs.readthedocs.io/en/latest/pulsar2/introduction.html)
+## Support Platform
+- AX650
+  - [M4N-Dock(爱芯派Pro)](https://wiki.sipeed.com/hardware/zh/maixIV/m4ndock/m4ndock.html)
+  - [M.2 Accelerator card](https://axcl-docs.readthedocs.io/zh-cn/latest/doc_guide_hardware.html)
+- AX630C
+  - [爱芯派2](https://axera-pi-2-docs-cn.readthedocs.io/zh-cn/latest/index.html)
+  - [Module-LLM](https://docs.m5stack.com/zh_CN/module/Module-LLM)
+  - [LLM630 Compute Kit](https://docs.m5stack.com/zh_CN/core/LLM630%20Compute%20Kit)
+|Chips|Time|
+|--|--|
+|AX650|  ms |
+|AX630C|  ms |
+## How to use
+Download all files from this repository to the device
+### python env requirement
+#### pyaxengine
+https://github.com/AXERA-TECH/pyaxengine
+```
+wget https://github.com/AXERA-TECH/pyaxengine/releases/download/0.1.3.rc2/axengine-0.1.3-py3-none-any.whl
+pip install axengine-0.1.3-py3-none-any.whl
+```
+#### others
+Maybe None.
+#### Inference with AX650 Host, such as M4N-Dock(爱芯派Pro)
+Input image:
+![](examples/demo01.jpg)
+```
+root@ax650:~/AXERA-TECH/Depth-Anything-3# python3 python/infer.py --model models/da3metric-large.axmodel --img examples/demo01.jpg
+[INFO] Available providers:  ['AxEngineExecutionProvider']
+[INFO] Using provider: AxEngineExecutionProvider
+[INFO] Chip type: ChipType.MC50
+[INFO] VNPU type: VNPUType.DISABLED
+[INFO] Engine version: 2.12.0s
+[INFO] Model type: 2 (triple core)
+[INFO] Compiler version: 3.3 ae03a08f
+root@ax650:~/AXERA-TECH/Depth-Anything-3# ls
+```
+Output image:
+![](output-ax.png)

examples/demo01.jpg ADDED Viewed

Git LFS Details

SHA256: 35ef1bbb63f6540e49aa9b6302b9b938be4fe8b9c08c07c3694b02396b0e87e0
Pointer size: 131 Bytes
Size of remote file: 488 kB

examples/demo02.jpg ADDED Viewed

Git LFS Details

SHA256: c1f116034aa5abd5b5470226be2bb03bd938c8affe90389c52d10fe8b1ac7e21
Pointer size: 131 Bytes
Size of remote file: 511 kB

examples/demo03.jpg ADDED Viewed

Git LFS Details

SHA256: 764dffd4d97bbacd620bc005fa86837018393ccb5ffd1059c2245a3cacff7782
Pointer size: 131 Bytes
Size of remote file: 465 kB

examples/demo04.jpg ADDED Viewed

Git LFS Details

SHA256: 3a301f4e0361fe75ca4d256a35062f87eecc3f7655d747c9def3259c86e26a45
Pointer size: 131 Bytes
Size of remote file: 300 kB

examples/demo05.jpg ADDED Viewed

Git LFS Details

SHA256: 50e7e2f057c5a2d27bb09b0b3e814147966e30139ddaf54362c72746a5320339
Pointer size: 131 Bytes
Size of remote file: 353 kB

examples/demo06.jpg ADDED Viewed

Git LFS Details

SHA256: 0fd815bddeab139e7477c948a22fffdf84d9b87f81d77dcf6fd8ef39ebaaafb5
Pointer size: 131 Bytes
Size of remote file: 783 kB

examples/demo07.jpg ADDED Viewed

Git LFS Details

SHA256: 345bec735adc4c238bf14ddf1d182c4881f8ba08814c4f4074c1d79e9e4adc52
Pointer size: 131 Bytes
Size of remote file: 400 kB

examples/demo08.jpg ADDED Viewed

Git LFS Details

SHA256: d32b480349013be5f84521b0df1d6590139163aef8457f051076ed03c7371e6f
Pointer size: 131 Bytes
Size of remote file: 103 kB

examples/demo09.jpg ADDED Viewed

Git LFS Details

SHA256: 6a64033ba69bb408c092dbff811abfbcb0196f1f87541902d03d2a909a0b8ea9
Pointer size: 131 Bytes
Size of remote file: 410 kB

examples/demo10.jpg ADDED Viewed

Git LFS Details

SHA256: bc77f215081f58de8d079e821e2808f6ee2727dfa729c10a5921c186a32c7638
Pointer size: 131 Bytes
Size of remote file: 487 kB

examples/demo11.jpg ADDED Viewed

Git LFS Details

SHA256: 150ef98e997ee6ff705bd06105c343f76a8f181ef93ff9ceebbd62a3ab6b592b
Pointer size: 131 Bytes
Size of remote file: 244 kB

examples/demo12.jpg ADDED Viewed

Git LFS Details

SHA256: 264458adcf5af6e3733dfda7ef4628c4a1dc49ed249aa8896256d9534a8377c4
Pointer size: 131 Bytes
Size of remote file: 263 kB

examples/demo13.jpg ADDED Viewed

Git LFS Details

SHA256: 9168fc752a002d50138a56621e8de5fab7fed125a978dd293319d28d30993564
Pointer size: 131 Bytes
Size of remote file: 421 kB

examples/demo14.jpg ADDED Viewed

Git LFS Details

SHA256: 01480d952bc950332f0eea31da0777f66d5f285d8edfe2a5f47508f4b260a99f
Pointer size: 131 Bytes
Size of remote file: 643 kB

examples/demo15.jpg ADDED Viewed

Git LFS Details

SHA256: bf60ce3879f627e8886280cc61442174c91908894a5b059681341fed600f7db3
Pointer size: 131 Bytes
Size of remote file: 769 kB

examples/demo16.jpg ADDED Viewed

Git LFS Details

SHA256: a92e51732b38ad8b21b5cbbc6883374bd5ab56bb4907d6c4f1e13307970480ee
Pointer size: 131 Bytes
Size of remote file: 378 kB

examples/demo17.jpg ADDED Viewed

Git LFS Details

SHA256: 7174dcfbbb95a2e581ebf1e14cfbb4bef7a1295ae9cece405c87145223dcb32d
Pointer size: 131 Bytes
Size of remote file: 153 kB

examples/demo18.jpg ADDED Viewed

Git LFS Details

SHA256: 4deeb16dbee40108f194bd87c8621416110427c8ab5fc5ad6a1d9002b2b620c2
Pointer size: 131 Bytes
Size of remote file: 179 kB

examples/demo19.jpg ADDED Viewed

Git LFS Details

SHA256: 7cdb09c34eb0b4d2ac5f6070aec47c8f983a0b1b2c9ee1fc30decafb64f1bd98
Pointer size: 132 Bytes
Size of remote file: 1 MB

examples/demo20.jpg ADDED Viewed

Git LFS Details

SHA256: 2958fd1b7018e40b68ccc8d74ff8e50bf143f5046711d57c54eec2a479550ace
Pointer size: 131 Bytes
Size of remote file: 498 kB

models/da3-base.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02f0291bb629de91860a17174351c82825a975f4979100882399219f39764ea6
+size 139250301

models/da3-base.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a9193dca2e27df2fa5cd3bac074afcf3d662a9939869f4177aeacf4eba73061
+size 451237395

models/da3-small.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9563bff5bde0aff1ce69ae026691035207d4c813fc5190ab118adff8da77366
+size 40927267

models/da3-small.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82b0da30b20e48b968b718588a3a0cb296d0df5cc09327e0bd3301343edf9e9f
+size 124726109

models/da3metric-large.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f65d9248e36663e989c926653a6f411aecbd822504c4c1364be05f22174e0c9
+size 382403608

models/da3metric-large.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:500faa78858c1b646b0e39974128479bf313a0b10c6071b47161c34fc308c17f
+size 1334346787

models/da3mono-large.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d70bb9242c90ad9425733d8aacd27d18d520f2e5f6f15f86efd08d9035a8745
+size 382396604

models/da3mono-large.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:166946c445e7be229fa20a87ea445d9b2f11b484d171915a273a9757b60e1f01
+size 1334346787

output-ax.png ADDED Viewed

Git LFS Details

SHA256: 16896a7a40bf37eac65316d0ec74afa99c7dc3d390aa88f84f4aa71143fe9969
Pointer size: 132 Bytes
Size of remote file: 4.73 MB

output-onnx.png ADDED Viewed

Git LFS Details

SHA256: dc0db36b8986d5d8e24666670d4b7f20098c40fed11378409db4167c12af0ac2
Pointer size: 132 Bytes
Size of remote file: 4.72 MB

python/infer.py ADDED Viewed

	@@ -0,0 +1,50 @@

+import argparse
+import cv2
+import numpy as np
+import axengine as axe
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--img",
+        type=str,
+        required=True,
+        help="Path to input image.",
+    )
+    parser.add_argument(
+        "--model",
+        type=str,
+        required=True,
+        help="Path to axmodel model.",
+    )
+    return parser.parse_args()
+def infer(img: str, model: str, viz: bool = False):
+    img_raw = cv2.imread(img)
+    image = cv2.cvtColor(img_raw, cv2.COLOR_BGR2RGB)
+    orig_h, orig_w = image.shape[:2]
+    image = cv2.resize(image, (504,280))
+    image = image[None]
+    session = axe.InferenceSession(model)
+    depth = session.run(None, {"img": image})[0]
+    depth = cv2.resize(depth[0, 0], (orig_w, orig_h))
+    depth = (depth - depth.min()) / (depth.max() - depth.min()) * 255.0
+    depth = depth.astype(np.uint8)
+    depth_color = cv2.applyColorMap(depth, cv2.COLORMAP_INFERNO)
+    combined_result = cv2.hconcat([img_raw,  depth_color])
+    cv2.imwrite("output-ax.png", combined_result)
+    return depth
+if __name__ == "__main__":
+    args = parse_args()
+    infer(**vars(args))

python/infer_onnx.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import argparse
+import cv2
+import numpy as np
+import onnxruntime as ort
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser()
+    parser.add_argument(
+        "--img",
+        type=str,
+        required=True,
+        help="Path to input image.",
+    )
+    parser.add_argument(
+        "--model",
+        type=str,
+        required=True,
+        help="Path to ONNX model.",
+    )
+    return parser.parse_args()
+def infer(img: str, model: str, viz: bool = False):
+    img_raw = cv2.imread(img)
+    image = cv2.cvtColor(img_raw, cv2.COLOR_BGR2RGB)
+    orig_h, orig_w = image.shape[:2]
+    image = cv2.resize(image, (504,280))
+    mean = np.array([123.675, 116.28, 103.53],dtype=np.float32).reshape(1,1,3)
+    std = np.array([58.395, 57.12, 57.375],dtype=np.float32).reshape(1,1,3)
+    image = (image-mean)/std
+    image = image.transpose(2,0,1)
+    image = image[None]
+    session = ort.InferenceSession(
+        model, providers=["CUDAExecutionProvider", "CPUExecutionProvider"]
+    )
+    depth = session.run(None, {"img": image})[0]
+    depth = cv2.resize(depth[0, 0], (orig_w, orig_h))
+    depth = (depth - depth.min()) / (depth.max() - depth.min()) * 255.0
+    depth = depth.astype(np.uint8)
+    depth_color = cv2.applyColorMap(depth, cv2.COLORMAP_INFERNO)
+    combined_result = cv2.hconcat([img_raw,  depth_color])
+    cv2.imwrite("output-onnx.png", combined_result)
+    return depth
+if __name__ == "__main__":
+    args = parse_args()
+    infer(**vars(args))

python/requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+onnx
+onnxruntime
+opencv-python