diff --git a/README.md b/README.md
index 0f0ff38ea3d839e2b20f41793b88af245a61dc8c..69a74671eb173e1fc48e7a8714a0c2d7dec13952 100644
--- a/README.md
+++ b/README.md
@@ -36,7 +36,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
CLIP |
FP16 |
Supported |
- - |
+ ixFormer |
INT8 |
@@ -54,11 +54,22 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ ConvNeXt-Base |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
ConvNeXt-Small |
FP16 |
Supported |
- - |
+ Supported |
INT8 |
@@ -66,15 +77,15 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- CSPDarkNet5 |
+ CSPDarkNet53 |
FP16 |
Supported |
- - |
+ Supported |
INT8 |
- |
- - |
+ Supported |
CSPResNet50 |
@@ -113,7 +124,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
DenseNet161 |
FP16 |
Supported |
- - |
+ Supported |
INT8 |
@@ -124,6 +135,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
DenseNet169 |
FP16 |
Supported |
+ Supported |
+
+
+ INT8 |
+ - |
+ - |
+
+
+ DenseNet201 |
+ FP16 |
+ Supported |
- |
@@ -157,6 +179,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
EfficientNet-B2 |
FP16 |
Supported |
+ Supported |
+
+
+ INT8 |
+ - |
+ - |
+
+
+ EfficientNet-B3 |
+ FP16 |
+ Supported |
- |
@@ -186,6 +219,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ EfficientNetv2_s |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
GoogLeNet |
FP16 |
@@ -230,6 +274,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
Supported |
+
+ MNASNet0_5 |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
MobileNetV2 |
FP16 |
@@ -263,6 +318,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ MViTv2_base |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
RegNet_x_1_6gf |
FP16 |
@@ -274,6 +340,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ RegNet_y_1_6gf |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
RepVGG |
FP16 |
@@ -365,7 +442,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
ResNet_V1_D50 |
FP16 |
- - |
+ Supported |
Supported |
@@ -377,6 +454,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
ResNeXt50_32x4d |
FP16 |
Supported |
+ Supported |
+
+
+ INT8 |
+ - |
+ - |
+
+
+ ResNeXt101_64x4d |
+ FP16 |
+ Supported |
- |
@@ -428,6 +516,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ ShuffleNetV2_x1_5 |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
SqueezeNet 1.0 |
FP16 |
@@ -520,7 +619,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
CenterNet |
FP16 |
Supported |
- - |
+ Supported |
INT8 |
@@ -582,6 +681,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ PAA |
+ FP16 |
+ Supported |
+ |
+
+
+ INT8 |
+ |
+ |
+
RetinaFace |
FP16 |
@@ -692,6 +802,28 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
Supported |
Supported |
+
+ YOLOv9 |
+ FP16 |
+ Supported |
+ |
+
+
+ INT8 |
+ |
+ |
+
+
+ YOLOv10 |
+ FP16 |
+ Supported |
+ |
+
+
+ INT8 |
+ |
+ |
+
YOLOX |
FP16 |
@@ -728,6 +860,39 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
+### OCR
+
+
+
+ Models |
+ Precision |
+ IGIE |
+ IxRT |
+
+
+ Kie_layoutXLM |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
+
+ Rec_SVTR |
+ FP16 |
+ Supported |
+ - |
+
+
+ INT8 |
+ - |
+ - |
+
+
+
### Pose Estimation
@@ -737,11 +902,22 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
IGIE |
IxRT |
+
+ Lightweight OpenPose |
+ FP16 |
+ |
+ Supported |
+
+
+ INT8 |
+ - |
+ - |
+
RTMPose |
FP16 |
Supported |
- - |
+ Supported |
INT8 |
@@ -945,13 +1121,19 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
ChatGLM-3-6B |
- Supported |
+ Supported |
- |
- |
- Llama2-7B |
+ ChatGLM-3-6B-32K |
+ Supported |
- |
+ - |
+
+
+ Llama2-7B |
+ Supported |
Supported |
- |
@@ -962,9 +1144,15 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- Qwen-7B |
+ MiniCPM-V-2 |
+ Supported |
- |
- |
+
+
+ Qwen-7B |
+ Supported |
+ - |
Supported |
@@ -979,12 +1167,36 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型
- |
- |
+
+ Qwen1.5-32B Chat |
+ Supported |
+ - |
+ - |
+
Qwen1.5-72B |
Supported |
- |
- |
+
+ Qwen2-7B Instruct |
+ Supported |
+ - |
+ - |
+
+
+ Qwen2-72B Instruct |
+ Supported |
+ - |
+ - |
+
+
+ StableLM2-1.6B |
+ Supported |
+ - |
+ - |
+
## Speech
diff --git a/models/cv/classification/resnetv1d50/igie/README.md b/models/cv/classification/resnet_v1_d50/igie/README.md
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/README.md
rename to models/cv/classification/resnet_v1_d50/igie/README.md
diff --git a/models/cv/classification/resnetv1d50/igie/build_engine.py b/models/cv/classification/resnet_v1_d50/igie/build_engine.py
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/build_engine.py
rename to models/cv/classification/resnet_v1_d50/igie/build_engine.py
diff --git a/models/cv/classification/resnetv1d50/igie/export.py b/models/cv/classification/resnet_v1_d50/igie/export.py
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/export.py
rename to models/cv/classification/resnet_v1_d50/igie/export.py
diff --git a/models/cv/classification/resnetv1d50/igie/inference.py b/models/cv/classification/resnet_v1_d50/igie/inference.py
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/inference.py
rename to models/cv/classification/resnet_v1_d50/igie/inference.py
diff --git a/models/cv/classification/resnetv1d50/igie/requirements.txt b/models/cv/classification/resnet_v1_d50/igie/requirements.txt
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/requirements.txt
rename to models/cv/classification/resnet_v1_d50/igie/requirements.txt
diff --git a/models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh b/models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh
rename to models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh
diff --git a/models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh b/models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh
similarity index 100%
rename from models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh
rename to models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh
diff --git a/models/cv/ocr/kie_layoutxlm/README.md b/models/cv/ocr/kie_layoutxlm/igie/README.md
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/README.md
rename to models/cv/ocr/kie_layoutxlm/igie/README.md
diff --git a/models/cv/ocr/kie_layoutxlm/build_engine.py b/models/cv/ocr/kie_layoutxlm/igie/build_engine.py
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/build_engine.py
rename to models/cv/ocr/kie_layoutxlm/igie/build_engine.py
diff --git a/models/cv/ocr/kie_layoutxlm/inference.py b/models/cv/ocr/kie_layoutxlm/igie/inference.py
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/inference.py
rename to models/cv/ocr/kie_layoutxlm/igie/inference.py
diff --git a/models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_accuracy.sh b/models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_accuracy.sh
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_accuracy.sh
rename to models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_accuracy.sh
diff --git a/models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_performance.sh b/models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_performance.sh
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_performance.sh
rename to models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_performance.sh
diff --git a/models/cv/ocr/kie_layoutxlm/ser_vi_layoutxlm_xfund_zh.yml b/models/cv/ocr/kie_layoutxlm/igie/ser_vi_layoutxlm_xfund_zh.yml
similarity index 100%
rename from models/cv/ocr/kie_layoutxlm/ser_vi_layoutxlm_xfund_zh.yml
rename to models/cv/ocr/kie_layoutxlm/igie/ser_vi_layoutxlm_xfund_zh.yml
diff --git a/models/cv/ocr/rec_svtr/README.md b/models/cv/ocr/rec_svtr/igie/README.md
similarity index 100%
rename from models/cv/ocr/rec_svtr/README.md
rename to models/cv/ocr/rec_svtr/igie/README.md
diff --git a/models/cv/ocr/rec_svtr/build_engine.py b/models/cv/ocr/rec_svtr/igie/build_engine.py
similarity index 100%
rename from models/cv/ocr/rec_svtr/build_engine.py
rename to models/cv/ocr/rec_svtr/igie/build_engine.py
diff --git a/models/cv/ocr/rec_svtr/inference.py b/models/cv/ocr/rec_svtr/igie/inference.py
similarity index 100%
rename from models/cv/ocr/rec_svtr/inference.py
rename to models/cv/ocr/rec_svtr/igie/inference.py
diff --git a/models/cv/ocr/rec_svtr/rec_svtr_tiny_6local_6global_stn_en.yml b/models/cv/ocr/rec_svtr/igie/rec_svtr_tiny_6local_6global_stn_en.yml
similarity index 100%
rename from models/cv/ocr/rec_svtr/rec_svtr_tiny_6local_6global_stn_en.yml
rename to models/cv/ocr/rec_svtr/igie/rec_svtr_tiny_6local_6global_stn_en.yml
diff --git a/models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_accuracy.sh b/models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_accuracy.sh
similarity index 100%
rename from models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_accuracy.sh
rename to models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_accuracy.sh
diff --git a/models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_performance.sh b/models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_performance.sh
similarity index 100%
rename from models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_performance.sh
rename to models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_performance.sh
diff --git a/models/cv/pose_estimation/rtmpose/ixrt/README.md b/models/cv/pose_estimation/rtmpose/ixrt/README.md
index e278c8e3c2f673194428fda2c1168e80d0aea724..3e6b68a47647044b2b9116ec57303bef9206f899 100644
--- a/models/cv/pose_estimation/rtmpose/ixrt/README.md
+++ b/models/cv/pose_estimation/rtmpose/ixrt/README.md
@@ -45,7 +45,9 @@ python3 export.py --weight data/rtmpose/rtmpose-m_simcc-aic-coco_pt-aic-coco_420
onnxsim data/rtmpose/rtmpose.onnx data/rtmpose/rtmpose_opt.onnx
```
-## TestSample
+## Inference
+
+### FP16
```bash
python3 predict.py --model data/rtmpose/rtmpose_opt.onnx --precision fp16 --img_path demo/demo.jpg
diff --git a/models/nlp/large_language_model/qwen2-7b/vllm/README.md b/models/nlp/large_language_model/qwen2-7b/vllm/README.md
index ebf5c00c98e717dd41137e186fe53c3b68ce7144..6cfc785858a7cc6f96699f267f9b3b357ed43840 100755
--- a/models/nlp/large_language_model/qwen2-7b/vllm/README.md
+++ b/models/nlp/large_language_model/qwen2-7b/vllm/README.md
@@ -1,4 +1,4 @@
-# Qwen2-7B-Instruct
+# Qwen2-7B Instruct
## Description
diff --git a/models/nlp/large_language_model/stablelm/vllm/README.md b/models/nlp/large_language_model/stablelm/vllm/README.md
index 603f6732f52636e2e9fe55155bc6f5fe5461214e..e9d1b7e4fb0b7c65c7b793bf6f80cf36b667bf7e 100644
--- a/models/nlp/large_language_model/stablelm/vllm/README.md
+++ b/models/nlp/large_language_model/stablelm/vllm/README.md
@@ -1,4 +1,4 @@
-# StableLm-2-1_6B
+# StableLM2-1.6B
## Description