diff --git a/README.md b/README.md index 0f0ff38ea3d839e2b20f41793b88af245a61dc8c..69a74671eb173e1fc48e7a8714a0c2d7dec13952 100644 --- a/README.md +++ b/README.md @@ -36,7 +36,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 CLIP FP16 Supported - - + ixFormer INT8 @@ -54,11 +54,22 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + ConvNeXt-Base + FP16 + Supported + - + + + INT8 + - + - + ConvNeXt-Small FP16 Supported - - + Supported INT8 @@ -66,15 +77,15 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - CSPDarkNet5 + CSPDarkNet53 FP16 Supported - - + Supported INT8 - - - + Supported CSPResNet50 @@ -113,7 +124,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 DenseNet161 FP16 Supported - - + Supported INT8 @@ -124,6 +135,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 DenseNet169 FP16 Supported + Supported + + + INT8 + - + - + + + DenseNet201 + FP16 + Supported - @@ -157,6 +179,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 EfficientNet-B2 FP16 Supported + Supported + + + INT8 + - + - + + + EfficientNet-B3 + FP16 + Supported - @@ -186,6 +219,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + EfficientNetv2_s + FP16 + Supported + - + + + INT8 + - + - + GoogLeNet FP16 @@ -230,6 +274,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - Supported + + MNASNet0_5 + FP16 + Supported + - + + + INT8 + - + - + MobileNetV2 FP16 @@ -263,6 +318,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + MViTv2_base + FP16 + Supported + - + + + INT8 + - + - + RegNet_x_1_6gf FP16 @@ -274,6 +340,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + RegNet_y_1_6gf + FP16 + Supported + - + + + INT8 + - + - + RepVGG FP16 @@ -365,7 +442,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 ResNet_V1_D50 FP16 - - + Supported Supported @@ -377,6 +454,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 ResNeXt50_32x4d FP16 Supported + Supported + + + INT8 + - + - + + + ResNeXt101_64x4d + FP16 + Supported - @@ -428,6 +516,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + ShuffleNetV2_x1_5 + FP16 + Supported + - + + + INT8 + - + - + SqueezeNet 1.0 FP16 @@ -520,7 +619,7 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 CenterNet FP16 Supported - - + Supported INT8 @@ -582,6 +681,17 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - - + + PAA + FP16 + Supported + + + + INT8 + + + RetinaFace FP16 @@ -692,6 +802,28 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 Supported Supported + + YOLOv9 + FP16 + Supported + + + + INT8 + + + + + YOLOv10 + FP16 + Supported + + + + INT8 + + + YOLOX FP16 @@ -728,6 +860,39 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 +### OCR + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelsPrecisionIGIEIxRT
Kie_layoutXLMFP16Supported-
INT8--
Rec_SVTRFP16Supported-
INT8--
+ ### Pose Estimation @@ -737,11 +902,22 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 + + + + + + + + + + + - + @@ -945,13 +1121,19 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - + - + + + + + + + @@ -962,9 +1144,15 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 - + + + + + + + @@ -979,12 +1167,36 @@ DeepSparkInference将按季度进行版本更新,后续会逐步丰富模型 + + + + + + + + + + + + + + + + + + + + + + + +
IGIE IxRT
Lightweight OpenPoseFP16Supported
INT8--
RTMPose FP16 Supported-Supported
INT8
ChatGLM-3-6BSupportedSupported - -
Llama2-7BChatGLM-3-6B-32KSupported --
Llama2-7BSupported Supported -
-
Qwen-7BMiniCPM-V-2Supported - -
Qwen-7BSupported- Supported
- -
Qwen1.5-32B ChatSupported--
Qwen1.5-72B Supported - -
Qwen2-7B InstructSupported--
Qwen2-72B InstructSupported--
StableLM2-1.6BSupported--
## Speech diff --git a/models/cv/classification/resnetv1d50/igie/README.md b/models/cv/classification/resnet_v1_d50/igie/README.md similarity index 100% rename from models/cv/classification/resnetv1d50/igie/README.md rename to models/cv/classification/resnet_v1_d50/igie/README.md diff --git a/models/cv/classification/resnetv1d50/igie/build_engine.py b/models/cv/classification/resnet_v1_d50/igie/build_engine.py similarity index 100% rename from models/cv/classification/resnetv1d50/igie/build_engine.py rename to models/cv/classification/resnet_v1_d50/igie/build_engine.py diff --git a/models/cv/classification/resnetv1d50/igie/export.py b/models/cv/classification/resnet_v1_d50/igie/export.py similarity index 100% rename from models/cv/classification/resnetv1d50/igie/export.py rename to models/cv/classification/resnet_v1_d50/igie/export.py diff --git a/models/cv/classification/resnetv1d50/igie/inference.py b/models/cv/classification/resnet_v1_d50/igie/inference.py similarity index 100% rename from models/cv/classification/resnetv1d50/igie/inference.py rename to models/cv/classification/resnet_v1_d50/igie/inference.py diff --git a/models/cv/classification/resnetv1d50/igie/requirements.txt b/models/cv/classification/resnet_v1_d50/igie/requirements.txt similarity index 100% rename from models/cv/classification/resnetv1d50/igie/requirements.txt rename to models/cv/classification/resnet_v1_d50/igie/requirements.txt diff --git a/models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh b/models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh similarity index 100% rename from models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh rename to models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_accuracy.sh diff --git a/models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh b/models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh similarity index 100% rename from models/cv/classification/resnetv1d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh rename to models/cv/classification/resnet_v1_d50/igie/scripts/infer_resnetv1d50_fp16_performance.sh diff --git a/models/cv/ocr/kie_layoutxlm/README.md b/models/cv/ocr/kie_layoutxlm/igie/README.md similarity index 100% rename from models/cv/ocr/kie_layoutxlm/README.md rename to models/cv/ocr/kie_layoutxlm/igie/README.md diff --git a/models/cv/ocr/kie_layoutxlm/build_engine.py b/models/cv/ocr/kie_layoutxlm/igie/build_engine.py similarity index 100% rename from models/cv/ocr/kie_layoutxlm/build_engine.py rename to models/cv/ocr/kie_layoutxlm/igie/build_engine.py diff --git a/models/cv/ocr/kie_layoutxlm/inference.py b/models/cv/ocr/kie_layoutxlm/igie/inference.py similarity index 100% rename from models/cv/ocr/kie_layoutxlm/inference.py rename to models/cv/ocr/kie_layoutxlm/igie/inference.py diff --git a/models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_accuracy.sh b/models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_accuracy.sh similarity index 100% rename from models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_accuracy.sh rename to models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_accuracy.sh diff --git a/models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_performance.sh b/models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_performance.sh similarity index 100% rename from models/cv/ocr/kie_layoutxlm/scripts/infer_kie_ser_fp16_performance.sh rename to models/cv/ocr/kie_layoutxlm/igie/scripts/infer_kie_ser_fp16_performance.sh diff --git a/models/cv/ocr/kie_layoutxlm/ser_vi_layoutxlm_xfund_zh.yml b/models/cv/ocr/kie_layoutxlm/igie/ser_vi_layoutxlm_xfund_zh.yml similarity index 100% rename from models/cv/ocr/kie_layoutxlm/ser_vi_layoutxlm_xfund_zh.yml rename to models/cv/ocr/kie_layoutxlm/igie/ser_vi_layoutxlm_xfund_zh.yml diff --git a/models/cv/ocr/rec_svtr/README.md b/models/cv/ocr/rec_svtr/igie/README.md similarity index 100% rename from models/cv/ocr/rec_svtr/README.md rename to models/cv/ocr/rec_svtr/igie/README.md diff --git a/models/cv/ocr/rec_svtr/build_engine.py b/models/cv/ocr/rec_svtr/igie/build_engine.py similarity index 100% rename from models/cv/ocr/rec_svtr/build_engine.py rename to models/cv/ocr/rec_svtr/igie/build_engine.py diff --git a/models/cv/ocr/rec_svtr/inference.py b/models/cv/ocr/rec_svtr/igie/inference.py similarity index 100% rename from models/cv/ocr/rec_svtr/inference.py rename to models/cv/ocr/rec_svtr/igie/inference.py diff --git a/models/cv/ocr/rec_svtr/rec_svtr_tiny_6local_6global_stn_en.yml b/models/cv/ocr/rec_svtr/igie/rec_svtr_tiny_6local_6global_stn_en.yml similarity index 100% rename from models/cv/ocr/rec_svtr/rec_svtr_tiny_6local_6global_stn_en.yml rename to models/cv/ocr/rec_svtr/igie/rec_svtr_tiny_6local_6global_stn_en.yml diff --git a/models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_accuracy.sh b/models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_accuracy.sh similarity index 100% rename from models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_accuracy.sh rename to models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_accuracy.sh diff --git a/models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_performance.sh b/models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_performance.sh similarity index 100% rename from models/cv/ocr/rec_svtr/scripts/infer_svtr_fp16_performance.sh rename to models/cv/ocr/rec_svtr/igie/scripts/infer_svtr_fp16_performance.sh diff --git a/models/cv/pose_estimation/rtmpose/ixrt/README.md b/models/cv/pose_estimation/rtmpose/ixrt/README.md index e278c8e3c2f673194428fda2c1168e80d0aea724..3e6b68a47647044b2b9116ec57303bef9206f899 100644 --- a/models/cv/pose_estimation/rtmpose/ixrt/README.md +++ b/models/cv/pose_estimation/rtmpose/ixrt/README.md @@ -45,7 +45,9 @@ python3 export.py --weight data/rtmpose/rtmpose-m_simcc-aic-coco_pt-aic-coco_420 onnxsim data/rtmpose/rtmpose.onnx data/rtmpose/rtmpose_opt.onnx ``` -## TestSample +## Inference + +### FP16 ```bash python3 predict.py --model data/rtmpose/rtmpose_opt.onnx --precision fp16 --img_path demo/demo.jpg diff --git a/models/nlp/large_language_model/qwen2-7b/vllm/README.md b/models/nlp/large_language_model/qwen2-7b/vllm/README.md index ebf5c00c98e717dd41137e186fe53c3b68ce7144..6cfc785858a7cc6f96699f267f9b3b357ed43840 100755 --- a/models/nlp/large_language_model/qwen2-7b/vllm/README.md +++ b/models/nlp/large_language_model/qwen2-7b/vllm/README.md @@ -1,4 +1,4 @@ -# Qwen2-7B-Instruct +# Qwen2-7B Instruct ## Description diff --git a/models/nlp/large_language_model/stablelm/vllm/README.md b/models/nlp/large_language_model/stablelm/vllm/README.md index 603f6732f52636e2e9fe55155bc6f5fe5461214e..e9d1b7e4fb0b7c65c7b793bf6f80cf36b667bf7e 100644 --- a/models/nlp/large_language_model/stablelm/vllm/README.md +++ b/models/nlp/large_language_model/stablelm/vllm/README.md @@ -1,4 +1,4 @@ -# StableLm-2-1_6B +# StableLM2-1.6B ## Description