diff --git a/euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile b/euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile similarity index 42% rename from euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile rename to euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile index 5a4bcdb3598b0c54365a80e58971f9a8e7e9b991..c3122a28566ab69f12d4a4439249572a0803569d 100644 --- a/euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile +++ b/euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile @@ -2,9 +2,11 @@ ARG BASE=openeuler/openeuler:22.03-lts-sp3 FROM ${BASE} RUN yum upgrade -y && \ - yum -y install gcc make && \ + yum -y install gcc make wget && \ yum clean all -RUN mkdir -p /home/euler-copilot-fast-inference +RUN mkdir -p /home/euler-copilot-fast-inference &&\ + cd /home/euler-copilot-fast-inference &&\ + wget https://hf-mirror.com/Qwen/Qwen1.5-1.8B-Chat-GGUF/resolve/main/qwen1_5-1_8b-chat-q4_0.gguf ENV OMP_NUM_THREADS=16 COPY fast-llm /home/euler-copilot-fast-inference \ No newline at end of file diff --git a/euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/fast-llm b/euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/fast-llm similarity index 100% rename from euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/fast-llm rename to euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/fast-llm diff --git a/euler-copilot-fast-inference/README.md b/euler-copilot-fast-inference-qwen/README.md similarity index 68% rename from euler-copilot-fast-inference/README.md rename to euler-copilot-fast-inference-qwen/README.md index 8e8b3aa8822da8ce66cbf5ea24349efa001a66b2..02287077f60b4bda013b42653fbf71eea3693721 100644 --- a/euler-copilot-fast-inference/README.md +++ b/euler-copilot-fast-inference-qwen/README.md @@ -1,11 +1,14 @@ # Quick reference -# euler-copilot-fast-inference | openEuler +# euler-copilot-fast-inference-qwen | openEuler An inference framework that can be used for large-scale CPU inference, based on the Kunpeng and openEuler basic image, containerized package after release, can be used for one-click deployment # Supported tags and respective Dockerfile links -tags of the current container image: openeuler/euler-copilot-fast-inference:1.0.0-oe2203sp3 -Link to dockerfile is (https://gitee.com/openeuler/openeuler-docker-images/blob/master/euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile) +The tag of each euler-copilot-fast-inference-qwen docker image is consist of the version of euler-copilot-fast-inference-qwen and the version of basic image. The details are as follows + +| Tags | Currently | Architectures | +| ------------------------------------------------------------ | ------------------------------------------------------------ | ------------- | +| [1.5-oe2203sp3](https://gitee.com/openeuler/openeuler-docker-images/blob/master/euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile) | euler-copilot-fast-inference-qwen 1.5 on openEuler 22.03-lts-sp3 | arm64 | # Usage: 1. Start the container based on the application image @@ -32,9 +35,7 @@ Link to dockerfile is (https://gitee.com/openeuler/openeuler-docker-images/blob/ # cd source code cd euler-copilot-fast-inference # start docker - docker run --name **** -it -d --net=host --privileged=true --entrypoint=bash openeuler/fast-llm:1.0.0-oe2203sp3 - # copy weight file - docker cp qwen1_5-7b-chat-q4_0.gguf :/home/euler-copilot-fast-inference + docker run --name **** -it -d --net=host --privileged=true --entrypoint=bash openeuler/euler-copilot-fast-inference-qwen:1.5-oe2203sp3 # start inference docker exec -it bash cd /home/euler-copilot-fast-inference diff --git a/euler-copilot-fast-inference/doc/image-info.yml b/euler-copilot-fast-inference-qwen/doc/image-info.yml similarity index 55% rename from euler-copilot-fast-inference/doc/image-info.yml rename to euler-copilot-fast-inference-qwen/doc/image-info.yml index deb705277c339c14c811b26e6b5ecb6fc5de9bc2..a529d20d97cefa16228a0841fd4896cb95430f68 100644 --- a/euler-copilot-fast-inference/doc/image-info.yml +++ b/euler-copilot-fast-inference-qwen/doc/image-info.yml @@ -1,22 +1,22 @@ -name: euler-copilot-fast-inference +name: euler-copilot-fast-inference-qwen category: ai -description: euler-copilot-fast-inference是一个用于验证鲲鹏CPU推理引擎的相关组件,可用于CPU推理测试。 +description: euler-copilot-fast-inference-qwen是一个用于验证鲲鹏CPU推理引擎的相关组件,可用于CPU推理测试。 environment: | 本应用在Docker环境中运行,安装Docker执行如下命令 ``` yum install -y docker ``` tags: | - euler-copilot-fast-inference镜像的Tag由其版本信息和基础镜像版本信息组成,详细内容如下 + euler-copilot-fast-inference-qwen镜像的Tag由其版本信息和基础镜像版本信息组成,详细内容如下 | Tag | Currently | Architectures | |----------|-------------|------------------| - |[1.0.0-oe2203sp3](https://gitee.com/openeuler/openeuler-docker-images/blob/master/euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile)| euler-copilot-fast-inference 1.0.0 on openEuler 22.03-LTS-sp3 | arm64 | + |[1.5-oe2203sp3](https://gitee.com/openeuler/openeuler-docker-images/blob/master/euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile)| euler-copilot-fast-inference qwen1.5 on openEuler 22.03-LTS-sp3 | arm64 | download: | - 由于euler-copilot-fast-inference镜像体积较大,建议单独pull到本地后再启动容器: + 由于euler-copilot-fast-inference-qwen镜像体积较大,建议单独pull到本地后再启动容器: ``` - docker pull openeuler/euler-copilot-fast-inference:{Tag} + docker pull openeuler/euler-copilot-fast-inference-qwen:{Tag} ``` usage: | @@ -30,9 +30,7 @@ usage: | # 进入源码目录 cd mptcp_net-next # 启动容器 - docker run --name **** -it -d --net=host --privileged=true --entrypoint=bash openeuler/fast-llm:1.0.0-oe2203sp3 - # copy权重文件 - docker cp qwen1_5-7b-chat-q4_0.gguf :/home/euler-copilot-fast-inference + docker run --name **** -it -d --net=host --privileged=true --entrypoint=bash openeuler/euler-copilot-fast-inference-qwen:1.5-oe2203sp3 # 进入docker执行推理 docker exec -it bash cd /home/euler-copilot-fast-inference diff --git a/euler-copilot-fast-inference-qwen/doc/picture/logo.jpg b/euler-copilot-fast-inference-qwen/doc/picture/logo.jpg new file mode 100644 index 0000000000000000000000000000000000000000..3ae1e255268d7e02e19ca1c6eca697deea09fbd5 Binary files /dev/null and b/euler-copilot-fast-inference-qwen/doc/picture/logo.jpg differ diff --git a/euler-copilot-fast-inference-qwen/meta.yml b/euler-copilot-fast-inference-qwen/meta.yml new file mode 100644 index 0000000000000000000000000000000000000000..dcddfd056d0842307a5ca6780edfe054eb23eabe --- /dev/null +++ b/euler-copilot-fast-inference-qwen/meta.yml @@ -0,0 +1,3 @@ +1.5-oe2203sp3: + path: euler-copilot-fast-inference-qwen/1.5/22.03-lts-sp3/Dockerfile + arch: aarch64 \ No newline at end of file diff --git a/euler-copilot-fast-inference/meta.yml b/euler-copilot-fast-inference/meta.yml deleted file mode 100644 index 749bac73dd9c3862330351518e458eb52ef3c818..0000000000000000000000000000000000000000 --- a/euler-copilot-fast-inference/meta.yml +++ /dev/null @@ -1,2 +0,0 @@ -1.0.0-oe2203sp3: - path: euler-copilot-fast-inference/1.0.0/22.03-lts-sp3/Dockerfile \ No newline at end of file