From 2028adcd5b4321eac559f2b498207b7b635cc0a7 Mon Sep 17 00:00:00 2001 From: liyu319 Date: Thu, 29 May 2025 08:58:47 +0000 Subject: [PATCH] =?UTF-8?q?readme=E6=9B=B4=E6=96=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: liyu319 --- MindIE/LLM/QwQ/QwQ-32B/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-0.6B-Base/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-0.6B/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-1.7B-Base/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-1.7B/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-14B-Base/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-14B/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-32B/README.md | 12 ++++++------ MindIE/LLM/Qwen3/Qwen3-4B-Base/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-4B/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-8B-Base/README.md | 2 +- MindIE/LLM/Qwen3/Qwen3-8B/README.md | 2 +- 12 files changed, 17 insertions(+), 17 deletions(-) diff --git a/MindIE/LLM/QwQ/QwQ-32B/README.md b/MindIE/LLM/QwQ/QwQ-32B/README.md index 90d64bc478..0ff7862baf 100644 --- a/MindIE/LLM/QwQ/QwQ-32B/README.md +++ b/MindIE/LLM/QwQ/QwQ-32B/README.md @@ -116,7 +116,7 @@ torchrun --nproc_per_node 4 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 32 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-0.6B-Base/README.md b/MindIE/LLM/Qwen3/Qwen3-0.6B-Base/README.md index 9ed0c88a02..091fe827fb 100644 --- a/MindIE/LLM/Qwen3/Qwen3-0.6B-Base/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-0.6B-Base/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 1 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-0.6B/README.md b/MindIE/LLM/Qwen3/Qwen3-0.6B/README.md index 41f9d33b5a..0de6b81f35 100644 --- a/MindIE/LLM/Qwen3/Qwen3-0.6B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-0.6B/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-1.7B-Base/README.md b/MindIE/LLM/Qwen3/Qwen3-1.7B-Base/README.md index 715bed2242..a9536a0ac3 100644 --- a/MindIE/LLM/Qwen3/Qwen3-1.7B-Base/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-1.7B-Base/README.md @@ -108,7 +108,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-1.7B/README.md b/MindIE/LLM/Qwen3/Qwen3-1.7B/README.md index 9df7ec9865..a0bb232d04 100644 --- a/MindIE/LLM/Qwen3/Qwen3-1.7B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-1.7B/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-14B-Base/README.md b/MindIE/LLM/Qwen3/Qwen3-14B-Base/README.md index a412dfbaf5..1878a2762f 100644 --- a/MindIE/LLM/Qwen3/Qwen3-14B-Base/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-14B-Base/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-14B/README.md b/MindIE/LLM/Qwen3/Qwen3-14B/README.md index 4032fd02a1..dda0e14a75 100644 --- a/MindIE/LLM/Qwen3/Qwen3-14B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-14B/README.md @@ -132,7 +132,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-32B/README.md b/MindIE/LLM/Qwen3/Qwen3-32B/README.md index 7afa633fd2..2d2bd5f3f8 100644 --- a/MindIE/LLM/Qwen3/Qwen3-32B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-32B/README.md @@ -105,11 +105,11 @@ export MINDIE_LOG_TO_STDOUT=1 执行对话测试 ```shell -torchrun --nproc_per_node 2 \ +torchrun --nproc_per_node 4 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` @@ -122,9 +122,9 @@ cd $ATB_SPEED_HOME_PATH/tests/modeltest/ ```shell bash run.sh pa_[data_type] performance [case_pair] [batch_size] ([prefill_batch_size]) [model_name] ([is_chat_model]) (lora [lora_data_path]) [weight_dir] ([trust_remote_code]) [chip_num] ([parallel_params]) ([max_position_embedding/max_sequence_length]) ``` -具体执行batch=1, 输入长度256, 输出长度256用例的2卡并行性能测试命令为: +具体执行batch=1, 输入长度256, 输出长度256用例的4卡并行性能测试命令为: ```shell -bash run.sh pa_bf16 performance [[256,256]] 1 qwen ${weight_path} 2 +bash run.sh pa_bf16 performance [[256,256]] 1 qwen ${weight_path} 4 ``` > 注:ModelTest为大模型的性能和精度提供测试功能。使用文档请参考`${ATB_SPEED_HOME_PATH}/tests/modeltest/README.md` @@ -157,7 +157,7 @@ vim /usr/local/Ascend/mindie/latest/mindie-service/conf/config.json "BackendConfig": { ... -"npuDeviceIds" : [[0,1]], +"npuDeviceIds" : [[0,1,2,3]], ... "ModelDeployConfig": { @@ -167,7 +167,7 @@ vim /usr/local/Ascend/mindie/latest/mindie-service/conf/config.json ... "modelName" : "qwen3", "modelWeightPath" : "/data/datasets/Qwen3-32B", -"worldSize" : 2, +"worldSize" : 4, ... } ] diff --git a/MindIE/LLM/Qwen3/Qwen3-4B-Base/README.md b/MindIE/LLM/Qwen3/Qwen3-4B-Base/README.md index a1d92b3b35..ce4d9f2d16 100644 --- a/MindIE/LLM/Qwen3/Qwen3-4B-Base/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-4B-Base/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-4B/README.md b/MindIE/LLM/Qwen3/Qwen3-4B/README.md index 53ad29dd58..bd33772e5d 100644 --- a/MindIE/LLM/Qwen3/Qwen3-4B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-4B/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-8B-Base/README.md b/MindIE/LLM/Qwen3/Qwen3-8B-Base/README.md index 82414c862f..78296fd8ca 100644 --- a/MindIE/LLM/Qwen3/Qwen3-8B-Base/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-8B-Base/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` diff --git a/MindIE/LLM/Qwen3/Qwen3-8B/README.md b/MindIE/LLM/Qwen3/Qwen3-8B/README.md index ad4873dac0..5203461975 100644 --- a/MindIE/LLM/Qwen3/Qwen3-8B/README.md +++ b/MindIE/LLM/Qwen3/Qwen3-8B/README.md @@ -109,7 +109,7 @@ torchrun --nproc_per_node 2 \ --master_port 20037 \ -m examples.run_pa \ --model_path {权重路径} \ - --trust_remote_code + --trust_remote_code \ --max_output_length 256 ``` -- Gitee