diff --git a/scripts/run-glm4.7-30B-A3B.sh b/scripts/run-glm4.7-30B-A3B.sh index bec6bfc492..11aca66b01 100644 --- a/scripts/run-glm4.7-30B-A3B.sh +++ b/scripts/run-glm4.7-30B-A3B.sh @@ -66,7 +66,7 @@ PERF_ARGS=( --sequence-parallel --pipeline-model-parallel-size 2 --context-parallel-size 2 - --expert-model-parallel-size 8 + --expert-model-parallel-size 4 --expert-tensor-parallel-size 1 --decoder-last-pipeline-num-layers 23