mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Iluvartar][CI] Fix the error max_tokens_per_expert referenced before assignment (#6083)
This commit is contained in:
@@ -7,7 +7,7 @@ on:
|
||||
description: "Build Images"
|
||||
required: true
|
||||
type: string
|
||||
default: "ccr-2vdh3abv-pub.cnc.bj.baidubce.com/device/paddle-ixuca:fd-ci"
|
||||
default: "ccr-2vdh3abv-pub.cnc.bj.baidubce.com/device/paddle-ixuca:3.3.0"
|
||||
FASTDEPLOY_ARCHIVE_URL:
|
||||
description: "URL of the compressed FastDeploy code archive."
|
||||
required: true
|
||||
|
||||
@@ -19,5 +19,5 @@ jobs:
|
||||
needs: [clone]
|
||||
uses: ./.github/workflows/_iluvatar_cases.yml
|
||||
with:
|
||||
DOCKER_IMAGE: ccr-2vdh3abv-pub.cnc.bj.baidubce.com/device/paddle-ixuca:fd-ci
|
||||
DOCKER_IMAGE: ccr-2vdh3abv-pub.cnc.bj.baidubce.com/device/paddle-ixuca:3.3.0
|
||||
FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }}
|
||||
|
||||
@@ -323,6 +323,7 @@ class CutlassMoEMethod(UnquantizedFusedMoEMethod):
|
||||
topk_only_mode=True,
|
||||
)
|
||||
dequant_scale = None
|
||||
max_tokens_per_expert = None
|
||||
else:
|
||||
(
|
||||
permute_input,
|
||||
@@ -365,6 +366,7 @@ class CutlassMoEMethod(UnquantizedFusedMoEMethod):
|
||||
topk_only_mode=False,
|
||||
)
|
||||
dequant_scale = None
|
||||
max_tokens_per_expert = None
|
||||
else:
|
||||
(
|
||||
permute_input,
|
||||
|
||||
@@ -2,6 +2,8 @@
|
||||
DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
||||
echo "$DIR"
|
||||
|
||||
ixsmi
|
||||
|
||||
#先kill一遍
|
||||
ps -efww | grep -E 'run_ernie300B_4layer' | grep -v grep | awk '{print $2}' | xargs kill -9 || true
|
||||
|
||||
@@ -232,7 +234,7 @@ if [ ${exit_code} -ne 0 ]; then
|
||||
exit 1
|
||||
fi
|
||||
|
||||
expected_strings="Buddhist statue"
|
||||
expected_strings="Buddhist"
|
||||
if grep -q "$expected_strings" "$result_file"; then
|
||||
echo -e "\nPASSED"
|
||||
else
|
||||
|
||||
Reference in New Issue
Block a user