diff --git a/.github/workflows/_base_test.yml b/.github/workflows/_base_test.yml index 283db8de945..e4b10e3b3a4 100644 --- a/.github/workflows/_base_test.yml +++ b/.github/workflows/_base_test.yml @@ -206,20 +206,6 @@ jobs: check_service 90 python -m pytest -sv test_max_waiting_time.py || TEST_EXIT_CODE=1 - curl -X POST http://0.0.0.0:${FLASK_PORT}/switch \ - -H "Content-Type: application/json" \ - -d "{\"--model\": \"/MODELDATA/ernie-4_5-21b-a3b-bf16-paddle\", \"--config\": \"21b_mtp.yaml\", \"--enable-logprob\": \"False\"}" - check_service 180 - export TEMPLATE=TOKEN_NORMAL - python -m pytest -sv test_seed_usage.py -k "not test_seed_stream" || TEST_EXIT_CODE=1 - - curl -X POST http://0.0.0.0:${FLASK_PORT}/switch \ - -H "Content-Type: application/json" \ - -d "{\"--model\": \"/MODELDATA/ernie-4_5-21b-a3b-bf16-paddle\", \"--config\": \"21b_sot.yaml\", \"--enable-logprob\": \"False\"}" - check_service 360 - export TEMPLATE=TOKEN_NORMAL - python -m pytest -sv test_seed_usage.py -k "not test_seed_stream" || TEST_EXIT_CODE=1 - popd echo "TEST_EXIT_CODE=${TEST_EXIT_CODE}" >> /workspace/FastDeploy/exit_code.env ' diff --git a/.github/workflows/ce_job.yml b/.github/workflows/ce_job.yml index 19e79dbaf0f..e84e1c8a1a4 100644 --- a/.github/workflows/ce_job.yml +++ b/.github/workflows/ce_job.yml @@ -191,7 +191,7 @@ jobs: commit_id=${{ github.sha }} branch_name=${{ github.ref_name }} - target_path=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/SM${COMPILE_ARCH//,/_}/${branch_name}/${commit_id} + target_path=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/cu126/SM${COMPILE_ARCH//,/_}/${branch_name}/${commit_id} wget -q --no-proxy --no-check-certificate https://paddle-qa.bj.bcebos.com/CodeSync/develop/PaddlePaddle/PaddleTest/tools/bos_tools.py push_file=$(realpath bos_tools.py) @@ -201,7 +201,7 @@ jobs: target_path_stripped="${target_path#paddle-qa/}" WHEEL_PATH=https://paddle-qa.bj.bcebos.com/${target_path_stripped}/${filename} - target_path_latest=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/SM${COMPILE_ARCH//,/_}/${branch_name}/latest + target_path_latest=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/cu126/SM${COMPILE_ARCH//,/_}/${branch_name}/latest python ${push_file} ${filename} ${target_path_latest} target_path_stripped_latest="${target_path_latest#paddle-qa/}" WHEEL_PATH_LATEST=https://paddle-qa.bj.bcebos.com/${target_path_stripped_latest}/${filename} @@ -230,7 +230,7 @@ jobs: commit_id=${{ github.sha }} branch_name=${{ github.ref_name }} - target_path=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/SM${COMPILE_ARCH//,/_}/${branch_name}/${commit_id} + target_path=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/cu126/SM${COMPILE_ARCH//,/_}/${branch_name}/${commit_id} wget -q --no-proxy --no-check-certificate https://paddle-qa.bj.bcebos.com/CodeSync/develop/PaddlePaddle/PaddleTest/tools/bos_tools.py push_file=$(realpath bos_tools.py) @@ -240,7 +240,7 @@ jobs: target_path_stripped="${target_path#paddle-qa/}" WHEEL_PATH=https://paddle-qa.bj.bcebos.com/${target_path_stripped}/${filename} - target_path_latest=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/SM${COMPILE_ARCH//,/_}/${branch_name}/latest + target_path_latest=paddle-qa/paddle-pipeline/FastDeploy_ActionCE/cu126/SM${COMPILE_ARCH//,/_}/${branch_name}/latest python ${push_file} ${filename} ${target_path_latest} target_path_stripped_latest="${target_path_latest#paddle-qa/}" WHEEL_PATH_LATEST=https://paddle-qa.bj.bcebos.com/${target_path_stripped_latest}/${filename} diff --git a/.github/workflows/pr_build_and_test.yml b/.github/workflows/pr_build_and_test.yml index 23eb2fefa89..620bf9fc40d 100644 --- a/.github/workflows/pr_build_and_test.yml +++ b/.github/workflows/pr_build_and_test.yml @@ -75,23 +75,3 @@ jobs: FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }} FASTDEPLOY_WHEEL_URL: ${{ needs.build.outputs.wheel_path }} MODEL_CACHE_DIR: "/ssd2/actions-runner/ModelData" - - accuracy_test: - name: Run Accuracy Tests - needs: [clone,build] - uses: ./.github/workflows/_accuracy_test.yml - with: - DOCKER_IMAGE: ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddleqa:fastdeploy-ciuse-cuda126-dailyupdate - FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }} - FASTDEPLOY_WHEEL_URL: ${{ needs.build.outputs.wheel_path }} - MODEL_CACHE_DIR: "/ssd2/actions-runner/ModelData" - - stable_test: - name: Run Stable Tests - needs: [clone,build] - uses: ./.github/workflows/_stable_test.yml - with: - DOCKER_IMAGE: ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddleqa:fastdeploy-ciuse-cuda126-dailyupdate - FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }} - FASTDEPLOY_WHEEL_URL: ${{ needs.build.outputs.wheel_path }} - MODEL_CACHE_DIR: "/ssd2/actions-runner/ModelData" diff --git a/.github/workflows/publish_job.yml b/.github/workflows/publish_job.yml index a176f929daf..fc67b5faafa 100644 --- a/.github/workflows/publish_job.yml +++ b/.github/workflows/publish_job.yml @@ -377,5 +377,5 @@ jobs: with: DOCKER_IMAGE: ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddleqa:fastdeploy-ciuse-cuda126-dailyupdate FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }} - FASTDEPLOY_WHEEL_URL: ${{ needs.build.outputs.wheel_path }} + FASTDEPLOY_WHEEL_URL: ${{ needs.build_sm8090.outputs.wheel_path }} MODEL_CACHE_DIR: "/ssd2/actions-runner/ModelData" diff --git a/tests/ce/deploy/21b_mtp.yaml b/tests/ce/deploy/21b_mtp.yaml deleted file mode 100644 index 75224062561..00000000000 --- a/tests/ce/deploy/21b_mtp.yaml +++ /dev/null @@ -1,8 +0,0 @@ -max_model_len: 32768 -max_num_seqs: 128 -tensor_parallel_size: 1 -quantization: wint4 -speculative_config: - method: mtp - num_speculative_tokens: 1 - model: /MODELDATA/ernie-4_5-21b-a3b-bf16-paddle/mtp/ diff --git a/tests/ce/deploy/21b_sot.yaml b/tests/ce/deploy/21b_sot.yaml deleted file mode 100644 index 243e5335b6b..00000000000 --- a/tests/ce/deploy/21b_sot.yaml +++ /dev/null @@ -1,9 +0,0 @@ -max_model_len: 32768 -max_num_seqs: 128 -tensor_parallel_size: 1 -quantization: wint4 -graph_optimization_config: - graph_opt_level: 1 - sot_warmup_sizes: [2,16,32,64] - use_cudagraph: True - full_cuda_graph: False