-
Notifications
You must be signed in to change notification settings - Fork 26
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
#9082: t3k demo with slack notifications for owners. split jobs
- Loading branch information
Showing
3 changed files
with
66 additions
and
59 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,54 @@ | ||
#!/bin/bash | ||
|
||
run_t3000_falcon40b_tests() { | ||
# Record the start time | ||
start_time=$(date +%s) | ||
|
||
echo "LOG_METAL: Running run_t3000_falcon40b_tests" | ||
|
||
# Falcon40B prefill 60 layer end to end with 10 loops; we need 8x8 grid size | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest models/demos/t3000/falcon40b/tests/ci/test_falcon_end_to_end_60_layer_t3000_prefill_10_loops.py | ||
|
||
# Falcon40B end to end demo (prefill + decode) | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest models/demos/t3000/falcon40b/tests/ci/test_falcon_end_to_end_t3000_demo_loops.py | ||
|
||
# Record the end time | ||
end_time=$(date +%s) | ||
duration=$((end_time - start_time)) | ||
echo "LOG_METAL: run_t3000_falcon40b_tests $duration seconds to complete" | ||
} | ||
|
||
run_t3000_falcon7b_tests(){ | ||
# Record the start time | ||
start_time=$(date +%s) | ||
|
||
echo "LOG_METAL: Running run_t3000_falcon7b_tests" | ||
|
||
# Falcon7B demo (perf verification and output verification) | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest --disable-warnings -q -s --input-method=json --input-path='models/demos/t3000/falcon7b/input_data_t3000.json' models/demos/t3000/falcon7b/demo_t3000.py::test_demo_multichip[user_input0-8-True-perf_mode_stochastic_verify] | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest --disable-warnings -q -s --input-method=json --input-path='models/demos/t3000/falcon7b/input_data_t3000.json' models/demos/t3000/falcon7b/demo_t3000.py::test_demo_multichip[user_input0-8-True-default_mode_greedy_verify] | ||
|
||
# Falcon7B perplexity test (prefill and decode) | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest models/demos/falcon7b/tests/test_perplexity_falcon.py::test_perplexity[True-prefill_seq1024_dram] | ||
WH_ARCH_YAML=wormhole_b0_80_arch_eth_dispatch.yaml pytest models/demos/falcon7b/tests/test_perplexity_falcon.py::test_perplexity[True-decode_1024_l1_sharded] | ||
|
||
# Record the end time | ||
end_time=$(date +%s) | ||
duration=$((end_time - start_time)) | ||
echo "LOG_METAL: run_t3000_falcon7b_tests $duration seconds to complete" | ||
} | ||
|
||
run_t3000_mixtral_tests() { | ||
# Record the start time | ||
start_time=$(date +%s) | ||
|
||
echo "LOG_METAL: Running run_t3000_mixtral8x7b_tests" | ||
|
||
# mixtral8x7b 8 chip demo test - 100 token generation with general weights (env flags set inside the test) | ||
pytest models/demos/t3000/mixtral8x7b/demo/demo.py::test_mixtral8x7b_demo[wormhole_b0-True-general_weights] | ||
|
||
# Record the end time | ||
end_time=$(date +%s) | ||
duration=$((end_time - start_time)) | ||
echo "LOG_METAL: run_t3000_mixtral_tests $duration seconds to complete" | ||
} |