Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 4 additions & 2 deletions .ci/scripts/test_llama.sh
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ source "$(dirname "${BASH_SOURCE[0]}")/utils.sh"

MODEL_NAME=$1 # stories110M
BUILD_TOOL=$2 # buck2 or cmake
DTYPE=$3 # fp16 or fp32
DTYPE=$3 # fp16, bf16, or fp32
MODE=${4:-"xnnpack+custom"} # portable or xnnpack+custom or xnnpack+custom+qe
UPLOAD_DIR=${5:-}
if [[ $# -lt 4 ]]; then # Assuming 4 mandatory args
Expand All @@ -29,7 +29,7 @@ if [[ -z "${BUILD_TOOL:-}" ]]; then
fi

if [[ -z "${DTYPE:-}" ]]; then
echo "Missing dtype, choose fp16 or fp32, exiting..."
echo "Missing dtype, choose fp16, bf16, or fp32, exiting..."
exit 1
fi

Expand Down Expand Up @@ -174,6 +174,8 @@ fi
EXPORTED_MODEL_NAME="llama2"
if [[ "${DTYPE}" == "fp16" ]]; then
EXPORTED_MODEL_NAME="${EXPORTED_MODEL_NAME}_h"
elif [[ "${DTYPE}" == "bf16" ]]; then
EXPORTED_MODEL_NAME="${EXPORTED_MODEL_NAME}_bf"
elif [[ "${DTYPE}" == "fp32" ]]; then
:
else
Expand Down
7 changes: 7 additions & 0 deletions .github/workflows/pull.yml
Original file line number Diff line number Diff line change
Expand Up @@ -91,6 +91,13 @@ jobs:
dtype: [fp32]
build-tool: [buck2, cmake]
mode: [portable, xnnpack+custom, xnnpack+custom+qe]
include:
- dtype: bf16
build-tool: cmake
mode: portable
- dtype: bf16
build-tool: buck2
mode: portable
fail-fast: false
with:
runner: linux.2xlarge
Expand Down
3 changes: 3 additions & 0 deletions .github/workflows/trunk.yml
Original file line number Diff line number Diff line change
Expand Up @@ -224,6 +224,9 @@ jobs:
matrix:
dtype: [fp32]
mode: [portable, xnnpack+kv+custom, mps, coreml]
include:
- dtype: bf16
mode: portable
fail-fast: false
with:
runner: macos-m1-stable
Expand Down