diff --git a/.ci/scripts/gather_test_models.py b/.ci/scripts/gather_test_models.py index b32a052026a..3f22d7699de 100755 --- a/.ci/scripts/gather_test_models.py +++ b/.ci/scripts/gather_test_models.py @@ -33,7 +33,7 @@ "dl3": "linux.4xlarge.memory", "emformer_join": "linux.4xlarge.memory", "emformer_predict": "linux.4xlarge.memory", - "phi-4-mini": "linux.4xlarge.memory", + "phi_4_mini": "linux.4xlarge.memory", } } diff --git a/.ci/scripts/test_model.sh b/.ci/scripts/test_model.sh index 51e81e62a9f..cd543ff1424 100755 --- a/.ci/scripts/test_model.sh +++ b/.ci/scripts/test_model.sh @@ -100,11 +100,11 @@ test_model() { rm "./${MODEL_NAME}.pte" return # Skip running with portable executor runnner since portable doesn't support Qwen's biased linears. fi - if [[ "${MODEL_NAME}" == "phi-4-mini" ]]; then + if [[ "${MODEL_NAME}" == "phi_4_mini" ]]; then # Install requirements for export_llama bash examples/models/llama/install_requirements.sh # Test export_llama script: python3 -m examples.models.llama.export_llama. - "${PYTHON_EXECUTABLE}" -m examples.models.llama.export_llama --model "${MODEL_NAME}" -c examples/models/llama/params/demo_rand_params.pth -p examples/models/phi-4-mini/config.json + "${PYTHON_EXECUTABLE}" -m examples.models.llama.export_llama --model "${MODEL_NAME}" -c examples/models/llama/params/demo_rand_params.pth -p examples/models/phi_4_mini/config.json run_portable_executor_runner rm "./${MODEL_NAME}.pte" return diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml index 81948e4e827..9a2221b3aac 100644 --- a/.github/workflows/pull.yml +++ b/.github/workflows/pull.yml @@ -106,7 +106,7 @@ jobs: - model: emformer_join backend: xnnpack-quantization-delegation runner: linux.4xlarge.memory - - model: phi-4-mini + - model: phi_4_mini backend: portable runner: linux.4xlarge.memory - model: llama3_2_vision_encoder diff --git a/.github/workflows/trunk.yml b/.github/workflows/trunk.yml index ecae932b74f..829d8fd88f4 100644 --- a/.github/workflows/trunk.yml +++ b/.github/workflows/trunk.yml @@ -72,7 +72,7 @@ jobs: backend: portable - model: softmax backend: portable - - model: phi-4-mini + - model: phi_4_mini backend: portable - model: qwen2_5 backend: portable diff --git a/examples/models/__init__.py b/examples/models/__init__.py index 80ba6801a6c..41ec5c3aac6 100644 --- a/examples/models/__init__.py +++ b/examples/models/__init__.py @@ -36,7 +36,7 @@ class Model(str, Enum): Llava = "llava" EfficientSam = "efficient_sam" Qwen25 = "qwen2_5" - Phi4Mini = "phi-4-mini" + Phi4Mini = "phi_4_mini" def __str__(self) -> str: return self.value @@ -80,7 +80,7 @@ def __str__(self) -> str: str(Model.Llava): ("llava", "LlavaModel"), str(Model.EfficientSam): ("efficient_sam", "EfficientSAM"), str(Model.Qwen25): ("qwen2_5", "Qwen2_5Model"), - str(Model.Phi4Mini): ("phi-4-mini", "Phi4MiniModel"), + str(Model.Phi4Mini): ("phi_4_mini", "Phi4MiniModel"), } __all__ = [ diff --git a/examples/models/llama/export_llama_lib.py b/examples/models/llama/export_llama_lib.py index 1620924f4f6..c7603108ccf 100644 --- a/examples/models/llama/export_llama_lib.py +++ b/examples/models/llama/export_llama_lib.py @@ -95,7 +95,7 @@ "llama3_2", "static_llama", "qwen2_5", - "phi-4-mini", + "phi_4_mini", "smollm2", ] TORCHTUNE_DEFINED_MODELS = ["llama3_2_vision"] diff --git a/examples/models/phi-4-mini/README.md b/examples/models/phi_4_mini/README.md similarity index 100% rename from examples/models/phi-4-mini/README.md rename to examples/models/phi_4_mini/README.md diff --git a/examples/models/phi-4-mini/__init__.py b/examples/models/phi_4_mini/__init__.py similarity index 100% rename from examples/models/phi-4-mini/__init__.py rename to examples/models/phi_4_mini/__init__.py diff --git a/examples/models/phi-4-mini/config.json b/examples/models/phi_4_mini/config.json similarity index 100% rename from examples/models/phi-4-mini/config.json rename to examples/models/phi_4_mini/config.json diff --git a/examples/models/phi-4-mini/convert_weights.py b/examples/models/phi_4_mini/convert_weights.py similarity index 100% rename from examples/models/phi-4-mini/convert_weights.py rename to examples/models/phi_4_mini/convert_weights.py