diff --git a/clients/python/llmengine/data_types.py b/clients/python/llmengine/data_types.py index b3fcbf58..cb7ad263 100644 --- a/clients/python/llmengine/data_types.py +++ b/clients/python/llmengine/data_types.py @@ -29,7 +29,7 @@ class GpuType(str, Enum): NVIDIA_TESLA_T4 = "nvidia-tesla-t4" NVIDIA_AMPERE_A10 = "nvidia-ampere-a10" - NVIDIA_AMPERE_A100 = "nvidia-a100" + NVIDIA_AMPERE_A100 = "nvidia-ampere-a100" class ModelEndpointType(str, Enum): diff --git a/server/llm_engine_server/domain/entities/gpu_type.py b/server/llm_engine_server/domain/entities/gpu_type.py index 99cfd1b4..a8c4ade4 100644 --- a/server/llm_engine_server/domain/entities/gpu_type.py +++ b/server/llm_engine_server/domain/entities/gpu_type.py @@ -6,4 +6,4 @@ class GpuType(str, Enum): NVIDIA_TESLA_T4 = "nvidia-tesla-t4" NVIDIA_AMPERE_A10 = "nvidia-ampere-a10" - NVIDIA_AMPERE_A100 = "nvidia-a100" + NVIDIA_AMPERE_A100 = "nvidia-ampere-a100" diff --git a/server/tests/unit/common/test_batch_jobs_dtos.py b/server/tests/unit/common/test_batch_jobs_dtos.py index b5f704f0..f6eb384e 100644 --- a/server/tests/unit/common/test_batch_jobs_dtos.py +++ b/server/tests/unit/common/test_batch_jobs_dtos.py @@ -24,10 +24,10 @@ def test_create_docker_image_batch_job_resource_requests_merge_requests(): # Test merging default = CreateDockerImageBatchJobResourceRequests(cpus=0.5) override = CreateDockerImageBatchJobResourceRequests( - memory="100Mi", gpus=1, gpu_type="nvidia-a100", storage="10Gi" + memory="100Mi", gpus=1, gpu_type="nvidia-ampere-a100", storage="10Gi" ) expected = CreateDockerImageBatchJobResourceRequests( - cpus=0.5, memory="100Mi", gpus=1, gpu_type="nvidia-a100", storage="10Gi" + cpus=0.5, memory="100Mi", gpus=1, gpu_type="nvidia-ampere-a100", storage="10Gi" ) actual = CreateDockerImageBatchJobResourceRequests.merge_requests(default, override) assert expected == actual