Remove global torch import in llm_inference_utils.py (mlflow#11115)

Signed-off-by: B-Step62 <yuki.watanabe@databricks.com> Signed-off-by: Arthur Jenoudet <arthur.jenoudet@databricks.com>
artjen · Mar 26, 2024 · b1ca2e6 · b1ca2e6
1 parent e242f7b
commit b1ca2e6
Showing 1 changed file with 6 additions and 2 deletions.
diff --git a/mlflow/transformers/llm_inference_utils.py b/mlflow/transformers/llm_inference_utils.py
@@ -1,9 +1,10 @@
+from __future__ import annotations
+
 import time
 import uuid
-from typing import Any, Dict, List, Optional, Tuple, Union
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Tuple, Union
 
 import pandas as pd
-import torch
 from transformers import AutoTokenizer, StoppingCriteria
 
 from mlflow.exceptions import MlflowException
@@ -15,6 +16,9 @@
     COMPLETIONS_MODEL_OUTPUT_SCHEMA,
 )
 
+if TYPE_CHECKING:
+    import torch
+
 _LLM_INFERENCE_TASK_KEY = "inference_task"
 # The LLM inference task is saved as "task" in the metadata for forward compatibility with
 # future Databricks Provisioned Throughput support of more model architectures for inference.