diff --git a/gptqmodel/utils/looper_helpers.py b/gptqmodel/utils/looper_helpers.py index b77e4e8bd..0801707b8 100644 --- a/gptqmodel/utils/looper_helpers.py +++ b/gptqmodel/utils/looper_helpers.py @@ -24,7 +24,7 @@ from ..utils.torch import ALL_DEVICES, CPU, torch_sync -USE_TORCH_REPLICATE = env_flag("GPTQMODEL_USE_TORCH_REPLICATE", True) +USE_TORCH_REPLICATE = env_flag("GPTQMODEL_USE_TORCH_REPLICATE", False) _THREAD_SAFE_PARALLEL = ThreadSafe(torch_parallel)