diff --git a/requirements/framework.txt b/requirements/framework.txt index d59049c768..e6127654e4 100644 --- a/requirements/framework.txt +++ b/requirements/framework.txt @@ -35,6 +35,6 @@ tiktoken tqdm transformers>=4.33,<4.58 transformers_stream_generator -trl>=0.15,<0.21 +trl>=0.15,<0.24 uvicorn zstandard diff --git a/swift/llm/infer/infer_engine/sglang_engine.py b/swift/llm/infer/infer_engine/sglang_engine.py index 1033b1509a..dd78d0b651 100644 --- a/swift/llm/infer/infer_engine/sglang_engine.py +++ b/swift/llm/infer/infer_engine/sglang_engine.py @@ -73,13 +73,14 @@ def __init__( parameters = inspect.signature(ServerArgs).parameters if 'pp_size' in parameters: engine_kwargs['pp_size'] = pp_size + if 'enable_ep_moe' in parameters: + engine_kwargs['enable_ep_moe'] = enable_ep_moe self.server_args = ServerArgs( model_path=self.model_dir, dtype=self.model_info.torch_dtype, tp_size=tp_size, dp_size=dp_size, ep_size=ep_size, - enable_ep_moe=enable_ep_moe, mem_fraction_static=mem_fraction_static, context_length=context_length, disable_cuda_graph=disable_cuda_graph, diff --git a/swift/llm/train/tuner.py b/swift/llm/train/tuner.py index bfa6b2b565..9c3990e403 100644 --- a/swift/llm/train/tuner.py +++ b/swift/llm/train/tuner.py @@ -316,6 +316,8 @@ def prepare_adapter(args: TrainArguments, model, *, template=None, train_dataset ) logger.info(f'bone config: {bone_config}') model = Swift.prepare_model(model, bone_config) + else: + raise ValueError(f'Unknown train_type: {args.train_type}') return model