diff --git a/swift/llm/template/template/emu3.py b/swift/llm/template/template/emu3.py index 47cf7d421c..fb0ca1d42f 100644 --- a/swift/llm/template/template/emu3.py +++ b/swift/llm/template/template/emu3.py @@ -27,8 +27,10 @@ class Emu3GenTemplate(Template): 'lowres, bad anatomy, bad hands, text, error, missing fingers, extra digit, fewer digits, cropped, ' 'worst quality, low quality, normal quality, jpeg artifacts, signature, watermark, username, blurry.') - def __init__(self, *args, **kwargs): - super().__init__(*args, **kwargs) + def init_processor(self, processor) -> None: + if processor is None: + return + super().init_processor(processor) self.bov = self.processor.tokenizer.encode(self.processor.visual_template[0].format(token_id=0))[0] self.eov = self.processor.tokenizer.encode(self.processor.visual_template[0].format(token_id=self.COOKBOOK_SIZE - 1))[0] diff --git a/swift/llm/template/template/qwen.py b/swift/llm/template/template/qwen.py index 6dc57663a6..e84997ffe4 100644 --- a/swift/llm/template/template/qwen.py +++ b/swift/llm/template/template/qwen.py @@ -408,8 +408,10 @@ class Qwen2_5OmniTemplate(Qwen2_5VLTemplate): version = 'omni' placeholder_tokens = ['<|IMAGE|>', '<|AUDIO|>', '<|VIDEO|>'] - def __init__(self, *args, **kwargs): - super().__init__(*args, **kwargs) + def init_processor(self, processor) -> None: + if processor is None: + return + super().init_processor(processor) from transformers.models.qwen2_5_omni.processing_qwen2_5_omni import Qwen2_5OmniProcessorKwargs default = Qwen2_5OmniProcessorKwargs._defaults self.seconds_per_chunk = default['videos_kwargs']['seconds_per_chunk']