diff --git a/processing_kimi_vl.py b/processing_kimi_vl.py index 93c71ad..de279ec 100644 --- a/processing_kimi_vl.py +++ b/processing_kimi_vl.py @@ -22,7 +22,7 @@ from typing import List, Union from transformers.feature_extraction_utils import BatchFeature from transformers.image_utils import ImageInput -from transformers.processing_utils import ProcessingKwargs, ProcessorMixin, Unpack, _validate_images_text_input_order +from transformers.processing_utils import ProcessingKwargs, ProcessorMixin, Unpack from transformers.tokenization_utils_base import PreTokenizedInput, TextInput from transformers.utils import logging @@ -110,8 +110,6 @@ class KimiVLProcessor(ProcessorMixin): if images is None and text is None: raise ValueError("You have to specify at least one of `images` or `text`.") - # check if images and text inputs are reversed for BC - images, text = _validate_images_text_input_order(images, text) output_kwargs = self._merge_kwargs( KimiVLProcessorKwargs,