rednote-hilab/dots.ocr · fix autoprocessor

fix autoprocessor

#30

by kingsley01 - opened Sep 24

←

Files changed (2) hide show

configuration_dots.py CHANGED Viewed

@@ -3,6 +3,7 @@ from transformers.configuration_utils import PretrainedConfig
 from transformers.models.qwen2 import Qwen2Config
 from transformers import Qwen2_5_VLProcessor, AutoProcessor
 from transformers.models.auto.configuration_auto import CONFIG_MAPPING
 class DotsVisionConfig(PretrainedConfig):
@@ -68,7 +69,8 @@ class DotsOCRConfig(Qwen2Config):
 class DotsVLProcessor(Qwen2_5_VLProcessor):
     def __init__(self, image_processor=None, tokenizer=None, chat_template=None, **kwargs):
-        super().__init__(image_processor, tokenizer, chat_template=chat_template)
         self.image_token = "<|imgpad|>" if not hasattr(tokenizer, "image_token") else tokenizer.image_token

 from transformers.models.qwen2 import Qwen2Config
 from transformers import Qwen2_5_VLProcessor, AutoProcessor
 from transformers.models.auto.configuration_auto import CONFIG_MAPPING
+from transformers.video_processing_utils import BaseVideoProcessor
 class DotsVisionConfig(PretrainedConfig):
 class DotsVLProcessor(Qwen2_5_VLProcessor):
     def __init__(self, image_processor=None, tokenizer=None, chat_template=None, **kwargs):
+        dummy_processor = BaseVideoProcessor()
+        super().__init__(image_processor, tokenizer, video_processor=dummy_processor, chat_template=chat_template)
         self.image_token = "<|imgpad|>" if not hasattr(tokenizer, "image_token") else tokenizer.image_token

preprocessor_config.json CHANGED Viewed

@@ -1,4 +1,7 @@
 {
   "min_pixels": 3136,
   "max_pixels": 11289600,
   "patch_size": 14,

 {
+  "auto_map": {
+        "AutoProcessor": "configuration_dots.DotsVLProcessor"
+    },
   "min_pixels": 3136,
   "max_pixels": 11289600,
   "patch_size": 14,