fredaddy
/

MiniCPM-v-2_6

Image-Text-to-Text

feature-extraction

Model card Files Files and versions

fredaddy commited on Sep 16, 2024

Commit

e56d8f8

·

verified ·

1 Parent(s): cd5795f

Update handler.py

Files changed (1) hide show

handler.py +3 -3

handler.py CHANGED Viewed

@@ -6,18 +6,18 @@ class ModelHandler:
     def __init__(self):
         # Load the model and tokenizer with appropriate weights
         self.model = AutoModel.from_pretrained(
-            'openbmb/MiniCPM-V-2_6',
             trust_remote_code=True,
             attn_implementation='sdpa',
             torch_dtype=torch.bfloat16
         ).eval().cuda()
-        self.tokenizer = AutoTokenizer.from_pretrained('openbmb/MiniCPM-V-2_6', trust_remote_code=True)
     def preprocess(self, inputs):
         # Preprocess image input
         image = Image.open(inputs['image'].file).convert('RGB')
-        question = inputs.get("question", "What is in the image?")
         msgs = [{'role': 'user', 'content': [image, question]}]
         return msgs

     def __init__(self):
         # Load the model and tokenizer with appropriate weights
         self.model = AutoModel.from_pretrained(
+            'fredaddy/MiniCPM-V-2_6',
             trust_remote_code=True,
             attn_implementation='sdpa',
             torch_dtype=torch.bfloat16
         ).eval().cuda()
+        self.tokenizer = AutoTokenizer.from_pretrained('fredaddy/MiniCPM-V-2_6', trust_remote_code=True)
     def preprocess(self, inputs):
         # Preprocess image input
         image = Image.open(inputs['image'].file).convert('RGB')
+        question = inputs.get("question", "Extract all data in the image. Be extremely careful to ensure that you don't miss anything. It's imperative that you extract and digitize everything on that page.")
         msgs = [{'role': 'user', 'content': [image, question]}]
         return msgs