MLLMerging
Collection
23 items
•
Updated
•
2
This is a LoRA adapter for Qwen2.5-VL-32B fine-tuned on Optical Character Recognition tasks.
from transformers import AutoModelForVision2Seq, AutoProcessor
from peft import PeftModel
# Load base model
base_model = AutoModelForVision2Seq.from_pretrained(
"Qwen/Qwen2.5-VL-32B",
trust_remote_code=True
)
# Load LoRA adapter
model = PeftModel.from_pretrained(base_model, "yongxianwei/Qwen2.5-VL-32B-OCR")
processor = AutoProcessor.from_pretrained("Qwen/Qwen2.5-VL-32B", trust_remote_code=True)
# Inference
# ... your inference code ...
Fine-tuned using LoRA on specific Optical Character Recognition datasets.
@misc{qwen2.5-vl-optical character recognition,
author = {Yongxian Wei},
title = {Qwen2.5-VL LoRA for Optical Character Recognition},
year = {2024},
publisher = {Hugging Face},
url = {https://huggingface.co/yongxianwei/Qwen2.5-VL-32B-OCR}
}