OpenGVLab
/

VideoChat-Flash-Qwen2_5-2B_res448

Video-Text-to-Text

videochat_flash_qwen

feature-extraction

Eval Results (legacy)

Model card Files Files and versions

lixinhao commited on Mar 4, 2025

Commit

67ffd65

·

verified ·

1 Parent(s): 6e39ace

Update README.md

Files changed (1) hide show

README.md +1 -1

README.md CHANGED Viewed

@@ -114,7 +114,7 @@ from transformers import AutoModel, AutoTokenizer
 model_path = 'OpenGVLab/VideoChat-Flash-Qwen2_5-2B_res448'
 tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
-model = AutoModel.from_pretrained(model_path, trust_remote_code=True).half().cuda()
 image_processor = model.get_vision_tower().image_processor
 mm_llm_compress = False # use the global compress or not

 model_path = 'OpenGVLab/VideoChat-Flash-Qwen2_5-2B_res448'
 tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
+model = AutoModel.from_pretrained(model_path, trust_remote_code=True).to(torch.bfloat16).cuda()
 image_processor = model.get_vision_tower().image_processor
 mm_llm_compress = False # use the global compress or not