Spaces:

prithivMLmods
/

DocScope-R1

Running on Zero

prithivMLmods commited on 11 days ago

Commit

281fc09

verified ·

1 Parent(s): a2f45ed

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -103,6 +103,7 @@ MODEL_ID_M = "nvidia/Cosmos-Reason1-7B"
 processor_m = AutoProcessor.from_pretrained(MODEL_ID_M, trust_remote_code=True)
 model_m = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_M,
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
@@ -112,6 +113,7 @@ MODEL_ID_X = "prithivMLmods/docscopeOCR-7B-050425-exp"
 processor_x = AutoProcessor.from_pretrained(MODEL_ID_X, trust_remote_code=True)
 model_x = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_X,
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
@@ -121,6 +123,7 @@ MODEL_ID_Z = "Ertugrul/Qwen2.5-VL-7B-Captioner-Relaxed"
 processor_z = AutoProcessor.from_pretrained(MODEL_ID_Z, trust_remote_code=True)
 model_z = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_Z,
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
@@ -130,6 +133,7 @@ MODEL_ID_V = "prithivMLmods/visionOCR-3B-061125"
 processor_v = AutoProcessor.from_pretrained(MODEL_ID_V, trust_remote_code=True)
 model_v = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_V,
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()

 processor_m = AutoProcessor.from_pretrained(MODEL_ID_M, trust_remote_code=True)
 model_m = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_M,
+    attn_implementation="flash_attention_2",
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
 processor_x = AutoProcessor.from_pretrained(MODEL_ID_X, trust_remote_code=True)
 model_x = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_X,
+    attn_implementation="flash_attention_2",
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
 processor_z = AutoProcessor.from_pretrained(MODEL_ID_Z, trust_remote_code=True)
 model_z = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_Z,
+    attn_implementation="flash_attention_2",
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()
 processor_v = AutoProcessor.from_pretrained(MODEL_ID_V, trust_remote_code=True)
 model_v = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID_V,
+    attn_implementation="flash_attention_2",
     trust_remote_code=True,
     torch_dtype=torch.float16
 ).to(device).eval()