Spaces:

FractalAIResearch
/

Fathom-R1-14B

Running

App Files Files Community

FractalAIR commited on May 13

Commit

ae21a11

verified ·

1 Parent(s): ef5ddd1

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -43

app.py CHANGED Viewed

@@ -16,26 +16,14 @@ client = OpenAI(
     api_key="hf_XXXXX"
 )
-from transformers import VisionEncoderDecoderModel, TrOCRProcessor
 from PIL import Image
-# Load the model and processor
-processor = TrOCRProcessor.from_pretrained("breezedeus/pix2text-mfr")
-model = VisionEncoderDecoderModel.from_pretrained("breezedeus/pix2text-mfr")
-model.eval()
 def image_to_latex(image_path):
     image = Image.open(image_path).convert("RGB")
-    pixel_values = processor(images=image, return_tensors="pt").pixel_values
-    with torch.no_grad():
-        generated_ids = model.generate(pixel_values)
-    generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-    return generated_text
-def process_image(image):
-    latex_code = image_to_latex(image)
     return latex_code
 # Global dictionary to store all conversations: {id: {"title": str, "messages": list}}
 conversations = {}
@@ -109,28 +97,6 @@ def generate_response(user_message,
     yield new_history, new_history
-# OCR function using HF hosted model
-'''def extract_latex_from_image(image):
-    if image is None:
-        return gr.update(value="")
-    buffered = BytesIO()
-    image.save(buffered, format="PNG")
-    buffered.seek(0)
-    api_url = "https://api-inference.huggingface.co/models/harishkannaram/latex-ocr"
-    hf_token = os.getenv(HF_API)
-    headers = {"Authorization": f"Bearer {hf_token}"}
-    response = requests.post(api_url, headers=headers, files={"inputs": buffered})
-    if response.status_code == 200:
-        text = response.json().get("generated_text", "")
-        return gr.update(value=text)
-    else:
-        return gr.update(value="⚠️ OCR failed. Please try again.")
-'''
 example_messages = {
     "JEE Main 2025 Combinatorics": "From all the English alphabets, five letters are chosen and are arranged in alphabetical order. The total number of ways, in which the middle letter is 'M', is?",
@@ -198,17 +164,12 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
                 with gr.Column():
                     submit_button = gr.Button("Send", variant="primary", scale=1)
                     clear_button = gr.Button("Clear", scale=1)
-            '''gr.Markdown("### Upload Image of a Math Question")
-            image_input = gr.Image(type="pil", label="Upload Image (PNG/JPG)", height=120)
-            ocr_button = gr.Button("Extract LaTeX from Image 🧠")
-            ocr_button.click(fn=extract_latex_from_image, inputs=image_input, outputs=user_input)'''
             with gr.Row():
                 image_input = gr.Image(type="filepath", label="Upload Image")
                 output_text = gr.Textbox(label="LaTeX Output")
             image_input.change(fn=process_image, inputs=image_input, outputs=output_text)
             gr.Markdown("**Try these examples:**")
             with gr.Row():

     api_key="hf_XXXXX"
 )
 from PIL import Image
+from pix2tex import cli as pix2tex
 def image_to_latex(image_path):
+    model = pix2tex.LatexOCR()
     image = Image.open(image_path).convert("RGB")
+    latex_code = model(image)
     return latex_code
 # Global dictionary to store all conversations: {id: {"title": str, "messages": list}}
 conversations = {}
     yield new_history, new_history
 example_messages = {
     "JEE Main 2025 Combinatorics": "From all the English alphabets, five letters are chosen and are arranged in alphabetical order. The total number of ways, in which the middle letter is 'M', is?",
                 with gr.Column():
                     submit_button = gr.Button("Send", variant="primary", scale=1)
                     clear_button = gr.Button("Clear", scale=1)
             with gr.Row():
                 image_input = gr.Image(type="filepath", label="Upload Image")
                 output_text = gr.Textbox(label="LaTeX Output")
             image_input.change(fn=process_image, inputs=image_input, outputs=output_text)
             gr.Markdown("**Try these examples:**")
             with gr.Row():