Spaces:

oberbics
/

HistorySpace

Sleeping

App Files Files Community

oberbics commited on Apr 13

Commit

90d7012

verified ·

1 Parent(s): d446745

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -36

app.py CHANGED Viewed

@@ -1,57 +1,52 @@
 import gradio as gr
-import torch
 import json
-from transformers import AutoModelForCausalLM, AutoTokenizer
-# Initialize model with error handling
-try:
-    tokenizer = AutoTokenizer.from_pretrained("numind/NuExtract-1.5")
-    model = AutoModelForCausalLM.from_pretrained(
-        "numind/NuExtract-1.5",
-        device_map="auto",
-        torch_dtype=torch.float16,
-        trust_remote_code=True
-    )
-    MODEL_LOADED = True
-    print("Model loaded successfully!")
-except Exception as e:
-    MODEL_LOADED = False
-    print(f"Model loading failed: {e}")
 def test_function(template, text):
     print(f"Test function called with template: {template[:30]} and text: {text[:30]}")
     return "Button clicked successfully", "Function was called"
 def extract_info(template, text):
-    if not MODEL_LOADED:
-        return "❌ Model not loaded", "{}"
     try:
         # Format prompt according to NuExtract-1.5 requirements
         prompt = f"<|input|>\n### Template:\n{template}\n### Text:\n{text}\n\n<|output|>"
         print(f"Processing with prompt: {prompt[:100]}...")
-        # Tokenize
-        inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
-        # Generate with cache disabled
-        print("Generating output...")
-        outputs = model.generate(
-            **inputs,
-            max_new_tokens=1000,
-            do_sample=False,
-            use_cache=False  # This disables the problematic cache
-        )
-        # Decode and extract result
-        print("Decoding output...")
-        result = tokenizer.decode(outputs[0], skip_special_tokens=True)
-        # Split at output marker
-        if "<|output|>" in result:
-            json_text = result.split("<|output|>")[1].strip()
         else:
-            json_text = result
         # Try to parse as JSON
         print("Parsing JSON...")

 import gradio as gr
 import json
+import requests
+import os
+# Use the Hugging Face Inference API instead of loading the model
+API_URL = "https://api-inference.huggingface.co/models/numind/NuExtract-1.5"
+headers = {"Authorization": f"Bearer {os.environ.get('HF_TOKEN', '')}"}
 def test_function(template, text):
     print(f"Test function called with template: {template[:30]} and text: {text[:30]}")
     return "Button clicked successfully", "Function was called"
 def extract_info(template, text):
     try:
         # Format prompt according to NuExtract-1.5 requirements
         prompt = f"<|input|>\n### Template:\n{template}\n### Text:\n{text}\n\n<|output|>"
         print(f"Processing with prompt: {prompt[:100]}...")
+        # Call API instead of using local model
+        payload = {
+            "inputs": prompt,
+            "parameters": {
+                "max_new_tokens": 1000,
+                "do_sample": False
+            }
+        }
+        print("Calling API...")
+        response = requests.post(API_URL, headers=headers, json=payload)
+        if response.status_code != 200:
+            print(f"API error: {response.status_code}, {response.text}")
+            return f"❌ API Error: {response.status_code}", response.text
+        # Process result
+        result = response.json()
+        # Handle different response formats
+        if isinstance(result, list) and len(result) > 0:
+            result_text = result[0].get("generated_text", "")
+        else:
+            result_text = str(result)
+        # Split at output marker if present
+        if "<|output|>" in result_text:
+            json_text = result_text.split("<|output|>")[1].strip()
         else:
+            json_text = result_text
         # Try to parse as JSON
         print("Parsing JSON...")