Spaces:

gregorlied
/

medical-text-summarization

Sleeping

gregorlied commited on Jul 16

Commit

e4075e2

verified ·

1 Parent(s): db6cac8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,13 +13,13 @@ from pydantic import BaseModel
 hf_login(token=os.getenv("HF_TOKEN"))
 model_name = "meta-llama/Llama-3.2-1B-Instruct"
-model_name = "gregorlied/Llama-3.2-1B-Instruct-Medical-Report-Summarization"
 device = 'cuda' if torch.cuda.is_available() else 'cpu'
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     device_map="auto",
-    torch_dtype=torch.bfloat16,
     attn_implementation='eager',
     trust_remote_code=True,
 )
@@ -93,10 +93,10 @@ Please extract relevant clinical information from the report.
 def summarize(text):
     if not text.strip():
         return "Please enter some text to summarize."
     messages = [
-        {"role": "system", "content": prompt},
-        {"role": "user", "content": text},
     ]
     model_inputs = tokenizer([text], return_tensors="pt").to(device)

 hf_login(token=os.getenv("HF_TOKEN"))
 model_name = "meta-llama/Llama-3.2-1B-Instruct"
+model_name = "gregorlied/Llama-3.2-1B-Instruct-Medical-Report-Summarization-FP32"
 device = 'cuda' if torch.cuda.is_available() else 'cpu'
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     device_map="auto",
+    # torch_dtype=torch.bfloat16,
     attn_implementation='eager',
     trust_remote_code=True,
 )
 def summarize(text):
     if not text.strip():
         return "Please enter some text to summarize."
     messages = [
+        {"role": "system", "content": prompt.strip()},
+        {"role": "user", "content": text.strip()},
     ]
     model_inputs = tokenizer([text], return_tensors="pt").to(device)