Spaces:

jason-moore
/

sum-soap-demo

Paused

jason-moore commited on Mar 31

Commit

fad9e5e

1 Parent(s): 0fcb40c

full prec

Files changed (2) hide show

app.py CHANGED Viewed

@@ -18,10 +18,8 @@ def load_model():
             model = AutoModelForCausalLM.from_pretrained(
                 "omi-health/sum-small",
                 trust_remote_code=False,
-                torch_dtype=torch.float16,  # Half precision
                 device_map="auto"  # Let the library decide best device mapping
             )
-            print(f"Model loaded with float16 precision on GPU")
             print(f"GPU: {torch.cuda.get_device_name(0)}")
             print(f"Memory allocated: {torch.cuda.memory_allocated(0) / 1024**2:.2f} MB")
         else:

             model = AutoModelForCausalLM.from_pretrained(
                 "omi-health/sum-small",
                 trust_remote_code=False,
                 device_map="auto"  # Let the library decide best device mapping
             )
             print(f"GPU: {torch.cuda.get_device_name(0)}")
             print(f"Memory allocated: {torch.cuda.memory_allocated(0) / 1024**2:.2f} MB")
         else:

requirements.txt CHANGED Viewed

@@ -2,3 +2,4 @@
 torch
 transformers>=4.36.0
 gradio>=3.50.0

 torch
 transformers>=4.36.0
 gradio>=3.50.0
+accelerate