Spaces:

eswardivi
/

phi-4

Running on Zero

eswardivi commited on Apr 18, 2024

Commit

ac6fdaf

verified ·

1 Parent(s): ad891da

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,9 +18,9 @@ quantization_config = BitsAndBytesConfig(
 )
 model = AutoModelForCausalLM.from_pretrained(
-    "google/gemma-1.1-7b-it", quantization_config=quantization_config, token=token
 )
-tok = AutoTokenizer.from_pretrained("google/gemma-1.1-7b-it", token=token)
 if torch.cuda.is_available():
     device = torch.device("cuda")
@@ -104,5 +104,6 @@ demo = gr.ChatInterface(
     ],
     stop_btn="Stop Generation",
     title="Chat With LLMs",
 )
 demo.launch()

 )
 model = AutoModelForCausalLM.from_pretrained(
+    "meta-llama/Meta-Llama-3-70B-Instruct", quantization_config=quantization_config, token=token
 )
+tok = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-70B-Instruct", token=token)
 if torch.cuda.is_available():
     device = torch.device("cuda")
     ],
     stop_btn="Stop Generation",
     title="Chat With LLMs",
+    description="Now Running ![meta-llama/Meta-Llama-3-70B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct) in 4bit"
 )
 demo.launch()