Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -13,11 +13,11 @@ print("TORCH_CUDA", torch.cuda.is_available())
|
|
13 |
|
14 |
print("loading model")
|
15 |
# Load the tokenizer and model
|
16 |
-
repo_name = "nvidia/Hymba-1.5B-Instruct"
|
|
|
17 |
|
18 |
tokenizer = AutoTokenizer.from_pretrained(repo_name, trust_remote_code=True)
|
19 |
-
|
20 |
-
model = AutoModelForCausalLM.from_pretrained("HuggingFaceTB/SmolLM2-1.7B-Instruct", trust_remote_code=True)
|
21 |
|
22 |
model = model.cuda().to(torch.bfloat16)
|
23 |
|
|
|
13 |
|
14 |
print("loading model")
|
15 |
# Load the tokenizer and model
|
16 |
+
# repo_name = "nvidia/Hymba-1.5B-Instruct"
|
17 |
+
repo_name = "HuggingFaceTB/SmolLM2-1.7B-Instruct"
|
18 |
|
19 |
tokenizer = AutoTokenizer.from_pretrained(repo_name, trust_remote_code=True)
|
20 |
+
model = AutoModelForCausalLM.from_pretrained(repo_name, trust_remote_code=True)
|
|
|
21 |
|
22 |
model = model.cuda().to(torch.bfloat16)
|
23 |
|