Spaces:
Running
on
Zero
Running
on
Zero
Update infer.py
Browse files
infer.py
CHANGED
@@ -50,10 +50,10 @@ def load_model(model_name, audio_tokenizer_path):
|
|
50 |
use_flash_attention_2=True,
|
51 |
use_cache=True,
|
52 |
)
|
53 |
-
model = model.to("cuda")
|
54 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
55 |
tokenizer_voila = VoilaTokenizer(model_path=audio_tokenizer_path, device="cpu")
|
56 |
-
tokenizer_voila.to("cuda")
|
57 |
return model, tokenizer, tokenizer_voila, model_type
|
58 |
|
59 |
def is_audio_output_task(task_type):
|
|
|
50 |
use_flash_attention_2=True,
|
51 |
use_cache=True,
|
52 |
)
|
53 |
+
# model = model.to("cuda")
|
54 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
55 |
tokenizer_voila = VoilaTokenizer(model_path=audio_tokenizer_path, device="cpu")
|
56 |
+
# tokenizer_voila.to("cuda")
|
57 |
return model, tokenizer, tokenizer_voila, model_type
|
58 |
|
59 |
def is_audio_output_task(task_type):
|