guangyil commited on
Commit
13efdd4
·
verified ·
1 Parent(s): 750f337

Update infer.py

Browse files
Files changed (1) hide show
  1. infer.py +2 -2
infer.py CHANGED
@@ -50,10 +50,10 @@ def load_model(model_name, audio_tokenizer_path):
50
  use_flash_attention_2=True,
51
  use_cache=True,
52
  )
53
- model = model.to("cuda")
54
  tokenizer = AutoTokenizer.from_pretrained(model_name)
55
  tokenizer_voila = VoilaTokenizer(model_path=audio_tokenizer_path, device="cpu")
56
- tokenizer_voila.to("cuda")
57
  return model, tokenizer, tokenizer_voila, model_type
58
 
59
  def is_audio_output_task(task_type):
 
50
  use_flash_attention_2=True,
51
  use_cache=True,
52
  )
53
+ # model = model.to("cuda")
54
  tokenizer = AutoTokenizer.from_pretrained(model_name)
55
  tokenizer_voila = VoilaTokenizer(model_path=audio_tokenizer_path, device="cpu")
56
+ # tokenizer_voila.to("cuda")
57
  return model, tokenizer, tokenizer_voila, model_type
58
 
59
  def is_audio_output_task(task_type):