fffiloni commited on
Commit
ca1c374
·
1 Parent(s): 09780d3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -21,7 +21,7 @@ diffuser_pipeline = DiffusionPipeline.from_pretrained(
21
  speech_processor=processor,
22
  use_auth_token=MY_SECRET_TOKEN,
23
  revision="fp16",
24
- torch_dtype=torch.float16,
25
  )
26
 
27
  diffuser_pipeline.enable_attention_slicing()
@@ -34,10 +34,10 @@ audio_input = gr.Audio(source="microphone")
34
  image_output = gr.Image()
35
 
36
  def speech_to_text(audio_sample):
37
- text = audio_sample["text"].lower()
38
- print(text)
39
- speech_data = audio_sample["audio"]["array"]
40
- output = diffuser_pipeline(speech_data)
41
 
42
  return output.images[0]
43
 
 
21
  speech_processor=processor,
22
  use_auth_token=MY_SECRET_TOKEN,
23
  revision="fp16",
24
+ #torch_dtype=torch.float16,
25
  )
26
 
27
  diffuser_pipeline.enable_attention_slicing()
 
34
  image_output = gr.Image()
35
 
36
  def speech_to_text(audio_sample):
37
+ #text = audio_sample["text"].lower()
38
+ #print(text)
39
+ #speech_data = audio_sample["audio"]["array"]
40
+ output = diffuser_pipeline(audio_sample)
41
 
42
  return output.images[0]
43