Spaces:

justus-tobias
/

Moshi

Paused

justus-tobias commited on Sep 27, 2024

Commit

5b7c5f9

1 Parent(s): 8d2f8c3

tested error handling

Files changed (1) hide show

app.py CHANGED Viewed

@@ -35,17 +35,21 @@ def process_wav_new(wav):
     lm_gen = LMGen(moshi, temp=0.8, temp_text=0.7)  # this handles sampling params etc.
     out_wav_chunks = []
-    # Now we will stream over both Moshi I/O, and decode on the fly with Mimi.
-    with torch.no_grad(), lm_gen.streaming(1), mimi.streaming(1):
-        for idx, code in enumerate(all_codes):
-            # print("CODE: ", code.shape)
-            tokens_out = lm_gen.step(code.to(device))
-            # tokens_out is [B, 1 + 8, 1], with tokens_out[:, 1] representing the text token.
-            if tokens_out is not None:
-                wav_chunk = mimi.decode(tokens_out[:, 1:])
-                out_wav_chunks.append(wav_chunk)
-            print(idx, end='\r')
-    # out_wav = torch.cat(out_wav_chunks, dim=-1)
     return torch.cat(out_wav_chunks, dim=-1)

     lm_gen = LMGen(moshi, temp=0.8, temp_text=0.7)  # this handles sampling params etc.
     out_wav_chunks = []
+    try:
+        # Now we will stream over both Moshi I/O, and decode on the fly with Mimi.
+        with torch.no_grad(), lm_gen.streaming(1), mimi.streaming(1):
+            for idx, code in enumerate(all_codes):
+                # print("CODE: ", code.shape)
+                tokens_out = lm_gen.step(code.to(device))
+                # tokens_out is [B, 1 + 8, 1], with tokens_out[:, 1] representing the text token.
+                if tokens_out is not None:
+                    wav_chunk = mimi.decode(tokens_out[:, 1:])
+                    out_wav_chunks.append(wav_chunk)
+                print(idx, end='\r')
+        # out_wav = torch.cat(out_wav_chunks, dim=-1)
+    except gr.Error:
+        return torch.cat(out_wav_chunks, dim=-1)
     return torch.cat(out_wav_chunks, dim=-1)