Update app.py
Browse files
app.py
CHANGED
@@ -1492,12 +1492,19 @@ def bark_tts(text):
|
|
1492 |
|
1493 |
start = time.time()
|
1494 |
# ✅ DO NOT use **inputs here to avoid duplicate keys
|
1495 |
-
|
1496 |
-
|
1497 |
-
|
1498 |
-
|
1499 |
-
|
1500 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1501 |
print(f"✅ Bark finished in {round(time.time() - start, 2)}s")
|
1502 |
|
1503 |
speech = speech_values.cpu().numpy().squeeze()
|
|
|
1492 |
|
1493 |
start = time.time()
|
1494 |
# ✅ DO NOT use **inputs here to avoid duplicate keys
|
1495 |
+
generate_args = {
|
1496 |
+
"input_ids": input_ids,
|
1497 |
+
"attention_mask": attention_mask,
|
1498 |
+
"pad_token_id": model_bark.config.eos_token_id,
|
1499 |
+
"max_new_tokens": 100
|
1500 |
+
}
|
1501 |
+
# Remove conflicting keys if already in processor output
|
1502 |
+
for key in ["max_new_tokens", "pad_token_id"]:
|
1503 |
+
if key in inputs:
|
1504 |
+
del inputs[key]
|
1505 |
+
|
1506 |
+
speech_values = model_bark.generate(**generate_args)
|
1507 |
+
|
1508 |
print(f"✅ Bark finished in {round(time.time() - start, 2)}s")
|
1509 |
|
1510 |
speech = speech_values.cpu().numpy().squeeze()
|