Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -2,11 +2,8 @@
|
|
2 |
import streamlit as st
|
3 |
import speech_recognition as sr
|
4 |
from transformers import pipeline
|
5 |
-
import
|
6 |
-
|
7 |
-
# Initialize the text-to-speech engine
|
8 |
-
tts_engine = pyttsx3.init()
|
9 |
-
tts_engine.setProperty('rate', 150) # Set the speech rate for TTS
|
10 |
|
11 |
# Function to transcribe audio to text
|
12 |
def transcribe_audio(audio_file, input_language):
|
@@ -20,30 +17,72 @@ def transcribe_audio(audio_file, input_language):
|
|
20 |
return f"Error: {str(e)}"
|
21 |
|
22 |
# Function to translate text
|
23 |
-
def translate_text(text,
|
24 |
try:
|
25 |
-
|
26 |
-
translator = pipeline("translation", model=model_name)
|
27 |
translated = translator(text)[0]["translation_text"]
|
28 |
return translated
|
29 |
except Exception as e:
|
30 |
return f"Error: {str(e)}"
|
31 |
|
32 |
-
# Function to
|
33 |
-
def speak_text(text):
|
34 |
try:
|
35 |
-
|
36 |
-
|
|
|
37 |
except Exception as e:
|
38 |
-
|
39 |
|
40 |
-
# Streamlit app
|
41 |
st.title("Real-Time Voice-to-Voice Translator ππ€")
|
42 |
st.markdown("""
|
43 |
This app translates spoken input between multiple languages in real time.
|
44 |
1. Select input and output languages.
|
45 |
-
2. Upload
|
46 |
3. Listen to the translated speech.
|
47 |
""")
|
48 |
|
49 |
-
#
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
import streamlit as st
|
3 |
import speech_recognition as sr
|
4 |
from transformers import pipeline
|
5 |
+
from gtts import gTTS
|
6 |
+
import os
|
|
|
|
|
|
|
7 |
|
8 |
# Function to transcribe audio to text
|
9 |
def transcribe_audio(audio_file, input_language):
|
|
|
17 |
return f"Error: {str(e)}"
|
18 |
|
19 |
# Function to translate text
|
20 |
+
def translate_text(text, target_language):
|
21 |
try:
|
22 |
+
translator = pipeline("translation", model=f"Helsinki-NLP/opus-mt-en-{target_language}")
|
|
|
23 |
translated = translator(text)[0]["translation_text"]
|
24 |
return translated
|
25 |
except Exception as e:
|
26 |
return f"Error: {str(e)}"
|
27 |
|
28 |
+
# Function to generate and play speech
|
29 |
+
def speak_text(text, language):
|
30 |
try:
|
31 |
+
tts = gTTS(text=text, lang=language)
|
32 |
+
tts.save("translated_audio.mp3")
|
33 |
+
return "translated_audio.mp3"
|
34 |
except Exception as e:
|
35 |
+
return None
|
36 |
|
37 |
+
# Streamlit app
|
38 |
st.title("Real-Time Voice-to-Voice Translator ππ€")
|
39 |
st.markdown("""
|
40 |
This app translates spoken input between multiple languages in real time.
|
41 |
1. Select input and output languages.
|
42 |
+
2. Upload your audio file or record audio for translation.
|
43 |
3. Listen to the translated speech.
|
44 |
""")
|
45 |
|
46 |
+
# Language options
|
47 |
+
languages = {
|
48 |
+
"English": "en",
|
49 |
+
"Spanish": "es",
|
50 |
+
"French": "fr",
|
51 |
+
"German": "de",
|
52 |
+
"Chinese": "zh",
|
53 |
+
"Japanese": "ja",
|
54 |
+
"Korean": "ko",
|
55 |
+
"Hindi": "hi",
|
56 |
+
}
|
57 |
+
|
58 |
+
# Select input and output languages
|
59 |
+
input_lang = st.selectbox("Select input language", options=languages.keys())
|
60 |
+
output_lang = st.selectbox("Select output language", options=languages.keys())
|
61 |
+
|
62 |
+
# Upload audio file
|
63 |
+
uploaded_audio = st.file_uploader("Upload an audio file", type=["wav", "mp3", "ogg"])
|
64 |
+
|
65 |
+
if uploaded_audio:
|
66 |
+
# Process the uploaded audio
|
67 |
+
st.audio(uploaded_audio, format="audio/wav")
|
68 |
+
st.write("Transcribing audio...")
|
69 |
+
input_language_code = languages[input_lang]
|
70 |
+
transcribed_text = transcribe_audio(uploaded_audio, input_language_code)
|
71 |
+
st.write(f"Transcribed Text: {transcribed_text}")
|
72 |
+
|
73 |
+
# Translate text
|
74 |
+
if transcribed_text and not transcribed_text.startswith("Error"):
|
75 |
+
st.write("Translating text...")
|
76 |
+
output_language_code = languages[output_lang]
|
77 |
+
translated_text = translate_text(transcribed_text, output_language_code)
|
78 |
+
st.write(f"Translated Text: {translated_text}")
|
79 |
+
|
80 |
+
# Generate speech for the translated text
|
81 |
+
st.write("Generating translated audio...")
|
82 |
+
audio_file = speak_text(translated_text, output_language_code)
|
83 |
+
if audio_file:
|
84 |
+
st.audio(audio_file, format="audio/mp3")
|
85 |
+
else:
|
86 |
+
st.error("Error in generating translated speech.")
|
87 |
+
else:
|
88 |
+
st.error("Error in transcription.")
|