Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -16,7 +16,7 @@ from pydub import AudioSegment
|
|
16 |
default_voice_short= ""
|
17 |
check1 = False # set global variable to check to see if process_text is begin of transcript line or not.
|
18 |
|
19 |
-
def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100, silence_padding_ms=
|
20 |
from pydub.silence import detect_nonsilent
|
21 |
# Detect non-silent regions
|
22 |
nonsilent = detect_nonsilent(audio, min_silence_len=min_silence_len, silence_thresh=silence_thresh)
|
@@ -29,6 +29,8 @@ def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100,
|
|
29 |
# Add padding before and after the trimmed audio
|
30 |
# Ensure the padding doesn't exceed the trimmed boundaries
|
31 |
start_trim = max(0, start_trim - silence_padding_ms) # Ensure no negative start
|
|
|
|
|
32 |
end_trim = min(len(audio), end_trim + silence_padding_ms) # Ensure end doesn't go past audio length
|
33 |
# Return the trimmed and padded audio
|
34 |
return audio[start_trim:end_trim]
|
@@ -136,9 +138,9 @@ async def generate_audio_with_voice_prefix(text_segment, default_voice, rate, pi
|
|
136 |
audio = AudioSegment.from_mp3(audio_path)
|
137 |
if check1:
|
138 |
print(f"First part of sentence - long silence")
|
139 |
-
audio = strip_silence(audio, silence_thresh=-40, min_silence_len=
|
140 |
else:
|
141 |
-
audio = strip_silence(audio, silence_thresh=-40, min_silence_len=
|
142 |
print(f"2nd part of sentence - long silence")
|
143 |
stripped_path = tempfile.mktemp(suffix=".mp3")
|
144 |
audio.export(stripped_path, format="mp3")
|
|
|
16 |
default_voice_short= ""
|
17 |
check1 = False # set global variable to check to see if process_text is begin of transcript line or not.
|
18 |
|
19 |
+
def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100, silence_padding_ms=100):
|
20 |
from pydub.silence import detect_nonsilent
|
21 |
# Detect non-silent regions
|
22 |
nonsilent = detect_nonsilent(audio, min_silence_len=min_silence_len, silence_thresh=silence_thresh)
|
|
|
29 |
# Add padding before and after the trimmed audio
|
30 |
# Ensure the padding doesn't exceed the trimmed boundaries
|
31 |
start_trim = max(0, start_trim - silence_padding_ms) # Ensure no negative start
|
32 |
+
#if not check1:
|
33 |
+
# silence_padding_ms=30
|
34 |
end_trim = min(len(audio), end_trim + silence_padding_ms) # Ensure end doesn't go past audio length
|
35 |
# Return the trimmed and padded audio
|
36 |
return audio[start_trim:end_trim]
|
|
|
138 |
audio = AudioSegment.from_mp3(audio_path)
|
139 |
if check1:
|
140 |
print(f"First part of sentence - long silence")
|
141 |
+
audio = strip_silence(audio, silence_thresh=-40, min_silence_len=50, silence_padding_ms=50) ##silence between sentences
|
142 |
else:
|
143 |
+
audio = strip_silence(audio, silence_thresh=-40, min_silence_len=50, silence_padding_ms=20) ##less silence for mid-sentence segments
|
144 |
print(f"2nd part of sentence - long silence")
|
145 |
stripped_path = tempfile.mktemp(suffix=".mp3")
|
146 |
audio.export(stripped_path, format="mp3")
|