cnph001 commited on
Commit
08f8e97
·
verified ·
1 Parent(s): 7941061

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -16,7 +16,7 @@ from pydub import AudioSegment
16
  default_voice_short= ""
17
  check1 = False # set global variable to check to see if process_text is begin of transcript line or not.
18
 
19
- def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100, silence_padding_ms=50):
20
  from pydub.silence import detect_nonsilent
21
  # Detect non-silent regions
22
  nonsilent = detect_nonsilent(audio, min_silence_len=min_silence_len, silence_thresh=silence_thresh)
@@ -29,6 +29,8 @@ def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100,
29
  # Add padding before and after the trimmed audio
30
  # Ensure the padding doesn't exceed the trimmed boundaries
31
  start_trim = max(0, start_trim - silence_padding_ms) # Ensure no negative start
 
 
32
  end_trim = min(len(audio), end_trim + silence_padding_ms) # Ensure end doesn't go past audio length
33
  # Return the trimmed and padded audio
34
  return audio[start_trim:end_trim]
@@ -136,9 +138,9 @@ async def generate_audio_with_voice_prefix(text_segment, default_voice, rate, pi
136
  audio = AudioSegment.from_mp3(audio_path)
137
  if check1:
138
  print(f"First part of sentence - long silence")
139
- audio = strip_silence(audio, silence_thresh=-40, min_silence_len=100) ##silence between sentences
140
  else:
141
- audio = strip_silence(audio, silence_thresh=-40, min_silence_len=100) ##less silence for mid-sentence segments
142
  print(f"2nd part of sentence - long silence")
143
  stripped_path = tempfile.mktemp(suffix=".mp3")
144
  audio.export(stripped_path, format="mp3")
 
16
  default_voice_short= ""
17
  check1 = False # set global variable to check to see if process_text is begin of transcript line or not.
18
 
19
+ def strip_silence(audio: AudioSegment, silence_thresh=-40, min_silence_len=100, silence_padding_ms=100):
20
  from pydub.silence import detect_nonsilent
21
  # Detect non-silent regions
22
  nonsilent = detect_nonsilent(audio, min_silence_len=min_silence_len, silence_thresh=silence_thresh)
 
29
  # Add padding before and after the trimmed audio
30
  # Ensure the padding doesn't exceed the trimmed boundaries
31
  start_trim = max(0, start_trim - silence_padding_ms) # Ensure no negative start
32
+ #if not check1:
33
+ # silence_padding_ms=30
34
  end_trim = min(len(audio), end_trim + silence_padding_ms) # Ensure end doesn't go past audio length
35
  # Return the trimmed and padded audio
36
  return audio[start_trim:end_trim]
 
138
  audio = AudioSegment.from_mp3(audio_path)
139
  if check1:
140
  print(f"First part of sentence - long silence")
141
+ audio = strip_silence(audio, silence_thresh=-40, min_silence_len=50, silence_padding_ms=50) ##silence between sentences
142
  else:
143
+ audio = strip_silence(audio, silence_thresh=-40, min_silence_len=50, silence_padding_ms=20) ##less silence for mid-sentence segments
144
  print(f"2nd part of sentence - long silence")
145
  stripped_path = tempfile.mktemp(suffix=".mp3")
146
  audio.export(stripped_path, format="mp3")