Spaces:

Detomo
/

naomi-app-api

Runtime error

App Files Files Community

vumichien commited on Feb 16, 2023

Commit

24c223a

1 Parent(s): afee0d3

Update main.py

Browse files

Files changed (1) hide show

main.py +15 -16

main.py CHANGED Viewed

@@ -102,18 +102,18 @@ async def predict(
             Levenshtein Distance Score from pitch and word
     """
-    upload_audio = ffmpeg_read(file, sampling_rate=16000)
     audio_duration = len(upload_audio) / 16000
     current_time = datetime.datetime.now().strftime("%Y-%h-%d-%H:%M:%S")
     start_time = time.time()
-    error_message, score = None, None
-    if len(word) != len(pitch) and pitch != "None":
         error_message = "Length of word and pitch input is not equal"
     word_preds = query_raw(upload_audio, word, processor, processor_with_lm, quantized_model, temperature=temperature)
-    if pitch != "None":
         pitch_preds = query_dummy(upload_audio, processor_pitch, quantized_pitch_model)
     # find best word
     word_score_list = []
     for word_predict in word_preds:
@@ -123,16 +123,15 @@ async def predict(
     wrong_word = find_different(word, best_word_predict)  # get wrong word
     # find best pitch
-    if pitch != "None":
-        if pitch_preds is not None:
-            best_pitch_predict = pitch_preds.replace(" ", "")
-            if len(best_pitch_predict) < len(best_word_predict):
-                best_pitch_predict = best_pitch_predict + "1" * (len(best_word_predict) - len(best_pitch_predict))
-            else:
-                best_pitch_predict = best_pitch_predict[:len(best_word_predict)]  # truncate to max len
-            pitch_score = fuzz.ratio(pitch, best_pitch_predict)
-            score = int((word_score * 2 + pitch_score) / 3)
-            wrong_pitch = find_different(pitch, best_pitch_predict)  # get wrong pitch
     else:
         score = int(word_score)
         best_pitch_predict = None

             Levenshtein Distance Score from pitch and word
     """
+    upload_audio = ffmpeg_read(file, sampling_rate=16000)
     audio_duration = len(upload_audio) / 16000
     current_time = datetime.datetime.now().strftime("%Y-%h-%d-%H:%M:%S")
     start_time = time.time()
+    error_message, score , pitch_preds = None, None, None
+    if len(word) != len(pitch) and pitch is not None:
         error_message = "Length of word and pitch input is not equal"
     word_preds = query_raw(upload_audio, word, processor, processor_with_lm, quantized_model, temperature=temperature)
+    if pitch is not None:
         pitch_preds = query_dummy(upload_audio, processor_pitch, quantized_pitch_model)
     # find best word
     word_score_list = []
     for word_predict in word_preds:
     wrong_word = find_different(word, best_word_predict)  # get wrong word
     # find best pitch
+    if pitch_preds is not None:
+        best_pitch_predict = pitch_preds.replace(" ", "")
+        if len(best_pitch_predict) < len(best_word_predict):
+            best_pitch_predict = best_pitch_predict + "1" * (len(best_word_predict) - len(best_pitch_predict))
+        else:
+            best_pitch_predict = best_pitch_predict[:len(best_word_predict)]  # truncate to max len
+        pitch_score = fuzz.ratio(pitch, best_pitch_predict)
+        score = int((word_score * 2 + pitch_score) / 3)
+        wrong_pitch = find_different(pitch, best_pitch_predict)  # get wrong pitch
     else:
         score = int(word_score)
         best_pitch_predict = None