Moore-Language-Space-ZeroGPU

Sleeping

ArissBandoss commited on May 19

Commit

f0846b1

verified ·

1 Parent(s): 4a24c4f

Update goai_helpers/goai_traduction.py

Files changed (1) hide show

goai_helpers/goai_traduction.py CHANGED Viewed

@@ -30,9 +30,6 @@ def goai_traduction(text, src_lang, tgt_lang):
     inputs = tokenizer(text, return_tensors="pt", truncation=False).to(device)
     input_length = inputs["input_ids"].shape[1]
-    # Estimation intelligente de la longueur de sortie attendue
-    # Pour le mooré vers français, un facteur de 1.2-1.5 est généralement bon
-    expected_output_length = int(input_length * 1.3)
     # ID du token de langue cible
     tgt_lang_id = tokenizer.convert_tokens_to_ids(tgt_lang)
@@ -45,13 +42,10 @@ def goai_traduction(text, src_lang, tgt_lang):
         **inputs,
         forced_bos_token_id=tgt_lang_id,
         max_new_tokens=1024,
-        min_length=expected_output_length,
         num_beams=5,
         no_repeat_ngram_size=4,
         repetition_penalty=2.0,
-        length_penalty=1.5,
-        diversity_penalty=0.5,
-        num_beam_groups=5
     )
     # Décodage

     inputs = tokenizer(text, return_tensors="pt", truncation=False).to(device)
     input_length = inputs["input_ids"].shape[1]
     # ID du token de langue cible
     tgt_lang_id = tokenizer.convert_tokens_to_ids(tgt_lang)
         **inputs,
         forced_bos_token_id=tgt_lang_id,
         max_new_tokens=1024,
         num_beams=5,
         no_repeat_ngram_size=4,
         repetition_penalty=2.0,
+        length_penalty=1.5,
     )
     # Décodage