Moore-Language-Space-ZeroGPU

Sleeping

ArissBandoss commited on May 18

Commit

7f3d8a9

verified ·

1 Parent(s): dfb286c

Update goai_helpers/goai_traduction.py

Files changed (1) hide show

goai_helpers/goai_traduction.py CHANGED Viewed

@@ -18,32 +18,36 @@ def goai_traduction(text, src_lang, tgt_lang):
     if src_lang == "fra_Latn" and tgt_lang == "mos_Latn":
         model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"
     elif src_lang == "mos_Latn" and tgt_lang == "fra_Latn":
-        model_id = "ArissBandoss/mos2fr-3B-1200"
     else:
         model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"
     tokenizer = AutoTokenizer.from_pretrained(model_id, token=auth_token)
     model = AutoModelForSeq2SeqLM.from_pretrained(model_id, token=auth_token).to(device)
     tokenizer.src_lang = src_lang
     inputs = tokenizer(text, return_tensors="pt").to(device)
-    # Ajout du code de langue cible
     tgt_lang_id = tokenizer.convert_tokens_to_ids(tgt_lang)
-    # Génération contrôlée
     outputs = model.generate(
         **inputs,
         forced_bos_token_id=tgt_lang_id,
-        eos_token_id=tokenizer.eos_token_id,  # S’assurer que le modèle peut s’arrêter
-        max_length=512,  # Teste avec 256 puis augmente progressivement
-        do_sample=False,
-        early_stopping=True
     )
     translation = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
-    print("ici translation")
-    print(translation)
     return translation
 def real_time_traduction(input_text, src_lang, tgt_lang):

     if src_lang == "fra_Latn" and tgt_lang == "mos_Latn":
         model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"
     elif src_lang == "mos_Latn" and tgt_lang == "fra_Latn":
+        model_id = "ArissBandoss/mos2fr-5B-800-fixed"  # Modèle réparé
     else:
         model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"
     tokenizer = AutoTokenizer.from_pretrained(model_id, token=auth_token)
     model = AutoModelForSeq2SeqLM.from_pretrained(model_id, token=auth_token).to(device)
+    # Configuration du tokenizer
     tokenizer.src_lang = src_lang
+    # Tokenisation
     inputs = tokenizer(text, return_tensors="pt").to(device)
+    # ID du token de langue cible
     tgt_lang_id = tokenizer.convert_tokens_to_ids(tgt_lang)
+    # Génération avec les paramètres optimaux
     outputs = model.generate(
         **inputs,
         forced_bos_token_id=tgt_lang_id,
+        max_new_tokens=1024,
+        num_beams=5,
+        early_stopping=False,
+        no_repeat_ngram_size=0,
+        length_penalty=1.0
     )
+    # Décodage
     translation = tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
     return translation
 def real_time_traduction(input_text, src_lang, tgt_lang):