Moore-Language-Space-ZeroGPU

Sleeping

App Files Files Community

Moore-Language-Space-ZeroGPU / goai_helpers /goai_traduction.py

ArissBandoss

Update goai_helpers/goai_traduction.py

b8808c9 verified 3 months ago

raw

history blame

2.53 kB

	import torch
	import spaces
	from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer
	from peft import PeftModel, PeftConfig
	import os
	from huggingface_hub import login

	max_length = 512
	auth_token = os.getenv('HF_SPACE_TOKEN')
	login(token=auth_token)


	@spaces.GPU
	def goai_traduction(text, src_lang, tgt_lang):
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

	if src_lang == "fra_Latn" and tgt_lang == "mos_Latn":
	model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"

	elif src_lang == "mos_Latn" and tgt_lang == "fra_Latn":
	model_id = "ArissBandoss/mos2fr-5B-800"

	else:
	model_id = "ArissBandoss/nllb-200-distilled-600M-finetuned-fr-to-mos-V4"

	tokenizer = AutoTokenizer.from_pretrained(model_id, token=auth_token)
	model = AutoModelForSeq2SeqLM.from_pretrained(model_id, token=auth_token)

	if model_id == "ArissBandoss/mos2fr-5B-800":
	peft_config = PeftConfig.from_pretrained("ArissBandoss/mos2fr-5B-800")
	base_model = AutoModelForSeq2SeqLM.from_pretrained(peft_config.base_model_name_or_path)
	model = PeftModel.from_pretrained(base_model, "ArissBandoss/mos2fr-5B-800")

	# Instead of using the pipeline, do direct generation
	tokenizer = AutoTokenizer.from_pretrained(peft_config.base_model_name_or_path)
	def translate(text, src_lang, tgt_lang, max_length=512):
	inputs = tokenizer(text, return_tensors="pt", max_length=max_length)
	inputs = {k: v.to(device) for k, v in inputs.items()}

	generation_kwargs = {}
	if src_lang and tgt_lang:
	generation_kwargs["forced_bos_token_id"] = tokenizer.convert_tokens_to_ids[tgt_lang]

	outputs = model.generate(inputs, max_length=max_length, generation_kwargs)
	return tokenizer.batch_decode(outputs, skip_special_tokens=True)[0]
	translation_text = translate(text, src_lang, tgt_lang)
	return translation_text



	trans_pipe = pipeline("translation",
	model=model, tokenizer=tokenizer,
	src_lang=src_lang, tgt_lang=tgt_lang,
	max_length=max_length,
	device=device
	)

	return trans_pipe(text)[0]["translation_text"]


	def real_time_traduction(input_text, src_lang, tgt_lang):
	return goai_traduction(input_text, src_lang, tgt_lang)