Spaces:

asmashayea
/

absa-app

Running

absa-app / generative_inference.py

aa9f0d3 about 9 hours ago

8.9 kB

	import torch
	import json
	from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
	from transformers import AutoModelForCausalLM, AutoTokenizer
	from peft import PeftModel
	import openai

	SYSTEM_PROMPT = (
	"You are an advanced AI model specialized in extracting aspects and determining their sentiment polarity from customer reviews.\n\n"
	"Instructions:\n"
	"1. Extract only the aspects (nouns) mentioned in the review.\n"
	"2. Assign a sentiment to each aspect: \"positive\", \"negative\", or \"neutral\".\n"
	"3. Return aspects in the same language as they appear.\n"
	"4. An aspect must be a noun that refers to a specific item or service the user described.\n"
	"5. Ignore adjectives, general ideas, and vague topics.\n"
	"6. Do NOT translate, explain, or add extra text.\n"
	"7. The output must be just a valid JSON list with 'aspect' and 'sentiment'. Start with `[` and stop at `]`.\n"
	"8. Do NOT output the instructions, review, or any text — only one output JSON list.\n"
	"9. Just one output and one review."
	)


	MODEL_OPTIONS = {
	"Araberta": {
	"base": "asmashayea/absa-araberta",
	"adapter": "asmashayea/absa-araberta"
	},
	"mT5": {
	"base": "google/mt5-base",
	"adapter": "asmashayea/mt4-absa"
	},
	"mBART": {
	"base": "facebook/mbart-large-50-many-to-many-mmt",
	"adapter": "asmashayea/mbart-absa"
	},
	"GPT3.5": {"base": "openai/gpt-3.5-turbo",
	"model_id": "ft:gpt-3.5-turbo-0125:asma:gpt-3-5-turbo-absa:Bb6gmwkE"},
	"GPT4o": {"base": "openai/gpt-4o",
	"model_id": "ft:gpt-4o-mini-2024-07-18:asma:gpt4-finetune-absa:BazoEjnp"},
	"ALLaM": {
	"base": "ALLaM-AI/ALLaM-7B-Instruct-preview",
	"adapter": "asmashayea/allam-absa"
	},
	"DeepSeek": {
	"base": "deepseek-ai/deepseek-llm-7b-chat",
	"adapter": "asmashayea/deepseek-absa"
	}
	}


	cached_models = {}

	# ✅ Reusable for both mT5 + mBART
	def load_mt5_bart(model_key):
	base_id = MODEL_OPTIONS[model_key]["base"]
	adapter_id = MODEL_OPTIONS[model_key]["adapter"]

	tokenizer = AutoTokenizer.from_pretrained(adapter_id)
	base_model = AutoModelForSeq2SeqLM.from_pretrained(base_id)
	peft_model = PeftModel.from_pretrained(base_model, adapter_id)
	peft_model.eval()

	cached_models[model_key] = (tokenizer, peft_model)
	return tokenizer, peft_model

	def infer_t5_bart(text, model_choice):

	tokenizer, peft_model = load_mt5_bart(model_choice)
	prompt = SYSTEM_PROMPT + f"\n\nReview: {text}"
	inputs = tokenizer(prompt, return_tensors="pt", padding=True, truncation=True).to(peft_model.device)

	with torch.no_grad():
	outputs = peft_model.generate(
	**inputs,
	max_new_tokens=256,
	num_beams=4,
	do_sample=False,
	temperature=0.0,
	early_stopping=True,
	pad_token_id=tokenizer.pad_token_id,
	eos_token_id=tokenizer.eos_token_id,
	)

	decoded = tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
	decoded = decoded.replace('<extra_id_0>', '').replace('</s>', '').strip()

	try:
	return json.loads(decoded)
	except json.JSONDecodeError:
	return {"raw_output": decoded, "error": "Invalid JSON"}



	OPENAI_API_KEY = "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"
	openai.api_key = OPENAI_API_KEY

	def infer_gpt_absa(text, model_key):
	MODEL_ID = MODEL_OPTIONS[model_key]["model_id"]
	try:
	response = openai.chat.completions.create(
	model=MODEL_ID,
	messages=[
	{
	"role": "system",
	"content": SYSTEM_PROMPT
	},
	{
	"role": "user",
	"content": text
	}
	],
	temperature=0
	)
	decoded = response.choices[0].message.content.strip()
	return json.loads(decoded)
	except Exception as e:
	return {"error": str(e)}



	def infer_allam(review_text):
	tokenizer, model = cached_models.get("ALLaM") or load_allam()

	prompt = tokenizer.apply_chat_template(
	[
	{"role": "system", "content": SYSTEM_PROMPT},
	{"role": "user", "content": review_text}
	],
	tokenize=False
	)

	inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=512).to(model.device)

	with torch.no_grad():
	outputs = model.generate(
	**inputs,
	max_new_tokens=128,
	do_sample=False,
	temperature=0.0,
	pad_token_id=tokenizer.eos_token_id
	)

	decoded = tokenizer.decode(outputs[0][inputs["input_ids"].shape[1]:], skip_special_tokens=True).strip()
	try:
	parsed = json.loads(decoded)
	return parsed
	except Exception as e:
	return {"error": str(e), "raw": decoded}


	def load_allam():
	base_model = AutoModelForCausalLM.from_pretrained(
	MODEL_OPTIONS["ALLaM"]["base"],
	device_map="auto",
	torch_dtype=torch.float16,
	trust_remote_code=True
	)
	tokenizer = AutoTokenizer.from_pretrained(
	MODEL_OPTIONS["ALLaM"]["adapter"],
	trust_remote_code=True
	)
	model = PeftModel.from_pretrained(base_model, MODEL_OPTIONS["ALLaM"]["adapter"])

	cached_models["ALLaM"] = (tokenizer, model)
	return tokenizer, model





	def load_allam():
	base = AutoModelForCausalLM.from_pretrained(
	MODEL_OPTIONS["ALLaM"]["base"],
	torch_dtype=torch.float16,
	trust_remote_code=True
	)
	tokenizer = AutoTokenizer.from_pretrained(
	MODEL_OPTIONS["ALLaM"]["adapter"], trust_remote_code=True
	)
	model = PeftModel.from_pretrained(base, MODEL_OPTIONS["ALLaM"]["adapter"])
	cached_models["ALLaM"] = (tokenizer, model)
	return tokenizer, model

	def infer_allam(review):
	if "ALLaM" not in cached_models:
	tokenizer, model = load_allam()
	else:
	tokenizer, model = cached_models["ALLaM"]

	prompt = tokenizer.apply_chat_template([
	{"role": "system", "content": SYSTEM_PROMPT},
	{"role": "user", "content": review}
	], tokenize=False)

	inputs = tokenizer(prompt, return_tensors="pt").to(model.device)

	with torch.no_grad():
	output = model.generate(**inputs, max_new_tokens=256)
	decoded = tokenizer.decode(output[0][inputs["input_ids"].shape[1]:], skip_special_tokens=True)

	try:
	return json.loads(decoded)
	except:
	return decoded




	def build_deepseek_prompt(review_text, output=""):
	return f"""<\|system\|>
	You are an advanced AI model specialized in extracting aspects and determining their sentiment polarity from customer reviews.


	Instructions:
	1. Extract only the aspects (nouns) mentioned in the review.
	2. Assign a sentiment to each aspect: "positive", "negative", or "neutral".
	3. Return aspects in the same language as they appear.
	4. An aspect must be a noun that refers to a specific item or service the user described.
	5. Ignore adjectives, general ideas, and vague topics.
	6. Do NOT translate, explain, or add extra text.
	7. The output must be just a valid JSON list with 'aspect' and 'sentiment'. Start with `[` and stop at `]`.
	8. Do NOT output the instructions, review, or any text — only one output JSON list.
	9. Just one output and one review.
	<\|user\|>
	{review_text}
	<\|assistant\|>
	{output}""" # ✅ include the output here


	def load_deepseek():
	base = AutoModelForCausalLM.from_pretrained(
	MODEL_OPTIONS["DeepSeek"]["base"],
	torch_dtype=torch.float16,
	trust_remote_code=True
	)
	tokenizer = AutoTokenizer.from_pretrained(
	MODEL_OPTIONS["DeepSeek"]["adapter"], trust_remote_code=True
	)
	model = PeftModel.from_pretrained(base, MODEL_OPTIONS["DeepSeek"]["adapter"])
	cached_models["DeepSeek"] = (tokenizer, model)
	return tokenizer, model

	def infer_deepseek(review):
	if "DeepSeek" not in cached_models:
	tokenizer, model = load_deepseek()
	else:
	tokenizer, model = cached_models["DeepSeek"]

	prompt = build_deepseek_prompt(review)
	inputs = tokenizer(prompt, return_tensors="pt", truncation=True, max_length=512).to(model.device)

	with torch.no_grad():
	output = model.generate(
	**inputs,
	max_new_tokens=128,
	do_sample=False,
	temperature=0.0,
	pad_token_id=tokenizer.eos_token_id
	)

	decoded = tokenizer.decode(
	output[0][inputs["input_ids"].shape[1]:],
	skip_special_tokens=True
	).strip()

	try:
	return json.loads(decoded)
	except Exception as e:
	print(f"❌ DeepSeek JSON parse error: {e}")
	return decoded