Spaces:

hank1229
/

StyleSavvy-ai

Running

App Files Files Community

StyleSavvy-ai / models /llm.py

hank1229

Update llm.py

f91e2fa verified 24 days ago

raw

history blame contribute delete

3.88 kB

	import json
	from transformers import pipeline

	class StyleSavvy:
	def __init__(
	self,
	model_name: str = "google/flan-t5-large",
	device: int = -1, # -1 = CPU, or GPU index
	max_length: int = 150,
	):
	self.pipe = pipeline(
	"text2text-generation",
	model=model_name,
	tokenizer=model_name,
	device=device,
	)
	self.max_length = max_length

	def advise(self, items, body_type, face_shape, occasion):
	# 如果 items 是 JSON 字串，先 parse 回 Python list
	items = json.loads(items) if isinstance(items, str) else items

	prompt = (
	f"The user is {body_type}-shaped with a {face_shape} face, "
	f"attending a {occasion}. They are wearing: "
	+ ", ".join(i["label"] for i in items)
	+ ".\n\nPlease list 5 concise style tips as bullet points:"
	)

	result = self.pipe(
	prompt,
	max_length=self.max_length,
	num_beams=4,
	early_stopping=True,
	do_sample=False
	)[0]["generated_text"].strip()

	return result





	# import torch

	# # models/llm.py

	# # models/llm.py

	# import os
	# from typing import List
	# from transformers import pipeline, Pipeline

	# # Force CPU modes (avoid any MPS/CUDA issues on macOS)
	# os.environ["CUDA_VISIBLE_DEVICES"] = ""
	# os.environ["PYTORCH_ENABLE_MPS_FALLBACK"] = "0"

	# class StyleSavvy:
	# def __init__(
	# self,
	# model_name: str = "openlm-research/open_llama_3b_v2",
	# device: int = -1, # -1 = CPU
	# max_new_tokens: int = 100,
	# temperature: float = 0.7,
	# top_p: float = 0.9,
	# ):
	# """
	# Uses OpenLLaMA-3B-v2 (≈3B params) for fast, local inference.
	# """
	# # Setup a causal text-generation pipeline
	# self.pipe: Pipeline = pipeline(
	# "text-generation",
	# model=model_name,
	# tokenizer=model_name,
	# device=device,
	# )
	# # GPT‐style models need a pad token to avoid warnings
	# if self.pipe.tokenizer.pad_token_id is None:
	# self.pipe.tokenizer.pad_token = self.pipe.tokenizer.eos_token

	# self.max_new_tokens = max_new_tokens
	# self.temperature = temperature
	# self.top_p = top_p

	# def advise(
	# self,
	# items: List[str],
	# body_type: str,
	# face_shape: str,
	# occasion: str
	# ) -> List[str]:
	# """
	# Builds a strict instruction prompt and returns exactly five "- " bullets.
	# """
	# labels = ", ".join(items) if items else "an outfit"
	# prompt = (
	# "You are a professional fashion consultant.\n"
	# f"The user is {body_type}-shaped with a {face_shape} face, attending {occasion}.\n"
	# f"They are wearing: {labels}.\n\n"
	# "Please provide exactly five concise style tips, each on its own line, "
	# "and starting with \"- \". No extra text."
	# )

	# # Generate
	# output = self.pipe(
	# prompt,
	# max_new_tokens=self.max_new_tokens,
	# do_sample=True,
	# temperature=self.temperature,
	# top_p=self.top_p,
	# return_full_text=False,
	# )[0]["generated_text"]

	# # Extract bullets
	# tips = [ln.strip() for ln in output.splitlines() if ln.strip().startswith("- ")]
	# # Fallback: split on sentences if fewer than 5 bullets
	# if len(tips) < 5:
	# candidates = [s.strip() for s in output.replace("\n"," ").split(".") if s.strip()]
	# tips = [f"- {candidates[i]}" for i in range(min(5, len(candidates)))]

	# return tips[:5]