Spaces:

spruceemmanuel
/

wellsaid

Runtime error

App Files Files Community

iamspruce commited on Jun 16

Commit

6eff95d

1 Parent(s): 869988f

updated models

Browse files

Files changed (2) hide show

app/models.py +22 -5
app/routers/analyze.py +9 -7

app/models.py CHANGED Viewed

@@ -2,11 +2,14 @@ from transformers import AutoModelForSeq2SeqLM, AutoTokenizer, pipeline
 import torch
 # Set the device for model inference (CPU is used by default)
 device = torch.device("cpu")
 # --- Grammar model ---
 # Uses vennify/t5-base-grammar-correction for grammar correction tasks.
-# This model takes text and returns a grammatically corrected version.
 grammar_tokenizer = AutoTokenizer.from_pretrained("vennify/t5-base-grammar-correction")
 grammar_model = AutoModelForSeq2SeqLM.from_pretrained("vennify/t5-base-grammar-correction").to(device)
@@ -47,6 +50,7 @@ def run_grammar_correction(text: str) -> str:
 def run_flan_prompt(prompt: str) -> str:
     """
     Runs a given prompt through the FLAN-T5 model to generate a response.
     Args:
         prompt (str): The prompt string to be processed by FLAN-T5.
@@ -56,8 +60,21 @@ def run_flan_prompt(prompt: str) -> str:
     """
     # Prepare the input for the FLAN-T5 model
     inputs = flan_tokenizer(prompt, return_tensors="pt").to(device)
-    # Generate the output based on the prompt
-    outputs = flan_model.generate(**inputs)
     # Decode the generated tokens back into a readable string
     return flan_tokenizer.decode(outputs[0], skip_special_tokens=True)
@@ -67,7 +84,7 @@ def run_translation(text: str, target_lang: str) -> str:
     Args:
         text (str): The input text to be translated.
-        target_lang (str): The target language code (e.g., "fr" for French).
     Returns:
         str: The translated text.
@@ -87,7 +104,7 @@ def classify_tone(text: str) -> str:
         text (str): The input text for tone classification.
     Returns:
-        str: The detected emotional label (e.g., 'neutral', 'joy', 'sadness').
     """
     # The tone_classifier returns a list of dictionaries, where each dictionary
     # contains 'label' and 'score'. We extract the 'label' from the first (and only) result.

 import torch
 # Set the device for model inference (CPU is used by default)
+# You can change to "cuda" if a compatible GPU is available for faster processing.
 device = torch.device("cpu")
 # --- Grammar model ---
 # Uses vennify/t5-base-grammar-correction for grammar correction tasks.
+# Note: This model might not catch all subtle spelling or advanced grammar errors
+# as robustly as larger models or rule-based systems. Its performance depends on
+# its training data.
 grammar_tokenizer = AutoTokenizer.from_pretrained("vennify/t5-base-grammar-correction")
 grammar_model = AutoModelForSeq2SeqLM.from_pretrained("vennify/t5-base-grammar-correction").to(device)
 def run_flan_prompt(prompt: str) -> str:
     """
     Runs a given prompt through the FLAN-T5 model to generate a response.
+    Includes advanced generation parameters for better output quality.
     Args:
         prompt (str): The prompt string to be processed by FLAN-T5.
     """
     # Prepare the input for the FLAN-T5 model
     inputs = flan_tokenizer(prompt, return_tensors="pt").to(device)
+    # Generate the output with improved parameters:
+    # max_new_tokens: Limits the maximum length of the generated response.
+    # num_beams: Uses beam search for higher quality, less repetitive outputs.
+    # do_sample: Enables sampling, allowing for more diverse outputs.
+    # top_k, top_p: Control the sampling process, making it more focused and coherent.
+    outputs = flan_model.generate(
+        **inputs,
+        max_new_tokens=100,  # Limit output length to prevent rambling
+        num_beams=5,         # Use beam search for better quality
+        do_sample=True,      # Enable sampling for diversity
+        top_k=50,            # Sample from top 50 most probable tokens
+        top_p=0.95,          # Sample from tokens that cumulatively exceed 95% probability
+        temperature=0.7      # Controls randomness; lower means more deterministic
+    )
     # Decode the generated tokens back into a readable string
     return flan_tokenizer.decode(outputs[0], skip_special_tokens=True)
     Args:
         text (str): The input text to be translated.
+        target_lang (str): The target language code (e.g., "fr" for French, "es" for Spanish).
     Returns:
         str: The translated text.
         text (str): The input text for tone classification.
     Returns:
+        str: The detected emotional label (e.g., 'neutral', 'joy', 'sadness', 'anger', 'fear', 'disgust', 'surprise').
     """
     # The tone_classifier returns a list of dictionaries, where each dictionary
     # contains 'label' and 'score'. We extract the 'label' from the first (and only) result.

app/routers/analyze.py CHANGED Viewed

@@ -51,6 +51,9 @@ def analyze_text(payload: AnalyzeInput):
     # --- 1. Grammar Suggestions with Diffs ---
     # Get the grammatically corrected version of the original text.
     corrected_grammar = models.run_grammar_correction(text)
     grammar_changes = []
@@ -97,13 +100,12 @@ def analyze_text(payload: AnalyzeInput):
     tone_suggestion_text = ""
     # Provide a simple tone suggestion based on the detected tone.
     # This logic can be expanded for more sophisticated suggestions based on context or user goals.
-    if detected_tone in ["neutral", "joy"]: # Example: if text is neutral or joyful, suggest a formal alternative
-        # Generate a formal tone version using FLAN-T5.
-        tone_suggestion_text = models.run_flan_prompt(prompts.tone_prompt(text, "formal"))
-    elif detected_tone == "anger":
-        tone_suggestion_text = models.run_flan_prompt(prompts.tone_prompt(text, "calm and professional"))
-    elif detected_tone == "sadness":
-        tone_suggestion_text = models.run_flan_prompt(prompts.tone_prompt(text, "more uplifting"))
     else:
         # If no specific suggestion, indicate that the detected tone is generally fine.
         tone_suggestion_text = f"The detected tone '{detected_tone}' seems appropriate for general communication."

     # --- 1. Grammar Suggestions with Diffs ---
     # Get the grammatically corrected version of the original text.
+    # Note: The 'vennify/t5-base-grammar-correction' model's performance
+    # can vary. For more robust corrections, especially for subtle spelling
+    # and grammar errors, consider a larger or fine-tuned model if needed.
     corrected_grammar = models.run_grammar_correction(text)
     grammar_changes = []
     tone_suggestion_text = ""
     # Provide a simple tone suggestion based on the detected tone.
     # This logic can be expanded for more sophisticated suggestions based on context or user goals.
+    if detected_tone in ["neutral", "joy", "sadness", "anger", "fear", "disgust", "surprise"]:
+        # For simplicity, we'll try to make neutral/joy more formal, and other strong emotions more neutral/calm.
+        if detected_tone in ["neutral", "joy"]:
+            tone_suggestion_text = models.run_flan_prompt(prompts.tone_prompt(text, "formal"))
+        else: # For emotions like anger, sadness, fear, etc., suggest a more neutral/calm tone
+            tone_suggestion_text = models.run_flan_prompt(prompts.tone_prompt(text, "neutral and calm"))
     else:
         # If no specific suggestion, indicate that the detected tone is generally fine.
         tone_suggestion_text = f"The detected tone '{detected_tone}' seems appropriate for general communication."