t5-paraphrase-generation

Sleeping

App Files Files Community

vikigitonga11 commited on Mar 18

Commit

ddc7bfd

verified ·

1 Parent(s): 3f7d7a9

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -15

app.py CHANGED Viewed

@@ -3,20 +3,21 @@ import re
 import torch
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
-# Load T5 paraphrase model
 model_name = "Vamsi/T5_Paraphrase_Paws"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForSeq2SeqLM.from_pretrained(model_name, torch_dtype=torch.float16)  # Use fp16 for speed
-# Move model to CPU
 model.to("cpu")
-# Initialize paraphrase pipeline
 paraphrase_pipeline = pipeline(
     "text2text-generation",
     model=model,
     tokenizer=tokenizer,
     truncation=True
 )
 def split_sentences(text):
@@ -30,20 +31,12 @@ def paraphrase_text(text):
     sentences = split_sentences(text)
-    # Apply T5 paraphrasing with controlled creativity
     paraphrased_results = paraphrase_pipeline(
         [f"paraphrase: {sentence} </s>" for sentence in sentences if sentence],
-        max_length=80,
-        do_sample=True,
-        temperature=0.7,  # More controlled creativity
-        top_p=0.85,  # Reduce randomness
-        top_k=50,
-        repetition_penalty=1.2,  # Avoid excessive repetition
-        num_return_sequences=1,  # Only one paraphrase per sentence
-        batch_size=8
     )
-    # Extract and join paraphrased sentences
     paraphrased_sentences = [result['generated_text'] for result in paraphrased_results]
     return " ".join(paraphrased_sentences)
@@ -52,8 +45,8 @@ demo = gr.Interface(
     fn=paraphrase_text,
     inputs=gr.Textbox(label="Enter text", placeholder="Type your text to paraphrase...", lines=10),
     outputs=gr.Textbox(label="Paraphrased Text", lines=10),
-    title="🎨 Controlled T5 Paraphraser",
-    description="Enter text and get a well-structured paraphrased version without randomness!",
     theme="huggingface"
 )

 import torch
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
+# Load T5 paraphrase model (faster than PEGASUS)
 model_name = "Vamsi/T5_Paraphrase_Paws"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForSeq2SeqLM.from_pretrained(model_name, torch_dtype=torch.float16)  # Use fp16 for speed
+# Move model to CPU (remove if using GPU)
 model.to("cpu")
+# Initialize paraphrase pipeline with optimized settings
 paraphrase_pipeline = pipeline(
     "text2text-generation",
     model=model,
     tokenizer=tokenizer,
     truncation=True
+    temperature=0.5,
 )
 def split_sentences(text):
     sentences = split_sentences(text)
+    # Apply T5 paraphrasing to each sentence
     paraphrased_results = paraphrase_pipeline(
         [f"paraphrase: {sentence} </s>" for sentence in sentences if sentence],
+        max_length=50, do_sample=True, batch_size=8, num_return_sequences=1  # Faster settings
     )
     paraphrased_sentences = [result['generated_text'] for result in paraphrased_results]
     return " ".join(paraphrased_sentences)
     fn=paraphrase_text,
     inputs=gr.Textbox(label="Enter text", placeholder="Type your text to paraphrase...", lines=10),
     outputs=gr.Textbox(label="Paraphrased Text", lines=10),
+    title="🚀 Fast & Clean T5 Paraphraser",
+    description="Enter text and let AI generate a paraphrased version using an optimized T5 model!",
     theme="huggingface"
 )