Scaper_search / summarizer.py
gaur3009's picture
Update summarizer.py
32855ec verified
raw
history blame
438 Bytes
from transformers import pipeline
summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
def summarize_text(text, max_length=100):
"""Summarize long text into shorter summary."""
# BART supports about 1024 tokens. Let's truncate text to ~1500 characters
truncated = text[:1500]
summary = summarizer(truncated, max_length=max_length, min_length=30, do_sample=False)[0]['summary_text']
return summary