Spaces:
Running
Running
Commit
·
dad8a09
1
Parent(s):
180b13e
Create summarizer.py
Browse files- summarizer.py +14 -0
summarizer.py
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Import necessary libraries
|
| 2 |
+
from transformers import pipeline
|
| 3 |
+
|
| 4 |
+
class ContentSummarizer:
|
| 5 |
+
def __init__(self, data):
|
| 6 |
+
self.data = data
|
| 7 |
+
self.summarizer = pipeline('summarization')
|
| 8 |
+
|
| 9 |
+
def summarize(self):
|
| 10 |
+
summaries = []
|
| 11 |
+
for index, row in self.data.iterrows():
|
| 12 |
+
summary = self.summarizer(row['content'], max_length=150, min_length=30, do_sample=False)
|
| 13 |
+
summaries.append({'url': row['url'], 'summary': summary[0]['summary_text']})
|
| 14 |
+
return summaries
|