Spaces:
Sleeping
Sleeping
dunkindonuts123 commited on
Commit ·
537a1be
1
Parent(s): 4465cb6
updated models.py
Browse files- engine/models.py +1 -7
engine/models.py
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
-
|
| 2 |
|
| 3 |
from __future__ import annotations
|
| 4 |
|
|
@@ -17,7 +17,6 @@ from engine.preprocessing import tokenize
|
|
| 17 |
|
| 18 |
|
| 19 |
class TFIDFModel:
|
| 20 |
-
"""Extractive summarizer using TF-IDF sentence scoring."""
|
| 21 |
|
| 22 |
def __init__(self) -> None:
|
| 23 |
self.idf: dict[str, float] = {}
|
|
@@ -56,7 +55,6 @@ class TFIDFModel:
|
|
| 56 |
|
| 57 |
|
| 58 |
class LexRankModel:
|
| 59 |
-
"""Graph-based extractive summarizer (LexRank)."""
|
| 60 |
|
| 61 |
THRESHOLD = 0.1
|
| 62 |
DAMPING = 0.85
|
|
@@ -134,8 +132,6 @@ class LexRankModel:
|
|
| 134 |
|
| 135 |
|
| 136 |
class SentenceTransformerModel:
|
| 137 |
-
"""Extractive summarizer using frozen sentence embeddings."""
|
| 138 |
-
|
| 139 |
def __init__(self, model_name: str = "all-MiniLM-L6-v2") -> None:
|
| 140 |
self.model = SentenceTransformer(model_name)
|
| 141 |
|
|
@@ -152,8 +148,6 @@ class SentenceTransformerModel:
|
|
| 152 |
|
| 153 |
|
| 154 |
class CodeT5Model:
|
| 155 |
-
"""Abstractive summarizer using CodeT5 fine-tuned on Java."""
|
| 156 |
-
|
| 157 |
MODEL_NAME = "Salesforce/codet5-base-codexglue-sum-java"
|
| 158 |
VOCAB_REPO = "Salesforce/codet5-base"
|
| 159 |
_SPECIAL_TOKENS = ("<pad>", "<s>", "</s>", "<unk>", "<mask>")
|
|
|
|
| 1 |
+
|
| 2 |
|
| 3 |
from __future__ import annotations
|
| 4 |
|
|
|
|
| 17 |
|
| 18 |
|
| 19 |
class TFIDFModel:
|
|
|
|
| 20 |
|
| 21 |
def __init__(self) -> None:
|
| 22 |
self.idf: dict[str, float] = {}
|
|
|
|
| 55 |
|
| 56 |
|
| 57 |
class LexRankModel:
|
|
|
|
| 58 |
|
| 59 |
THRESHOLD = 0.1
|
| 60 |
DAMPING = 0.85
|
|
|
|
| 132 |
|
| 133 |
|
| 134 |
class SentenceTransformerModel:
|
|
|
|
|
|
|
| 135 |
def __init__(self, model_name: str = "all-MiniLM-L6-v2") -> None:
|
| 136 |
self.model = SentenceTransformer(model_name)
|
| 137 |
|
|
|
|
| 148 |
|
| 149 |
|
| 150 |
class CodeT5Model:
|
|
|
|
|
|
|
| 151 |
MODEL_NAME = "Salesforce/codet5-base-codexglue-sum-java"
|
| 152 |
VOCAB_REPO = "Salesforce/codet5-base"
|
| 153 |
_SPECIAL_TOKENS = ("<pad>", "<s>", "</s>", "<unk>", "<mask>")
|