dunkindonuts123 commited on
Commit
537a1be
·
1 Parent(s): 4465cb6

updated models.py

Browse files
Files changed (1) hide show
  1. engine/models.py +1 -7
engine/models.py CHANGED
@@ -1,4 +1,4 @@
1
- """Summarization models — ported from readme_summarization_experiment.ipynb."""
2
 
3
  from __future__ import annotations
4
 
@@ -17,7 +17,6 @@ from engine.preprocessing import tokenize
17
 
18
 
19
  class TFIDFModel:
20
- """Extractive summarizer using TF-IDF sentence scoring."""
21
 
22
  def __init__(self) -> None:
23
  self.idf: dict[str, float] = {}
@@ -56,7 +55,6 @@ class TFIDFModel:
56
 
57
 
58
  class LexRankModel:
59
- """Graph-based extractive summarizer (LexRank)."""
60
 
61
  THRESHOLD = 0.1
62
  DAMPING = 0.85
@@ -134,8 +132,6 @@ class LexRankModel:
134
 
135
 
136
  class SentenceTransformerModel:
137
- """Extractive summarizer using frozen sentence embeddings."""
138
-
139
  def __init__(self, model_name: str = "all-MiniLM-L6-v2") -> None:
140
  self.model = SentenceTransformer(model_name)
141
 
@@ -152,8 +148,6 @@ class SentenceTransformerModel:
152
 
153
 
154
  class CodeT5Model:
155
- """Abstractive summarizer using CodeT5 fine-tuned on Java."""
156
-
157
  MODEL_NAME = "Salesforce/codet5-base-codexglue-sum-java"
158
  VOCAB_REPO = "Salesforce/codet5-base"
159
  _SPECIAL_TOKENS = ("<pad>", "<s>", "</s>", "<unk>", "<mask>")
 
1
+
2
 
3
  from __future__ import annotations
4
 
 
17
 
18
 
19
  class TFIDFModel:
 
20
 
21
  def __init__(self) -> None:
22
  self.idf: dict[str, float] = {}
 
55
 
56
 
57
  class LexRankModel:
 
58
 
59
  THRESHOLD = 0.1
60
  DAMPING = 0.85
 
132
 
133
 
134
  class SentenceTransformerModel:
 
 
135
  def __init__(self, model_name: str = "all-MiniLM-L6-v2") -> None:
136
  self.model = SentenceTransformer(model_name)
137
 
 
148
 
149
 
150
  class CodeT5Model:
 
 
151
  MODEL_NAME = "Salesforce/codet5-base-codexglue-sum-java"
152
  VOCAB_REPO = "Salesforce/codet5-base"
153
  _SPECIAL_TOKENS = ("<pad>", "<s>", "</s>", "<unk>", "<mask>")