Asanaly commited on
Commit
0717bdc
·
verified ·
1 Parent(s): 82d626e

Update summarizer.py

Browse files
Files changed (1) hide show
  1. summarizer.py +3 -8
summarizer.py CHANGED
@@ -4,16 +4,11 @@ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, BartTokenizer, Ba
4
  eng_tokenizer = BartTokenizer.from_pretrained("facebook/bart-large-cnn")
5
  eng_model = BartForConditionalGeneration.from_pretrained("facebook/bart-large-cnn")
6
 
7
- # Русская модель
8
- rus_tokenizer = AutoTokenizer.from_pretrained("cointegrated/rut5-base-extsum")
9
- rus_model = AutoModelForSeq2SeqLM.from_pretrained("cointegrated/rut5-base-extsum")
10
-
11
 
12
  def generate_summary(text: str, lang="en", max_length=200, min_length=50) -> str:
13
- """
14
- lang="en" — английский текст
15
- lang="ru" — русский текст
16
- """
17
  if lang == "ru":
18
  tokenizer = rus_tokenizer
19
  model = rus_model
 
4
  eng_tokenizer = BartTokenizer.from_pretrained("facebook/bart-large-cnn")
5
  eng_model = BartForConditionalGeneration.from_pretrained("facebook/bart-large-cnn")
6
 
7
+ # Русская модель (публичная)
8
+ rus_tokenizer = AutoTokenizer.from_pretrained("IlyaGusev/mbart_ru_sum_gazeta")
9
+ rus_model = AutoModelForSeq2SeqLM.from_pretrained("IlyaGusev/mbart_ru_sum_gazeta")
 
10
 
11
  def generate_summary(text: str, lang="en", max_length=200, min_length=50) -> str:
 
 
 
 
12
  if lang == "ru":
13
  tokenizer = rus_tokenizer
14
  model = rus_model