Update models/watermark_faster.py
Browse files
models/watermark_faster.py
CHANGED
|
@@ -21,6 +21,8 @@ import paddle
|
|
| 21 |
from jieba import posseg
|
| 22 |
paddle.enable_static()
|
| 23 |
import re
|
|
|
|
|
|
|
| 24 |
def cut_sent(para):
|
| 25 |
para = re.sub('([。!?\?])([^”’])', r'\1\n\2', para)
|
| 26 |
para = re.sub('([。!?\?][”’])([^,。!?\?\n ])', r'\1\n\2', para)
|
|
|
|
| 21 |
from jieba import posseg
|
| 22 |
paddle.enable_static()
|
| 23 |
import re
|
| 24 |
+
nltk.download('punkt')
|
| 25 |
+
nltk.download('stopwords')
|
| 26 |
def cut_sent(para):
|
| 27 |
para = re.sub('([。!?\?])([^”’])', r'\1\n\2', para)
|
| 28 |
para = re.sub('([。!?\?][”’])([^,。!?\?\n ])', r'\1\n\2', para)
|