Spaces:
Paused
Paused
File size: 1,294 Bytes
845e414 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 |
#!/usr/bin/python3
# -*- coding: utf-8 -*-
"""
https://huggingface.co/LTP
"""
import argparse
import os
from pyltp import Postagger, Segmentor, NamedEntityRecognizer
from project_settings import project_path
def get_args():
parser = argparse.ArgumentParser()
parser.add_argument(
"--text",
default="元芳你怎么看?我就趴窗口上看呗!",
type=str
)
parser.add_argument(
"--ltp_data_dir",
default=(project_path / "data/pyltp_models/ltp_data_v3.4.0").as_posix(),
type=str
)
args = parser.parse_args()
return args
def main():
args = get_args()
cws_model_path = os.path.join(args.ltp_data_dir, "cws.model")
pos_model_path = os.path.join(args.ltp_data_dir, "pos.model")
ner_model_path = os.path.join(args.ltp_data_dir, "ner.model")
segmentor = Segmentor(cws_model_path)
postagger = Postagger(pos_model_path)
recognizer = NamedEntityRecognizer(ner_model_path)
words = segmentor.segment(args.text)
postags = postagger.postag(words)
ner_tags = recognizer.recognize(words, postags)
print(words)
print(postags)
print(ner_tags)
segmentor.release()
postagger.release()
recognizer.release()
return
if __name__ == "__main__":
main()
|