raptorkwok commited on
Commit
f91e01a
·
1 Parent(s): f7c53ae

fix logic bug

Browse files
Files changed (1) hide show
  1. chinesemeteor.py +6 -4
chinesemeteor.py CHANGED
@@ -149,8 +149,8 @@ class ChineseMETEOR(evaluate.Metric):
149
  sys.stdout = open(os.devnull, 'w')
150
 
151
  try:
152
- pred_seg = [" ".join(jieba.cut(p.strip())) for p in predictions]
153
- ref_seg = [" ".join(jieba.cut(r.strip())) for r in references]
154
 
155
  # --- Apply Real Chinese WordNet into METEOR algorithm ---
156
  def _cwn_synsets(self, word, pos=None): # Matches NLTK method call
@@ -216,9 +216,11 @@ class ChineseMETEOR(evaluate.Metric):
216
  scores = [
217
  meteor_score.single_meteor_score(
218
  #word_tokenize(ref),
219
- self._tokenize_chinese(ref),
220
  #word_tokenize(hyp),
221
- self._tokenize_chinese(hyp),
 
 
222
  wordnet=chinese_wn
223
  )
224
  for ref, hyp in zip(ref_seg, pred_seg)
 
149
  sys.stdout = open(os.devnull, 'w')
150
 
151
  try:
152
+ pred_seg = [" ".join(pycantonese.segment(p.strip())) for p in predictions]
153
+ ref_seg = [" ".join(pycantonese.segment(r.strip())) for r in references]
154
 
155
  # --- Apply Real Chinese WordNet into METEOR algorithm ---
156
  def _cwn_synsets(self, word, pos=None): # Matches NLTK method call
 
216
  scores = [
217
  meteor_score.single_meteor_score(
218
  #word_tokenize(ref),
219
+ #self._tokenize_chinese(ref),
220
  #word_tokenize(hyp),
221
+ #self._tokenize_chinese(hyp),
222
+ ref,
223
+ hyp,
224
  wordnet=chinese_wn
225
  )
226
  for ref, hyp in zip(ref_seg, pred_seg)