T.Masuda commited on
Commit
adf06aa
·
1 Parent(s): 6f7ea15

similar-text

Browse files
Files changed (4) hide show
  1. .gitattributes +1 -0
  2. app.py +35 -0
  3. jwiki_w2v.kv +3 -0
  4. requirements.txt +2 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ jwiki_w2v.kv filter=lfs diff=lfs merge=lfs -text
app.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import gensim
3
+
4
+ def process_text(input_text):
5
+ if input_text is None or input_text == '':
6
+ yield [None, None]
7
+ return
8
+
9
+ max_count = 20
10
+ text = []
11
+ label = {}
12
+ index = 0
13
+ model = gensim.models.keyedvectors.load_word2vec_format('jwiki_w2v.kv', binary=True)
14
+ for result in model.most_similar(positive=[input_text]):
15
+ if index >= max_count:
16
+ break
17
+ print(result)
18
+ text.append(result[0])
19
+ label[result[0]] = result[1]
20
+ index += 1
21
+ yield [','.join(text), label]
22
+
23
+ app = gr.Interface(
24
+ title='similar-text',
25
+ description='similar-text',
26
+ fn=process_text,
27
+ inputs=gr.Textbox(label='text'),
28
+ outputs=[
29
+ gr.Textbox(label='text'),
30
+ gr.Label(label='scores'),
31
+ ],
32
+ allow_flagging='never',
33
+ )
34
+ app.queue(concurrency_count=5)
35
+ app.launch()
jwiki_w2v.kv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6147a4b9e96346f3829d0384965a26f3108581eadabc8f598c51a545fcd638a
3
+ size 401236292
requirements.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ gradio
2
+ gensim