PRASHANTH REDDY commited on
Commit
0259ef3
·
1 Parent(s): 715cf18
Files changed (4) hide show
  1. Resume_Screening.joblib +3 -0
  2. Word_Vec_Resume.joblib +3 -0
  3. app.py +41 -3
  4. reuirements.txt +5 -0
Resume_Screening.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:708b72cc94a0f506e7caccabf87d57e389f002518539ee5d47815d8d9b9767b3
3
+ size 27504290
Word_Vec_Resume.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac33f24793786403e4bce07b891d5bf48b5eb61b6e1c9ef08f2f18e9d23617a7
3
+ size 135853
app.py CHANGED
@@ -1,7 +1,45 @@
1
  import gradio as gr
 
 
 
 
 
2
 
3
- def greet(name):
4
- return "Hello " + name + "!!"
5
 
6
- iface = gr.Interface(fn=greet, inputs="text", outputs="text")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  iface.launch()
 
1
  import gradio as gr
2
+ import fitz
3
+ import os
4
+ import re
5
+ from joblib import load
6
+ from sklearn.feature_extraction.text import TfidfVectorizer
7
 
 
 
8
 
9
+ def extract_text_from_pdf(file_path):
10
+ text = ""
11
+ doc = fitz.open(file_path)
12
+ for page in doc:
13
+ text += page.get_text()
14
+ return text
15
+
16
+ def preprocess_text(text):
17
+ resumeText = re.sub('https\+S\s*','',text)
18
+ resumeText = re.sub('RT|cc','',resumeText)
19
+ resumeText = re.sub('#\S+','',resumeText)
20
+ resumeText = re.sub('@\+S','',resumeText)
21
+ resumeText = re.sub('[%s]' % re.escape("""!"#$%&'()*+,-./:;<=>?@[\]^_`{|}~"""), ' ', resumeText)
22
+ resumeText = re.sub(r'[^\x00-\x7f]',r' ', resumeText)
23
+ resumeText = re.sub('\s+', ' ', resumeText)
24
+ return resumeText
25
+
26
+ def load_model():
27
+ model = load('Resume_Screening.joblib')
28
+ return model
29
+
30
+ vectorizer=load('Word_Vec_Resume.joblib')
31
+ def predict(file_path):
32
+ text = extract_text_from_pdf(file_path)
33
+ text = preprocess_text(text)
34
+ text_vectorized = vectorizer.transform([text])
35
+ model = load_model()
36
+ result = model.predict(text_vectorized)
37
+ return result[0]
38
+
39
+ iface = gr.Interface(
40
+ fn=predict,
41
+ inputs="file",
42
+ outputs="text"
43
+ )
44
+
45
  iface.launch()
reuirements.txt ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ joblib
2
+ gradio
3
+ os
4
+ re
5
+ sci-kit-learn