Spaces:
Runtime error
Runtime error
PRASHANTH REDDY
commited on
Commit
·
0259ef3
1
Parent(s):
715cf18
Chnages
Browse files- Resume_Screening.joblib +3 -0
- Word_Vec_Resume.joblib +3 -0
- app.py +41 -3
- reuirements.txt +5 -0
Resume_Screening.joblib
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:708b72cc94a0f506e7caccabf87d57e389f002518539ee5d47815d8d9b9767b3
|
| 3 |
+
size 27504290
|
Word_Vec_Resume.joblib
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac33f24793786403e4bce07b891d5bf48b5eb61b6e1c9ef08f2f18e9d23617a7
|
| 3 |
+
size 135853
|
app.py
CHANGED
|
@@ -1,7 +1,45 @@
|
|
| 1 |
import gradio as gr
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
|
| 3 |
-
def greet(name):
|
| 4 |
-
return "Hello " + name + "!!"
|
| 5 |
|
| 6 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7 |
iface.launch()
|
|
|
|
| 1 |
import gradio as gr
|
| 2 |
+
import fitz
|
| 3 |
+
import os
|
| 4 |
+
import re
|
| 5 |
+
from joblib import load
|
| 6 |
+
from sklearn.feature_extraction.text import TfidfVectorizer
|
| 7 |
|
|
|
|
|
|
|
| 8 |
|
| 9 |
+
def extract_text_from_pdf(file_path):
|
| 10 |
+
text = ""
|
| 11 |
+
doc = fitz.open(file_path)
|
| 12 |
+
for page in doc:
|
| 13 |
+
text += page.get_text()
|
| 14 |
+
return text
|
| 15 |
+
|
| 16 |
+
def preprocess_text(text):
|
| 17 |
+
resumeText = re.sub('https\+S\s*','',text)
|
| 18 |
+
resumeText = re.sub('RT|cc','',resumeText)
|
| 19 |
+
resumeText = re.sub('#\S+','',resumeText)
|
| 20 |
+
resumeText = re.sub('@\+S','',resumeText)
|
| 21 |
+
resumeText = re.sub('[%s]' % re.escape("""!"#$%&'()*+,-./:;<=>?@[\]^_`{|}~"""), ' ', resumeText)
|
| 22 |
+
resumeText = re.sub(r'[^\x00-\x7f]',r' ', resumeText)
|
| 23 |
+
resumeText = re.sub('\s+', ' ', resumeText)
|
| 24 |
+
return resumeText
|
| 25 |
+
|
| 26 |
+
def load_model():
|
| 27 |
+
model = load('Resume_Screening.joblib')
|
| 28 |
+
return model
|
| 29 |
+
|
| 30 |
+
vectorizer=load('Word_Vec_Resume.joblib')
|
| 31 |
+
def predict(file_path):
|
| 32 |
+
text = extract_text_from_pdf(file_path)
|
| 33 |
+
text = preprocess_text(text)
|
| 34 |
+
text_vectorized = vectorizer.transform([text])
|
| 35 |
+
model = load_model()
|
| 36 |
+
result = model.predict(text_vectorized)
|
| 37 |
+
return result[0]
|
| 38 |
+
|
| 39 |
+
iface = gr.Interface(
|
| 40 |
+
fn=predict,
|
| 41 |
+
inputs="file",
|
| 42 |
+
outputs="text"
|
| 43 |
+
)
|
| 44 |
+
|
| 45 |
iface.launch()
|
reuirements.txt
ADDED
|
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
joblib
|
| 2 |
+
gradio
|
| 3 |
+
os
|
| 4 |
+
re
|
| 5 |
+
sci-kit-learn
|