Update README.md
Browse files
README.md
CHANGED
|
@@ -57,15 +57,14 @@ cleaned_resume_skills = clean_text(" ".join(resume_skills) if isinstance(resume_
|
|
| 57 |
|
| 58 |
def clean_text(text):
|
| 59 |
if isinstance(text, list):
|
| 60 |
-
text = " ".join(text)
|
| 61 |
elif text is None:
|
| 62 |
-
text = ""
|
| 63 |
-
|
| 64 |
-
text =
|
| 65 |
-
text = text.lower() # Convert to lowercase
|
| 66 |
return text
|
| 67 |
|
| 68 |
-
cleaned_resume_skills = clean_text(resume_skills)
|
| 69 |
|
| 70 |
vectorizer = CountVectorizer(stop_words='english')
|
| 71 |
job_desc_matrix = vectorizer.fit_transform(df['cleaned_job_info'])
|
|
|
|
| 57 |
|
| 58 |
def clean_text(text):
|
| 59 |
if isinstance(text, list):
|
| 60 |
+
text = " ".join(text)
|
| 61 |
elif text is None:
|
| 62 |
+
text = ""
|
| 63 |
+
text = re.sub(r'[^\w\s]', '', str(text))
|
| 64 |
+
text = text.lower()
|
|
|
|
| 65 |
return text
|
| 66 |
|
| 67 |
+
cleaned_resume_skills = clean_text(resume_skills)
|
| 68 |
|
| 69 |
vectorizer = CountVectorizer(stop_words='english')
|
| 70 |
job_desc_matrix = vectorizer.fit_transform(df['cleaned_job_info'])
|