Spaces:
Paused
Paused
Commit
·
722e882
1
Parent(s):
2e9d967
updated
Browse files- backend/services/resume_parser.py +12 -6
- requirements.txt +1 -0
backend/services/resume_parser.py
CHANGED
|
@@ -6,7 +6,6 @@ import zipfile
|
|
| 6 |
import json
|
| 7 |
import torch
|
| 8 |
from typing import List
|
| 9 |
-
from transformers import AutoModelForCausalLM, AutoTokenizer
|
| 10 |
|
| 11 |
os.environ["OMP_NUM_THREADS"] = "1"
|
| 12 |
os.environ["OPENBLAS_NUM_THREADS"] = "1"
|
|
@@ -14,18 +13,25 @@ os.environ["MKL_NUM_THREADS"] = "1"
|
|
| 14 |
os.environ["NUMEXPR_NUM_THREADS"] = "1"
|
| 15 |
os.environ["VECLIB_MAXIMUM_THREADS"] = "1"
|
| 16 |
|
| 17 |
-
|
|
|
|
| 18 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 19 |
|
| 20 |
-
|
| 21 |
-
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
| 22 |
model = AutoModelForCausalLM.from_pretrained(
|
| 23 |
-
|
| 24 |
-
|
| 25 |
device_map="auto"
|
| 26 |
)
|
| 27 |
|
| 28 |
|
|
|
|
| 29 |
# ===============================
|
| 30 |
# Text Extraction (PDF/DOCX)
|
| 31 |
# ===============================
|
|
|
|
| 6 |
import json
|
| 7 |
import torch
|
| 8 |
from typing import List
|
|
|
|
| 9 |
|
| 10 |
os.environ["OMP_NUM_THREADS"] = "1"
|
| 11 |
os.environ["OPENBLAS_NUM_THREADS"] = "1"
|
|
|
|
| 13 |
os.environ["NUMEXPR_NUM_THREADS"] = "1"
|
| 14 |
os.environ["VECLIB_MAXIMUM_THREADS"] = "1"
|
| 15 |
|
| 16 |
+
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
|
| 17 |
+
import torch
|
| 18 |
|
| 19 |
+
bnb_config = BitsAndBytesConfig(
|
| 20 |
+
load_in_4bit=True,
|
| 21 |
+
bnb_4bit_compute_dtype=torch.float16,
|
| 22 |
+
bnb_4bit_use_double_quant=True,
|
| 23 |
+
bnb_4bit_quant_type="nf4"
|
| 24 |
+
)
|
| 25 |
|
| 26 |
+
tokenizer = AutoTokenizer.from_pretrained("tiiuae/falcon-7b-instruct")
|
|
|
|
| 27 |
model = AutoModelForCausalLM.from_pretrained(
|
| 28 |
+
"tiiuae/falcon-7b-instruct",
|
| 29 |
+
quantization_config=bnb_config,
|
| 30 |
device_map="auto"
|
| 31 |
)
|
| 32 |
|
| 33 |
|
| 34 |
+
|
| 35 |
# ===============================
|
| 36 |
# Text Extraction (PDF/DOCX)
|
| 37 |
# ===============================
|
requirements.txt
CHANGED
|
@@ -61,4 +61,5 @@ requests>=2.31.0
|
|
| 61 |
# Spaces. The version is pinned for reproducibility and compatibility.
|
| 62 |
psycopg2-binary
|
| 63 |
matplotlib
|
|
|
|
| 64 |
|
|
|
|
| 61 |
# Spaces. The version is pinned for reproducibility and compatibility.
|
| 62 |
psycopg2-binary
|
| 63 |
matplotlib
|
| 64 |
+
bitsandbytes>=0.41.0
|
| 65 |
|