Spaces:
Runtime error
Runtime error
Update utility/utils.py
Browse files- utility/utils.py +4 -5
utility/utils.py
CHANGED
|
@@ -186,8 +186,7 @@ def extract_text_from_images(image_paths):
|
|
| 186 |
# Function to call the Gemma model and process the output as Json
|
| 187 |
def Data_Extractor(data, client=client):
|
| 188 |
text = f'''<s>[INST] Act as a Text extractor for the following text given in text: {data}.
|
| 189 |
-
Your task is to extract specific information and return it in a JSON format as outlined below:
|
| 190 |
-
|
| 191 |
Please extract the following details:
|
| 192 |
{{
|
| 193 |
"Name": ["Identify and extract all the person's names from the text."],
|
|
@@ -197,12 +196,12 @@ def Data_Extractor(data, client=client):
|
|
| 197 |
"Address": ["Extract all full postal addresses or locations mentioned in the text."],
|
| 198 |
"Email": ["Identify and extract all valid email addresses mentioned in the text; if none are found, return 'Not found'."],
|
| 199 |
"Link": ["Identify and extract any website URLs or social media links present in the text."]
|
| 200 |
-
}}
|
| 201 |
-
|
| 202 |
Output:
|
| 203 |
[/INST]</s> [INST]
|
| 204 |
Return the extracted information in JSON format as follows:
|
| 205 |
-
[/INST]
|
|
|
|
| 206 |
|
| 207 |
# Call the API for inference
|
| 208 |
response = client.text_generation(text, max_new_tokens=1000)#, temperature=0.4, top_k=50, top_p=0.9, repetition_penalty=1.2)
|
|
|
|
| 186 |
# Function to call the Gemma model and process the output as Json
|
| 187 |
def Data_Extractor(data, client=client):
|
| 188 |
text = f'''<s>[INST] Act as a Text extractor for the following text given in text: {data}.
|
| 189 |
+
Your task is to extract specific information and return it in a JSON format as outlined below:
|
|
|
|
| 190 |
Please extract the following details:
|
| 191 |
{{
|
| 192 |
"Name": ["Identify and extract all the person's names from the text."],
|
|
|
|
| 196 |
"Address": ["Extract all full postal addresses or locations mentioned in the text."],
|
| 197 |
"Email": ["Identify and extract all valid email addresses mentioned in the text; if none are found, return 'Not found'."],
|
| 198 |
"Link": ["Identify and extract any website URLs or social media links present in the text."]
|
| 199 |
+
}}
|
|
|
|
| 200 |
Output:
|
| 201 |
[/INST]</s> [INST]
|
| 202 |
Return the extracted information in JSON format as follows:
|
| 203 |
+
[/INST]
|
| 204 |
+
'''
|
| 205 |
|
| 206 |
# Call the API for inference
|
| 207 |
response = client.text_generation(text, max_new_tokens=1000)#, temperature=0.4, top_k=50, top_p=0.9, repetition_penalty=1.2)
|