ImageDataExtractor3

Runtime error

WebashalarForML commited on Oct 7, 2024

Commit

5c3e86a

verified ·

1 Parent(s): 08f219c

Update utility/utils.py

Files changed (1) hide show

utility/utils.py CHANGED Viewed

@@ -173,7 +173,7 @@ def extract_text_from_images(image_paths):
 # Function to call the Gemma model and process the output as Json
 def Data_Extractor(data, client=client):
     text = f'''Act as a  Text extractor for the following text given in text: {data}
-    extract text in the following output JSON string:
     {{
     "Name": ["Identify and Extract All the person's name from the text."],
     "Designation": ["Extract All the designation or job title mentioned in the text."],
@@ -182,8 +182,9 @@ def Data_Extractor(data, client=client):
     "Address": ["Extract All the full postal address or location mentioned in the text."],
     "Email": ["Identify and Extract All valid email addresses mentioned in the text else 'Not found'."],
     "Link": ["Identify and Extract any website URLs or social media links present in the text."]
-    }}
-    Output:
     '''
     # Call the API for inference
     response = client.text_generation(text, max_new_tokens=1000, temperature=0.4, top_k=50, top_p=0.9, repetition_penalty=1.2)

 # Function to call the Gemma model and process the output as Json
 def Data_Extractor(data, client=client):
     text = f'''Act as a  Text extractor for the following text given in text: {data}
+    Extract text in the following output JSON string:
     {{
     "Name": ["Identify and Extract All the person's name from the text."],
     "Designation": ["Extract All the designation or job title mentioned in the text."],
     "Address": ["Extract All the full postal address or location mentioned in the text."],
     "Email": ["Identify and Extract All valid email addresses mentioned in the text else 'Not found'."],
     "Link": ["Identify and Extract any website URLs or social media links present in the text."]
+    }}
+    Output:
     '''
     # Call the API for inference
     response = client.text_generation(text, max_new_tokens=1000, temperature=0.4, top_k=50, top_p=0.9, repetition_penalty=1.2)