Update app.py
Browse files
app.py
CHANGED
@@ -1,11 +1,19 @@
|
|
1 |
import gradio as gr
|
2 |
from transformers import pipeline
|
3 |
import re
|
|
|
4 |
|
5 |
# Load the OCR pipeline from Hugging Face
|
6 |
-
ocr_pipeline = pipeline("image-to-text", model="microsoft/trocr-
|
|
|
|
|
|
|
|
|
|
|
7 |
|
8 |
def perform_ocr(image):
|
|
|
|
|
9 |
text = ocr_pipeline(image)[0]['generated_text']
|
10 |
return text
|
11 |
|
@@ -45,4 +53,4 @@ def web_app():
|
|
45 |
interface.launch()
|
46 |
|
47 |
if __name__ == "__main__":
|
48 |
-
web_app()
|
|
|
1 |
import gradio as gr
|
2 |
from transformers import pipeline
|
3 |
import re
|
4 |
+
from PIL import ImageFilter
|
5 |
|
6 |
# Load the OCR pipeline from Hugging Face
|
7 |
+
ocr_pipeline = pipeline("image-to-text", model="microsoft/trocr-large-stage1") # Use a different model
|
8 |
+
|
9 |
+
def preprocess_image(image):
|
10 |
+
image = image.convert('L') # Convert to grayscale
|
11 |
+
image = image.filter(ImageFilter.SHARPEN) # Apply some filtering
|
12 |
+
return image
|
13 |
|
14 |
def perform_ocr(image):
|
15 |
+
# Preprocess the image before OCR
|
16 |
+
image = preprocess_image(image)
|
17 |
text = ocr_pipeline(image)[0]['generated_text']
|
18 |
return text
|
19 |
|
|
|
53 |
interface.launch()
|
54 |
|
55 |
if __name__ == "__main__":
|
56 |
+
web_app()
|