Skip to content

Commit aaa733b

Browse files
committed
ocr with gemini over
1 parent e67f894 commit aaa733b

File tree

2 files changed

+12
-40
lines changed

2 files changed

+12
-40
lines changed

.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,3 @@
11
__pycache__/
22
django
3+
.env

backend/ehr/ocr.py

+11-40
Original file line numberDiff line numberDiff line change
@@ -1,51 +1,22 @@
1-
# import pytesseract
2-
# from PIL import Image
3-
# import io
4-
5-
# def ocr_from_image(img):
6-
# img = Image.open(io.BytesIO(img))
7-
# text = pytesseract.image_to_string(img)
8-
# return text
9-
10-
# -*- coding: utf-8 -*-
11-
"""unisnipp_gemini.py
12-
13-
Automatically generated by Colaboratory.
14-
15-
Original file is located at
16-
https://colab.research.google.com/drive/1JqguW6zZXGR67GygUfDqXGR9d-gLowuV
17-
"""
18-
19-
import pathlib
1+
from dotenv import dotenv_values
202
import textwrap
21-
3+
from PIL import Image
4+
import io
225
import google.generativeai as genai
23-
24-
from IPython.display import display
25-
from IPython.display import Markdown
26-
from google.colab import userdata
27-
6+
from IPython.display import Markdown
287

298
def to_markdown(text):
309
text = text.replace('•', ' *')
3110
return Markdown(textwrap.indent(text, '> ', predicate=lambda _: True))
3211

3312

34-
GOOGLE_API_KEY=userdata.get('GOOGLE_API_KEY')
13+
GOOGLE_API_KEY=dotenv_values('.env')['GOOGLE_API_KEY']
3514
genai.configure(api_key=GOOGLE_API_KEY)
3615

37-
import PIL.Image
38-
39-
img = PIL.Image.open('jk.jpg')
40-
img
41-
42-
model = genai.GenerativeModel('gemini-pro-vision')
43-
44-
response = model.generate_content(["extract the text in proper way from this image", img], stream=True)
45-
response.resolve()
46-
to_markdown(response.text)
47-
48-
response1 = model.generate_content(["Understand what the extracted text is completely and format it in key-value pair with proper indentation", img], stream=True)
49-
response1.resolve()
16+
def ocr_to_text(img):
17+
img = Image.open(io.BytesIO(img))
18+
model = genai.GenerativeModel('gemini-pro-vision')
5019

51-
print(response1.text)
20+
response = model.generate_content(["extract the text in proper way from this image", img], stream=True)
21+
response.resolve()
22+
return response.text

0 commit comments

Comments
 (0)