This repository has been archived on 2023-03-25. You can view files and clone it, but cannot push or open issues or pull requests.
mightyscape-1.1-deprecated/extensions/fablabchemnitz/ocr/ocr.py
2021-07-23 02:36:56 +02:00

47 lines
1.4 KiB
Python
Executable File

#!/usr/bin/env python3
# Copyright (C) 2021 Amal Santhosh , amalsanp@gmail.com
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
#
import inkex
import pytesseract
from PIL import Image
import cairosvg
import os
class OcrOutputExtension(inkex.OutputExtension):
def effect(self):
try:
cairosvg.svg2png(url=self.file_io.name, write_to='read.png')
im = Image.open('read.png')
text = pytesseract.image_to_string(im,lang ='eng')
self.msg(text.rstrip())
os.remove('read.png')
except Exception as e:
self.msg(e)
self.msg("Image reading failed!")
return
def save(self, stream):
pass
if __name__ == '__main__':
OcrOutputExtension().run()