0% found this document useful (0 votes)

402 views

Easyocr

The document defines a Reader class that initializes optical character recognition models for various languages. It checks if required detection and recognition models are downloaded, downloading them if needed. It selects the appropriate recognition model based on the provided languages, handling a variety of script systems including Latin, Cyrillic, Devanagari, Arabic, Chinese and others.

Uploaded by

houssam ziouany

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

402 views

Easyocr

Uploaded by

houssam ziouany

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 8

# -- coding: utf-8 --

from .detection import get_detector, get_textbox

from .recognition import get_recognizer, get_text
from .utils import group_text_box, get_image_list, calculate_md5, get_paragraph,\
download_and_unzip, printProgressBar, diff, reformat_input,\
make_rotated_img_list, set_result_with_confidence
from .config import *
from bidi.algorithm import get_display
import numpy as np
import cv2
import torch
import os
import sys
from PIL import Image
from logging import getLogger
import yaml

if sys.version_info[0] == 2:
from io import open
from six.moves.urllib.request import urlretrieve
from pathlib2 import Path
else:
from urllib.request import urlretrieve
from pathlib import Path

LOGGER = getLogger(__name__)

class Reader(object):

def init(self, lang_list, gpu=True, model_storage_directory=None,

user_network_directory=None, recog_network = 'standard',
download_enabled=True, detector=True, recognizer=True,
verbose=True, quantize=True):
"""Create an EasyOCR Reader.

Parameters:
lang_list (list): Language codes (ISO 639) for languages to be
recognized during analysis.

gpu (bool): Enable GPU support (default)

model_storage_directory (string): Path to directory for model data. If

not specified,
models will be read from a directory as defined by the environment
variable
EASYOCR_MODULE_PATH (preferred), MODULE_PATH (if defined), or
~/.EasyOCR/.

user_network_directory (string): Path to directory for custom network

architecture.
If not specified, it is as defined by the environment variable
EASYOCR_MODULE_PATH (preferred), MODULE_PATH (if defined), or
~/.EasyOCR/.

download_enabled (bool): Enabled downloading of model data via HTTP

(default).
"""
self.download_enabled = download_enabled
self.model_storage_directory = MODULE_PATH + '/model'
if model_storage_directory:
self.model_storage_directory = model_storage_directory
Path(self.model_storage_directory).mkdir(parents=True, exist_ok=True)

self.user_network_directory = MODULE_PATH + '/user_network'

if user_network_directory:
self.user_network_directory = user_network_directory
Path(self.user_network_directory).mkdir(parents=True, exist_ok=True)
sys.path.append(self.user_network_directory)

if gpu is False:
self.device = 'cpu'
LOGGER.warning('Using CPU. Note: This module is much faster with a
GPU.')
elif not torch.cuda.is_available():
self.device = 'cpu'
LOGGER.warning('CUDA not available - defaulting to CPU. Note: This
module is much faster with a GPU.')
elif gpu is True:
self.device = 'cuda'
else:
self.device = gpu

# check and download detection model

detector_model = 'craft'
corrupt_msg = 'MD5 hash mismatch, possible file corruption'
detector_path = os.path.join(self.model_storage_directory,
detection_models[detector_model]['filename'])
if detector:
if os.path.isfile(detector_path) == False:
if not self.download_enabled:
raise FileNotFoundError("Missing %s and downloads disabled" %
detector_path)
LOGGER.warning('Downloading detection model, please wait. '
'This may take several minutes depending upon your
network connection.')
download_and_unzip(detection_models[detector_model]['url'],
detection_models[detector_model]['filename'], self.model_storage_directory,
verbose)
assert calculate_md5(detector_path) ==
detection_models[detector_model]['filesize'], corrupt_msg
LOGGER.info('Download complete')
elif calculate_md5(detector_path) != detection_models[detector_model]
['filesize']:
if not self.download_enabled:
raise FileNotFoundError("MD5 mismatch for %s and downloads
disabled" % detector_path)
LOGGER.warning(corrupt_msg)
os.remove(detector_path)
LOGGER.warning('Re-downloading the detection model, please wait. '
'This may take several minutes depending upon your
network connection.')
download_and_unzip(detection_models[detector_model]['url'],
detection_models[detector_model]['filename'], self.model_storage_directory,
verbose)
assert calculate_md5(detector_path) ==
detection_models[detector_model]['filesize'], corrupt_msg
# recognition model
separator_list = {}

if recog_network in ['standard'] + [model for model in

recognition_models['gen1']] + [model for model in recognition_models['gen2']]:
if recog_network in [model for model in recognition_models['gen1']]:
model = recognition_models['gen1'][recog_network]
recog_network = 'generation1'
self.model_lang = model['model_script']
elif recog_network in [model for model in recognition_models['gen2']]:
model = recognition_models['gen2'][recog_network]
recog_network = 'generation2'
self.model_lang = model['model_script']
else: # auto-detect
unknown_lang = set(lang_list) - set(all_lang_list)
if unknown_lang != set():
raise ValueError(unknown_lang, 'is not supported')
# choose recognition model
if lang_list == ['en']:
self.setModelLanguage('english', lang_list, ['en'], '["en"]')
model = recognition_models['gen2']['english_g2']
recog_network = 'generation2'
elif 'th' in lang_list:
self.setModelLanguage('thai', lang_list, ['th','en'],
'["th","en"]')
model = recognition_models['gen1']['thai_g1']
recog_network = 'generation1'
elif 'ch_tra' in lang_list:
self.setModelLanguage('chinese_tra', lang_list,
['ch_tra','en'], '["ch_tra","en"]')
model = recognition_models['gen1']['zh_tra_g1']
recog_network = 'generation1'
elif 'ch_sim' in lang_list:
self.setModelLanguage('chinese_sim', lang_list,
['ch_sim','en'], '["ch_sim","en"]')
model = recognition_models['gen2']['zh_sim_g2']
recog_network = 'generation2'
elif 'ja' in lang_list:
self.setModelLanguage('japanese', lang_list, ['ja','en'],
'["ja","en"]')
model = recognition_models['gen2']['japanese_g2']
recog_network = 'generation2'
elif 'ko' in lang_list:
self.setModelLanguage('korean', lang_list, ['ko','en'],
'["ko","en"]')
model = recognition_models['gen2']['korean_g2']
recog_network = 'generation2'
elif 'ta' in lang_list:
self.setModelLanguage('tamil', lang_list, ['ta','en'],
'["ta","en"]')
model = recognition_models['gen1']['tamil_g1']
recog_network = 'generation1'
elif 'te' in lang_list:
self.setModelLanguage('telugu', lang_list, ['te','en'],
'["te","en"]')
model = recognition_models['gen2']['telugu_g2']
recog_network = 'generation2'
elif 'kn' in lang_list:
self.setModelLanguage('kannada', lang_list, ['kn','en'],
'["kn","en"]')
model = recognition_models['gen2']['kannada_g2']
recog_network = 'generation2'
elif set(lang_list) & set(bengali_lang_list):
self.setModelLanguage('bengali', lang_list, bengali_lang_list+
['en'], '["bn","as","en"]')
model = recognition_models['gen1']['bengali_g1']
recog_network = 'generation1'
elif set(lang_list) & set(arabic_lang_list):
self.setModelLanguage('arabic', lang_list, arabic_lang_list+
['en'], '["ar","fa","ur","ug","en"]')
model = recognition_models['gen1']['arabic_g1']
recog_network = 'generation1'
elif set(lang_list) & set(devanagari_lang_list):
self.setModelLanguage('devanagari', lang_list,
devanagari_lang_list+['en'], '["hi","mr","ne","en"]')
model = recognition_models['gen1']['devanagari_g1']
recog_network = 'generation1'
elif set(lang_list) & set(cyrillic_lang_list):
self.setModelLanguage('cyrillic', lang_list,
cyrillic_lang_list+['en'],

'["ru","rs_cyrillic","be","bg","uk","mn","en"]')
model = recognition_models['gen1']['cyrillic_g1']
recog_network = 'generation1'
else:
self.model_lang = 'latin'
model = recognition_models['gen2']['latin_g2']
recog_network = 'generation2'
self.character = model['characters']

model_path = os.path.join(self.model_storage_directory,
model['filename'])
# check recognition model file
if recognizer:
if os.path.isfile(model_path) == False:
if not self.download_enabled:
raise FileNotFoundError("Missing %s and downloads disabled"
% model_path)
LOGGER.warning('Downloading recognition model, please wait. '
'This may take several minutes depending upon
your network connection.')
download_and_unzip(model['url'], model['filename'],
self.model_storage_directory, verbose)
assert calculate_md5(model_path) == model['filesize'],
corrupt_msg
LOGGER.info('Download complete.')
elif calculate_md5(model_path) != model['filesize']:
if not self.download_enabled:
raise FileNotFoundError("MD5 mismatch for %s and downloads
disabled" % model_path)
LOGGER.warning(corrupt_msg)
os.remove(model_path)
LOGGER.warning('Re-downloading the recognition model, please
wait. '
'This may take several minutes depending upon
your network connection.')
download_and_unzip(model['url'], model['filename'],
self.model_storage_directory, verbose)
assert calculate_md5(model_path) == model['filesize'],
corrupt_msg
LOGGER.info('Download complete')
self.setLanguageList(lang_list, model)

else: # user-defined model

with open(os.path.join(self.user_network_directory, recog_network+
'.yaml')) as file:
recog_config = yaml.load(file, Loader=yaml.FullLoader)
imgH = recog_config['imgH']
available_lang = recog_config['lang_list']
self.setModelLanguage(recog_network, lang_list, available_lang,
available_lang)
char_file = os.path.join(self.user_network_directory, recog_network+
'.txt')
self.character = recog_config['character_list']
model_file = recog_network+ '.pth'
model_path = os.path.join(self.model_storage_directory, model_file)
self.setLanguageList(lang_list, None)

dict_list = {}
for lang in lang_list:
dict_list[lang] = os.path.join(BASE_PATH, 'dict', lang + ".txt")

if detector:
self.detector = get_detector(detector_path, self.device, quantize)
if recognizer:
if recog_network == 'generation1':
network_params = {
'input_channel': 1,
'output_channel': 512,
'hidden_size': 512
}
elif recog_network == 'generation2':
network_params = {
'input_channel': 1,
'output_channel': 256,
'hidden_size': 256
}
else:
network_params = recog_config['network_params']
self.recognizer, self.converter = get_recognizer(recog_network,
network_params,\
self.character,
separator_list,\
dict_list, model_path,
device = self.device, quantize=quantize)

def setModelLanguage(self, language, lang_list, list_lang, list_lang_string):

self.model_lang = language
if set(lang_list) - set(list_lang) != set():
if language == 'ch_tra' or language == 'ch_sim':
language = 'chinese'
raise ValueError(language.capitalize() + ' is only compatible with
English, try lang_list=' + list_lang_string)

def getChar(self, fileName):

char_file = os.path.join(BASE_PATH, 'character', fileName)
with open(char_file, "r", encoding="utf-8-sig") as input_file:
list = input_file.read().splitlines()
char = ''.join(list)
return char

def setLanguageList(self, lang_list, model):

self.lang_char = []
for lang in lang_list:
char_file = os.path.join(BASE_PATH, 'character', lang + "_char.txt")
with open(char_file, "r", encoding = "utf-8-sig") as input_file:
char_list = input_file.read().splitlines()
self.lang_char += char_list
if model:
symbol = model['symbols']
else:
symbol = '0123456789!"#$%&\'()*+,-./:;<=>?@[\\]^_`{|}~ '
self.lang_char = set(self.lang_char).union(set(symbol))
self.lang_char = ''.join(self.lang_char)

def detect(self, img, min_size = 20, text_threshold = 0.7, low_text = 0.4,\

link_threshold = 0.4,canvas_size = 2560, mag_ratio = 1.,\
slope_ths = 0.1, ycenter_ths = 0.5, height_ths = 0.5,\
width_ths = 0.5, add_margin = 0.1, reformat=True,
optimal_num_chars=None):

if reformat:
img, img_cv_grey = reformat_input(img)

text_box = get_textbox(self.detector, img, canvas_size, mag_ratio,\

text_threshold, link_threshold, low_text,\
False, self.device, optimal_num_chars)
horizontal_list, free_list = group_text_box(text_box, slope_ths,\
ycenter_ths, height_ths,\
width_ths, add_margin, \
(optimal_num_chars is None))

if min_size:
horizontal_list = [i for i in horizontal_list if max(i[1]-i[0],i[3]-
i[2]) > min_size]
free_list = [i for i in free_list if max(diff([c[0] for c in i]),
diff([c[1] for c in i]))>min_size]

return horizontal_list, free_list

def recognize(self, img_cv_grey, horizontal_list=None, free_list=None,\

decoder = 'greedy', beamWidth= 5, batch_size = 1,\
workers = 0, allowlist = None, blocklist = None, detail = 1,\
rotation_info = None,\
paragraph = False,\
contrast_ths = 0.1,adjust_contrast = 0.5, filter_ths = 0.003,\
reformat=True):

if reformat:
img, img_cv_grey = reformat_input(img_cv_grey)

if allowlist:
ignore_char = ''.join(set(self.character)-set(allowlist))
elif blocklist:
ignore_char = ''.join(set(blocklist))
else:
ignore_char = ''.join(set(self.character)-set(self.lang_char))

if self.model_lang in ['chinese_tra','chinese_sim']: decoder = 'greedy'

if (horizontal_list==None) and (free_list==None):

y_max, x_max = img_cv_grey.shape
horizontal_list = [[0, x_max, 0, y_max]]
free_list = []

# without gpu/parallelization, it is faster to process image one by one

if ((batch_size == 1) or (self.device == 'cpu')) and not rotation_info:
result = []
for bbox in horizontal_list:
h_list = [bbox]
f_list = []
image_list, max_width = get_image_list(h_list, f_list, img_cv_grey,
model_height = imgH)
result0 = get_text(self.character, imgH, int(max_width),
self.recognizer, self.converter, image_list,\
ignore_char, decoder, beamWidth, batch_size,
contrast_ths, adjust_contrast, filter_ths,\
workers, self.device)
result += result0
for bbox in free_list:
h_list = []
f_list = [bbox]
image_list, max_width = get_image_list(h_list, f_list, img_cv_grey,
model_height = imgH)
result0 = get_text(self.character, imgH, int(max_width),
self.recognizer, self.converter, image_list,\
ignore_char, decoder, beamWidth, batch_size,
contrast_ths, adjust_contrast, filter_ths,\
workers, self.device)
result += result0
# default mode will try to process multiple boxes at the same time
else:
image_list, max_width = get_image_list(horizontal_list, free_list,
img_cv_grey, model_height = imgH)
image_len = len(image_list)
if rotation_info and image_list:
image_list = make_rotated_img_list(rotation_info, image_list)
max_width = max(max_width, imgH)

result = get_text(self.character, imgH, int(max_width),

self.recognizer, self.converter, image_list,\
ignore_char, decoder, beamWidth, batch_size,
contrast_ths, adjust_contrast, filter_ths,\
workers, self.device)

if rotation_info and (horizontal_list+free_list):

result = set_result_with_confidence(result, image_len)

if self.model_lang == 'arabic':
direction_mode = 'rtl'
result = [list(item) for item in result]
for item in result:
item[1] = get_display(item[1])
else:
direction_mode = 'ltr'

if paragraph:
result = get_paragraph(result, mode = direction_mode)

if detail == 0:
return [item[1] for item in result]
else:
return result

def readtext(self, image, decoder = 'greedy', beamWidth= 5, batch_size = 1,\

workers = 0, allowlist = None, blocklist = None, detail = 1,\
rotation_info = None, paragraph = False, min_size = 20,\
contrast_ths = 0.1,adjust_contrast = 0.5, filter_ths = 0.003,\
text_threshold = 0.7, low_text = 0.4, link_threshold = 0.4,\
canvas_size = 2560, mag_ratio = 1.,\
slope_ths = 0.1, ycenter_ths = 0.5, height_ths = 0.5,\
width_ths = 0.5, add_margin = 0.1):
'''
Parameters:
image: file path or numpy-array or a byte stream object
'''
img, img_cv_grey = reformat_input(image)

horizontal_list, free_list = self.detect(img, min_size, text_threshold,\

low_text, link_threshold,\
canvas_size, mag_ratio,\
slope_ths, ycenter_ths,\
height_ths,width_ths,\
add_margin, False)

result = self.recognize(img_cv_grey, horizontal_list, free_list,\

decoder, beamWidth, batch_size,\
workers, allowlist, blocklist, detail,
rotation_info,\
paragraph, contrast_ths, adjust_contrast,\
filter_ths, False)

return result

Al - Sayed, Turner Et Al. 2014 - Space Syntax Methodology
83% (6)
Al - Sayed, Turner Et Al. 2014 - Space Syntax Methodology
118 pages
Subjective Time. The Philosophy, Psychology, and Neuroscience of Temporality - Arstila, Valtteri
100% (1)
Subjective Time. The Philosophy, Psychology, and Neuroscience of Temporality - Arstila, Valtteri
687 pages
Jungian 16-Type Personality Assessment Questionnaire
0% (1)
Jungian 16-Type Personality Assessment Questionnaire
3 pages
Maintenance 2012
100% (8)
Maintenance 2012
99 pages
autonomous
No ratings yet
autonomous
22 pages
Experimental Pix2pix
No ratings yet
Experimental Pix2pix
5 pages
Python Scripts
No ratings yet
Python Scripts
5 pages
PyTorch Cheat Sheet & Quick Reference
No ratings yet
PyTorch Cheat Sheet & Quick Reference
6 pages
detect
No ratings yet
detect
6 pages
ALL FILES
No ratings yet
ALL FILES
6 pages
ML 1
No ratings yet
ML 1
22 pages
val
No ratings yet
val
9 pages
Karpathy MinGPT Model
No ratings yet
Karpathy MinGPT Model
7 pages
Tutorial Pytorch Best Commands
No ratings yet
Tutorial Pytorch Best Commands
8 pages
intent_recognizer
No ratings yet
intent_recognizer
5 pages
Cv prince
No ratings yet
Cv prince
120 pages
export
No ratings yet
export
13 pages
Deep Learning
No ratings yet
Deep Learning
46 pages
Codeyolov 5
No ratings yet
Codeyolov 5
16 pages
autonomouvvs
No ratings yet
autonomouvvs
53 pages
train
No ratings yet
train
13 pages
hubconf
No ratings yet
hubconf
4 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
10 pages
Ad3511 Deep Learning Lab Manual
No ratings yet
Ad3511 Deep Learning Lab Manual
80 pages
vit32_gptMD
No ratings yet
vit32_gptMD
6 pages
LLM CODE REF
No ratings yet
LLM CODE REF
10 pages
code2pdf_67c73149b96ef
No ratings yet
code2pdf_67c73149b96ef
4 pages
CVDL TAE 63 (1)
No ratings yet
CVDL TAE 63 (1)
9 pages
Train - Model
No ratings yet
Train - Model
2 pages
Creating an AI that can operate without an internet connection
No ratings yet
Creating an AI that can operate without an internet connection
11 pages
Image Caption2
No ratings yet
Image Caption2
9 pages
Training Code
No ratings yet
Training Code
27 pages
Python Deep Learning Lab Programs (2)
No ratings yet
Python Deep Learning Lab Programs (2)
35 pages
dl lab_merged (2)
No ratings yet
dl lab_merged (2)
60 pages
Project Source
No ratings yet
Project Source
21 pages
Deep Learning Manual (1)
No ratings yet
Deep Learning Manual (1)
53 pages
Deep Learning Lab Practicals
No ratings yet
Deep Learning Lab Practicals
24 pages
Assignment3 AL
No ratings yet
Assignment3 AL
23 pages
Deep Neural Network Application
No ratings yet
Deep Neural Network Application
17 pages
Zero
No ratings yet
Zero
27 pages
Aishwarya MiniProjectReport - SC
No ratings yet
Aishwarya MiniProjectReport - SC
6 pages
Deep Learning Practical
No ratings yet
Deep Learning Practical
12 pages
Font Transfer 2 Autoencoders
No ratings yet
Font Transfer 2 Autoencoders
78 pages
ML Code Analysis
No ratings yet
ML Code Analysis
6 pages
cat_dog_classification_CNN_Model
No ratings yet
cat_dog_classification_CNN_Model
13 pages
Predict
No ratings yet
Predict
3 pages
README MD
No ratings yet
README MD
3 pages
PyTorch Workflow Fundamentals
No ratings yet
PyTorch Workflow Fundamentals
1 page
Face - Emotion Recog - Implementation
No ratings yet
Face - Emotion Recog - Implementation
11 pages
command_classifier
No ratings yet
command_classifier
4 pages
Raw Nitex
No ratings yet
Raw Nitex
5 pages
Homework_6
No ratings yet
Homework_6
7 pages
Retorno 1
No ratings yet
Retorno 1
29 pages
Artificial Intelligence May Minor Project
No ratings yet
Artificial Intelligence May Minor Project
8 pages
ilovepdf_merged (3)
No ratings yet
ilovepdf_merged (3)
144 pages
Ai Lab 02
No ratings yet
Ai Lab 02
12 pages
DETECTCAMERA
No ratings yet
DETECTCAMERA
3 pages
Deforum Stable Diffusion - Ipynb
No ratings yet
Deforum Stable Diffusion - Ipynb
12 pages
DL Programs
No ratings yet
DL Programs
12 pages
NN From Scratch
No ratings yet
NN From Scratch
5 pages
Downloaded by R GAYATHRI (R.gayathri@aalimec - Ac.in)
No ratings yet
Downloaded by R GAYATHRI (R.gayathri@aalimec - Ac.in)
56 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
DL Practical 6,7 Outputs
No ratings yet
DL Practical 6,7 Outputs
9 pages
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
Health Solutions SENA
No ratings yet
Health Solutions SENA
4 pages
Mbam Su13
No ratings yet
Mbam Su13
30 pages
Aut Procedure
100% (4)
Aut Procedure
30 pages
PSP
No ratings yet
PSP
18 pages
Drama Notes Own
No ratings yet
Drama Notes Own
44 pages
Dr. Reddy's Laboratories Limited
No ratings yet
Dr. Reddy's Laboratories Limited
9 pages
DPS Deployment
No ratings yet
DPS Deployment
37 pages
MCQ'S On Ms-Excel Part-3
No ratings yet
MCQ'S On Ms-Excel Part-3
43 pages
The Non-Existence of God
No ratings yet
The Non-Existence of God
27 pages
MANUALMBE
90% (10)
MANUALMBE
264 pages
Analytics for Retail - A Step-By-Step Guide to the Statistics Behind a Successful Retail Business
No ratings yet
Analytics for Retail - A Step-By-Step Guide to the Statistics Behind a Successful Retail Business
105 pages
Sifcon Report 1
100% (1)
Sifcon Report 1
27 pages
MYE Datesheet
No ratings yet
MYE Datesheet
1 page
SBS Ferro100 Charger Manual
No ratings yet
SBS Ferro100 Charger Manual
23 pages
Contor Electronic Monofazat de Energie Electrică: Caracteristici Tehnice
No ratings yet
Contor Electronic Monofazat de Energie Electrică: Caracteristici Tehnice
2 pages
Chapter One: Industy Profile
No ratings yet
Chapter One: Industy Profile
23 pages
PDS Stopaq Wrappingband CL V2 en
No ratings yet
PDS Stopaq Wrappingband CL V2 en
2 pages
Numerical Methods
No ratings yet
Numerical Methods
22 pages
Source Data For Product
No ratings yet
Source Data For Product
143 pages
Telepsychology Best Practices 101: Segment 2: Disclaimer/Disclosure
No ratings yet
Telepsychology Best Practices 101: Segment 2: Disclaimer/Disclosure
41 pages
Zheng Word Part Technique
No ratings yet
Zheng Word Part Technique
8 pages
D3165 en
No ratings yet
D3165 en
8 pages
Factitious Disorder Munchausen Syndrome In.22
No ratings yet
Factitious Disorder Munchausen Syndrome In.22
6 pages
Lead Data Engineer
No ratings yet
Lead Data Engineer
4 pages
03 - Building Inspection - Testing
No ratings yet
03 - Building Inspection - Testing
58 pages
MSDS Aplus Gypsumboard
No ratings yet
MSDS Aplus Gypsumboard
5 pages

Easyocr

Uploaded by

Easyocr

Uploaded by

# -*- coding: utf-8 -*-

from .detection import get_detector, get_textbox

def __init__(self, lang_list, gpu=True, model_storage_directory=None,

gpu (bool): Enable GPU support (default)

model_storage_directory (string): Path to directory for model data. If

user_network_directory (string): Path to directory for custom network

download_enabled (bool): Enabled downloading of model data via HTTP

self.user_network_directory = MODULE_PATH + '/user_network'

# check and download detection model

if recog_network in ['standard'] + [model for model in

else: # user-defined model

def setModelLanguage(self, language, lang_list, list_lang, list_lang_string):

def getChar(self, fileName):

def setLanguageList(self, lang_list, model):

def detect(self, img, min_size = 20, text_threshold = 0.7, low_text = 0.4,\

text_box = get_textbox(self.detector, img, canvas_size, mag_ratio,\

return horizontal_list, free_list

def recognize(self, img_cv_grey, horizontal_list=None, free_list=None,\

if self.model_lang in ['chinese_tra','chinese_sim']: decoder = 'greedy'

if (horizontal_list==None) and (free_list==None):

# without gpu/parallelization, it is faster to process image one by one

result = get_text(self.character, imgH, int(max_width),

if rotation_info and (horizontal_list+free_list):

def readtext(self, image, decoder = 'greedy', beamWidth= 5, batch_size = 1,\

horizontal_list, free_list = self.detect(img, min_size, text_threshold,\

result = self.recognize(img_cv_grey, horizontal_list, free_list,\

You might also like

# -- coding: utf-8 --

def init(self, lang_list, gpu=True, model_storage_directory=None,