Spaces:
Sleeping
Sleeping
Update app_pages/ocr_comparator.py
Browse files- app_pages/ocr_comparator.py +10 -6
app_pages/ocr_comparator.py
CHANGED
|
@@ -626,9 +626,6 @@ def app():
|
|
| 626 |
##
|
| 627 |
|
| 628 |
# Create results data frame
|
| 629 |
-
print("list_text_easyocr : ", list_text_easyocr)
|
| 630 |
-
print("list_text_ppocr : ", list_text_ppocr)
|
| 631 |
-
print("lens : ", len(list_cropped_images))
|
| 632 |
out_df_results = pd.DataFrame({'cropped_image': list_cropped_images,
|
| 633 |
'text_easyocr': list_text_easyocr,
|
| 634 |
'confidence_easyocr': list_confidence_easyocr,
|
|
@@ -665,7 +662,8 @@ def app():
|
|
| 665 |
## ------- EasyOCR Text recognition
|
| 666 |
try:
|
| 667 |
step = 0*len(in_list_images) # first recognition process
|
| 668 |
-
nb_steps = 4 * len(in_list_images)
|
|
|
|
| 669 |
for ind_img, cropped in enumerate(in_list_images):
|
| 670 |
result = _in_reader_easyocr.recognize(cropped, **in_params)
|
| 671 |
try:
|
|
@@ -702,7 +700,8 @@ def app():
|
|
| 702 |
try:
|
| 703 |
reader_ppocr = PaddleOCR(**in_params)
|
| 704 |
step = 1*len(in_list_images) # second recognition process
|
| 705 |
-
nb_steps = 4 * len(in_list_images)
|
|
|
|
| 706 |
progress_bar = st.progress(step/nb_steps)
|
| 707 |
|
| 708 |
for ind_img, cropped in enumerate(in_list_images):
|
|
@@ -778,7 +777,8 @@ def app():
|
|
| 778 |
"""
|
| 779 |
## ------- Tesseract Text recognition
|
| 780 |
step = 3*in_nb_images # fourth recognition process
|
| 781 |
-
nb_steps = 4 * in_nb_images
|
|
|
|
| 782 |
progress_bar = st.progress(step/nb_steps)
|
| 783 |
|
| 784 |
try:
|
|
@@ -874,6 +874,10 @@ def app():
|
|
| 874 |
column_width = 400
|
| 875 |
for ind_lig in range(0, reco_lines+1, 2):
|
| 876 |
cols = st.columns(2)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 877 |
for ind_col in range(2):
|
| 878 |
ind = ind_lig + ind_col
|
| 879 |
if ind < len(in_reader_type_list):
|
|
|
|
| 626 |
##
|
| 627 |
|
| 628 |
# Create results data frame
|
|
|
|
|
|
|
|
|
|
| 629 |
out_df_results = pd.DataFrame({'cropped_image': list_cropped_images,
|
| 630 |
'text_easyocr': list_text_easyocr,
|
| 631 |
'confidence_easyocr': list_confidence_easyocr,
|
|
|
|
| 662 |
## ------- EasyOCR Text recognition
|
| 663 |
try:
|
| 664 |
step = 0*len(in_list_images) # first recognition process
|
| 665 |
+
#nb_steps = 4 * len(in_list_images)
|
| 666 |
+
nb_steps = 3 * len(in_list_images)
|
| 667 |
for ind_img, cropped in enumerate(in_list_images):
|
| 668 |
result = _in_reader_easyocr.recognize(cropped, **in_params)
|
| 669 |
try:
|
|
|
|
| 700 |
try:
|
| 701 |
reader_ppocr = PaddleOCR(**in_params)
|
| 702 |
step = 1*len(in_list_images) # second recognition process
|
| 703 |
+
#nb_steps = 4 * len(in_list_images)
|
| 704 |
+
nb_steps = 3 * len(in_list_images)
|
| 705 |
progress_bar = st.progress(step/nb_steps)
|
| 706 |
|
| 707 |
for ind_img, cropped in enumerate(in_list_images):
|
|
|
|
| 777 |
"""
|
| 778 |
## ------- Tesseract Text recognition
|
| 779 |
step = 3*in_nb_images # fourth recognition process
|
| 780 |
+
#nb_steps = 4 * in_nb_images
|
| 781 |
+
nb_steps = 3 * in_nb_images
|
| 782 |
progress_bar = st.progress(step/nb_steps)
|
| 783 |
|
| 784 |
try:
|
|
|
|
| 874 |
column_width = 400
|
| 875 |
for ind_lig in range(0, reco_lines+1, 2):
|
| 876 |
cols = st.columns(2)
|
| 877 |
+
# test
|
| 878 |
+
cols[0].markdown('col 0')
|
| 879 |
+
cols[1].markdown('col 1')
|
| 880 |
+
#
|
| 881 |
for ind_col in range(2):
|
| 882 |
ind = ind_lig + ind_col
|
| 883 |
if ind < len(in_reader_type_list):
|