Spaces:

Loren
/

Streamlit_OCR_comparator

Running

File size: 52,156 Bytes

c957723

import streamlit as st
import cv2
import imutils
from paddleocr import PaddleOCR, draw_ocr
from PIL import Image
import io
import os
import numpy as np
import ast
import operator
import matplotlib.pyplot as plt


os.environ["KMP_DUPLICATE_LIB_OK"] = "TRUE"

st.markdown("""

    <style>

        .main > div:first-of-type {

            padding: 1em 2em 2em 2em;

        }

    </style>

""", unsafe_allow_html=True)

###################################################################################################
##   INITIALISATIONS
###################################################################################################
###
@st.cache_data(show_spinner=True)
def initializations():
    print("Initializations ...")
    out_dict_lang_ppocr = {'Abaza': 'abq', 'Adyghe': 'ady', 'Afrikaans': 'af', 'Albanian': 'sq', \
    'Angika': 'ang', 'Arabic': 'ar', 'Avar': 'ava', 'Azerbaijani': 'az', 'Belarusian': 'be', \
    'Bhojpuri': 'bho','Bihari': 'bh','Bosnian': 'bs','Bulgarian': 'bg','Chinese & English': 'ch', \
    'Chinese Traditional': 'chinese_cht', 'Croatian': 'hr', 'Czech': 'cs', 'Danish': 'da', \
    'Dargwa': 'dar', 'Dutch': 'nl', 'English': 'en', 'Estonian': 'et', 'French': 'fr', \
    'German': 'german','Goan Konkani': 'gom','Hindi': 'hi','Hungarian': 'hu','Icelandic': 'is', \
    'Indonesian': 'id', 'Ingush': 'inh', 'Irish': 'ga', 'Italian': 'it', 'Japan': 'japan', \
    'Kabardian': 'kbd', 'Korean': 'korean', 'Kurdish': 'ku', 'Lak': 'lbe', 'Latvian': 'lv', \
    'Lezghian': 'lez', 'Lithuanian': 'lt', 'Magahi': 'mah', 'Maithili': 'mai', 'Malay': 'ms', \
    'Maltese': 'mt', 'Maori': 'mi', 'Marathi': 'mr', 'Mongolian': 'mn', 'Nagpur': 'sck', \
    'Nepali': 'ne', 'Newari': 'new', 'Norwegian': 'no', 'Occitan': 'oc', 'Persian': 'fa', \
    'Polish': 'pl', 'Portuguese': 'pt', 'Romanian': 'ro', 'Russia': 'ru', 'Saudi Arabia': 'sa', \
    'Serbian(cyrillic)': 'rs_cyrillic', 'Serbian(latin)': 'rs_latin', 'Slovak': 'sk', \
    'Slovenian': 'sl', 'Spanish': 'es', 'Swahili': 'sw', 'Swedish': 'sv', 'Tabassaran': 'tab', \
    'Tagalog': 'tl', 'Tamil': 'ta', 'Telugu': 'te', 'Turkish': 'tr', 'Ukranian': 'uk', \
    'Urdu': 'ur', 'Uyghur': 'ug', 'Uzbek': 'uz', 'Vietnamese': 'vi', 'Welsh': 'cy'}

    out_dict_interpolation = {"INTER_LINEAR": cv2.INTER_LINEAR,
                              "INTER_NEAREST": cv2.INTER_NEAREST,
#                              "INTER_LINEAR_EXACT": cv2.INTER_LINEAR_EXACT,
                              "INTER_AREA": cv2.INTER_AREA,
                              "INTER_CUBIC": cv2.INTER_CUBIC,
                              "INTER_LANCZOS4": cv2.INTER_LANCZOS4,
#                              "INTER_NEAREST_EXACT": cv2.INTER_NEAREST_EXACT,
#                              "INTER_MAX": cv2.INTER_MAX,
#                              "WARP_FILL_OUTLIERS": cv2.WARP_FILL_OUTLIERS,
#                              "WARP_INVERSE_MAP": cv2.WARP_INVERSE_MAP,
                             }

    out_dict_thresholding_type = {"THRESH_BINARY": cv2.THRESH_BINARY,
                                  "THRESH_BINARY_INV": cv2.THRESH_BINARY_INV,
                                  "THRESH_TRUNC": cv2.THRESH_TRUNC,
                                  "THRESH_TOZERO": cv2.THRESH_TOZERO,
                                 }

    out_dict_adaptative_method = {"ADAPTIVE_THRESH_MEAN_C": cv2.ADAPTIVE_THRESH_MEAN_C,
                                  "ADAPTIVE_THRESH_GAUSSIAN_C": cv2.ADAPTIVE_THRESH_GAUSSIAN_C}

    return out_dict_lang_ppocr, out_dict_interpolation, out_dict_thresholding_type, out_dict_adaptative_method

###################################################################################################
##   FONTIONS
###################################################################################################
###
@st.cache_data(show_spinner=False)
def load_image(in_image_file):
    """Load input file and open it

    Args:

        in_image_file (string or Streamlit UploadedFile): image to consider

    Returns:

        matrix      : input file opened with Opencv

    """
    #if isinstance(in_image_file, str):
    #    out_image_path = "img."+in_image_file.split('.')[-1]
    #else:
    #    out_image_path = "img."+in_image_file.name.split('.')[-1]
    if isinstance(in_image_file, str):
        out_image_path = "tmp_"+in_image_file
    else:
        out_image_path = "tmp_"+in_image_file.name
    img = Image.open(in_image_file)
    img_saved = img.save(out_image_path)
    # Read image
#    out_image_orig = Image.open(out_image_path)
    out_image_cv2 = cv2.cvtColor(cv2.imread(out_image_path), cv2.COLOR_BGR2RGB)

    st.session_state.resize = False
    st.session_state.scaling_factor = None
    st.session_state.interpolation = None
    st.session_state.rotate = None
    st.session_state.angle = None
    st.session_state.convolution = None
    st.session_state.text_convol = None
    st.session_state.convol_kernel = None
    st.session_state.averaging = None
    st.session_state.averaging_kernel_size = None
    st.session_state.gaussian_bluring = None
    st.session_state.gb_kernel_size = None
    st.session_state.sigmaX = None
    st.session_state.sigmaY = None
    st.session_state.median_bluring = None
    st.session_state.mb_kernel_size = None
    st.session_state.bilateral_filtering = None
    st.session_state.d = None
    st.session_state.sigma_color = None
    st.session_state.sigma_space = None
    st.session_state.erosion = None
    st.session_state.erosion_kernel_size = None
    st.session_state.nb_iter_erosion = None
    st.session_state.dilation = None
    st.session_state.dilation_kernel_size = None
    st.session_state.nb_iter_dilation = None
    st.session_state.binarization = None
    st.session_state.bin_thresh = None
    st.session_state.bin_thresh = None
    st.session_state.bin_thresholding_type = None
    st.session_state.bin_otsu = None
    st.session_state.thresh_typ = None
    st.session_state.adaptative_thresh = None
    st.session_state.at_thresholding_type = None
    st.session_state.at_max_value = None
    st.session_state.at_adaptative_method = None
    st.session_state.at_block_size = None
    st.session_state.at_const = None
    st.session_state.processed_image = None

    return out_image_cv2, out_image_path
###
def eval_expr(expr):
    """Eval numeric expression

    Args:

        expr (string): numeric expression

    Returns:

       float: eval result

    """
    result = 1.
    # Dictionnary of authorized operators
    operators = {
        ast.Add: operator.add,
        ast.Sub: operator.sub,
        ast.Mult: operator.mul,
        ast.Div: operator.truediv,
        ast.Pow: operator.pow,
        ast.USub: operator.neg,
    }
    def _eval(node):
        if isinstance(node, ast.Expression):
            return _eval(node.body)
        elif isinstance(node, ast.Constant):  # nombre
            return node.value
        elif isinstance(node, ast.BinOp):  # opérations binaires
            return operators[type(node.op)](_eval(node.left), _eval(node.right))
        elif isinstance(node, ast.UnaryOp):  # opérations unaires (-n)
            return operators[type(node.op)](_eval(node.operand))
        else:
            raise TypeError(node)
    try:
        parsed = ast.parse(expr, mode='eval')
        result = _eval(parsed.body)
    except:
        pass
    return result
###
def text_kernel_to_latex(text_eval):
    """Try to parse a kernel text description like: 1/6 * [[1,1],[1,1]]

    Args:

        text_eval (string): the string with the kernel expression

    Returns:

       string: left part of input string before *

       list: right part of input string after *

       string: latex expression corresponding to the text kernel input

    """
    list_eval = text_eval.split('*')
    text_kernel = list_eval[-1].strip()
    list_kernel = ast.literal_eval(text_kernel)
    latex = "\\begin{bmatrix}\n"
    for row in list_kernel:
        latex += " & ".join(map(str, row)) + " \\\\\n"
    latex += "\\end{bmatrix}"
    text_coeff = 1.
    latex_text = latex
    if len(list_eval) > 1:
        text_coeff = list_eval[0].strip()
        latex_text = text_coeff + ' ' + latex
    return text_coeff, list_kernel, latex_text
###
def get_img_fig(img):
    """Plot image with matplotlib, in order to have image size

    Args:

        img (Image): Image to show

    Returns:

        Matplotlib figure

    """
    fig = plt.figure()
    if len(img.shape) == 3:
        plt.imshow(img, cmap=None)
    else:
        plt.imshow(img, cmap='gray')
    return fig

@st.fragment
def show_latex(latex_code):
    st.latex(latex_code)
###################################################################################################
##   STREAMLIT APP
###################################################################################################
st.title(''':orange[Image check and enhance for OCR task]''')
st.write("")
st.write("")
st.write("")
st.set_option("client.showErrorDetails", False)

dict_lang_ppocr, dict_interpolation, dict_thresholding_type, dict_adaptative_method = initializations()

cols = st.columns([0.25, 0.25, 0.5])
cols[0].markdown("#### :orange[Choose picture:]")
img_typ = cols[0].radio("#### :orange[Choose picture type:]", ['Upload file', 'Take a picture', 'Use a demo file'], \
                            index=0)
if img_typ == 'Upload file':
    image_file = cols[1].file_uploader("Upload a file:", type=["png","jpg","jpeg"])

if img_typ == 'Take a picture':
    image_file = cols[1].camera_input("Take a picture:")
if img_typ == 'Use a demo file':
    image_file = 'img_demo_enhance.png'

##----------- Process input image -----------------------------------------------------------------
if image_file is not None:
    img_cv2, image_path = load_image(image_file)

    cols[2].markdown('#### :orange[Original image]')
    cnt_img_ori = cols[2].container(height=300, border=False)
    #cnt_img_ori.image(img_cv2) #, use_container_width=True)
    cnt_img_ori.pyplot(get_img_fig(img_cv2))
    col1, col2 = st.columns([0.5, 0.5]) #gap="medium")

    col1.markdown('#### :orange[Processed image]')
    list_op = []

    if col1.checkbox("GrayScale"):
        try:
            img_first = cv2.cvtColor(img_cv2.copy(), cv2.COLOR_BGR2GRAY)
            list_op.append("Grayscale")
        except Exception as e:
            st.exception(e)
    else:
        img_first = img_cv2.copy()

    if col1.checkbox("Bit-wise inversion"):
        try:
            img_first = cv2.bitwise_not(img_first)
            list_op.append("Bit-wise inversion")
        except Exception as e:
            st.exception(e)

    # Processed image construction
    cnt_img_wrk = col1.container(height=500, border=False)
    img_processed = cnt_img_wrk.empty()
    img_wrk = img_first.copy()

    if st.session_state.resize:
        try:
            img_wrk = cv2.resize(img_wrk, None, fx=st.session_state.scaling_factor,
                                 fy=st.session_state.scaling_factor,
                                 interpolation=dict_interpolation[st.session_state.interpolation])
            list_op.append("Resize - fx="+str(st.session_state.scaling_factor)+", fy="+
                           str(st.session_state.scaling_factor)+", interpolation="+
                           st.session_state.interpolation)
        except Exception as e:
            st.exception(e)

    if st.session_state.rotate:
        try:
            img_wrk = imutils.rotate(img_wrk, angle=st.session_state.angle)
            list_op.append("Rotate - angle="+str(st.session_state.angle))
        except Exception as e:
            st.exception(e)

    if st.session_state.convolution:
        try:
            img_wrk = cv2.filter2D(src=img_wrk, ddepth=-1, kernel=st.session_state.convol_kernel)
            list_op.append("Filtering - Custom 2D Convolution - kernel="+ st.session_state.text_convol)
        except Exception as e:
            st.exception(e)

    if st.session_state.averaging:
        try:
            img_wrk = cv2.blur(src=img_wrk, ksize=st.session_state.averaging_kernel_size)
            list_op.append("Filtering - Averaging - kernel_size="+
                           str(st.session_state.averaging_kernel_size))
        except Exception as e:
            st.exception(e)

    if  st.session_state.gaussian_bluring:
        try:
            img_wrk = cv2.GaussianBlur(src=img_wrk, ksize=st.session_state.gb_kernel_size, \
                                    sigmaX=st.session_state.sigmaX, sigmaY=st.session_state.sigmaY)
            list_op.append("Filtering - Gaussian Blurring - ksize="+ \
                        str(st.session_state.gb_kernel_size)+", sigmaX="+
                        str(st.session_state.sigmaX)+", sigmaY="+str(st.session_state.sigmaY))
        except Exception as e:
            st.exception(e)

    if st.session_state.median_bluring:
        try:
            img_wrk = cv2.medianBlur(img_wrk, st.session_state.mb_kernel_size)
            list_op.append("Filtering - Median Blurring - kernel_size="+ \
                           str(st.session_state.mb_kernel_size))
        except Exception as e:
            st.exception(e)

    if st.session_state.bilateral_filtering:
        try:
            img_wrk = cv2.bilateralFilter(img_wrk, st.session_state.d, st.session_state.sigma_color,
                                         st.session_state.sigma_space)
            list_op.append("Filtering - Bilateral Filtering - d="+ str(st.session_state.d)+
                           ", sigma_color="+str(st.session_state.sigma_color)+ \
                           ", sigma_space="+str(st.session_state.sigma_space))
        except Exception as e:
            st.exception(e)

    if st.session_state.erosion:
        try:
            kernel = np.ones((st.session_state.erosion_kernel_size,
                              st.session_state.erosion_kernel_size),
                             np.uint8)
            img_wrk = cv2.erode(img_wrk, kernel, iterations=st.session_state.nb_iter_erosion)
            list_op.append("Erosion - kernel_size="+str(st.session_state.erosion_kernel_size)+ \
                           ", iterations="+str(st.session_state.nb_iter_erosion))
        except Exception as e:
            st.exception(e)

    if st.session_state.dilation:
        try:
            kernel = np.ones((st.session_state.dilation_kernel_size,
                              st.session_state.dilation_kernel_size),
                             np.uint8)
            img_wrk = cv2.dilate(img_wrk, kernel, iterations=st.session_state.nb_iter_dilation)
            list_op.append("Dilation - kernel_size="+str(st.session_state.dilation_kernel_size )+ \
                           ", iterations="+str(st.session_state.nb_iter_dilation))
        except Exception as e:
            st.exception(e)

    if st.session_state.binarization:
        try:
            ret, img_wrk = cv2.threshold(img_wrk, st.session_state.bin_thresh,
                                         st.session_state.bin_value,
                                         st.session_state.thresh_typ)
            list_op.append("Thresholding - thresh="+str(st.session_state.bin_thresh)+ \
                           ", maxval="+str(st.session_state.bin_value)+", type="+ \
                           st.session_state.bin_thresholding_type+", otsu="+ \
                           str(st.session_state.bin_otsu))
        except Exception as e:
            st.exception(e)

    if st.session_state.adaptative_thresh:
        try:
            img_wrk = cv2.adaptiveThreshold(img_wrk, st.session_state.at_max_value,
                                dict_adaptative_method[st.session_state.at_adaptative_method],
                                dict_thresholding_type[st.session_state.at_thresholding_type],
                                st.session_state.at_block_size, st.session_state.at_const)
            list_op.append("Adaptative thresholding - maxValue="+
                           str(st.session_state.at_max_value)+", adaptiveMethod="+
                           st.session_state.at_adaptative_method+", thresholdType"+
                           ", thresholding_type="+st.session_state.at_thresholding_type+
                           ", blockSize="+str(st.session_state.at_block_size)+", C="+
                           str(st.session_state.at_const))
        except Exception as e:
            st.exception(e)

    # Show image
    img_processed.pyplot(get_img_fig(img_wrk))
    st.session_state.processed_image = img_wrk

    # Process
    col2.markdown('#### :orange[Check & enhance]')

    with col2.expander(":blue[Image processing]", expanded=False):
        tab1, tab2, tab3, tab4, tab5 = \
                st.tabs(["Resize", "Rotate", "Filtering",
                          "Morphologie", "Thresholding"])
        with tab1: # Resize
            with tab1.form("Resize parameters"):
                st.session_state.scaling_factor = st.slider("Scaling factor :", 0.1, 20., 1., 0.1)
                cols_tab1 = st.columns([0.1, 0.9], gap="medium", vertical_alignment="center")
                cols_tab1[0].markdown("💬", help="""An interpolation function’s goal is

        to examine neighborhoods of pixels and use these neighborhoods to optically increase or decrease

        the size of the image without introducing distortions (or at least as few distortions

        as possible).\n

        ```cv2.INTER_LINEAR``` This option uses the bilinear interpolation algorithm. Unlike INTER_NEAREST,

        this does the interpolation in two dimensions and predicts the function used to calculate the color

        of a pixel. This algorithm is effective in handling visual distortions while zooming or

        enlarging an image.\n

        ```cv2.INTER_NEAREST``` This option uses the nearest neighbor interpolation algorithm. It retains

        the sharpness of the edges though the overall image may be blurred.\n

        ```cv2.INTER_LINEAR_EXACT```is a modification of ```INTER_LINEAR``` and both uses bilinear

        interpolation algorithm. The only difference is that the calculations in ```INTER_LINEAR_EXACT```

        are accurate to a bit.\n

        ```cv2.INTER_AREA``` option uses resampling using pixel area relation technique. While enlarging

        images, INTER_AREA work same as INTER_NEAREST. In other cases, ```INTER_AREA works``` better in

        image decimation and avoiding false inference patterns in images (moire pattern).\n

        ```cv2.INTER_CUBIC``` option uses bicubic interpolation technique. This is an extension of cubic

        interpolation technique and is used for 2 dimension regular grid patterns.\n

        ```cv2.INTER_LANCZOS4``` option uses Lanczos interpolation over 8 x 8 pixel neighborhood technique.

        It uses Fourier series and Chebyshev polynomials and is suited for images with large number of

        small size details.\n

        ```cv2.INTER_NEAREST_EXACT ``` is a modification of INTER_NEAREST with bit level accuracy.\n

        ```cv2.INTER_MAX ``` option uses mask for interpolation codes.\n

        ```cv2.WARP_FILL_OUTLIERS ``` interpolation technique skips the outliers during interpolation calculations.\n

        ```cv2.WARP_INVERSE_MAP ``` option uses inverse transformation technique for interpolation.\n""")
                cols_tab1[0].link_button("📚", "https://opencv.org/blog/resizing-and-rescaling-images-with-opencv/#h-resizing-with-different-interpolation-methods")
                st.session_state.interpolation = cols_tab1[1].selectbox("Interpolation method:",
                                                            list(dict_interpolation.keys()))
                c1, c2 = st.columns(2)
                apply_tab1 = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=1)
                with c2:
                    submit_tab1 = st.form_submit_button(":green[Confirm]")

            if submit_tab1:
                st.session_state.resize = apply_tab1
                st.rerun()

        with tab2: # Rotate
            with tab2.form("Rotate parameters"):
                st.session_state.angle = st.slider("Angle :", 0, 360, 0, step=10)
                c1, c2 = st.columns(2)
                apply_tab2 = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=2)
                with c2:
                    submit_tab2 = st.form_submit_button(":green[Confirm]")

            if submit_tab2:
                st.session_state.rotate = apply_tab2
                st.rerun()

        with tab3: # Filtering
            st.write("📚 :blue[*More about image filtering*]  👉  \

                        [here](https://learnopencv.com/image-filtering-using-convolution-in-opencv/)")
            selection = st.segmented_control("Filtering type",
                                            ["Custom 2D Convolution", "Blurring"],
                                            selection_mode="single")
            match selection:
                case "Custom 2D Convolution":
                    with st.form("tab3_1"):
                        st.write("📚 :blue[*More about convolution matrix*]  👉  \

                                    [here](https://en.wikipedia.org/wiki/Kernel_(image_processing))")
                        text_convol = st.text_input("Write your custom kernel here (example : 1/9 * [[1,1,1], [1,1,1], [1,1,1]]):",
                                                    value=None)
                        kernel = None
                        if text_convol is not None:
                            try:
                                text_coeff, list_kernel, latex_code = text_kernel_to_latex(text_convol)
                                coeff = eval_expr(text_coeff)
                                kernel = coeff * np.array(list_kernel)
                                show_latex(latex_code)
                            except Exception as e:
                                st.exception(e)
                                text_convol = None
                        else:
                            text_coeff, list_kernel, latex_code = \
                                        text_kernel_to_latex("1/9 * [[1,1,1], [1,1,1], [1,1,1]]")
                            show_latex(latex_code)

                        c1, c2 = st.columns(2)
                        apply_tab31 = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=3)
                        with c2:
                            submit_tab31 = st.form_submit_button(":green[Confirm]")

                    if submit_tab31:
                        st.session_state.convolution = apply_tab31
                        st.session_state.text_convol = text_convol
                        st.session_state.convol_kernel = kernel
                        st.rerun()

                case "Blurring":
                    st.write("📚 :blue[*More about blurring techniques*]  👉  \

                                [here](https://docs.opencv.org/4.x/d4/d13/tutorial_py_filtering.html)")
                    b1, b2, b3, b4 = st.tabs(["Averaging", "Gaussian Blurring", "Median Blurring",
                                        "Bilateral Filtering"])
#                    typ_blurring = st.segmented_control("Bluring type",
#                                        ["Averaging", "Gaussian Blurring", "Median Blurring",
#                                        "Bilateral Filtering"],
#                                        selection_mode="multi")

                    with b1:
                        with st.form("tab_32a"):
                            st.markdown("💬 :green[Averaging?]",
                                            help="This is done by convolving an image with a normalized box filter.\

                                        It simply takes the average of all the pixels under the kernel \

                                        area and replaces the central element."
                                           )
                            kernel_width = st.slider("Kernel size width:", 2, 20, None, 1)
                            kernel_height = st.slider("Kernel size height:", 2, 20, None, 1)

                            c1, c2 = st.columns(2)
                            apply_tab32a = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=4)
                            with c2:
                                submit_tab32a = st.form_submit_button(":green[Confirm]")

                        if submit_tab32a:
                            st.session_state.averaging = apply_tab32a
                            st.session_state.averaging_kernel_size = (kernel_width, kernel_height)
                            st.rerun()

                    with b2:
                        with st.form("tab_32b"):
                            st.markdown("💬 :green[Gaussian Blurringing?]",
                                                help="In this method, instead of a box filter, a Gaussian kernel is used. \

    We should specify the width and height of the kernel which should be positive and odd. \

    We also should specify the standard deviation in the X and Y directions, `sigmaX` and `sigmaY` respectively. \

    If only `sigmaX` is specified, `sigmaY` is taken as the same as sigmaX. If both are given as zeros, they are \

    calculated from the kernel size.\n \

    Gaussian blurring is highly effective in removing Gaussian noise from an image.")
                            kernel_width = st.slider("Kernel size width:", 2, 20, None, 1,)
                            kernel_height = st.slider("Kernel size height:", 2, 20, None, 1)
                            st.markdown("Standard deviations of the Gaussian kernel:",
                                        help="""The parameters `sigmaX` and `sigmaY` represent the standard deviations

                                                    of the Gaussian kernel in the horizontal (X) and vertical (Y) directions,

                                                    respectively. These values control the extent of blurring applied to the image.\n

    **Typical Values for sigmaX and sigmaY:**

    - Low values (e.g., 1–3): Apply a mild blur, useful for slight noise reduction while preserving image details.

    - Moderate values (e.g., 5–10): Produce a more noticeable blur, helpful for reducing more significant noise or smoothing out textures.

    - High values (e.g., >10): Result in a strong blur, which can be used for artistic effects or to obscure details.

    It's common practice to set sigmaX and sigmaY to 0. In this case, OpenCV calculates the standard deviations based on the kernel size (ksize).

    If only sigmaX is specified and sigmaY is set to 0, OpenCV uses the same value for both directions. \n

    **Recommendations:**

    - Specify sigmaX and sigmaY explicitly: For precise control over the blurring effect, define both parameters based on the desired outcome.

    - Use sigmaX = 0 and sigmaY = 0: To allow OpenCV to compute the standard deviations automatically from the kernel size.

    - Choose an appropriate kernel size: The ksize parameter should be a tuple of positive odd integers (e.g., (3, 3), (5, 5)).

                        """)
                            sigmaX = st.slider("sigmaX:", 0, 20, 0, 1)
                            sigmaY = st.slider("sigmaY:", 0, 20, 0, 1)

                            c1, c2 = st.columns(2)
                            apply_tab32b = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=5)
                            with c2:
                                submit_tab32b = st.form_submit_button(":green[Confirm]")

                        if submit_tab32b:
                            st.session_state.gaussian_bluring = apply_tab32b
                            st.session_state.gb_kernel_size = (kernel_width, kernel_height)
                            st.session_state.sigmaX = sigmaX
                            st.session_state.sigmaY = sigmaY
                            st.rerun()

                    with b3:
                        with st.form("tab_32c"):
                            st.markdown("💬 :green[Median Blurring?]",
                                            help="It takes the median of all the pixels under the \

    kernel area and the central element is replaced with this median value.  Interestingly, in the above \

    filters, the central element is a newly calculated value which may be a pixel value in the image or a new value. \

    But in median blurring, the central element is always replaced by some pixel value in the image. \

    It reduces the noise effectively. Its kernel size should be a positive odd integer.\n \

    Median blurring is highly effective against salt-and-pepper noise in an image.")
                            kernel_size = st.slider("Kernel size:", 3, 15, None, 2, key=101)

                            c1, c2 = st.columns(2)
                            apply_tab32c = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=6)
                            with c2:
                                submit_tab32c = st.form_submit_button(":green[Confirm]")

                        if submit_tab32c:
                            st.session_state.median_bluring = apply_tab32c
                            st.session_state.mb_kernel_size = kernel_size
                            st.rerun()

                    with b4:
                        with st.form("tab_32d"):
                            st.markdown("💬 :green[Bilateral Filtering?]",
                                        help="It is highly effective in noise removal while \

    keeping edges sharp. But the operation is slower compared to other filters. We already saw that a \

    Gaussian filter takes the neighbourhood around the pixel and finds its Gaussian weighted average. \

    This Gaussian filter is a function of space alone, that is, nearby pixels are considered while \

    filtering. It doesn't consider whether pixels have almost the same intensity. It doesn't consider \

    whether a pixel is an edge pixel or not. So it blurs the edges also, which we don't want to do.\n \

    Bilateral filtering also takes a Gaussian filter in space, but one more Gaussian filter which is \

    a function of pixel difference. \

    The Gaussian function of space makes sure that only nearby pixels are considered for blurring, \

    while the Gaussian function of intensity difference makes sure that only those pixels with similar \

    intensities to the central pixel are considered for blurring. \

    So it preserves the edges since pixels at edges will have large intensity variation.")
                            st.markdown("Diameter of each pixel neighborhood that is used during filtering:",
                                        help=""" **Effect:**\n

    A larger `d` value means that more neighboring pixels are considered in the filtering process, leading to a more pronounced

    blurring effect. Conversely, a smaller `d` focuses the filter on a tighter area, preserving more details.

    **Automatic Calculation:**\n

    If `d` is set to a non-positive value (e.g., 0 or negative), OpenCV automatically calculates it based on the sigmaSpace parameter.

    Specifically, the radius is computed as `radius = cvRound(sigmaSpace * 1.5)`, and then `d = radius * 2 + 1` to ensure it's an odd

    number. This ensures that the kernel has a central pixel. 

    **Typical Values for `d`:**\n

    The choice of d depends on the desired balance between noise reduction and edge preservation:

    - Small d (e.g., 5 to 9): Suitable for subtle smoothing while maintaining edge sharpness.

    - Medium d (e.g., 9 to 15): Offers a balance between noise reduction and detail preservation.

    - Large d (e.g., 15 and above): Provides stronger blurring, which may be useful for artistic effects but can lead to loss of

    fine details.

    **Recommendations:**\n

    - Large filters (d > 5) are very slow, so it is recommended to use `d=5` for real-time applications, and perhaps

    `d=9` for offline applications that need heavy noise filtering.

    - Start with Moderate Values: Begin with `d=9`, `sigmaColor=75`, and `sigmaSpace=75` as a baseline. Adjust these values based on

    the specific requirements of your application.

    - Consider Image Size: For larger images, you might need to increase `d` to achieve a noticeable effect. Conversely,

    for smaller images, a smaller `d` might suffice.

    - Balance with `sigmaColor` and `sigmaSpace`: Ensure that `d` is appropriately balanced with `sigmaColor` and

    `sigmaSpace`. An excessively large `sigmaSpace` with a small `d` might not utilize the full potential of the spatial filtering.

                                                """)
                            d_value = st.slider("d:", 3, 15, None, 2)
                            st.markdown("`sigmaColor` and `sigmaSpace`:", help="""

    `sigmaColor`: This parameter defines the filter sigma in the color space. A larger value means that pixels with more significant

    color differences will be mixed together, resulting in areas of semi-equal color.

    `sigmaSpace`: This parameter defines the filter sigma in the coordinate space. A larger value means that pixels farther apart

    will influence each other as long as their colors are close enough.\n

    These parameters work together to ensure that the filter smooths the image while preserving edges.

    **Typical Values for `sigmaColor` and `sigmaSpace`:**\n

    The choice of `sigmaColor` and `sigmaSpace` depends on the specific application and the desired effect.

    However, some commonly used values are:

    - `sigmaColor`: Values around 75 are often used for general smoothing while preserving edges.

    - `sigmaSpace`: Similarly, values around 75 are typical for maintaining edge sharpness while reducing noise.

    For example, applying the bilateral filter with `d=9`, `sigmaColor=75`, and `sigmaSpace=75` is a common practice.

    **Recommendations:**`\n

    - Start with Equal Values: Setting `sigmaColor` and `sigmaSpace` to the same value (e.g., 75) is a good starting point.

    - Adjust Based on Results: If the image appears too blurred, reduce the values. If noise is still present, increase them.

    - Consider Image Characteristics: For images with high noise, higher values may be necessary. For images where edge preservation

    is critical, lower values are preferable.""")
                            sigma_color = st.slider("sigmaColor", 1, 255, None, 1)
                            sigma_space = st.slider("sigmaSpace", 1, 255, None, 1)

                            c1, c2 = st.columns(2)
                            apply_tab32d = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=7)
                            with c2:
                                submit_tab32d = st.form_submit_button(":green[Confirm]")

                        if submit_tab32d:
                            st.session_state.bilateral_filtering = apply_tab32d
                            st.session_state.d = d_value
                            st.session_state.sigma_color = sigma_color
                            st.session_state.sigma_space = sigma_space
                            st.rerun()

        with tab4: # Morphologie
            list_select = st.segmented_control("Morphological operation:",
                                              ["Erosion", 'Dilation'],
                                              selection_mode="multi")
            if "Erosion" in list_select:
                with st.form("tab_4a"):
                    st.markdown("💬 :green[Erosion?]",
                                    help="The basic idea of erosion is just like soil erosion only, it erodes \

    away the boundaries of foreground object (Always try to keep foreground in white). \

    So what it does? The kernel slides through the image (as in 2D convolution). A pixel in the \

    original image (either 1 or 0) will be considered 1 only if all the pixels under the kernel is 1, \

    otherwise it is eroded (made to zero). \n \

    So what happends is that, all the pixels near boundary will be discarded depending upon the \

    size of kernel. So the thickness or size of the foreground object decreases or simply white region \

    decreases in the image. \n\

    It is useful for removing small white noises, detach two connected objects etc. \n \

    :orange[**Best practice :** convert to grayscale before apply erosion.]")
                    kernel_size_ero = st.slider("Kernel size:", 3, 21, 3, 2, key=102)
                    nb_iter = st.slider('Iterations number:', 1, 7, 1, 1, key=201)

                    c1, c2 = st.columns(2)
                    apply_tab4a = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=8)
                    with c2:
                        submit_tab4a = st.form_submit_button(":green[Confirm]")

                if submit_tab4a:
                    st.session_state.erosion = apply_tab4a
                    st.session_state.erosion_kernel_size = kernel_size_ero
                    st.session_state.nb_iter_erosion = nb_iter
                    st.rerun()

            if "Dilation" in list_select:
                with st.form("tab_4b"):
                    st.markdown("💬 :green[Dilation?]",
                                    help="The opposite of an erosion is a dilation. Just like an \

    erosion will eat away at the foreground pixels, a dilation will grow the foreground pixels. \

    Dilations increase the size of foreground objects and are especially useful for joining broken \

    parts of an image together. Dilations, just as an erosion, also utilize structuring elements \

    — a center pixel p of the structuring element is set to white if ANY pixel in the structuring \

    element is > 0. \n \

    :orange[**Best practice :** convert to grayscale before apply dilation.]")
                    kernel_size_dil = st.slider("Kernel size:", 3, 21, 3, 2, key=103)
                    nb_iter = st.slider('Iterations number:', 1, 7, 1, 1, key=202)
                    kernel = np.ones((kernel_size_dil,kernel_size_dil),np.uint8)

                    c1, c2 = st.columns(2)
                    apply_tab4b = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=9)
                    with c2:
                        submit_tab4b = st.form_submit_button(":green[Confirm]")

                if submit_tab4b:
                    st.session_state.dilation = apply_tab4b
                    st.session_state.dilation_kernel_size = kernel_size_dil
                    st.session_state.nb_iter_dilation = nb_iter
                    st.rerun()

        with tab5: # Thresholding
            selection = st.segmented_control("Type:", ["Binarization", "Adaptative thresholding"])
            match selection:
                case "Binarization":
                    with st.form("tab5_a"):
                        st.markdown("💬 :green[What is thresholding?]",
                                    help='''Thresholding is the binarization of an image. In general, we seek to

                                            convert a grayscale image to a binary image, where the pixels are either

                                            0 or 255.

                                            A simple thresholding example would be selecting a threshold value T,

                                            and then setting all pixel intensities less than T to 0, and all pixel

                                            values greater than T to 255. In this way, we are able to create a binary

                                            representation of the image.''')
                        st.markdown("*:orange[⚠ Image must be in gray scale]*")
                        cols_tab1 = st.columns([0.1, 0.9], gap="medium", vertical_alignment="center")
                        with cols_tab1[1]:
                            thresholding_type = cols_tab1[1].selectbox("Thresholding type:",
                                                                    list(dict_thresholding_type.keys()))
                            with cols_tab1[0].popover(":material/info:", help="Help on thresholding type",
                                                    use_container_width=False):
                                st.link_button("📚:blue[cf. OpenCV documentation :]",
                                            "https://docs.opencv.org/3.0-beta/modules/imgproc/doc/miscellaneous_transformations.html#threshold")

                        thresh = st.slider("Thresh :", 0, 255, 255, 1)
                        if thresholding_type in ["cv.THRESH_BINARY", "cv.THRESH_BINARY_INV"]:
                            value = st.slider("Value :", 0, 255, 255, 1)
                        else:
                            value = 255

                        cols_tab3 = st.columns(2, gap="medium", vertical_alignment="center")
                        otsu = cols_tab3[0].checkbox("Optimum Global Thresholding using Otsu’s Method?",
                                                    help='''Otsu’s method tries to find a threshold value

                                                        which minimizes the weighted within-class variance.

                                                        Since Variance is the spread of the distribution

                                                            about the mean. Thus, minimizing the within-class

                                                            variance will tend to make the classes compact.''')
                        cols_tab3[1].link_button("📚:blue[Documentation]",
                                                "https://theailearner.com/2019/07/19/optimum-global-thresholding-using-otsus-method/")

                        thresh_typ = dict_thresholding_type[thresholding_type]

                        c1, c2 = st.columns(2)
                        apply_tab5a = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=10)
                        with c2:
                            submit_tab5a = st.form_submit_button(":green[Confirm]")

                    if submit_tab5a:
                        if otsu:
                            thresh_typ = thresh_typ+cv2.THRESH_OTSU
                        st.session_state.binarization = apply_tab5a
                        st.session_state.bin_thresh = thresh
                        st.session_state.bin_value = value
                        st.session_state.bin_thresholding_type = thresholding_type
                        st.session_state.bin_otsu = otsu
                        st.session_state.thresh_typ = thresh_typ
                        st.rerun()

                case "Adaptative thresholding":
                    with st.form("tab5_b"):
                        st.markdown("💬 :green[What is adaptative thresholding?]",
                                            help='''This is a usefull technique when dealing with images having non-uniform illumination.

                                            In this, the threshold value is calculated separately for each pixel using

                                            some statistics obtained from its neighborhood. This way we will get different thresholds

                                            for different image regions and thus tackles the problem of varying illumination.''')
                        st.markdown("*:orange[⚠ Image must be in gray scale]*")
                        thresholding_type = st.selectbox("Thresholding type:",
                                                        list(dict_thresholding_type.keys())[:2])
                        max_value = st.slider("Max value :", 0, 255, 255, 1,
                                              help="""This is the value assigned to the pixels after thresholding.

                                                This depends on the thresholding type. If the type is cv2.THRESH_BINARY,

                                                all the pixels greater than the threshold are assigned this maxValue.""")
                        adaptative_method = st.selectbox("Adaptative method:",
                                                         list(dict_adaptative_method.keys()),
                                                         help="""This tells us how the threshold is calculated from the pixel neighborhood.

                This currently supports two methods:

                - cv2.ADAPTIVE_THRESH_MEAN_C: In this, the threshold value is the mean of the neighborhood area.\n

                - cv2.ADAPTIVE_THRESH_GAUSSIAN_C: In this, the threshold value is the weighted sum of the

                neighborhood area. This uses Gaussian weights computed using getGaussiankernel() method.""")
                        block_size = st.slider("Block size:", 3, 21, 3, 2,
                                               help='''**🔍 What is blockSize?**\n

                In adaptive thresholding, the threshold for each pixel is determined based on a local neighborhood around it.

                The blockSize parameter specifies the size of this neighborhood.

                Specifically, it defines the dimensions of the square region (of size blockSize × blockSize) centered on the pixel being processed.

                The threshold is then calculated based on the pixel values within this region.\n

                **✅ Acceptable Values for blockSize**\n

                Must be an odd integer greater than 1: This ensures that the neighborhood has a central pixel.

                Common choices: 3, 5, 7, 9, 11, 13, 15, etc.

                Even numbers are invalid: Using an even blockSize (e.g., 2, 4, 6) would result in an error because

                there would be no central pixel in the neighborhood.\n

                **🎯 Impact of blockSize on Thresholding**\n

                Smaller blockSize (e.g., 3 or 5):\n

                - Captures fine details and small variations in illumination.

                - May be more sensitive to noise.\n

                Larger blockSize (e.g., 15 or 21):\n

                - Provides smoother thresholding, reducing the effect of noise.

                - Might overlook small features or details.



                Choosing the appropriate blockSize depends on the specific characteristics of your image and the details you wish to preserve or suppress.''')
                        const = st.slider("C:", -10, 20, 0, 1,
                                          help='''The parameter C serves as a constant subtracted from the computed mean or weighted mean of the

                                                    neighborhood pixels. This subtraction fine-tunes the thresholding process, allowing for better control

                                                    over the binarization outcome.

                **🎯 Typical Values for C**

                The optimal value for C varies depending on the image's characteristics, such as lighting conditions and noise levels. Commonly used values include:

                - 2 to 10: These values are often effective for standard images with moderate lighting variations.

                - Higher values (e.g., 15 or 20): Useful for images with significant noise or when a more aggressive thresholding is needed.

                - Negative values: Occasionally used to make the thresholding more lenient, capturing lighter details that might otherwise be missed.



                It's advisable to experiment with different C values to determine the most suitable one for your specific application. ''')

                        c1, c2 = st.columns(2)
                        apply_tab5b = c1.toggle("Apply", help="Click here to indicate whether the operation should be carried out or not, then validate with Confirm.", key=11)
                        with c2:
                            submit_tab5b = st.form_submit_button(":green[Confirm]")

                    if submit_tab5b:
                        st.session_state.adaptative_thresh = apply_tab5b
                        st.session_state.at_max_value = max_value
                        st.session_state.at_adaptative_method = adaptative_method
                        st.session_state.at_thresholding_type = thresholding_type
                        st.session_state.at_block_size = block_size
                        st.session_state.at_const = const
                        st.rerun()

    col1_a, col1_b = col1.columns(2)
    if col1_a.button("📃 :blue[List of operations]"):
        col1_a.write(list_op)

    if col1_b.button("Prepare download"):
        if len(img_wrk.shape) == 2:
            pil_img = Image.fromarray(img_wrk).convert("L")
        else:
            img_rgb = cv2.cvtColor(img_wrk, cv2.COLOR_BGR2RGB)
            pil_img = Image.fromarray(img_rgb)
        img_bytes = io.BytesIO()
        pil_img.save(img_bytes, format='PNG')
        img_bytes.seek(0)
        col1_b.download_button(
            label="Download processed image",
            data=img_bytes,
            file_name="processed_image.png",
            on_click="ignore",
            icon=":material/download:",
            mime="image/png"
        )

    with col2.expander(":blue[Quick overview of OCR recognition (with PPOCR)]", expanded=True):
        with st.form("form1"):
            key_ppocr_lang = st.selectbox("Choose language: :", dict_lang_ppocr.keys(), 20)
            res_cnt = st.empty()
            submit_detect = st.form_submit_button("Launch overview")

        ##----------- Process OCR --------------------------------------------------------------
        if submit_detect:
            with res_cnt, st.spinner("PPOCR initialization ..."):
                ocr = PaddleOCR(lang=dict_lang_ppocr[key_ppocr_lang]) #, show_log=False)
            with res_cnt, st.spinner("OCR process ..."):
                result = ocr.ocr(img_wrk)
            # draw result
            result = result[0]
            if len(img_wrk.shape) == 3:
                image = img_wrk.copy()
            else:
                image = cv2.cvtColor(img_wrk, cv2.COLOR_GRAY2RGB)
            boxes = [line[0] for line in result]

            txts = [line[1][0] for line in result]
            scores = [line[1][1] for line in result]
            im_show = draw_ocr(image, boxes, txts, scores, font_path='./fonts/french.ttf')
            im_show = Image.fromarray(im_show)
            res_cnt.image(im_show, use_container_width=True)