oya163
diff --git a/‎.gitignore
+2 b/‎.gitignore
+2
diff --git a/‎README.md
+37-13 b/‎README.md
+37-13
diff --git a/‎app.py
+134 b/‎app.py
+134
diff --git a/‎checkbox_detection.ipynb
+401 b/‎checkbox_detection.ipynb
+401
diff --git a/‎images/checkbox_detection_workflow.png
55.7 KB b/‎images/checkbox_detection_workflow.png
55.7 KB
diff --git a/‎images/checked_text_extraction.png
63.8 KB b/‎images/checked_text_extraction.png
63.8 KB
diff --git a/‎images/detected_checkbox_coordinates.png
151 KB b/‎images/detected_checkbox_coordinates.png
151 KB
diff --git a/‎images/sample.png
134 KB b/‎images/sample.png
134 KB
diff --git a/‎models/detector-model.pt
+3 b/‎models/detector-model.pt
+3
diff --git a/‎requirements.txt
+26 b/‎requirements.txt
+26
@@ -0,0 +1,2 @@
+.venv
+flagged/
@@ -1,13 +1,37 @@
----
-title: Checkbox Text Extraction
-emoji: 🔥
-colorFrom: blue
-colorTo: blue
-sdk: gradio
-sdk_version: 4.36.1
-app_file: app.py
-pinned: false
-license: apache-2.0
----
-
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+# Checkbox Detection and Text Extraction
+
+## Introduction
+
+- This tool helps you to extract the checked text (The text next to the checked box).
+- It is built on top of [Checkbox-Detection](https://github.com/LynnHaDo/Checkbox-Detection) by [LynnHaDo](https://github.com/LynnHaDo).
+- It uses the **Euclidean Distance** to extract the checked text following the result from checkbox detection model and the OCR
+![Checkbox Text Extraction](images/checked_text_extraction.png "Checkbox Text Extraction")
+
+## Workflow
+![Checkbox Detection and corresponding text extraction](images/checkbox_detection_workflow.png "Checkbox Detection and Text Extraction Workflow")
+
+## Installation
+
+    # Create virtual environment
+    python3.11 -m venv .venv
+
+    # Activate the virtual environment
+    source .venv/bin/activate
+
+    # Install the requirements from requirements.txt
+    pip install -r requirements.txt
+
+    # Install poppler-utils
+    sudo apt-get install poppler-utils
+
+## Demo
+
+This is currently deployed in [HuggingFace Spaces](https://huggingface.co/spaces/oyashi163/checkbox_text_extraction)
+
+## Note
+
+Please use the sample image provided in `images` folder for testing purpose. 
+You might want to modify the OCR parameters for your image to get more accurate later.
+
+## References
+- https://github.com/LynnHaDo/Checkbox-Detection
@@ -0,0 +1,134 @@
+import math
+import gradio as gr
+import easyocr
+import cv2
+from ultralytics import YOLO 
+
+# Load OCR model into memory
+reader = easyocr.Reader(['en']) # this needs to run only once to load the model into memory
+
+# Define constants
+BOX_COLORS = {
+    "unchecked": (242, 48, 48),
+    "checked": (38, 115, 101),
+    "block": (242, 159, 5)
+}
+BOX_PADDING = 2
+
+# Load models
+DETECTION_MODEL = YOLO("models/detector-model.pt") 
+
+def detect_checkbox(image_path):
+    """
+    Output inference image with bounding box
+    Args:
+    - image: to check for checkboxes
+    Return: image with bounding boxes drawn and box coordinates
+    """
+    image = cv2.imread(image_path)
+    if image is None:
+        return image
+    
+    # Predict on image
+    results = DETECTION_MODEL.predict(source=image, conf=0.1, iou=0.8) # Predict on image
+    boxes = results[0].boxes # Get bounding boxes
+
+    if len(boxes) == 0:
+        return image
+    
+    box_coordinates = []
+
+    # Get bounding boxes
+    for box in boxes:
+        detection_class_conf = round(box.conf.item(), 2)
+        detection_class = list(BOX_COLORS)[int(box.cls)]
+        # Get start and end points of the current box
+        start_box = (int(box.xyxy[0][0]), int(box.xyxy[0][1]))
+        end_box = (int(box.xyxy[0][2]), int(box.xyxy[0][3]))
+        box = image[start_box[1]:end_box[1], start_box[0]: end_box[0], :]
+        
+        if detection_class == 'checked':
+            box_coordinates.append((start_box, end_box))
+            
+            # 01. DRAW BOUNDING BOX OF OBJECT
+            line_thickness = round(0.002 * (image.shape[0] + image.shape[1]) / 2) + 1
+            image = cv2.rectangle(img=image, 
+                                pt1=start_box, 
+                                pt2=end_box,
+                                color=BOX_COLORS['checked'], 
+                                thickness = line_thickness) # Draw the box with predefined colors
+            
+            image = cv2.putText(img=image, org=start_box, text=detection_class, fontFace=0, color=(0,0,0), fontScale=line_thickness/3)
+
+            # 02. DRAW LABEL
+            text = str(detection_class_conf)
+            # Get text dimensions to draw wrapping box
+            font_thickness =  max(line_thickness - 1, 1)
+            (text_w, text_h), _ = cv2.getTextSize(text=text, fontFace=2, fontScale=line_thickness/3, thickness=font_thickness)
+            # Draw wrapping box for text
+            image = cv2.rectangle(img=image,
+                                  pt1=(start_box[0], start_box[1] - text_h - BOX_PADDING*2),
+                                  pt2=(start_box[0] + text_w + BOX_PADDING * 2, start_box[1]),
+                                  color=BOX_COLORS['checked'],
+                                  thickness=-1)
+            # Put class name on image
+            start_text = (start_box[0] + BOX_PADDING, start_box[1] - BOX_PADDING)
+            image = cv2.putText(img=image, text=text, org=start_text, fontFace=0, color=(255,255,255), fontScale=line_thickness/3, thickness=font_thickness)
+        
+    return image, box_coordinates
+
+def euclidean_distance(coord1, coord2):
+    return math.sqrt((coord1[0] - coord2[0])**2 + (coord1[1] - coord2[1])**2)
+
+def nearest_coordinate(target_coord, coordinates):
+    min_distance = float('inf')
+    nearest_coord = None
+    
+    for coord in coordinates:
+        distance = euclidean_distance(target_coord, coord)
+        if distance < min_distance:
+            min_distance = distance
+            nearest_coord = coord
+    
+    
+    return nearest_coord, euclidean_distance(target_coord, nearest_coord)
+
+def checkbox_text_extract(image_filename):
+    checkbox_img, checkbox_coordinates = detect_checkbox(image_filename)
+    
+    result = reader.readtext(image_filename, decoder = 'beamsearch',
+                    text_threshold = 0.8, low_text = 0.2, link_threshold = 0.4,
+                    canvas_size = 1500, mag_ratio = 1.5,
+                    slope_ths = 0.1, ycenter_ths = 0.8, height_ths = 0.8,
+                    width_ths = 1.0, y_ths = 0.8, x_ths = 1.0, add_margin = 0.1)
+    
+    # Get the bottom right coordinates of the CHECKED checkbox
+    checkbox_bottom_right_coord = []
+
+    for each in checkbox_coordinates:
+        checkbox_bottom_right_coord.append((each[1][0], each[0][1]))
+
+    # Sort based on the coordinates
+    checkbox_bottom_right_coord = sorted(checkbox_bottom_right_coord, key=lambda point: point[1])
+
+    detected_text = {}
+
+    for index, each in enumerate(result):
+        x_coord = int(each[0][0][0])
+        y_coord = int(each[0][0][1])
+        detected_text[(x_coord, y_coord)] = each[1]
+        
+    checked_text = ''
+    for each_checkbox_coord in checkbox_bottom_right_coord:
+        nearest, distance = nearest_coordinate(each_checkbox_coord, list(detected_text.keys()))
+        if distance <= 15:
+            checked_text += f"- {detected_text[nearest]}\n"
+
+    return checked_text
+
+
+iface = gr.Interface(fn=checkbox_text_extract, 
+                     inputs=gr.Image(label="Upload image having checkboxes and text", type="filepath"), 
+                     outputs=gr.Markdown())
+
+iface.launch()
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c7c3b6f1858e045cec68db2fd3b2c28c6d67fa937ed34cf2a20231dc3ea2e8e
+size 87617854
@@ -0,0 +1,26 @@
+certifi==2022.9.24
+chardet==5.1.0
+charset-normalizer==3.0.1
+cryptography==38.0.4
+distlib==0.3.6
+filelock==3.9.0
+GDAL==3.6.2
+httplib2==0.20.4
+idna==3.3
+ntpsec==1.2.2
+numpy==1.24.2
+pipenv==2022.12.19
+platformdirs==2.6.0
+pycurl==7.45.2
+pyOpenSSL==23.0.0
+pyparsing==3.0.9
+PySimpleSOAP==1.16.2
+python-apt==2.6.0
+python-debian==0.1.49
+python-debianbts==4.0.1
+reportbug==12.0.0
+requests==2.28.1
+six==1.16.0
+urllib3==1.26.12
+virtualenv==20.17.1+ds
+virtualenv-clone==0.3.0
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:9c7c3b6f1858e045cec68db2fd3b2c28c6d67fa937ed34cf2a20231dc3ea2e8e`
	`3`	`+size 87617854`