SHA1
--- a/home/jinja2/home/grid.html
+++ b/home/jinja2/home/grid.html
@@ -0,0 +1,43 @@
 
				+<!DOCTYPE html>
			
 
				+<html>
			
 
				+    <head>
			
 
				+        <meta charset="UTF-8">
			
 
				+        <title>Crossword</title>
			
 
				+        <style>
			
 
				+            .crossword {
			
 
				+                border-right: 1px solid;
			
 
				+                border-bottom: 1px solid;
			
 
				+            }
			
 
				+            .crossword td {
			
 
				+                border-left: 1px solid;
			
 
				+                border-top: 1px solid;
			
 
				+            }
			
 
				+            .crossword td.filled {
			
 
				+                background: black;
			
 
				+            }
			
 
				+        </style>
			
 
				+    </head>
			
 
				+    <body>
			
 
				+        <table border=0 cellspacing=0 cellpadding=0 class="crossword">
			
 
				+            {%- set tab_index = namespace(value=1) %}
			
 
				+            {%- set blank = '&emsp;'|safe %}
			
 
				+            {%- for row in range(num_rows) %}
			
 
				+                <tr>
			
 
				+                    {%- for col in range(num_cols) %}
			
 
				+                        {%- if grid[row][col].filled %}
			
 
				+                            <td class="filled">&emsp;</td>
			
 
				+                        {%- else %}
			
 
				+                            <td class="empty" tabindex="{{ tab_index.value }}">
			
 
				+                                {{ grid[row][col].number|default(blank) }}
			
 
				+                            </td>
			
 
				+                            {%- set tab_index.value = tab_index.value + 1 %}
			
 
				+                        {%- endif %}
			
 
				+                    {%- endfor %}
			
 
				+                </tr>
			
 
				+            {%- endfor %}
			
 
				+        </table>
			
 
				+    </body>
			
 
				+</html>
			
 
				+<!--
			
 
				+vim:ts=4:sw=4:expandtab
			
 
				+-->
			
--- a/home/jinja2/home/index.html
+++ b/home/jinja2/home/index.html
@@ -0,0 +1,16 @@
 
				+<!DOCTYPE html>
			
 
				+<html>
			
 
				+    <head>
			
 
				+        <meta charset="UTF-8">
			
 
				+        <title>Crossword Extractor</title>
			
 
				+    </head>
			
 
				+    <body>
			
 
				+        <form enctype="multipart/form-data" method="post" action="">
			
 
				+            <div>{{ form }}</div>
			
 
				+            <div><input type="submit" value="Upload"></div>
			
 
				+        </form>
			
 
				+    </body>
			
 
				+</html>
			
 
				+<!--
			
 
				+vim:ts=4:sw=4:expandtab
			
 
				+-->
			
--- a/home/jinja2/home/output.html
+++ b/home/jinja2/home/output.html
@@ -0,0 +1,33 @@
 
				+<!DOCTYPE html>
			
 
				+<html>
			
 
				+    <head>
			
 
				+        <meta charset="UTF-8">
			
 
				+        <title>Extracted Crossword</title>
			
 
				+        <style>
			
 
				+            img {
			
 
				+                width: 600px;
			
 
				+            }
			
 
				+        </style>
			
 
				+    </head>
			
 
				+    <body>
			
 
				+        {% if warnings %}
			
 
				+        <div>
			
 
				+            Warnings:
			
 
				+            <ul>
			
 
				+                {% for warning in warnings %}
			
 
				+                    <li>{{ warning }}</li>
			
 
				+                {% endfor %}
			
 
				+            </ul>
			
 
				+        </div>
			
 
				+        {% endif %}
			
 
				+        <div>
			
 
				+            <a href="{{ image_url }}" download="{{ image_file_name }}">Download</a>
			
 
				+        </div>
			
 
				+        <div>
			
 
				+            <img alt="Crossword" src="{{ image_url }}">
			
 
				+        </div>
			
 
				+    </body>
			
 
				+</html>
			
 
				+<!--
			
 
				+vim:ts=4:sw=4:expandtab
			
 
				+-->
			
--- a/home/management/__init__.py
+++ b/home/management/__init__.py
--- a/home/management/commands/__init__.py
+++ b/home/management/commands/__init__.py
--- a/home/management/commands/extract.py
+++ b/home/management/commands/extract.py
@@ -0,0 +1,104 @@
 
				+import cv2
			
 
				+from django.core.management.base import BaseCommand
			
 
				+from django.template.loader import render_to_string
			
 
				+from ...xword import extract_crossword_grid, draw_grid
			
 
				+
			
 
				+
			
 
				+class Command(BaseCommand):
			
 
				+    help = "Extracts a clean crossword image from a photograph."
			
 
				+
			
 
				+    def add_arguments(self, parser):
			
 
				+        parser.add_argument('input_file_name')
			
 
				+
			
 
				+        parser.add_argument('--debug', action='store_true')
			
 
				+
			
 
				+        parser.add_argument('--remove-colours', action='store_true')
			
 
				+        parser.add_argument('--colour-removal-threshold', type=int, default=48)
			
 
				+
			
 
				+        parser.add_argument('--gaussian-blur-size', type=int, default=11)
			
 
				+        parser.add_argument('--adaptive-threshold-block-size', type=int, default=11)
			
 
				+        parser.add_argument('--adaptive-threshold-mean-adjustment', type=int, default=2)
			
 
				+
			
 
				+        parser.add_argument('--not-square', action='store_true')
			
 
				+
			
 
				+        parser.add_argument('--num-dilations', type=int, default=1)
			
 
				+
			
 
				+        parser.add_argument('--contour-erosion-kernel-size', type=int, default=5)
			
 
				+        parser.add_argument('--contour-erosion-iterations', type=int, default=5)
			
 
				+        parser.add_argument('--line-detector-element-size', type=int, default=51)
			
 
				+
			
 
				+        parser.add_argument('--sampling-block-size-ratio', type=float, default=0.25)
			
 
				+        parser.add_argument('--sampling-threshold-quantile', type=float, default=0.3)
			
 
				+        parser.add_argument('--sampling-threshold', type=int)
			
 
				+
			
 
				+        parser.add_argument('--grid-line-thickness', type=int, default=4)
			
 
				+        parser.add_argument('--grid-square-size', type=int, default=64)
			
 
				+        parser.add_argument('--grid-border-size', type=int, default=20)
			
 
				+
			
 
				+        group = parser.add_mutually_exclusive_group()
			
 
				+        group.add_argument('--out')
			
 
				+        group.add_argument('--html')
			
 
				+
			
 
				+    def handle(self, *args, **options):
			
 
				+        warnings, grid, num_rows, num_cols, block_img = extract_crossword_grid(
			
 
				+            options['input_file_name'],
			
 
				+            callback=debug_callback if options['debug'] else None,
			
 
				+            remove_colours=options['remove_colours'],
			
 
				+            colour_removal_threshold=options['colour_removal_threshold'],
			
 
				+            gaussian_blur_size=options['gaussian_blur_size'],
			
 
				+            adaptive_threshold_block_size=options['adaptive_threshold_block_size'],
			
 
				+            adaptive_threshold_mean_adjustment=options['adaptive_threshold_mean_adjustment'],
			
 
				+            square=not options['not_square'],
			
 
				+            num_dilations=options['num_dilations'],
			
 
				+            contour_erosion_kernel_size=options['contour_erosion_kernel_size'],
			
 
				+            contour_erosion_iterations=options['contour_erosion_iterations'],
			
 
				+            line_detector_element_size=options['line_detector_element_size'],
			
 
				+            sampling_block_size_ratio=options['sampling_block_size_ratio'],
			
 
				+            sampling_threshold_quantile=options['sampling_threshold_quantile'],
			
 
				+            sampling_threshold=options['sampling_threshold']
			
 
				+        )
			
 
				+
			
 
				+        if options['debug']:
			
 
				+            debug_callback('square', block_img)
			
 
				+
			
 
				+        for warning in warnings:
			
 
				+            print('WARNING: ' + warning)
			
 
				+
			
 
				+        if options['html'] is not None:
			
 
				+            html = render_to_string('home/grid.html', {
			
 
				+                'grid': grid,
			
 
				+                'num_rows': num_rows,
			
 
				+                'num_cols': num_cols,
			
 
				+            })
			
 
				+
			
 
				+            with open(options['html'], 'w') as f:
			
 
				+                f.write(html)
			
 
				+
			
 
				+        else:
			
 
				+            image = draw_grid(
			
 
				+                grid,
			
 
				+                num_rows,
			
 
				+                num_cols,
			
 
				+                grid_line_thickness=options['grid_line_thickness'],
			
 
				+                grid_square_size=options['grid_square_size'],
			
 
				+                grid_border_size=options['grid_border_size']
			
 
				+            )
			
 
				+
			
 
				+            if options['debug'] or (options['out'] is None):
			
 
				+                debug_callback('output', image)
			
 
				+
			
 
				+            if options['out'] is not None:
			
 
				+                _, png = cv2.imencode('.png', image)
			
 
				+
			
 
				+                with open(options['out'], 'wb') as f:
			
 
				+                    f.write(png.tobytes())
			
 
				+
			
 
				+        if options['debug'] or (options['out'] is None):
			
 
				+            while cv2.waitKey() & 0xFF != ord('q'):
			
 
				+                pass
			
 
				+            cv2.destroyAllWindows()
			
 
				+
			
 
				+
			
 
				+def debug_callback(name, image):
			
 
				+    cv2.namedWindow(name, cv2.WINDOW_NORMAL)
			
 
				+    cv2.imshow(name, image)
			
--- a/home/templates/home/index.html
+++ b/home/templates/home/index.html
@@ -1,16 +0,0 @@
 
				-<!DOCTYPE html>
			
 
				-<html>
			
 
				-  <head>
			
 
				-    <meta charset="UTF-8">
			
 
				-    <title>Crossword Extractor</title>
			
 
				-  </head>
			
 
				-  <body>
			
 
				-    <form enctype="multipart/form-data" method="post" action="">
			
 
				-      <div>{{ form }}</div>
			
 
				-      <div><input type="submit" value="Upload"></div>
			
 
				-    </form>
			
 
				-  </body>
			
 
				-</html>
			
 
				-<!--
			
 
				-vim:ts=2:sw=2:expandtab
			
 
				--->
			
--- a/home/templates/home/output.html
+++ b/home/templates/home/output.html
@@ -1,33 +0,0 @@
 
				-<!DOCTYPE html>
			
 
				-<html>
			
 
				-  <head>
			
 
				-    <meta charset="UTF-8">
			
 
				-    <title>Extracted Crossword</title>
			
 
				-    <style>
			
 
				-      img {
			
 
				-        width: 600px;
			
 
				-      }
			
 
				-    </style>
			
 
				-  </head>
			
 
				-  <body>
			
 
				-    {% if warnings %}
			
 
				-    <div>
			
 
				-      Warnings:
			
 
				-      <ul>
			
 
				-        {% for warning in warnings %}
			
 
				-          <li>{{ warning }}</li>
			
 
				-        {% endfor %}
			
 
				-      </ul>
			
 
				-    </div>
			
 
				-    {% endif %}
			
 
				-    <div>
			
 
				-      <a href="{{ image_url }}" download="{{ image_file_name }}">Download</a>
			
 
				-    </div>
			
 
				-    <div>
			
 
				-      <img alt="Crossword" src="{{ image_url }}">
			
 
				-    </div>
			
 
				-  </body>
			
 
				-</html>
			
 
				-<!--
			
 
				-vim:ts=2:sw=2:expandtab
			
 
				--->
			
--- a/home/views.py
+++ b/home/views.py
@@ -1,10 +1,11 @@
 
				 from base64 import b64encode
			
 
				+import cv2
			
 
				 from datetime import datetime
			
 
				 from django.http import HttpResponse, HttpResponseBadRequest
			
 
				 from django.shortcuts import render
			
 
				 from django.views import View
			
 
				 from .forms import CrosswordForm
			
 
				-from .xword import extract_crossword
			
 
				+from .xword import extract_crossword_grid, draw_grid
			
 
				 
			
 
				 
			
 
				 class HomeView(View):
			
@@ -15,9 +16,14 @@ class HomeView(View):
 
				         form = CrosswordForm(request.POST, request.FILES)
			
 
				         if not form.is_valid():
			
 
				             return HttpResponseBadRequest('Invalid form data')
			
 
				-        image, warnings = extract_crossword(form.cleaned_data['file'].temporary_file_path())
			
 
				+        warnings, grid, num_rows, num_cols, block_img = extract_crossword_grid(
			
 
				+            form.cleaned_data['file'].temporary_file_path(),
			
 
				+            remove_colours=False
			
 
				+        )
			
 
				+        image = draw_grid(grid, num_rows, num_cols)
			
 
				+        _, png = cv2.imencode('.png', image)
			
 
				         return render(request, 'home/output.html', {
			
 
				             'warnings': warnings,
			
 
				             'image_file_name': 'xword_{}.png'.format(datetime.now().strftime('%Y%m%d_%H%M%S')),
			
 
				-            'image_url': 'data:image/png;base64,' + b64encode(image).decode()
			
 
				+            'image_url': 'data:image/png;base64,' + b64encode(png.tobytes()).decode()
			
 
				         })
			
--- a/home/xword.py
+++ b/home/xword.py
@@ -5,6 +5,25 @@ import copy
 
				 import argparse
			
 
				 
			
 
				 
			
 
				+def non_greys_to_white(img, threshold=48):
			
 
				+    b, g, r = cv2.split(img)
			
 
				+    rgb_diff = cv2.subtract(cv2.max(cv2.max(b, g), r), cv2.min(cv2.min(b, g), r))
			
 
				+    filtered = img.copy()
			
 
				+    filtered[np.where(rgb_diff > threshold)] = (255, 255, 255)
			
 
				+    return filtered
			
 
				+
			
 
				+
			
 
				+def load_image_as_greyscale(file_name, filter_colours, colour_filter_threshold):
			
 
				+    img = cv2.imread(file_name)
			
 
				+    if img is None:
			
 
				+        raise RuntimeError("Failed to load image")
			
 
				+
			
 
				+    if filter_colours:
			
 
				+        img = non_greys_to_white(img, colour_filter_threshold)
			
 
				+
			
 
				+    return cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
			
 
				+
			
 
				+
			
 
				 def preprocess_image(original, gaussian_blur_size, adaptive_threshold_block_size, adaptive_threshold_mean_adjustment, num_dilations):
			
 
				     img = cv2.GaussianBlur(original, (gaussian_blur_size, gaussian_blur_size), 0)
			
 
				     img = cv2.adaptiveThreshold(img, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY_INV, adaptive_threshold_block_size, adaptive_threshold_mean_adjustment)
			
@@ -136,25 +155,41 @@ def extract_grid_colours(img, num_rows, num_cols, sampling_block_size_ratio):
 
				 def grid_colours_to_blocks(grid_colours, num_rows, num_cols, sampling_threshold):
			
 
				     grid = copy.deepcopy(grid_colours)
			
 
				     warning = False
			
 
				-    for row in range(round(num_rows / 2)):
			
 
				+
			
 
				+    midpoint = num_rows // 2 + (0 if num_rows % 2 == 0 else 1)
			
 
				+    for row in range(midpoint):
			
 
				         for col in range(num_cols):
			
 
				+            # If there is an odd number of rows then row and row2 will point to
			
 
				+            # the same row when we reach the middle. Doesn't seem worth adding a
			
 
				+            # special case.
			
 
				             row2 = num_rows - row - 1
			
 
				             col2 = num_cols - col - 1
			
 
				             delta1 = grid_colours[row][col] - sampling_threshold
			
 
				             delta2 = grid_colours[row2][col2] - sampling_threshold
			
 
				 
			
 
				             if (delta1 > 0) and (delta2 > 0):
			
 
				-                block = 0
			
 
				+                filled = False
			
 
				             elif (delta1 < 0) and (delta2 < 0):
			
 
				-                block = 1
			
 
				+                filled = True
			
 
				             else:
			
 
				                 warning = True
			
 
				                 if abs(delta1) > abs(delta2):
			
 
				-                    block = 1 if delta1 < 0 else 0
			
 
				+                    filled = delta1 < 0
			
 
				                 else:
			
 
				-                    block = 1 if delta2 < 0 else 0
			
 
				+                    filled = delta2 < 0
			
 
				+
			
 
				+            grid[row][col] = {'filled': filled}
			
 
				+            grid[row2][col2] = {'filled': filled}
			
 
				 
			
 
				-            grid[row][col] = grid[row2][col2] = block
			
 
				+    number = 1
			
 
				+    for row in range(num_rows):
			
 
				+        for col in range(num_cols):
			
 
				+            if (not grid[row][col]['filled'] and (
			
 
				+                (((col == 0) or grid[row][col - 1]['filled']) and (col < num_cols - 1) and not grid[row][col + 1]['filled']) or
			
 
				+                (((row == 0) or grid[row - 1][col]['filled']) and (row < num_rows - 1) and not grid[row + 1][col]['filled'])
			
 
				+            )):
			
 
				+                grid[row][col]['number'] = number
			
 
				+                number += 1
			
 
				 
			
 
				     return warning, grid
			
 
				 
			
@@ -169,38 +204,32 @@ def draw_point(image, point, colour):
 
				                 image[y, x] = colour
			
 
				 
			
 
				 
			
 
				-def show_image(image):
			
 
				-    cv2.namedWindow('xword', cv2.WINDOW_NORMAL)
			
 
				-    cv2.imshow('xword', image)
			
 
				-    while cv2.waitKey() & 0xFF != ord('q'):
			
 
				-        pass
			
 
				-    cv2.destroyAllWindows()
			
 
				-
			
 
				-
			
 
				-def extract_crossword(
			
 
				+def extract_crossword_grid(
			
 
				     file_name,
			
 
				+    callback=None,
			
 
				+    remove_colours=False,
			
 
				+    colour_removal_threshold=48,
			
 
				     gaussian_blur_size=11,
			
 
				     adaptive_threshold_block_size=11,
			
 
				     adaptive_threshold_mean_adjustment=2,
			
 
				     square=True,
			
 
				     num_dilations=1,
			
 
				     contour_erosion_kernel_size=5,
			
 
				-    contour_erosion_iterations=6,
			
 
				+    contour_erosion_iterations=5,
			
 
				     line_detector_element_size=51,
			
 
				     sampling_block_size_ratio=0.25,
			
 
				     sampling_threshold_quantile=0.3,
			
 
				-    sampling_threshold=None,
			
 
				-    grid_line_thickness=4,
			
 
				-    grid_square_size=64,
			
 
				-    grid_border_size=20,
			
 
				+    sampling_threshold=None
			
 
				 ):
			
 
				     warnings = []
			
 
				 
			
 
				-    original = cv2.imread(file_name, cv2.IMREAD_GRAYSCALE)
			
 
				-    if original is None:
			
 
				-        raise RuntimeError("Failed to load image")
			
 
				+    original = load_image_as_greyscale(file_name, remove_colours, colour_removal_threshold)
			
 
				+    if callback is not None:
			
 
				+        callback('original', original)
			
 
				 
			
 
				     img = preprocess_image(original, gaussian_blur_size, adaptive_threshold_block_size, adaptive_threshold_mean_adjustment, num_dilations)
			
 
				+    if callback is not None:
			
 
				+        callback('preprocessed', img)
			
 
				 
			
 
				     biggest = find_biggest_contour(img)
			
 
				     biggest = erode_contour(img.shape, biggest, contour_erosion_kernel_size, contour_erosion_iterations)
			
@@ -208,6 +237,8 @@ def extract_crossword(
 
				     top_left, top_right, bottom_right, bottom_left = get_contour_corners(img, biggest)
			
 
				 
			
 
				     img = extract_square(img, top_left, top_right, bottom_right, bottom_left)
			
 
				+    if callback is not None:
			
 
				+        callback('pre-fft', img)
			
 
				 
			
 
				     num_rows = get_line_frequency(img, line_detector_element_size, 1)
			
 
				     num_cols = get_line_frequency(img, line_detector_element_size, 0)
			
@@ -226,6 +257,17 @@ def extract_crossword(
 
				     if warning:
			
 
				         warnings.append("Some blocks may be the wrong colour")
			
 
				 
			
 
				+    return warnings, grid, num_rows, num_cols, block_img
			
 
				+
			
 
				+
			
 
				+def draw_grid(
			
 
				+    grid,
			
 
				+    num_rows,
			
 
				+    num_cols,
			
 
				+    grid_line_thickness=4,
			
 
				+    grid_square_size=64,
			
 
				+    grid_border_size=20
			
 
				+):
			
 
				     step = grid_square_size + grid_line_thickness
			
 
				     grid_height = num_rows * step + grid_line_thickness
			
 
				     grid_width = num_cols * step + grid_line_thickness
			
@@ -234,9 +276,7 @@ def extract_crossword(
 
				     for row in range(num_rows):
			
 
				         y = row * step + grid_line_thickness + grid_border_size
			
 
				         for col in range(num_cols):
			
 
				-            if grid[row][col] == 0:
			
 
				+            if not grid[row][col]['filled']:
			
 
				                 x = col * step + grid_line_thickness + grid_border_size
			
 
				                 cv2.rectangle(output, (x, y), (x + grid_square_size - 1, y + grid_square_size - 1), 255, -1)
			
 
				-
			
 
				-    _, png = cv2.imencode('.png', output)
			
 
				-    return png.tobytes(), warnings
			
 
				+    return output
			
--- a/requirements.in
+++ b/requirements.in
@@ -1,4 +1,6 @@
 
				 chaussette
			
 
				 django
			
 
				+django-extensions
			
 
				+jinja2
			
 
				 opencv-python
			
 
				 pip-tools
			
--- a/requirements.txt
+++ b/requirements.txt
@@ -7,10 +7,13 @@
 
				 asgiref==3.2.3            # via django
			
 
				 chaussette==1.3.0
			
 
				 click==7.0                # via pip-tools
			
 
				+django-extensions==2.2.6
			
 
				 django==3.0.2
			
 
				+jinja2==2.11.0
			
 
				+markupsafe==1.1.1         # via jinja2
			
 
				 numpy==1.18.1             # via opencv-python
			
 
				 opencv-python==4.1.2.30
			
 
				 pip-tools==4.4.0
			
 
				 pytz==2019.3              # via django
			
 
				-six==1.14.0               # via chaussette, pip-tools
			
 
				+six==1.14.0               # via chaussette, django-extensions, pip-tools
			
 
				 sqlparse==0.3.0           # via django
			
--- a/xword/jinja2.py
+++ b/xword/jinja2.py
@@ -0,0 +1,12 @@
 
				+#from django.contrib.staticfiles.storage import staticfiles_storage
			
 
				+#from django.urls import reverse
			
 
				+from jinja2 import Environment
			
 
				+
			
 
				+
			
 
				+def environment(**options):
			
 
				+    env = Environment(**options)
			
 
				+    env.globals.update({
			
 
				+        #‘static’: staticfiles_storage.url,
			
 
				+        #‘url’: reverse,
			
 
				+    })
			
 
				+    return env
			
--- a/xword/settings.py
+++ b/xword/settings.py
@@ -11,6 +11,7 @@ DEBUG = False
 
				 ALLOWED_HOSTS = OVERRIDE_ME
			
 
				 
			
 
				 INSTALLED_APPS = [
			
 
				+    'django_extensions',
			
 
				     'home.apps.HomeConfig',
			
 
				 ]
			
 
				 
			
@@ -24,10 +25,11 @@ ROOT_URLCONF = 'xword.urls'
 
				 
			
 
				 TEMPLATES = [
			
 
				     {
			
 
				-        'BACKEND': 'django.template.backends.django.DjangoTemplates',
			
 
				+        'BACKEND': 'django.template.backends.jinja2.Jinja2',
			
 
				         'DIRS': [],
			
 
				         'APP_DIRS': True,
			
 
				         'OPTIONS': {
			
 
				+            'environment': 'xword.jinja2.environment',
			
 
				             'context_processors': [
			
 
				                 'django.template.context_processors.debug',
			
 
				                 'django.template.context_processors.request',
Автор	SHA1 Сообщение	Дата
Andrew Klopper	a62558add7 Add HTML output.	лет назад: 6
Andrew Klopper	6fdfd76066 Split extract_crossword into extract_crossword_grid and grid_to_png	лет назад: 6
Andrew Klopper	3de3b2f972 Added ability to filter out non-greys before trying to extract the	лет назад: 6
Andrew Klopper	8ab61aeb6d Added 'extract' command.	лет назад: 6