Sub_GUI.py

from tkinter import *
from tkinter.ttk import *
from pathlib import Path
from PIL import Image, ImageTk
import numpy as np
import cv2


def open_tutorial(mst):
    tutorial_window = Toplevel()
    tutorial_window.title("Tutorial")
    tutorial_window.geometry("200x200")
    Label(tutorial_window, text="This is the tutorial").grid(row=0, column=0)


def get_scene(scene):
    return str(puzzle_images / puzzle_dict[scene])


def get_character(character):
    return str(target_images / target_dict[character])


def my_preview(mst, character_dd, scene_dd, scene_label, character_label, zoomed_label):
    print("Searching for {} in {}!".format(character_dd.get(), scene_dd.get()))
    scene = scene_dd.get()
    character = character_dd.get()
    scene_image = cv2.imread(str(puzzle_images / puzzle_dict[scene]))
    scene_image = resize_with_aspect_ratio(scene_image, height=int(mst.winfo_screenheight()*0.8))
    mst.show_scene = process_image(scene_image)
    target_image = cv2.imread(str(target_images / target_dict[character]))
    target_image = resize_with_aspect_ratio(target_image, width=100)
    mst.show_character = process_image(target_image)
    scene_label.configure(image=mst.show_scene)
    character_label.configure(image=mst.show_character)
    zoomed_label.grid_remove()


def search_image(mst, target_pic, puzzle_pic, scene_label, character_label, zoomed_label, search_b):
    search_b.configure(text="Processing...")
    target = cv2.imread(get_character(target_pic.get()))
    puzzle = cv2.imread(get_scene(puzzle_pic.get()))
    target_gray = cv2.cvtColor(target, cv2.COLOR_BGR2GRAY)
    puzzle_gray = cv2.cvtColor(puzzle, cv2.COLOR_BGR2GRAY)
    target_edge = cv2.adaptiveThreshold(target_gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY, 11, 2)
    (height, width) = target.shape[:2]
    found = None
    for scale in np.linspace(0.5, 1.8, 10)[::-1]:
        resized = resize_with_aspect_ratio(puzzle_gray, width=int(puzzle.shape[1] * scale))
        r = puzzle.shape[1] / float(resized.shape[1])
        if resized.shape[0] < height or resized.shape[1] < width:
            break

        edged = cv2.adaptiveThreshold(resized, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C, cv2.THRESH_BINARY, 11, 2)
        result = cv2.matchTemplate(edged, target_edge, cv2.TM_CCOEFF)
        (minVal, maxVal, minLoc, maxLoc) = cv2.minMaxLoc(result)

        if found is None or maxVal > found[0]:
            found = (maxVal, maxLoc, r)

    (_, maxLoc, r) = found
    (startX, startY) = (int(maxLoc[0] * r), int(maxLoc[1] * r))
    (endX, endY) = (int((maxLoc[0] + width) * r), int((maxLoc[1] + height) * r))
    roi = puzzle[startY:endY, startX:endX]
    mask = np.zeros(puzzle.shape, dtype="uint8")
    puzzle = cv2.addWeighted(puzzle, 0.25, mask, 0.75, 0)
    puzzle[startY:endY, startX:endX] = roi
    puzzle = cv2.rectangle(puzzle, (startX, startY), (endX, endY), (0, 255, 0), 3)
    zoomed = puzzle[startY-100:endY+100, startX-100:endX+100]
    resize = resize_with_aspect_ratio(puzzle, height=int(mst.winfo_screenheight()*0.8))
    mst.show_scene = process_image(resize)
    target = resize_with_aspect_ratio(target, width=100)
    mst.show_character = process_image(target)
    mst.show_zoomed = process_image(zoomed)
    scene_label.configure(image=mst.show_scene)
    character_label.configure(image=mst.show_character)
    zoomed_label.configure(image=mst.show_zoomed)
    zoomed_label.grid(row=2, column=3, sticky=S, pady=2)
    search_b.configure(text="Search")


def process_image(image):
    # Convert image from openCV BGR to RGB for displaying
    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    # Convert to PIL format
    image = Image.fromarray(image)
    # ImageTk format
    image = ImageTk.PhotoImage(image)
    return image


def open_wheres_waldo(mst):
    ww = Toplevel()
    ww.title("Where's Waldo")
    screen_width = ww.winfo_screenwidth()
    screen_height = ww.winfo_screenheight()
    ww.geometry(f'{screen_width}x{screen_height}')
    ww.resizable(0, 0)

    scene_dd = StringVar(ww)

    scene_dd.set('Choose Scene')
    s_dd = OptionMenu(ww, scene_dd, *puzzle_dict.keys())
    s_dd.grid(row=0, column=0, sticky=W, pady=2)

    character_dd = StringVar(ww)
    character_dd.set('Choose Character')
    c_dd = OptionMenu(ww, character_dd, *target_dict.keys())
    c_dd.grid(row=1, column=0, sticky=W, pady=2)

    preview_b = Button(ww, text="Preview", command=lambda: my_preview(ww, character_dd, scene_dd, scene_label,
                                                                      character_label, zoomed_label), width=20)
    preview_b.grid(row=0, column=1, sticky=W, pady=2)

    search_b = Button(ww, text="Search", command=lambda: search_image(ww, character_dd, scene_dd, scene_label,
                                                                      character_label, zoomed_label, search_b),
                      width=20)
    search_b.grid(row=1, column=1, sticky=W, pady=2)

    default_image = cv2.imread(str(puzzle_images / puzzle_dict['City']))
    default_image = resize_with_aspect_ratio(default_image, height=int(screen_height * 0.8))
    ww.default = process_image(default_image)

    scene_label = Label(ww, image=ww.default)
    scene_label.grid(row=2, column=0, columnspan=2, rowspan=1, sticky=W, pady=2)

    waldo_image = cv2.imread(str(target_images / target_dict['Waldo']))
    waldo_image = resize_with_aspect_ratio(waldo_image, width=100)
    ww.waldo = process_image(waldo_image)

    character_label = Label(ww, image=ww.waldo)
    character_label.grid(row=2, column=3, sticky=NW, pady=2)

    zoomed_label = Label(ww)
    zoomed_label.grid(row=2, column=3, sticky=S, pady=2)


def make_decision_GUI(mst):
    mst.geometry("400x200")
    mst.title("Main Menu")
    label = Label(mst, text="Please select one of the following options.\n"
                            "Tutorial - This tool will teach you how Computer Vision operates with\n"
                            "with very simple shapes and colors\n"
                            "Where's Waldo - This tool will allow you to play a Where's Waldo game\n"
                            "with computer vision")
    label.grid(row=0, column=0, columnspan=2, pady=10)
    tutorial_btn = Button(mst, text="Tutorial", command=lambda: open_tutorial(mst))
    tutorial_btn.grid(row=1, column=0)
    ww_btn = Button(mst, text="Where's Waldo", command=lambda: open_wheres_waldo(mst))
    ww_btn.grid(row=1, column=1)


def resize_with_aspect_ratio(image, width=None, height=None, inter=cv2.INTER_AREA):
    dim = None
    (h, w) = image.shape[:2]

    if width is None and height is None:
        return image
    if width is None:
        r = height / float(h)
        dim = (int(w * r), height)
    else:
        r = width / float(w)
        dim = (width, int(h * r))

    return cv2.resize(image, dim, interpolation=inter)


def main():
    master = Tk()
    make_decision_GUI(master)
    mainloop()


if __name__ == '__main__':
    target_dict = {'': '', 'Waldo': 'waldo_face.jpeg', 'Wenda': 'wenda.jpg', 'Wizard': 'wizard.jpg', 'Odlaw': 'odlaw.jpg',
                   'Woof': 'woofs_tail.jpg'}

    puzzle_dict = {'': '', 'Beach': 'puzzle3.jpeg', 'City': 'puzzle2.jpeg', 'Zoo': 'zoo.jpeg',
                   'Department Store': 'Waldo_Department_Store.jpeg',
                   'Ski Resort': 'ski.jpeg', 'Train Station': 'train.jpeg', 'Museum': 'museum.jpeg'}
    puzzle_images = Path('Puzzle Images')

    target_images = Path('Target Images')
    main()