upload 보고서, codes

이민호
Commit c81d66763e6f0b83fd5f564122cec0d08e0d449e c81d6676 1 parent c7a2a607
Showing 156 changed files with 5303 additions and 0 deletions
Code/HD-CelebA-Cropper/.gitignore
Code/HD-CelebA-Cropper/align.py
Code/HD-CelebA-Cropper/cropper.py
Code/HD-CelebA-Cropper/scores.txt
Code/MaskTheFace/.gitattributes
Code/MaskTheFace/.gitignore
Code/MaskTheFace/_config.yml
Code/MaskTheFace/images/000001.jpg
Code/MaskTheFace/images/000001_binary.jpg
Code/MaskTheFace/images/000001_masked.jpg
Code/MaskTheFace/mask_the_face.py
Code/MaskTheFace/masks/masks.cfg
Code/MaskTheFace/masks/templates/KN95.png
Code/MaskTheFace/masks/templates/KN95_left.png
Code/MaskTheFace/masks/templates/KN95_right.png
Code/MaskTheFace/masks/templates/N95.png
Code/MaskTheFace/masks/templates/N95_left.png
Code/MaskTheFace/masks/templates/N95_right.png
Code/MaskTheFace/masks/templates/cloth.png
Code/MaskTheFace/masks/templates/cloth_left.png
--- a/Code/HD-CelebA-Cropper/.gitignore 0 → 100644
View file @c81d667
+++ b/Code/HD-CelebA-Cropper/.gitignore 0 → 100644
View file @c81d667
+*.pyc
+__pycache__/
+/data/
\ No newline at end of file
--- a/Code/HD-CelebA-Cropper/align.py 0 → 100644
View file @c81d667
+++ b/Code/HD-CelebA-Cropper/align.py 0 → 100644
View file @c81d667
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import argparse
+from functools import partial
+from multiprocessing import Pool
+import os
+import re
+
+import cropper
+import numpy as np
+import tqdm
+
+
+# ==============================================================================
+# =                                      param                                 =
+# ==============================================================================
+
+parser = argparse.ArgumentParser()
+# main
+parser.add_argument('--img_dir', dest='img_dir', default='./data/img_celeba')
+parser.add_argument('--save_dir', dest='save_dir', default='./data/aligned')
+parser.add_argument('--landmark_file', dest='landmark_file', default='./data/landmark.txt')
+parser.add_argument('--standard_landmark_file', dest='standard_landmark_file', default='./data/standard_landmark_68pts.txt')
+parser.add_argument('--crop_size_h', dest='crop_size_h', type=int, default=572)
+parser.add_argument('--crop_size_w', dest='crop_size_w', type=int, default=572)
+parser.add_argument('--move_h', dest='move_h', type=float, default=0.25)
+parser.add_argument('--move_w', dest='move_w', type=float, default=0.)
+parser.add_argument('--save_format', dest='save_format', choices=['jpg', 'png'], default='jpg')
+parser.add_argument('--n_worker', dest='n_worker', type=int, default=8)
+# others
+parser.add_argument('--face_factor', dest='face_factor', type=float, help='The factor of face area relative to the output image.', default=0.45)
+parser.add_argument('--align_type', dest='align_type', choices=['affine', 'similarity'], default='similarity')
+parser.add_argument('--order', dest='order', type=int, choices=[0, 1, 2, 3, 4, 5], help='The order of interpolation.', default=3)
+parser.add_argument('--mode', dest='mode', choices=['constant', 'edge', 'symmetric', 'reflect', 'wrap'], default='edge')
+args = parser.parse_args()
+
+
+# ==============================================================================
+# =                                opencv first                                =
+# ==============================================================================
+
+_DEAFAULT_JPG_QUALITY = 95
+try:
+    import cv2
+    imread = cv2.imread
+    imwrite = partial(cv2.imwrite, params=[int(cv2.IMWRITE_JPEG_QUALITY), _DEAFAULT_JPG_QUALITY])
+    align_crop = cropper.align_crop_opencv
+    print('Use OpenCV')
+except:
+    import skimage.io as io
+    imread = io.imread
+    imwrite = partial(io.imsave, quality=_DEAFAULT_JPG_QUALITY)
+    align_crop = cropper.align_crop_skimage
+    print('Importing OpenCv fails. Use scikit-image')
+
+
+# ==============================================================================
+# =                                     run                                    =
+# ==============================================================================
+
+# count landmarks
+with open(args.landmark_file) as f:
+    line = f.readline()
+n_landmark = len(re.split('[ ]+', line)[1:]) // 2
+
+# load standard landmark
+standard_landmark = np.genfromtxt(args.standard_landmark_file, dtype=np.float).reshape(n_landmark, 2)
+standard_landmark[:, 0] += args.move_w
+standard_landmark[:, 1] += args.move_h
+
+# data dir
+save_dir = os.path.join(args.save_dir, 'align_size(%d,%d)_move(%.3f,%.3f)_face_factor(%.3f)_%s' % (args.crop_size_h, args.crop_size_w, args.move_h, args.move_w, args.face_factor, args.save_format))
+data_dir = os.path.join(save_dir, 'data')
+if not os.path.isdir(data_dir):
+    os.makedirs(data_dir)
+
+
+def work(name, landmark) -> str:  # a single work
+    for _ in range(3):  # try three times
+        try:
+            img = imread(os.path.join(args.img_dir, name))
+            img_crop, tformed_landmarks = align_crop(img,
+                                                     landmark,
+                                                     standard_landmark,
+                                                     crop_size=(args.crop_size_h, args.crop_size_w),
+                                                     face_factor=args.face_factor,
+                                                     align_type=args.align_type,
+                                                     order=args.order,
+                                                     mode=args.mode)
+
+            name = os.path.splitext(name)[0] + '.' + args.save_format
+            path = os.path.join(data_dir, name)
+            if not os.path.isdir(os.path.split(path)[0]):
+                os.makedirs(os.path.split(path)[0])
+            imwrite(path, img_crop)
+
+            tformed_landmarks.shape = -1
+            name_landmark_str = ('%s' + ' %.1f' * n_landmark * 2) % ((name, ) + tuple(tformed_landmarks))
+            return name_landmark_str
+        except:
+            print('%s fails!' % name)
+
+
+if __name__ == "__main__":
+    img_names = np.genfromtxt(args.landmark_file, dtype=np.str, usecols=0)
+    landmarks = np.genfromtxt(args.landmark_file, dtype=np.float,
+                              usecols=range(1, n_landmark * 2 + 1)).reshape(-1, n_landmark, 2)
+
+    n_pics = len(img_names)
+
+    landmarks_path = os.path.join(save_dir, 'landmark.txt')
+    f = open(landmarks_path, 'w')
+    pool = Pool(args.n_worker)
+    bar = tqdm.tqdm(total=n_pics)
+
+    tasks = []
+    for i in range(n_pics):
+        tasks.append(pool.apply_async(work, (img_names[i], landmarks[i]), callback=lambda _: bar.update()))
+
+    try:
+        result = tasks.pop(0).get()
+        if result is not None and result != "":
+            f.write(result + '\n')
+    except:
+        pass
+
+    pool.close()
+    pool.join()
+    bar.close()
+    f.close()
\ No newline at end of file
--- a/Code/HD-CelebA-Cropper/cropper.py 0 → 100644
View file @c81d667
+++ b/Code/HD-CelebA-Cropper/cropper.py 0 → 100644
View file @c81d667
+import numpy as np
+
+
+def align_crop_opencv(img,
+                      src_landmarks,
+                      standard_landmarks,
+                      crop_size=512,
+                      face_factor=0.7,
+                      align_type='similarity',
+                      order=3,
+                      mode='edge'):
+    """Align and crop a face image by landmarks.
+
+    Arguments:
+        img                : Face image to be aligned and cropped.
+        src_landmarks      : [[x_1, y_1], ..., [x_n, y_n]].
+        standard_landmarks : Standard shape, should be normalized.
+        crop_size          : Output image size, should be 1. int for (crop_size, crop_size)
+                             or 2. (int, int) for (crop_size_h, crop_size_w).
+        face_factor        : The factor of face area relative to the output image.
+        align_type         : 'similarity' or 'affine'.
+        order              : The order of interpolation. The order has to be in the range 0-5:
+                                 - 0: INTER_NEAREST
+                                 - 1: INTER_LINEAR
+                                 - 2: INTER_AREA
+                                 - 3: INTER_CUBIC
+                                 - 4: INTER_LANCZOS4
+                                 - 5: INTER_LANCZOS4
+        mode               : One of ['constant', 'edge', 'symmetric', 'reflect', 'wrap'].
+                             Points outside the boundaries of the input are filled according
+                             to the given mode.
+    """
+    # set OpenCV
+    import cv2
+    inter = {0: cv2.INTER_NEAREST, 1: cv2.INTER_LINEAR, 2: cv2.INTER_AREA,
+             3: cv2.INTER_CUBIC, 4: cv2.INTER_LANCZOS4, 5: cv2.INTER_LANCZOS4}
+    border = {'constant': cv2.BORDER_CONSTANT, 'edge': cv2.BORDER_REPLICATE,
+              'symmetric': cv2.BORDER_REFLECT, 'reflect': cv2.BORDER_REFLECT101,
+              'wrap': cv2.BORDER_WRAP}
+
+    # check
+    assert align_type in ['affine', 'similarity'], 'Invalid `align_type`! Allowed: %s!' % ['affine', 'similarity']
+    assert order in [0, 1, 2, 3, 4, 5], 'Invalid `order`! Allowed: %s!' % [0, 1, 2, 3, 4, 5]
+    assert mode in ['constant', 'edge', 'symmetric', 'reflect', 'wrap'], 'Invalid `mode`! Allowed: %s!' % ['constant', 'edge', 'symmetric', 'reflect', 'wrap']
+
+    # crop size
+    if isinstance(crop_size, (list, tuple)) and len(crop_size) == 2:
+        crop_size_h = crop_size[0]
+        crop_size_w = crop_size[1]
+    elif isinstance(crop_size, int):
+        crop_size_h = crop_size_w = crop_size
+    else:
+        raise Exception('Invalid `crop_size`! `crop_size` should be 1. int for (crop_size, crop_size) or 2. (int, int) for (crop_size_h, crop_size_w)!')
+
+    # estimate transform matrix
+    trg_landmarks = standard_landmarks * max(crop_size_h, crop_size_w) * face_factor + np.array([crop_size_w // 2, crop_size_h // 2])
+    if align_type == 'affine':
+        tform = cv2.estimateAffine2D(trg_landmarks, src_landmarks, ransacReprojThreshold=np.Inf)[0]
+    else:
+        tform = cv2.estimateAffinePartial2D(trg_landmarks, src_landmarks, ransacReprojThreshold=np.Inf)[0]
+
+    # warp image by given transform
+    output_shape = (crop_size_h, crop_size_w)
+    img_crop = cv2.warpAffine(img, tform, output_shape[::-1], flags=cv2.WARP_INVERSE_MAP + inter[order], borderMode=border[mode])
+
+    # get transformed landmarks
+    tformed_landmarks = cv2.transform(np.expand_dims(src_landmarks, axis=0), cv2.invertAffineTransform(tform))[0]
+
+    return img_crop, tformed_landmarks
+
+
+def align_crop_skimage(img,
+                       src_landmarks,
+                       standard_landmarks,
+                       crop_size=512,
+                       face_factor=0.7,
+                       align_type='similarity',
+                       order=3,
+                       mode='edge'):
+    """Align and crop a face image by landmarks.
+
+    Arguments:
+        img                : Face image to be aligned and cropped.
+        src_landmarks      : [[x_1, y_1], ..., [x_n, y_n]].
+        standard_landmarks : Standard shape, should be normalized.
+        crop_size          : Output image size, should be 1. int for (crop_size, crop_size)
+                             or 2. (int, int) for (crop_size_h, crop_size_w).
+        face_factor        : The factor of face area relative to the output image.
+        align_type         : 'similarity' or 'affine'.
+        order              : The order of interpolation. The order has to be in the range 0-5:
+                                 - 0: INTER_NEAREST
+                                 - 1: INTER_LINEAR
+                                 - 2: INTER_AREA
+                                 - 3: INTER_CUBIC
+                                 - 4: INTER_LANCZOS4
+                                 - 5: INTER_LANCZOS4
+        mode               : One of ['constant', 'edge', 'symmetric', 'reflect', 'wrap'].
+                             Points outside the boundaries of the input are filled according
+                             to the given mode.
+    """
+    raise NotImplementedError("'align_crop_skimage' is not implemented!")
--- a/Code/HD-CelebA-Cropper/scores.txt 0 → 100644
View file @c81d667
+++ b/Code/HD-CelebA-Cropper/scores.txt 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/.gitattributes 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/.gitattributes 0 → 100644
View file @c81d667
+# Auto detect text files and perform LF normalization
+* text=auto
--- a/Code/MaskTheFace/.gitignore 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/.gitignore 0 → 100644
View file @c81d667
+*.pyc
+docs
+data
+lfw
+lfw_40
+.idea
+loss
+vgg_face_dataset
+saved_network
+loss
+z_detect_face.py
+z_main.py
+*.npy
+*.Lnk
+data1
+data1_masked
+scratch.py
+subset
+subset_masked
+vgg_face_dataset
+*.mp4
+ML_examples
+*.pptx
+datasets
+*.dat
+*.docx
+
--- a/Code/MaskTheFace/_config.yml 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/_config.yml 0 → 100644
View file @c81d667
+theme: jekyll-theme-cayman
\ No newline at end of file
--- a/Code/MaskTheFace/images/000001.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/images/000001.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/images/000001_binary.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/images/000001_binary.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/images/000001_masked.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/images/000001_masked.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/mask_the_face.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/mask_the_face.py 0 → 100644
View file @c81d667
+# Author: aqeelanwar
+# Created: 27 April,2020, 10:22 PM
+# Email: aqeel.anwar@gatech.edu
+
+import argparse
+import dlib
+from utils.aux_functions import *
+
+
+# Command-line input setup
+parser = argparse.ArgumentParser(
+    description="MaskTheFace - Python code to mask faces dataset"
+)
+parser.add_argument(
+    "--path",
+    type=str,
+    default="",
+    help="Path to either the folder containing images or the image itself",
+)
+parser.add_argument(
+    "--mask_type",
+    type=str,
+    default="surgical",
+    choices=["surgical", "N95", "KN95", "cloth", "gas", "inpaint", "random", "all"],
+    help="Type of the mask to be applied. Available options: all, surgical_blue, surgical_green, N95, cloth",
+)
+
+parser.add_argument(
+    "--pattern",
+    type=str,
+    default="",
+    help="Type of the pattern. Available options in masks/textures",
+)
+
+parser.add_argument(
+    "--pattern_weight",
+    type=float,
+    default=0.5,
+    help="Weight of the pattern. Must be between 0 and 1",
+)
+
+parser.add_argument(
+    "--color",
+    type=str,
+    default="#0473e2",
+    help="Hex color value that need to be overlayed to the mask",
+)
+
+parser.add_argument(
+    "--color_weight",
+    type=float,
+    default=0.5,
+    help="Weight of the color intensity. Must be between 0 and 1",
+)
+
+parser.add_argument(
+    "--code",
+    type=str,
+    # default="cloth-masks/textures/check/check_4.jpg, cloth-#e54294, cloth-#ff0000, cloth, cloth-masks/textures/others/heart_1.png, cloth-masks/textures/fruits/pineapple.png, N95, surgical_blue, surgical_green",
+    default="",
+    help="Generate specific formats",
+)
+
+
+parser.add_argument(
+    "--verbose", dest="verbose", action="store_true", help="Turn verbosity on"
+)
+parser.add_argument(
+    "--write_original_image",
+    dest="write_original_image",
+    action="store_true",
+    help="If true, original image is also stored in the masked folder",
+)
+parser.set_defaults(feature=False)
+
+args = parser.parse_args()
+args.write_path = args.path + "_masked"
+
+# Set up dlib face detector and predictor
+args.detector = dlib.get_frontal_face_detector()
+path_to_dlib_model = "dlib_models/shape_predictor_68_face_landmarks.dat"
+if not os.path.exists(path_to_dlib_model):
+    download_dlib_model()
+
+args.predictor = dlib.shape_predictor(path_to_dlib_model)
+
+# Extract data from code
+mask_code = "".join(args.code.split()).split(",")
+args.code_count = np.zeros(len(mask_code))
+args.mask_dict_of_dict = {}
+
+
+for i, entry in enumerate(mask_code):
+    mask_dict = {}
+    mask_color = ""
+    mask_texture = ""
+    mask_type = entry.split("-")[0]
+    if len(entry.split("-")) == 2:
+        mask_variation = entry.split("-")[1]
+        if "#" in mask_variation:
+            mask_color = mask_variation
+        else:
+            mask_texture = mask_variation
+    mask_dict["type"] = mask_type
+    mask_dict["color"] = mask_color
+    mask_dict["texture"] = mask_texture
+    args.mask_dict_of_dict[i] = mask_dict
+
+# Check if path is file or directory or none
+is_directory, is_file, is_other = check_path(args.path)
+display_MaskTheFace()
+
+if is_directory:
+    path, dirs, files = os.walk(args.path).__next__()
+    file_count = len(files)
+    dirs_count = len(dirs)
+    if len(files) > 0:
+        print_orderly("Masking image files", 60)
+
+    # Process files in the directory if any
+    for f in tqdm(files):
+        image_path = path + "/" + f
+
+        write_path = path + "_masked"
+        if not os.path.isdir(write_path):
+            os.makedirs(write_path)
+
+        if is_image(image_path):
+            # Proceed if file is image
+            if args.verbose:
+                str_p = "Processing: " + image_path
+                tqdm.write(str_p)
+
+            split_path = f.rsplit(".")
+            masked_image, mask, mask_binary_array, original_image = mask_image(
+                image_path, args
+            )
+            for i in range(len(mask)):
+                w_path = (
+                    write_path
+                    + "/"
+                    + split_path[0]
+                    + "_"
+                    + "masked"
+                    + "."
+                    + split_path[1]
+                )
+                img = masked_image[i]
+                binary_img = mask_binary_array[i]
+                cv2.imwrite(w_path, img)
+                cv2.imwrite(
+                    path + "_binary/" + split_path[0] + "_binary" + "." + split_path[1],
+                    binary_img,
+                )
+                cv2.imwrite(
+                    path + "_original/" + split_path[0] + "." + split_path[1],
+                    original_image,
+                )
+
+    print_orderly("Masking image directories", 60)
+
+    # Process directories withing the path provided
+    for d in tqdm(dirs):
+        dir_path = args.path + "/" + d
+        dir_write_path = args.write_path + "/" + d
+        if not os.path.isdir(dir_write_path):
+            os.makedirs(dir_write_path)
+        _, _, files = os.walk(dir_path).__next__()
+
+        # Process each files within subdirectory
+        for f in files:
+            image_path = dir_path + "/" + f
+            if args.verbose:
+                str_p = "Processing: " + image_path
+                tqdm.write(str_p)
+            write_path = dir_write_path
+            if is_image(image_path):
+                # Proceed if file is image
+                split_path = f.rsplit(".")
+                masked_image, mask, mask_binary, original_image = mask_image(
+                    image_path, args
+                )
+                for i in range(len(mask)):
+                    w_path = (
+                        write_path
+                        + "/"
+                        + split_path[0]
+                        + "_"
+                        + "masked"
+                        + "."
+                        + split_path[1]
+                    )
+                    w_path_original = write_path + "/" + f
+                    img = masked_image[i]
+                    binary_img = mask_binary[i]
+                    cv2.imwrite(
+                        path
+                        + "_binary/"
+                        + split_path[0]
+                        + "_binary"
+                        + "."
+                        + split_path[1],
+                        binary_img,
+                    )
+                    # Write the masked image
+                    cv2.imwrite(w_path, img)
+                    if args.write_original_image:
+                        # Write the original image
+                        cv2.imwrite(w_path_original, original_image)
+
+            if args.verbose:
+                print(args.code_count)
+
+# Process if the path was a file
+elif is_file:
+    print("Masking image file")
+    image_path = args.path
+    write_path = args.path.rsplit(".")[0]
+    if is_image(image_path):
+        # Proceed if file is image
+        # masked_images, mask, mask_binary_array, original_image
+        masked_image, mask, mask_binary_array, original_image = mask_image(
+            image_path, args
+        )
+        for i in range(len(mask)):
+            w_path = write_path + "_" + "masked" + "." + args.path.rsplit(".")[1]
+            img = masked_image[i]
+            binary_img = mask_binary_array[i]
+            cv2.imwrite(w_path, img)
+            cv2.imwrite(write_path + "_binary." + args.path.rsplit(".")[1], binary_img)
+else:
+    print("Path is neither a valid file or a valid directory")
+print("Processing Done")
--- a/Code/MaskTheFace/masks/masks.cfg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/masks.cfg 0 → 100644
View file @c81d667
+[surgical]
+template:   masks/templates/surgical.png
+mask_a:     21, 97
+mask_b:     307, 22
+mask_c:     600, 99
+mask_d:     25, 322
+mask_e:     295, 470
+mask_f:     600, 323
+
+[surgical_left]
+template:   masks/templates/surgical_left.png
+mask_a:     39, 27
+mask_b:     130, 9
+mask_c:     567, 20
+mask_d:     87, 207
+mask_e:     168, 302
+mask_f:     568, 202
+
+[surgical_right]
+template:   masks/templates/surgical_right.png
+mask_a:     3, 20
+mask_b:     440, 9
+mask_c:     531, 27
+mask_d:     2, 202
+mask_e:     402, 302
+mask_f:     483, 207
+
+[surgical_green]
+template:   masks/templates/surgical_green.png
+mask_a:     21, 97
+mask_b:     307, 22
+mask_c:     600, 99
+mask_d:     25, 322
+mask_e:     295, 470
+mask_f:     600, 323
+
+[surgical_green_left]
+template:   masks/templates/surgical_green_left.png
+mask_a:     39, 27
+mask_b:     130, 9
+mask_c:     567, 20
+mask_d:     87, 207
+mask_e:     168, 302
+mask_f:     568, 202
+
+[surgical_green_right]
+template:   masks/templates/surgical_green_right.png
+mask_a:     3, 20
+mask_b:     440, 9
+mask_c:     531, 27
+mask_d:     2, 202
+mask_e:     402, 302
+mask_f:     483, 207
+
+[surgical_blue]
+template:   masks/templates/surgical_blue.png
+mask_a:     21, 97
+mask_b:     307, 22
+mask_c:     600, 99
+mask_d:     25, 322
+mask_e:     295, 470
+mask_f:     600, 323
+
+[surgical_blue_left]
+template:   masks/templates/surgical_blue_left.png
+mask_a:     39, 27
+mask_b:     130, 9
+mask_c:     567, 20
+mask_d:     87, 207
+mask_e:     168, 302
+mask_f:     568, 202
+
+[surgical_blue_right]
+template:   masks/templates/surgical_blue_right.png
+mask_a:     3, 20
+mask_b:     440, 9
+mask_c:     531, 27
+mask_d:     2, 202
+mask_e:     402, 302
+mask_f:     483, 207
+
+
+[N95]
+template:   masks/templates/N95.png
+mask_a:     15, 119
+mask_b:     327, 5
+mask_c:     640, 93
+mask_d:     13, 285
+mask_e:     351, 518
+mask_f:     645, 285
+
+;[N95_left]
+;template:   masks/N95_left.png
+;mask_a:     176, 121
+;mask_b:     313, 46
+;mask_c:     799, 135
+;mask_d:     97, 438
+;mask_e:     329, 627
+;mask_f:     791, 401
+
+[N95_right]
+template:   masks/templates/N95_right.png
+mask_c:     979, 331
+mask_b:     806, 172
+mask_a:     12, 222
+mask_f:     907, 762
+mask_e:     577, 875
+mask_d:     -4, 632
+
+[N95_left]
+template:   masks/templates/N95_left.png
+mask_a:     193, 331
+mask_b:     366, 172
+mask_c:     1160, 222
+mask_d:     265, 762
+mask_e:     595, 875
+mask_f:     1176, 632
+
+
+[cloth_left]
+template:   masks/templates/cloth_left.png
+mask_a:     65, 93
+mask_b:     162, 15
+mask_c:     672, 75
+mask_d:     114, 296
+mask_e:     207, 443
+mask_f:     671, 341
+
+[cloth_right]
+template:   masks/templates/cloth_right.png
+mask_a:     98, 93
+mask_b:     608, 15
+mask_c:     705, 75
+mask_d:     99, 296
+mask_e:     563, 443
+mask_f:     656, 341
+
+[cloth]
+template:   masks/templates/cloth.png
+mask_a:     122, 90
+mask_b:     405, 7
+mask_c:     686, 79
+mask_d:     165, 323
+mask_e:     406, 509
+mask_f:     653, 311
+
+[gas]
+template: masks/templates/gas.png
+mask_a: 330, 431
+mask_b: 873, 117
+mask_c: 1494, 434
+mask_d: 430, 754
+mask_e: 869, 1100
+mask_f: 1400, 710
+
+[gas_left]
+template: masks/templates/gas_left.png
+mask_a: 239, 238
+mask_b: 317, 42
+mask_c: 965, 239
+mask_d: 224, 404
+mask_e: 337, 502
+mask_f: 963, 406
+
+[gas_right]
+template: masks/templates/gas_right.png
+mask_c: 621, 238
+mask_b: 543, 60
+mask_a: -105, 239
+mask_f: 636, 404
+mask_e: 523, 502
+mask_d: -103, 406
+
+[KN95]
+template: masks/templates/KN95.png
+mask_a: 20, 47
+mask_b: 410, 5
+mask_c: 760, 55
+mask_d: 75, 340
+mask_e: 398, 600
+mask_f: 671, 320
+
+[KN95_left]
+template: masks/templates/KN95_left.png
+mask_a: 52, 258
+mask_b: 207, 100
+mask_c: 730, 80
+mask_d: 210, 408
+mask_e: 335, 604
+mask_f: 770, 270
+
+[KN95_right]
+template: masks/templates/KN95_right.png
+mask_c: 664, 258
+mask_b: 509, 100
+mask_a: -14, 80
+mask_f: 506, 408
+mask_e: 381, 604
+mask_d: -54, 270
+
+
+[empty]
+[empty_left]
+[empty_right]
+
+[inpaint]
+[inpaint_left]
+[inpaint_right]
+
--- a/Code/MaskTheFace/masks/templates/KN95.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/KN95.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/KN95_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/KN95_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/KN95_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/KN95_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/N95.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/N95.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/N95_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/N95_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/N95_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/N95_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/cloth.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/cloth.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/cloth_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/cloth_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/cloth_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/cloth_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/gas.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/gas.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/gas_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/gas_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/gas_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/gas_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_blue.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_blue.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_blue_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_blue_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_blue_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_blue_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_green.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_green.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_green_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_green_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_green_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_green_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_left.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_left.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/templates/surgical_right.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/templates/surgical_right.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_1.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_1.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_2.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_2.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_3.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_3.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_4.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_4.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_5.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_5.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_6.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_6.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/check/check_7.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/check/check_7.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_1.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_1.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_10.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_10.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_11.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_11.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_2.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_2.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_3.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_3.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_4.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_4.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_5.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_5.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_6.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_6.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_7.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_7.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_8.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_8.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/floral_9.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/floral_9.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/floral/grey_petals.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/floral/grey_petals.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/bananas.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/bananas.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/cherry.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/cherry.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/cherry.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/cherry.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/lemon.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/lemon.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/pineapple.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/pineapple.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/fruits/strawberry.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/fruits/strawberry.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/others/heart_1.png 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/others/heart_1.png 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/masks/textures/others/polka.jpg 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/masks/textures/others/polka.jpg 0 → 100644
View file @c81d667
--- a/Code/MaskTheFace/requirements.txt 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/requirements.txt 0 → 100644
View file @c81d667
+certifi==2020.4.5.1
+click==7.1.2
+dlib==19.19.0
+dotmap==1.3.14
+face-recognition==1.3.0
+face-recognition-models==0.3.0
+numpy==1.18.4
+opencv-python==4.2.0.34
+Pillow==7.1.2
+tqdm==4.46.0
+wincertstore==0.2
+imutils==0.5.3
+requests==2.24.0
--- a/Code/MaskTheFace/utils/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/__init__.py 0 → 100644
View file @c81d667
+# Author: Aqeel Anwar(ICSRL)
+# Created: 7/30/2020, 7:43 AM
+# Email: aqeel.anwar@gatech.edu
\ No newline at end of file
--- a/Code/MaskTheFace/utils/aux_functions.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/aux_functions.py 0 → 100644
View file @c81d667
+# Author: aqeelanwar
+# Created: 27 April,2020, 10:21 PM
+# Email: aqeel.anwar@gatech.edu
+
+from configparser import ConfigParser
+import cv2, math, os
+from PIL import Image, ImageDraw
+from tqdm import tqdm
+from utils.read_cfg import read_cfg
+from utils.fit_ellipse import *
+import random
+from utils.create_mask import texture_the_mask, color_the_mask
+from imutils import face_utils
+import requests
+from zipfile import ZipFile
+from tqdm import tqdm
+import bz2, shutil
+
+
+def download_dlib_model():
+    print_orderly("Get dlib model", 60)
+    dlib_model_link = "http://dlib.net/files/shape_predictor_68_face_landmarks.dat.bz2"
+    print("Downloading dlib model...")
+    with requests.get(dlib_model_link, stream=True) as r:
+        print("Zip file size: ", np.round(len(r.content) / 1024 / 1024, 2), "MB")
+        destination = (
+            "dlib_models" + os.path.sep + "shape_predictor_68_face_landmarks.dat.bz2"
+        )
+        if not os.path.exists(destination.rsplit(os.path.sep, 1)[0]):
+            os.mkdir(destination.rsplit(os.path.sep, 1)[0])
+        print("Saving dlib model...")
+        with open(destination, "wb") as fd:
+            for chunk in r.iter_content(chunk_size=32678):
+                fd.write(chunk)
+    print("Extracting dlib model...")
+    with bz2.BZ2File(destination) as fr, open(
+        "dlib_models/shape_predictor_68_face_landmarks.dat", "wb"
+    ) as fw:
+        shutil.copyfileobj(fr, fw)
+    print("Saved: ", destination)
+    print_orderly("done", 60)
+
+    os.remove(destination)
+
+
+def get_line(face_landmark, image, type="eye", debug=False):
+    pil_image = Image.fromarray(image)
+    d = ImageDraw.Draw(pil_image)
+    left_eye = face_landmark["left_eye"]
+    right_eye = face_landmark["right_eye"]
+    left_eye_mid = np.mean(np.array(left_eye), axis=0)
+    right_eye_mid = np.mean(np.array(right_eye), axis=0)
+    eye_line_mid = (left_eye_mid + right_eye_mid) / 2
+
+    if type == "eye":
+        left_point = left_eye_mid
+        right_point = right_eye_mid
+        mid_point = eye_line_mid
+
+    elif type == "nose_mid":
+        nose_length = (
+            face_landmark["nose_bridge"][-1][1] - face_landmark["nose_bridge"][0][1]
+        )
+        left_point = [left_eye_mid[0], left_eye_mid[1] + nose_length / 2]
+        right_point = [right_eye_mid[0], right_eye_mid[1] + nose_length / 2]
+        # mid_point = (
+        #     face_landmark["nose_bridge"][-1][1] + face_landmark["nose_bridge"][0][1]
+        # ) / 2
+
+        mid_pointY = (
+            face_landmark["nose_bridge"][-1][1] + face_landmark["nose_bridge"][0][1]
+        ) / 2
+        mid_pointX = (
+            face_landmark["nose_bridge"][-1][0] + face_landmark["nose_bridge"][0][0]
+        ) / 2
+        mid_point = (mid_pointX, mid_pointY)
+
+    elif type == "nose_tip":
+        nose_length = (
+            face_landmark["nose_bridge"][-1][1] - face_landmark["nose_bridge"][0][1]
+        )
+        left_point = [left_eye_mid[0], left_eye_mid[1] + nose_length]
+        right_point = [right_eye_mid[0], right_eye_mid[1] + nose_length]
+        mid_point = (
+            face_landmark["nose_bridge"][-1][1] + face_landmark["nose_bridge"][0][1]
+        ) / 2
+
+    elif type == "bottom_lip":
+        bottom_lip = face_landmark["bottom_lip"]
+        bottom_lip_mid = np.max(np.array(bottom_lip), axis=0)
+        shiftY = bottom_lip_mid[1] - eye_line_mid[1]
+        left_point = [left_eye_mid[0], left_eye_mid[1] + shiftY]
+        right_point = [right_eye_mid[0], right_eye_mid[1] + shiftY]
+        mid_point = bottom_lip_mid
+
+    elif type == "perp_line":
+        bottom_lip = face_landmark["bottom_lip"]
+        bottom_lip_mid = np.mean(np.array(bottom_lip), axis=0)
+
+        left_point = eye_line_mid
+        left_point = face_landmark["nose_bridge"][0]
+        right_point = bottom_lip_mid
+
+        mid_point = bottom_lip_mid
+
+    elif type == "nose_long":
+        nose_bridge = face_landmark["nose_bridge"]
+        left_point = [nose_bridge[0][0], nose_bridge[0][1]]
+        right_point = [nose_bridge[-1][0], nose_bridge[-1][1]]
+
+        mid_point = left_point
+
+    # d.line(eye_mid, width=5, fill='red')
+    y = [left_point[1], right_point[1]]
+    x = [left_point[0], right_point[0]]
+    # cv2.imshow('h', image)
+    # cv2.waitKey(0)
+    eye_line = fit_line(x, y, image)
+    d.line(eye_line, width=5, fill="blue")
+
+    # Perpendicular Line
+    # (midX, midY) and (midX - y2 + y1, midY + x2 - x1)
+    y = [
+        (left_point[1] + right_point[1]) / 2,
+        (left_point[1] + right_point[1]) / 2 + right_point[0] - left_point[0],
+    ]
+    x = [
+        (left_point[0] + right_point[0]) / 2,
+        (left_point[0] + right_point[0]) / 2 - right_point[1] + left_point[1],
+    ]
+    perp_line = fit_line(x, y, image)
+    if debug:
+        d.line(perp_line, width=5, fill="red")
+        pil_image.show()
+    return eye_line, perp_line, left_point, right_point, mid_point
+
+
+def get_points_on_chin(line, face_landmark, chin_type="chin"):
+    chin = face_landmark[chin_type]
+    points_on_chin = []
+    for i in range(len(chin) - 1):
+        chin_first_point = [chin[i][0], chin[i][1]]
+        chin_second_point = [chin[i + 1][0], chin[i + 1][1]]
+
+        flag, x, y = line_intersection(line, (chin_first_point, chin_second_point))
+        if flag:
+            points_on_chin.append((x, y))
+
+    return points_on_chin
+
+
+def plot_lines(face_line, image, debug=False):
+    pil_image = Image.fromarray(image)
+    if debug:
+        d = ImageDraw.Draw(pil_image)
+        d.line(face_line, width=4, fill="white")
+        pil_image.show()
+
+
+def line_intersection(line1, line2):
+    # mid = int(len(line1) / 2)
+    start = 0
+    end = -1
+    line1 = ([line1[start][0], line1[start][1]], [line1[end][0], line1[end][1]])
+
+    xdiff = (line1[0][0] - line1[1][0], line2[0][0] - line2[1][0])
+    ydiff = (line1[0][1] - line1[1][1], line2[0][1] - line2[1][1])
+    x = []
+    y = []
+    flag = False
+
+    def det(a, b):
+        return a[0] * b[1] - a[1] * b[0]
+
+    div = det(xdiff, ydiff)
+    if div == 0:
+        return flag, x, y
+
+    d = (det(*line1), det(*line2))
+    x = det(d, xdiff) / div
+    y = det(d, ydiff) / div
+
+    segment_minX = min(line2[0][0], line2[1][0])
+    segment_maxX = max(line2[0][0], line2[1][0])
+
+    segment_minY = min(line2[0][1], line2[1][1])
+    segment_maxY = max(line2[0][1], line2[1][1])
+
+    if (
+        segment_maxX + 1 >= x >= segment_minX - 1
+        and segment_maxY + 1 >= y >= segment_minY - 1
+    ):
+        flag = True
+
+    return flag, x, y
+
+
+def fit_line(x, y, image):
+    if x[0] == x[1]:
+        x[0] += 0.1
+    coefficients = np.polyfit(x, y, 1)
+    polynomial = np.poly1d(coefficients)
+    x_axis = np.linspace(0, image.shape[1], 50)
+    y_axis = polynomial(x_axis)
+    eye_line = []
+    for i in range(len(x_axis)):
+        eye_line.append((x_axis[i], y_axis[i]))
+
+    return eye_line
+
+
+def get_six_points(face_landmark, image):
+    _, perp_line1, _, _, m = get_line(face_landmark, image, type="nose_mid")
+    face_b = m
+
+    perp_line, _, _, _, _ = get_line(face_landmark, image, type="perp_line")
+    points1 = get_points_on_chin(perp_line1, face_landmark)
+    points = get_points_on_chin(perp_line, face_landmark)
+    if not points1:
+        face_e = tuple(np.asarray(points[0]))
+    elif not points:
+        face_e = tuple(np.asarray(points1[0]))
+    else:
+        face_e = tuple((np.asarray(points[0]) + np.asarray(points1[0])) / 2)
+    # face_e = points1[0]
+    nose_mid_line, _, _, _, _ = get_line(face_landmark, image, type="nose_long")
+
+    angle = get_angle(perp_line, nose_mid_line)
+    # print("angle: ", angle)
+    nose_mid_line, _, _, _, _ = get_line(face_landmark, image, type="nose_tip")
+    points = get_points_on_chin(nose_mid_line, face_landmark)
+    if len(points) < 2:
+        face_landmark = get_face_ellipse(face_landmark)
+        # print("extrapolating chin")
+        points = get_points_on_chin(
+            nose_mid_line, face_landmark, chin_type="chin_extrapolated"
+        )
+        if len(points) < 2:
+            points = []
+            points.append(face_landmark["chin"][0])
+            points.append(face_landmark["chin"][-1])
+    face_a = points[0]
+    face_c = points[-1]
+    # cv2.imshow('j', image)
+    # cv2.waitKey(0)
+    nose_mid_line, _, _, _, _ = get_line(face_landmark, image, type="bottom_lip")
+    points = get_points_on_chin(nose_mid_line, face_landmark)
+    face_d = points[0]
+    face_f = points[-1]
+
+    six_points = np.float32([face_a, face_b, face_c, face_f, face_e, face_d])
+
+    return six_points, angle
+
+
+def get_angle(line1, line2):
+    delta_y = line1[-1][1] - line1[0][1]
+    delta_x = line1[-1][0] - line1[0][0]
+    perp_angle = math.degrees(math.atan2(delta_y, delta_x))
+    if delta_x < 0:
+        perp_angle = perp_angle + 180
+    if perp_angle < 0:
+        perp_angle += 360
+    if perp_angle > 180:
+        perp_angle -= 180
+
+    # print("perp", perp_angle)
+    delta_y = line2[-1][1] - line2[0][1]
+    delta_x = line2[-1][0] - line2[0][0]
+    nose_angle = math.degrees(math.atan2(delta_y, delta_x))
+
+    if delta_x < 0:
+        nose_angle = nose_angle + 180
+    if nose_angle < 0:
+        nose_angle += 360
+    if nose_angle > 180:
+        nose_angle -= 180
+    # print("nose", nose_angle)
+
+    angle = nose_angle - perp_angle
+    return angle
+
+
+def mask_face(image, face_location, six_points, angle, args, type="surgical"):
+    debug = False
+
+    # Find the face angle
+    threshold = 13
+    if angle < -threshold:
+        type += "_right"
+    elif angle > threshold:
+        type += "_left"
+
+    face_height = face_location[2] - face_location[0]
+    face_width = face_location[1] - face_location[3]
+    # image = image_raw[
+    #              face_location[0]-int(face_width/2): face_location[2]+int(face_width/2),
+    #              face_location[3]-int(face_height/2): face_location[1]+int(face_height/2),
+    #              :,
+    #              ]
+    # cv2.imshow('win', image)
+    # cv2.waitKey(0)
+    # Read appropriate mask image
+    w = image.shape[0]
+    h = image.shape[1]
+    if not "empty" in type and not "inpaint" in type:
+        cfg = read_cfg(config_filename="masks/masks.cfg", mask_type=type, verbose=False)
+    else:
+        if "left" in type:
+            str = "surgical_blue_left"
+        elif "right" in type:
+            str = "surgical_blue_right"
+        else:
+            str = "surgical_blue"
+        cfg = read_cfg(config_filename="masks/masks.cfg", mask_type=str, verbose=False)
+    img = cv2.imread(cfg.template, cv2.IMREAD_UNCHANGED)
+
+    # Process the mask if necessary
+    if args.pattern:
+        # Apply pattern to mask
+        img = texture_the_mask(img, args.pattern, args.pattern_weight)
+
+    if args.color:
+        # Apply color to mask
+        img = color_the_mask(img, args.color, args.color_weight)
+
+    mask_line = np.float32(
+        [cfg.mask_a, cfg.mask_b, cfg.mask_c, cfg.mask_f, cfg.mask_e, cfg.mask_d]
+    )
+    # Warp the mask
+    M, mask = cv2.findHomography(mask_line, six_points)
+    dst_mask = cv2.warpPerspective(img, M, (h, w))
+    dst_mask_points = cv2.perspectiveTransform(mask_line.reshape(-1, 1, 2), M)
+    mask = dst_mask[:, :, 3]
+    face_height = face_location[2] - face_location[0]
+    face_width = face_location[1] - face_location[3]
+    image_face = image[
+        face_location[0] + int(face_height / 2) : face_location[2],
+        face_location[3] : face_location[1],
+        :,
+    ]
+
+    image_face = image
+
+    # Adjust Brightness
+    mask_brightness = get_avg_brightness(img)
+    img_brightness = get_avg_brightness(image_face)
+    delta_b = 1 + (img_brightness - mask_brightness) / 255
+    dst_mask = change_brightness(dst_mask, delta_b)
+
+    # Adjust Saturation
+    mask_saturation = get_avg_saturation(img)
+    img_saturation = get_avg_saturation(image_face)
+    delta_s = 1 - (img_saturation - mask_saturation) / 255
+    dst_mask = change_saturation(dst_mask, delta_s)
+
+    # Apply mask
+    mask_inv = cv2.bitwise_not(mask)
+    img_bg = cv2.bitwise_and(image, image, mask=mask_inv)
+    img_fg = cv2.bitwise_and(dst_mask, dst_mask, mask=mask)
+    out_img = cv2.add(img_bg, img_fg[:, :, 0:3])
+    if "empty" in type or "inpaint" in type:
+        out_img = img_bg
+    # Plot key points
+
+    if "inpaint" in type:
+        out_img = cv2.inpaint(out_img, mask, 3, cv2.INPAINT_TELEA)
+        # dst_NS = cv2.inpaint(img, mask, 3, cv2.INPAINT_NS)
+
+    if debug:
+        for i in six_points:
+            cv2.circle(out_img, (i[0], i[1]), radius=4, color=(0, 0, 255), thickness=-1)
+
+        for i in dst_mask_points:
+            cv2.circle(
+                out_img, (i[0][0], i[0][1]), radius=4, color=(0, 255, 0), thickness=-1
+            )
+
+    return out_img, mask
+
+
+def draw_landmarks(face_landmarks, image):
+    pil_image = Image.fromarray(image)
+    d = ImageDraw.Draw(pil_image)
+    for facial_feature in face_landmarks.keys():
+        d.line(face_landmarks[facial_feature], width=5, fill="white")
+    pil_image.show()
+
+
+def get_face_ellipse(face_landmark):
+    chin = face_landmark["chin"]
+    x = []
+    y = []
+    for point in chin:
+        x.append(point[0])
+        y.append(point[1])
+
+    x = np.asarray(x)
+    y = np.asarray(y)
+
+    a = fitEllipse(x, y)
+    center = ellipse_center(a)
+    phi = ellipse_angle_of_rotation(a)
+    axes = ellipse_axis_length(a)
+    a, b = axes
+
+    arc = 2.2
+    R = np.arange(0, arc * np.pi, 0.2)
+    xx = center[0] + a * np.cos(R) * np.cos(phi) - b * np.sin(R) * np.sin(phi)
+    yy = center[1] + a * np.cos(R) * np.sin(phi) + b * np.sin(R) * np.cos(phi)
+    chin_extrapolated = []
+    for i in range(len(R)):
+        chin_extrapolated.append((xx[i], yy[i]))
+    face_landmark["chin_extrapolated"] = chin_extrapolated
+    return face_landmark
+
+
+def get_avg_brightness(img):
+    img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
+    h, s, v = cv2.split(img_hsv)
+    return np.mean(v)
+
+
+def get_avg_saturation(img):
+    img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
+    h, s, v = cv2.split(img_hsv)
+    return np.mean(v)
+
+
+def change_brightness(img, value=1.0):
+    img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
+    h, s, v = cv2.split(img_hsv)
+    v = value * v
+    v[v > 255] = 255
+    v = np.asarray(v, dtype=np.uint8)
+    final_hsv = cv2.merge((h, s, v))
+    img = cv2.cvtColor(final_hsv, cv2.COLOR_HSV2BGR)
+    return img
+
+
+def change_saturation(img, value=1.0):
+    img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
+    h, s, v = cv2.split(img_hsv)
+    s = value * s
+    s[s > 255] = 255
+    s = np.asarray(s, dtype=np.uint8)
+    final_hsv = cv2.merge((h, s, v))
+    img = cv2.cvtColor(final_hsv, cv2.COLOR_HSV2BGR)
+    return img
+
+
+def check_path(path):
+    is_directory = False
+    is_file = False
+    is_other = False
+    if os.path.isdir(path):
+        is_directory = True
+    elif os.path.isfile(path):
+        is_file = True
+    else:
+        is_other = True
+
+    return is_directory, is_file, is_other
+
+
+def shape_to_landmarks(shape):
+    face_landmarks = {}
+    face_landmarks["left_eyebrow"] = [
+        tuple(shape[17]),
+        tuple(shape[18]),
+        tuple(shape[19]),
+        tuple(shape[20]),
+        tuple(shape[21]),
+    ]
+    face_landmarks["right_eyebrow"] = [
+        tuple(shape[22]),
+        tuple(shape[23]),
+        tuple(shape[24]),
+        tuple(shape[25]),
+        tuple(shape[26]),
+    ]
+    face_landmarks["nose_bridge"] = [
+        tuple(shape[27]),
+        tuple(shape[28]),
+        tuple(shape[29]),
+        tuple(shape[30]),
+    ]
+    face_landmarks["nose_tip"] = [
+        tuple(shape[31]),
+        tuple(shape[32]),
+        tuple(shape[33]),
+        tuple(shape[34]),
+        tuple(shape[35]),
+    ]
+    face_landmarks["left_eye"] = [
+        tuple(shape[36]),
+        tuple(shape[37]),
+        tuple(shape[38]),
+        tuple(shape[39]),
+        tuple(shape[40]),
+        tuple(shape[41]),
+    ]
+    face_landmarks["right_eye"] = [
+        tuple(shape[42]),
+        tuple(shape[43]),
+        tuple(shape[44]),
+        tuple(shape[45]),
+        tuple(shape[46]),
+        tuple(shape[47]),
+    ]
+    face_landmarks["top_lip"] = [
+        tuple(shape[48]),
+        tuple(shape[49]),
+        tuple(shape[50]),
+        tuple(shape[51]),
+        tuple(shape[52]),
+        tuple(shape[53]),
+        tuple(shape[54]),
+        tuple(shape[60]),
+        tuple(shape[61]),
+        tuple(shape[62]),
+        tuple(shape[63]),
+        tuple(shape[64]),
+    ]
+
+    face_landmarks["bottom_lip"] = [
+        tuple(shape[54]),
+        tuple(shape[55]),
+        tuple(shape[56]),
+        tuple(shape[57]),
+        tuple(shape[58]),
+        tuple(shape[59]),
+        tuple(shape[48]),
+        tuple(shape[64]),
+        tuple(shape[65]),
+        tuple(shape[66]),
+        tuple(shape[67]),
+        tuple(shape[60]),
+    ]
+
+    face_landmarks["chin"] = [
+        tuple(shape[0]),
+        tuple(shape[1]),
+        tuple(shape[2]),
+        tuple(shape[3]),
+        tuple(shape[4]),
+        tuple(shape[5]),
+        tuple(shape[6]),
+        tuple(shape[7]),
+        tuple(shape[8]),
+        tuple(shape[9]),
+        tuple(shape[10]),
+        tuple(shape[11]),
+        tuple(shape[12]),
+        tuple(shape[13]),
+        tuple(shape[14]),
+        tuple(shape[15]),
+        tuple(shape[16]),
+    ]
+    return face_landmarks
+
+
+def rect_to_bb(rect):
+    x1 = rect.left()
+    x2 = rect.right()
+    y1 = rect.top()
+    y2 = rect.bottom()
+    return (x1, x2, y2, x1)
+
+
+def mask_image(image_path, args):
+    # Read the image
+    image = cv2.imread(image_path)
+    original_image = image.copy()
+    # gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    gray = image
+    face_locations = args.detector(gray, 1)
+    mask_type = args.mask_type
+    verbose = args.verbose
+    if args.code:
+        ind = random.randint(0, len(args.code_count) - 1)
+        mask_dict = args.mask_dict_of_dict[ind]
+        mask_type = mask_dict["type"]
+        args.color = mask_dict["color"]
+        args.pattern = mask_dict["texture"]
+        args.code_count[ind] += 1
+
+    elif mask_type == "random":
+        available_mask_types = get_available_mask_types()
+        mask_type = random.choice(available_mask_types)
+
+    if verbose:
+        tqdm.write("Faces found: {:2d}".format(len(face_locations)))
+    # Process each face in the image
+    masked_images = []
+    mask_binary_array = []
+    mask = []
+    for (i, face_location) in enumerate(face_locations):
+        shape = args.predictor(gray, face_location)
+        shape = face_utils.shape_to_np(shape)
+        face_landmarks = shape_to_landmarks(shape)
+        face_location = rect_to_bb(face_location)
+        # draw_landmarks(face_landmarks, image)
+        six_points_on_face, angle = get_six_points(face_landmarks, image)
+        mask = []
+        if mask_type != "all":
+            if len(masked_images) > 0:
+                image = masked_images.pop(0)
+            image, mask_binary = mask_face(
+                image, face_location, six_points_on_face, angle, args, type=mask_type
+            )
+
+            # compress to face tight
+            face_height = face_location[2] - face_location[0]
+            face_width = face_location[1] - face_location[3]
+            masked_images.append(image)
+            mask_binary_array.append(mask_binary)
+            mask.append(mask_type)
+        else:
+            available_mask_types = get_available_mask_types()
+            for m in range(len(available_mask_types)):
+                if len(masked_images) == len(available_mask_types):
+                    image = masked_images.pop(m)
+                img, mask_binary = mask_face(
+                    image,
+                    face_location,
+                    six_points_on_face,
+                    angle,
+                    args,
+                    type=available_mask_types[m],
+                )
+                masked_images.insert(m, img)
+                mask_binary_array.insert(m, mask_binary)
+            mask = available_mask_types
+            cc = 1
+
+    return masked_images, mask, mask_binary_array, original_image
+
+
+def is_image(path):
+    try:
+        extensions = path[-4:]
+        image_extensions = ["png", "PNG", "jpg", "JPG"]
+
+        if extensions[1:] in image_extensions:
+            return True 
+        else:
+            print("Please input image file. png / jpg")
+            return False 
+    except: 
+        return False 
+
+
+def get_available_mask_types(config_filename="masks/masks.cfg"):
+    parser = ConfigParser()
+    parser.optionxform = str
+    parser.read(config_filename)
+    available_mask_types = parser.sections()
+    available_mask_types = [
+        string for string in available_mask_types if "left" not in string
+    ]
+    available_mask_types = [
+        string for string in available_mask_types if "right" not in string
+    ]
+
+    return available_mask_types
+
+
+def print_orderly(str, n):
+    # print("")
+    hyphens = "-" * int((n - len(str)) / 2)
+    str_p = hyphens + " " + str + " " + hyphens
+    hyphens_bar = "-" * len(str_p)
+    print(hyphens_bar)
+    print(str_p)
+    print(hyphens_bar)
+
+
+def display_MaskTheFace():
+    with open("utils/display.txt", "r") as file:
+        for line in file:
+            cc = 1
+            print(line, end="")
--- a/Code/MaskTheFace/utils/create_mask.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/create_mask.py 0 → 100644
View file @c81d667
+# Author: aqeelanwar
+# Created: 6 July,2020, 12:14 AM
+# Email: aqeel.anwar@gatech.edu
+
+from PIL import ImageColor
+import cv2
+import numpy as np
+
+COLOR = [
+    "#fc1c1a",
+    "#177ABC",
+    "#94B6D2",
+    "#A5AB81",
+    "#DD8047",
+    "#6b425e",
+    "#e26d5a",
+    "#c92c48",
+    "#6a506d",
+    "#ffc900",
+    "#ffffff",
+    "#000000",
+    "#49ff00",
+]
+
+
+def color_the_mask(mask_image, color, intensity):
+    assert 0 <= intensity <= 1, "intensity should be between 0 and 1"
+    RGB_color = ImageColor.getcolor(color, "RGB")
+    RGB_color = (RGB_color[2], RGB_color[1], RGB_color[0])
+    orig_shape = mask_image.shape
+    bit_mask = mask_image[:, :, 3]
+    mask_image = mask_image[:, :, 0:3]
+
+    color_image = np.full(mask_image.shape, RGB_color, np.uint8)
+    mask_color = cv2.addWeighted(mask_image, 1 - intensity, color_image, intensity, 0)
+    mask_color = cv2.bitwise_and(mask_color, mask_color, mask=bit_mask)
+    colored_mask = np.zeros(orig_shape, dtype=np.uint8)
+    colored_mask[:, :, 0:3] = mask_color
+    colored_mask[:, :, 3] = bit_mask
+    return colored_mask
+
+
+def texture_the_mask(mask_image, texture_path, intensity):
+    assert 0 <= intensity <= 1, "intensity should be between 0 and 1"
+    orig_shape = mask_image.shape
+    bit_mask = mask_image[:, :, 3]
+    mask_image = mask_image[:, :, 0:3]
+    texture_image = cv2.imread(texture_path)
+    texture_image = cv2.resize(texture_image, (orig_shape[1], orig_shape[0]))
+
+    mask_texture = cv2.addWeighted(
+        mask_image, 1 - intensity, texture_image, intensity, 0
+    )
+    mask_texture = cv2.bitwise_and(mask_texture, mask_texture, mask=bit_mask)
+    textured_mask = np.zeros(orig_shape, dtype=np.uint8)
+    textured_mask[:, :, 0:3] = mask_texture
+    textured_mask[:, :, 3] = bit_mask
+
+    return textured_mask
+
+
+
+# cloth_mask = cv2.imread("masks/templates/cloth.png", cv2.IMREAD_UNCHANGED)
+# # cloth_mask = color_the_mask(cloth_mask, color=COLOR[0], intensity=0.5)
+# path = "masks/textures"
+# path, dir, files = os.walk(path).__next__()
+# first_frame = True
+# col_limit = 6
+# i = 0
+# # img_concat_row=[]
+# img_concat = []
+# # for f in files:
+# #     if "._" not in f:
+# #         print(f)
+# #         i += 1
+# #         texture_image = cv2.imread(os.path.join(path, f))
+# #         m = texture_the_mask(cloth_mask, texture_image, intensity=0.5)
+# #         if first_frame:
+# #             img_concat_row = m
+# #             first_frame = False
+# #         else:
+# #             img_concat_row = cv2.hconcat((img_concat_row, m))
+# #
+# #             if i % col_limit == 0:
+# #                 if len(img_concat) > 0:
+# #                     img_concat = cv2.vconcat((img_concat, img_concat_row))
+# #                 else:
+# #                     img_concat = img_concat_row
+# #                 first_frame = True
+#
+# ## COlor the mask
+# thresholds = np.arange(0.1,0.9,0.05)
+# for intensity in thresholds:
+#     c=COLOR[2]
+#     # intensity = 0.5
+#     if "._" not in c:
+#         print(intensity)
+#         i += 1
+#         # texture_image = cv2.imread(os.path.join(path, f))
+#         m = color_the_mask(cloth_mask, c, intensity=intensity)
+#         if first_frame:
+#             img_concat_row = m
+#             first_frame = False
+#         else:
+#             img_concat_row = cv2.hconcat((img_concat_row, m))
+#
+#             if i % col_limit == 0:
+#                 if len(img_concat) > 0:
+#                     img_concat = cv2.vconcat((img_concat, img_concat_row))
+#                 else:
+#                     img_concat = img_concat_row
+#                 first_frame = True
+#
+#
+# cv2.imshow("k", img_concat)
+# cv2.imwrite("combine_N95_left.png", img_concat)
+# cv2.waitKey(0)
+# cc = 1
--- a/Code/MaskTheFace/utils/display.txt 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/display.txt 0 → 100644
View file @c81d667
+ __  __           _ _______ _          ______
+|  \/  |         | |__   __| |        |  ____|
+| \  / | __ _ ___| | _| |  | |__   ___| |__ __ _  ___ ___
+| |\/| |/ _` / __| |/ / |  | '_ \ / _ \  __/ _` |/ __/ _ \
+| |  | | (_| \__ \   <| |  | | | |  __/ | | (_| | (_|  __/
+|_|  |_|\__,_|___/_|\_\_|  |_| |_|\___|_|  \__,_|\___\___|
--- a/Code/MaskTheFace/utils/fetch_dataset.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/fetch_dataset.py 0 → 100644
View file @c81d667
+# Author: Aqeel Anwar(ICSRL)
+# Created: 7/30/2020, 1:44 PM
+# Email: aqeel.anwar@gatech.edu
+
+# Code resued from https://stackoverflow.com/questions/38511444/python-download-files-from-google-drive-using-url
+# Make sure you run this from parent folder and not from utils folder i.e.
+# python utils/fetch_dataset.py
+
+import requests, os
+from zipfile import ZipFile
+import argparse
+import urllib
+
+parser = argparse.ArgumentParser(
+    description="Download dataset - Python code to download associated datasets"
+)
+parser.add_argument(
+    "--dataset",
+    type=str,
+    default="mfr2",
+    help="Name of the dataset - Details on available datasets can be found at GitHub Page",
+)
+args = parser.parse_args()
+
+
+def download_file_from_google_drive(id, destination):
+    URL = "https://docs.google.com/uc?export=download"
+
+    session = requests.Session()
+
+    response = session.get(URL, params={"id": id}, stream=True)
+    token = get_confirm_token(response)
+
+    if token:
+        params = {"id": id, "confirm": token}
+        response = session.get(URL, params=params, stream=True)
+
+    save_response_content(response, destination)
+
+
+def get_confirm_token(response):
+    for key, value in response.cookies.items():
+        if key.startswith("download_warning"):
+            return value
+
+    return None
+
+
+def save_response_content(response, destination):
+    CHUNK_SIZE = 32768
+    print(destination)
+    with open(destination, "wb") as f:
+        for chunk in response.iter_content(CHUNK_SIZE):
+            if chunk:  # filter out keep-alive new chunks
+                f.write(chunk)
+
+
+def download(t_url):
+    response = urllib.request.urlopen(t_url)
+    data = response.read()
+    txt_str = str(data)
+    lines = txt_str.split("\\n")
+    return lines
+
+
+def Convert(lst):
+    it = iter(lst)
+    res_dct = dict(zip(it, it))
+    return res_dct
+
+
+if __name__ == "__main__":
+    # Fetch the latest download_links.txt file from GitHub
+    link = "https://raw.githubusercontent.com/aqeelanwar/MaskTheFace/master/datasets/download_links.txt"
+    links_dict = Convert(
+        download(link)[0]
+        .replace(":", "\n")
+        .replace("b'", "")
+        .replace("'", "")
+        .replace(" ", "")
+        .split("\n")
+    )
+    file_id = links_dict[args.dataset]
+    destination = "datasets\_.zip"
+    print("Downloading: ", args.dataset)
+    download_file_from_google_drive(file_id, destination)
+    print("Extracting: ", args.dataset)
+    with ZipFile(destination, "r") as zipObj:
+        # Extract all the contents of zip file in current directory
+        zipObj.extractall(destination.rsplit(os.path.sep, 1)[0])
+
+    os.remove(destination)
--- a/Code/MaskTheFace/utils/fit_ellipse.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/fit_ellipse.py 0 → 100644
View file @c81d667
+# Author: aqeelanwar 
+# Created: 4 May,2020, 1:30 AM
+# Email: aqeel.anwar@gatech.edu
+
+import numpy as np
+from numpy.linalg import eig, inv
+
+def fitEllipse(x,y):
+    x = x[:,np.newaxis]
+    y = y[:,np.newaxis]
+    D =  np.hstack((x*x, x*y, y*y, x, y, np.ones_like(x)))
+    S = np.dot(D.T,D)
+    C = np.zeros([6,6])
+    C[0,2] = C[2,0] = 2; C[1,1] = -1
+    E, V =  eig(np.dot(inv(S), C))
+    n = np.argmax(np.abs(E))
+    a = V[:,n]
+    return a
+
+def ellipse_center(a):
+    b,c,d,f,g,a = a[1]/2, a[2], a[3]/2, a[4]/2, a[5], a[0]
+    num = b*b-a*c
+    x0=(c*d-b*f)/num
+    y0=(a*f-b*d)/num
+    return np.array([x0,y0])
+
+
+def ellipse_angle_of_rotation( a ):
+    b,c,d,f,g,a = a[1]/2, a[2], a[3]/2, a[4]/2, a[5], a[0]
+    return 0.5*np.arctan(2*b/(a-c))
+
+
+def ellipse_axis_length( a ):
+    b,c,d,f,g,a = a[1]/2, a[2], a[3]/2, a[4]/2, a[5], a[0]
+    up = 2*(a*f*f+c*d*d+g*b*b-2*b*d*f-a*c*g)
+    down1=(b*b-a*c)*( (c-a)*np.sqrt(1+4*b*b/((a-c)*(a-c)))-(c+a))
+    down2=(b*b-a*c)*( (a-c)*np.sqrt(1+4*b*b/((a-c)*(a-c)))-(c+a))
+    res1=np.sqrt(up/down1)
+    res2=np.sqrt(up/down2)
+    return np.array([res1, res2])
+
+def ellipse_angle_of_rotation2( a ):
+    b,c,d,f,g,a = a[1]/2, a[2], a[3]/2, a[4]/2, a[5], a[0]
+    if b == 0:
+        if a > c:
+            return 0
+        else:
+            return np.pi/2
+    else:
+        if a > c:
+            return np.arctan(2*b/(a-c))/2
+        else:
+            return np.pi/2 + np.arctan(2*b/(a-c))/2
+
+# a = fitEllipse(x,y)
+# center = ellipse_center(a)
+# #phi = ellipse_angle_of_rotation(a)
+# phi = ellipse_angle_of_rotation2(a)
+# axes = ellipse_axis_length(a)
+#
+# print("center = ",  center)
+# print("angle of rotation = ",  phi)
+# print("axes = ", axes)
+
--- a/Code/MaskTheFace/utils/point_the_mask.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/point_the_mask.py 0 → 100644
View file @c81d667
+# Author: aqeelanwar
+# Created: 2 May,2020, 2:49 AM
+# Email: aqeel.anwar@gatech.edu
+
+from tkinter import filedialog
+from tkinter import *
+import cv2, os
+
+mouse_pts = []
+
+
+def get_mouse_points(event, x, y, flags, param):
+    global mouseX, mouseY, mouse_pts
+    if event == cv2.EVENT_LBUTTONDOWN:
+        mouseX, mouseY = x, y
+        cv2.circle(mask_im, (x, y), 10, (0, 255, 255), 10)
+        if "mouse_pts" not in globals():
+            mouse_pts = []
+        mouse_pts.append((x, y))
+        # print("Point detected")
+        # print((x,y))
+
+
+root = Tk()
+filename = filedialog.askopenfilename(
+    initialdir="/",
+    title="Select file",
+    filetypes=(("PNG files", "*.PNG"), ("png files", "*.png"), ("All files", "*.*")),
+)
+root.destroy()
+filename_split = os.path.split(filename)
+folder = filename_split[0]
+file = filename_split[1]
+file_split = file.split(".")
+new_filename = folder + "/" + file_split[0] + "_marked." + file_split[-1]
+mask_im = cv2.imread(filename)
+cv2.namedWindow("Mask")
+cv2.setMouseCallback("Mask", get_mouse_points)
+
+while True:
+    cv2.imshow("Mask", mask_im)
+    cv2.waitKey(1)
+    if len(mouse_pts) == 6:
+        cv2.destroyWindow("Mask")
+        break
+    first_frame_display = False
+points = mouse_pts
+print(points)
+print("----------------------------------------------------------------")
+print("Copy the following code and paste it in masks.cfg")
+print("----------------------------------------------------------------")
+name_points = ["a", "b", "c", "d", "e", "f"]
+
+mask_title = "[" + file_split[0] + "]"
+print(mask_title)
+print("template: ", filename)
+for i in range(len(mouse_pts)):
+    name = (
+        "mask_"
+        + name_points[i]
+        + ": "
+        + str(mouse_pts[i][0])
+        + ","
+        + str(mouse_pts[i][1])
+    )
+    print(name)
+
+cv2.imwrite(new_filename, mask_im)
--- a/Code/MaskTheFace/utils/read_cfg.py 0 → 100644
View file @c81d667
+++ b/Code/MaskTheFace/utils/read_cfg.py 0 → 100644
View file @c81d667
+# Author: Aqeel Anwar(ICSRL)
+# Created: 9/20/2019, 12:43 PM
+# Email: aqeel.anwar@gatech.edu
+
+from configparser import ConfigParser
+from dotmap import DotMap
+
+
+def ConvertIfStringIsInt(input_string):
+    try:
+        float(input_string)
+
+        try:
+            if int(input_string) == float(input_string):
+                return int(input_string)
+            else:
+                return float(input_string)
+        except ValueError:
+            return float(input_string)
+
+    except ValueError:
+        return input_string
+
+
+def read_cfg(config_filename="masks/masks.cfg", mask_type="surgical", verbose=False):
+    parser = ConfigParser()
+    parser.optionxform = str
+    parser.read(config_filename)
+    cfg = DotMap()
+    section_name = mask_type
+
+    if verbose:
+        hyphens = "-" * int((80 - len(config_filename)) / 2)
+        print(hyphens + " " + config_filename + " " + hyphens)
+
+    # for section_name in parser.sections():
+
+    if verbose:
+        print("[" + section_name + "]")
+    for name, value in parser.items(section_name):
+        value = ConvertIfStringIsInt(value)
+        if name != "template":
+            cfg[name] = tuple(int(s) for s in value.split(","))
+        else:
+            cfg[name] = value
+        spaces = " " * (30 - len(name))
+        if verbose:
+            print(name + ":" + spaces + str(cfg[name]))
+
+    return cfg
--- a/Code/image-inpainting/Simple Image Inpainting.ipynb 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/Simple Image Inpainting.ipynb 0 → 100644
View file @c81d667
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "import torch.nn as nn\n",
+    "from torch.nn import Parameter\n",
+    "import torch.nn.functional as F\n",
+    "from torchvision import transforms as tf\n",
+    "import torch.utils.data as data\n",
+    "\n",
+    "import os\n",
+    "import cv2\n",
+    "import functools\n",
+    "import numpy as np\n",
+    "from PIL import Image\n",
+    "import matplotlib.pyplot as plt"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from models import vgg19"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = vgg19(pretrained=True).features[:-2]\n",
+    "\n",
+    "model = model.eval()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Sequential(\n",
+       "  (0): Conv2d(3, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (1): ReLU(inplace=True)\n",
+       "  (2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (3): ReLU(inplace=True)\n",
+       "  (4): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n",
+       "  (5): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (6): ReLU(inplace=True)\n",
+       "  (7): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (8): ReLU(inplace=True)\n",
+       "  (9): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n",
+       "  (10): Conv2d(128, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (11): ReLU(inplace=True)\n",
+       "  (12): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (13): ReLU(inplace=True)\n",
+       "  (14): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (15): ReLU(inplace=True)\n",
+       "  (16): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (17): ReLU(inplace=True)\n",
+       "  (18): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n",
+       "  (19): Conv2d(256, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (20): ReLU(inplace=True)\n",
+       "  (21): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (22): ReLU(inplace=True)\n",
+       "  (23): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (24): ReLU(inplace=True)\n",
+       "  (25): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (26): ReLU(inplace=True)\n",
+       "  (27): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n",
+       "  (28): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (29): ReLU(inplace=True)\n",
+       "  (30): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (31): ReLU(inplace=True)\n",
+       "  (32): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       "  (33): ReLU(inplace=True)\n",
+       "  (34): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n",
+       ")"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "img = torch.rand(4,3,256,256)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "torch.Size([4, 512, 8, 8])"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "out = model(img)\n",
+    "out.shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class GatedConv2d(nn.Module):\n",
+    "    def __init__(self, in_channels, out_channels, kernel_size, stride = 1, padding = 0, dilation = 1, activation = 'lrelu', norm = 'in'):\n",
+    "        super(GatedConv2d, self).__init__()\n",
+    "        self.pad = nn.ZeroPad2d(padding)\n",
+    "        if norm is not None:\n",
+    "            self.norm = nn.InstanceNorm2d(out_channels)\n",
+    "        else:\n",
+    "            self.norm = None\n",
+    "            \n",
+    "        if activation == 'tanh':\n",
+    "            self.activation = nn.Tanh()\n",
+    "        else:\n",
+    "            self.activation = nn.LeakyReLU(0.2, inplace = True)\n",
+    "        \n",
+    "       \n",
+    "        self.conv2d = nn.Conv2d(in_channels, out_channels, kernel_size, stride, padding = 0, dilation = dilation)\n",
+    "        self.mask_conv2d = nn.Conv2d(in_channels, out_channels, kernel_size, stride, padding = 0, dilation = dilation)\n",
+    "        self.sigmoid = torch.nn.Sigmoid()\n",
+    "    \n",
+    "    def forward(self, x):\n",
+    "        x = self.pad(x)\n",
+    "        conv = self.conv2d(x)\n",
+    "        mask = self.mask_conv2d(x)\n",
+    "        gated_mask = self.sigmoid(mask)\n",
+    "        x = conv * gated_mask\n",
+    "        if self.norm:\n",
+    "            x = self.norm(x)\n",
+    "        if self.activation:\n",
+    "            x = self.activation(x)\n",
+    "        return x\n",
+    "\n",
+    "class TransposeGatedConv2d(nn.Module):\n",
+    "    def __init__(self, in_channels, out_channels, kernel_size, stride = 1, padding = 0, dilation = 1, norm=None, scale_factor = 2):\n",
+    "        super(TransposeGatedConv2d, self).__init__()\n",
+    "        # Initialize the conv scheme\n",
+    "        self.scale_factor = scale_factor\n",
+    "        self.gated_conv2d = GatedConv2d(in_channels, out_channels, kernel_size, stride, padding, dilation, norm=norm)\n",
+    "    \n",
+    "    def forward(self, x):\n",
+    "        x = F.interpolate(x, scale_factor = self.scale_factor, mode = 'nearest')\n",
+    "        x = self.gated_conv2d(x)\n",
+    "        return x"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class GatedGenerator(nn.Module):\n",
+    "    def __init__(self, in_channels=4, latent_channels=64, out_channels=3):\n",
+    "        super(GatedGenerator, self).__init__()\n",
+    "        self.coarse = nn.Sequential(\n",
+    "            # encoder\n",
+    "            GatedConv2d(in_channels, latent_channels, 7, 1, 3, norm = None),\n",
+    "            GatedConv2d(latent_channels, latent_channels * 2, 4, 2, 1),\n",
+    "            GatedConv2d(latent_channels * 2, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 4, 2, 1),\n",
+    "            # Bottleneck\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 2, dilation = 2),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 4, dilation = 4),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 8, dilation = 8),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 16, dilation = 16),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            # decoder\n",
+    "            TransposeGatedConv2d(latent_channels * 4, latent_channels * 2, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 2, latent_channels * 2, 3, 1, 1),\n",
+    "            TransposeGatedConv2d(latent_channels * 2, latent_channels, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels, out_channels, 7, 1, 3, activation = 'tanh', norm = None)\n",
+    "        )\n",
+    "        self.refinement = nn.Sequential(\n",
+    "            # encoder\n",
+    "            GatedConv2d(in_channels, latent_channels, 7, 1, 3, norm = None),\n",
+    "            GatedConv2d(latent_channels, latent_channels * 2, 4, 2, 1),\n",
+    "            GatedConv2d(latent_channels * 2, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 4, 2, 1),\n",
+    "            # Bottleneck\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 2, dilation = 2),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 4, dilation = 4),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 8, dilation = 8),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 16, dilation = 16),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),\n",
+    "            # decoder\n",
+    "            TransposeGatedConv2d(latent_channels * 4, latent_channels * 2, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels * 2, latent_channels * 2, 3, 1, 1),\n",
+    "            TransposeGatedConv2d(latent_channels * 2, latent_channels, 3, 1, 1),\n",
+    "            GatedConv2d(latent_channels, out_channels, 7, 1, 3, activation = 'tanh', norm = None)\n",
+    "        )\n",
+    "        \n",
+    "    def forward(self, img, mask):\n",
+    "        # img: entire img\n",
+    "        # mask: 1 for mask region; 0 for unmask region\n",
+    "        # 1 - mask: unmask\n",
+    "        # img * (1 - mask): ground truth unmask region\n",
+    "        # Coarse\n",
+    "     \n",
+    "        first_masked_img = img * (1 - mask) + mask\n",
+    "        first_in = torch.cat((first_masked_img, mask), 1)       # in: [B, 4, H, W]\n",
+    "        first_out = self.coarse(first_in)                       # out: [B, 3, H, W]\n",
+    "        # Refinement\n",
+    "        second_masked_img = img * (1 - mask) + first_out * mask\n",
+    "        second_in = torch.cat((second_masked_img, mask), 1)     # in: [B, 4, H, W]\n",
+    "        second_out = self.refinement(second_in)                 # out: [B, 3, H, W]\n",
+    "        return first_out, second_out"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class NLayerDiscriminator(nn.Module):\n",
+    "    def __init__(self, input_nc, ndf=64, n_layers=3, norm_layer=nn.BatchNorm2d, use_sigmoid=False):\n",
+    "        super(NLayerDiscriminator, self).__init__()\n",
+    "        if type(norm_layer) == functools.partial:\n",
+    "            use_bias = norm_layer.func == nn.InstanceNorm2d\n",
+    "        else:\n",
+    "            use_bias = norm_layer == nn.InstanceNorm2d\n",
+    "\n",
+    "        kw = 4\n",
+    "        padw = 1\n",
+    "        sequence = [\n",
+    "            nn.Conv2d(input_nc, ndf, kernel_size=kw, stride=2, padding=padw),\n",
+    "            nn.LeakyReLU(0.2, True)\n",
+    "        ]\n",
+    "\n",
+    "        nf_mult = 1\n",
+    "        nf_mult_prev = 1\n",
+    "        for n in range(1, n_layers):\n",
+    "            nf_mult_prev = nf_mult\n",
+    "            nf_mult = min(2**n, 8)\n",
+    "            sequence += [\n",
+    "                nn.Conv2d(ndf * nf_mult_prev, ndf * nf_mult,\n",
+    "                          kernel_size=kw, stride=2, padding=padw, bias=use_bias),\n",
+    "                norm_layer(ndf * nf_mult),\n",
+    "                nn.LeakyReLU(0.2, True)\n",
+    "            ]\n",
+    "\n",
+    "        nf_mult_prev = nf_mult\n",
+    "        nf_mult = min(2**n_layers, 8)\n",
+    "        sequence += [\n",
+    "            nn.Conv2d(ndf * nf_mult_prev, ndf * nf_mult,\n",
+    "                      kernel_size=kw, stride=1, padding=padw, bias=use_bias),\n",
+    "            norm_layer(ndf * nf_mult),\n",
+    "            nn.LeakyReLU(0.2, True)\n",
+    "        ]\n",
+    "\n",
+    "        sequence += [nn.Conv2d(ndf * nf_mult, 1, kernel_size=kw, stride=1, padding=padw)]\n",
+    "\n",
+    "        if use_sigmoid:\n",
+    "            sequence += [nn.Sigmoid()]\n",
+    "\n",
+    "        self.model = nn.Sequential(*sequence)\n",
+    "\n",
+    "    def forward(self, input):\n",
+    "        return self.model(input)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 22,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class PerceptualNet(nn.Module):\n",
+    "    def __init__(self):\n",
+    "        super(PerceptualNet, self).__init__()\n",
+    "        self.features = nn.Sequential(\n",
+    "            nn.Conv2d(3, 64, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(64, 64, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.MaxPool2d(2, 2),\n",
+    "            nn.Conv2d(64, 128, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(128, 128, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.MaxPool2d(2, 2),\n",
+    "            nn.Conv2d(128, 256, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(256, 256, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(256, 256, 3, 1, 1),\n",
+    "            nn.MaxPool2d(2, 2),\n",
+    "            nn.Conv2d(256, 512, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(512, 512, 3, 1, 1),\n",
+    "            nn.ReLU(inplace = True),\n",
+    "            nn.Conv2d(512, 512, 3, 1, 1)\n",
+    "        )\n",
+    "\n",
+    "    def forward(self, x):\n",
+    "        x = self.features(x)\n",
+    "        return x"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class GANLoss(nn.Module):\n",
+    "    def __init__(self, target_real_label=1.0, target_fake_label=0.0):\n",
+    "        super(GANLoss, self).__init__()\n",
+    "        self.register_buffer('real_label', torch.tensor(target_real_label))\n",
+    "        self.register_buffer('fake_label', torch.tensor(target_fake_label))\n",
+    "        self.loss = nn.BCELoss()\n",
+    "\n",
+    "    def get_target_tensor(self, input, target_is_real):\n",
+    "        if target_is_real:\n",
+    "            target_tensor = self.real_label\n",
+    "        else:\n",
+    "            target_tensor = self.fake_label\n",
+    "        return target_tensor.expand_as(input)\n",
+    "\n",
+    "    def __call__(self, input, target_is_real):\n",
+    "        target_tensor = self.get_target_tensor(input, target_is_real)\n",
+    "        return self.loss(input, target_tensor)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class InpaintDataset(data.Dataset):\n",
+    "    def __init__(self, img_dir):\n",
+    "        self.img_dir = img_dir\n",
+    "        self.load_images()\n",
+    "        \n",
+    "    def load_images(self):\n",
+    "        self.fns =[]\n",
+    "        img_paths = sorted(os.listdir(self.img_dir))\n",
+    "        for path in img_paths:\n",
+    "            self.fns.append(os.path.join(self.img_dir, path))\n",
+    "            \n",
+    "    def __getitem__(self, index):\n",
+    "        img_path = self.fns[index]\n",
+    "        img = cv2.imread(img_path)\n",
+    "        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)\n",
+    "        img = cv2.resize(img, (256,256))\n",
+    "        \n",
+    "        mask = self.random_ff_mask()\n",
+    "        img = torch.from_numpy(img.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()\n",
+    "        mask = torch.from_numpy(mask.astype(np.float32)).contiguous()\n",
+    "        return img, mask\n",
+    "    \n",
+    "    def collate_fn(self, batch):\n",
+    "        imgs = torch.stack([i[0] for i in batch])\n",
+    "        masks = torch.stack([i[1] for i in batch])\n",
+    "        return {\n",
+    "            'imgs': imgs,\n",
+    "            'masks': masks\n",
+    "        }\n",
+    "    \n",
+    "    def __len__(self):\n",
+    "        return len(self.fns)\n",
+    "    \n",
+    "    def random_ff_mask(self, shape =256 , max_angle = 4, max_len = 40, max_width = 10, times = 15):\n",
+    "            \"\"\"Generate a random free form mask with configuration.\n",
+    "            Args:\n",
+    "                config: Config should have configuration including IMG_SHAPES,\n",
+    "                    VERTICAL_MARGIN, HEIGHT, HORIZONTAL_MARGIN, WIDTH.\n",
+    "            Returns:\n",
+    "                tuple: (top, left, height, width)\n",
+    "            \"\"\"\n",
+    "            height = shape\n",
+    "            width = shape\n",
+    "            mask = np.zeros((height, width), np.float32)\n",
+    "            times = np.random.randint(times)\n",
+    "            for i in range(times):\n",
+    "                start_x = np.random.randint(width)\n",
+    "                start_y = np.random.randint(height)\n",
+    "                for j in range(1 + np.random.randint(5)):\n",
+    "                    angle = 0.01 + np.random.randint(max_angle)\n",
+    "                    if i % 2 == 0:\n",
+    "                        angle = 2 * 3.1415926 - angle\n",
+    "                    length = 10 + np.random.randint(max_len)\n",
+    "                    brush_w = 5 + np.random.randint(max_width)\n",
+    "                    end_x = (start_x + length * np.sin(angle)).astype(np.int32)\n",
+    "                    end_y = (start_y + length * np.cos(angle)).astype(np.int32)\n",
+    "                    cv2.line(mask, (start_y, start_x), (end_y, end_x), 1.0, brush_w)\n",
+    "                    start_x, start_y = end_x, end_y\n",
+    "            return mask.reshape((1, ) + mask.shape).astype(np.float32)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = InpaintDataset(img_dir='datasets/places365standard_easyformat/places365_standard/train/waterfall')\n",
+    "dataloader = data.DataLoader(dataset, batch_size=4, collate_fn = dataset.collate_fn)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for batch in dataloader:\n",
+    "    imgs = batch['imgs']\n",
+    "    masks = batch['masks']\n",
+    "    \n",
+    "    break"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "device = torch.device('cuda')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'GANLoss' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+      "\u001b[1;32m<ipython-input-23-bdcc75eef256>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      2\u001b[0m \u001b[0mmodel_D\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mNLayerDiscriminator\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;36m3\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0muse_sigmoid\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;32mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      3\u001b[0m \u001b[0mmodel_P\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mPerceptualNet\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 4\u001b[1;33m \u001b[0mcriterion_adv\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mGANLoss\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      5\u001b[0m \u001b[0mcriterion_rec\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mnn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mMSELoss\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      6\u001b[0m \u001b[0mcriterion_per\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mnn\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mL1Loss\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;31mNameError\u001b[0m: name 'GANLoss' is not defined"
+     ]
+    }
+   ],
+   "source": [
+    "model_G = GatedGenerator()\n",
+    "model_D = NLayerDiscriminator(3, use_sigmoid=True)\n",
+    "model_P = PerceptualNet()\n",
+    "criterion_adv = GANLoss()\n",
+    "criterion_rec = nn.MSELoss()\n",
+    "criterion_per = nn.L1Loss()\n",
+    "optimizer_D = torch.optim.Adam(model_D.parameters(), lr=1e-4)\n",
+    "optimizer_G = torch.optim.Adam(model_G.parameters(), lr=1e-4)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "torch.save({\n",
+    "    'D': model_D.state_dict(),\n",
+    "    'G': model_G.state_dict()\n",
+    "}, 's.pth')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def count_params(model):\n",
+    "    return sum(p.numel() for p in model.parameters() if p.requires_grad)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print(count_params(model_G))\n",
+    "print(count_params(model_D))\n",
+    "print(count_params(model_P))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def random_ff_mask(shape =256 , max_angle = 4, max_len = 40, max_width = 10, times = 15):\n",
+    "            \"\"\"Generate a random free form mask with configuration.\n",
+    "            Args:\n",
+    "                config: Config should have configuration including IMG_SHAPES,\n",
+    "                    VERTICAL_MARGIN, HEIGHT, HORIZONTAL_MARGIN, WIDTH.\n",
+    "            Returns:\n",
+    "                tuple: (top, left, height, width)\n",
+    "            \"\"\"\n",
+    "            height = shape\n",
+    "            width = shape\n",
+    "            mask = np.zeros((height, width), np.float32)\n",
+    "            times = np.random.randint(times)\n",
+    "            for i in range(times):\n",
+    "                start_x = np.random.randint(width)\n",
+    "                start_y = np.random.randint(height)\n",
+    "                for j in range(1 + np.random.randint(5)):\n",
+    "                    angle = 0.01 + np.random.randint(max_angle)\n",
+    "                    if i % 2 == 0:\n",
+    "                        angle = 2 * 3.1415926 - angle\n",
+    "                    length = 10 + np.random.randint(max_len)\n",
+    "                    brush_w = 5 + np.random.randint(max_width)\n",
+    "                    end_x = (start_x + length * np.sin(angle)).astype(np.int32)\n",
+    "                    end_y = (start_y + length * np.cos(angle)).astype(np.int32)\n",
+    "                    cv2.line(mask, (start_y, start_x), (end_y, end_x), 1.0, brush_w)\n",
+    "                    start_x, start_y = end_x, end_y\n",
+    "            return mask.reshape((1, ) + mask.shape).astype(np.float32)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "img = cv2.imread('datasets/places365standard_easyformat/places365_standard/train/waterfall/00000003.jpg')\n",
+    "img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)\n",
+    "img = cv2.resize(img, (256, 256))\n",
+    "img = torch.from_numpy(img.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()\n",
+    "img_tensor = img.unsqueeze(0)\n",
+    "mask = random_ff_mask()\n",
+    "mask = torch.from_numpy(mask).contiguous().unsqueeze(0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def visualize(img):\n",
+    "    np_img = img.squeeze(0).detach().cpu().numpy()\n",
+    "    return np_img.transpose(1, 2, 0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plt.imshow(visualize(first_out_wholeimg))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "first_out, second_out = model_G(img_tensor, mask)\n",
+    "\n",
+    "first_out_wholeimg = img_tensor * (1 - mask) + first_out * mask     \n",
+    "second_out_wholeimg = img_tensor * (1 - mask) + second_out * mask"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Train discriminator\n",
+    "optimizer_D.zero_grad()\n",
+    "\n",
+    "fake_D = model_D(second_out_wholeimg.detach())\n",
+    "real_D = model_D(img_tensor)\n",
+    "\n",
+    "loss_fake_D = criterion_adv(fake_D, target_is_real=False)\n",
+    "loss_real_D = criterion_adv(real_D, target_is_real=True)\n",
+    "\n",
+    "loss_D = (loss_fake_D + loss_real_D) *0.5\n",
+    "\n",
+    "loss_D.backward()\n",
+    "optimizer_D.step()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Train Generator\n",
+    "\n",
+    "optimizer_G.zero_grad()\n",
+    "\n",
+    "fake_D = model_D(second_out_wholeimg)\n",
+    "G_loss = criterion_adv(fake_D, target_is_real=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Reconstruction loss\n",
+    "\n",
+    "loss_rec_1 = criterion_rec(first_out_wholeimg, img_tensor)\n",
+    "loss_rec_2 = criterion_rec(second_out_wholeimg, img_tensor)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Perceptual loss\n",
+    "\n",
+    "img_featuremaps = model_P(img_tensor)                            # feature maps\n",
+    "second_out_wholeimg_featuremaps = model_P(second_out_wholeimg)\n",
+    "\n",
+    "loss_P = criterion_per(second_out_wholeimg_featuremaps, img_featuremaps)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'lambda_G' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+      "\u001b[1;32m<ipython-input-18-dbfe5f51e2fc>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mloss\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mlambda_G\u001b[0m \u001b[1;33m*\u001b[0m \u001b[0mG_loss\u001b[0m \u001b[1;33m+\u001b[0m \u001b[0mlambda_rec_1\u001b[0m \u001b[1;33m*\u001b[0m \u001b[0mloss_rec_1\u001b[0m \u001b[1;33m+\u001b[0m \u001b[0mlambda_rec_2\u001b[0m \u001b[1;33m*\u001b[0m \u001b[0mloss_rec_2\u001b[0m \u001b[1;33m+\u001b[0m \u001b[0mlambda_per\u001b[0m \u001b[1;33m*\u001b[0m \u001b[0mloss_P\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      2\u001b[0m \u001b[0mloss\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      3\u001b[0m \u001b[0moptimizer_G\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mstep\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
+      "\u001b[1;31mNameError\u001b[0m: name 'lambda_G' is not defined"
+     ]
+    }
+   ],
+   "source": [
+    "loss = lambda_G * G_loss + lambda_rec_1 * loss_rec_1 + lambda_rec_2 * loss_rec_2 + lambda_per * loss_P\n",
+    "loss.backward()\n",
+    "optimizer_G.step()"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
--- a/Code/image-inpainting/configs/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__init__.py 0 → 100644
View file @c81d667
+from .config import Config
\ No newline at end of file
--- a/Code/image-inpainting/configs/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/__pycache__/config.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/config.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/__pycache__/config.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/config.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/__pycache__/config.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/__pycache__/config.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/configs/config.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/config.py 0 → 100644
View file @c81d667
+import yaml
+
+class Config():
+    def __init__(self, yaml_path):
+        yaml_file = open(yaml_path)
+        self._attr = yaml.load(yaml_file, Loader=yaml.FullLoader)['settings']
+
+    def __getattr__(self, attr):
+        try:
+            return self._attr[attr]
+        except KeyError:
+            return None
--- a/Code/image-inpainting/configs/facemask.yaml 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/facemask.yaml 0 → 100644
View file @c81d667
+settings:
+  root_dir: "./datasets/celeba/images/"
+  checkpoint_path: "weights"
+  sample_folder: "sample"
+
+  cuda: True
+  lr: 0.001
+  batch_size: 2
+  num_workers: 4
+
+  step_iters: [10000, 15000, 20000]
+  gamma: 0.1
+
+  d_num_layers: 3
+
+  visualize_per_iter: 500
+  save_per_iter: 500
+  print_per_iter: 10
+  num_epochs: 100
+
+  lambda_G: 1.0
+  lambda_rec_1: 100.0
+  lambda_rec_2: 100.0
+  lambda_per: 10.0
+
+  img_size: 512
--- a/Code/image-inpainting/configs/places365.yaml 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/places365.yaml 0 → 100644
View file @c81d667
+settings:
+  root_dir: "./datasets/places365_10classes"
+  checkpoint_path: "/content/drive/MyDrive/weights/Places365 Inpainting/phase 3"
+  sample_folder: "/content/drive/MyDrive/results/Places365 Inpainting/phase 3"
+
+  cuda: True
+  lr: 0.0001
+  batch_size: 8
+  num_workers: 4
+
+  step_iters: [50000, 75000, 100000]
+  gamma: 0.1
+
+  d_num_layers: 3
+
+  visualize_per_iter: 500
+  save_per_iter: 500
+  print_per_iter: 10
+  num_epochs: 100
+
+  lambda_G: 0.3
+  lambda_rec_1: 10.0
+  lambda_rec_2: 10.0
+  lambda_per: 1.0
+
+  img_size: 256
+  max_angle: 4
+  max_len: 50
+  max_width: 30
+  times: 15
--- a/Code/image-inpainting/configs/segm.yaml 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/configs/segm.yaml 0 → 100644
View file @c81d667
+settings:
+  root_dir: "./datasets/celeba/images/"
+  train_anns: "./datasets/celeba/annotations/train.csv"
+  val_anns: "./datasets/celeba/annotations/val.csv"
+
+  checkpoint_path: "weights" #"/content/drive/MyDrive/weights/Places365 Inpainting/unet/phase 1"
+  sample_folder: "sample" #"/content/drive/MyDrive/results/Places365 Inpainting/unet/phase 1"
+
+  cuda: True
+  lr: 0.001
+  batch_size: 4
+  num_workers: 4
+
+  step_iters: [50000, 75000, 100000]
+  gamma: 0.1
+
+  visualize_per_iter: 1000
+  save_per_iter: 1000
+  print_per_iter: 10
+  num_epochs: 100
+
+  img_size: 512
--- a/Code/image-inpainting/datasets/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/__init__.py 0 → 100644
View file @c81d667
+from .dataset import Places365Dataset, FacemaskDataset
+from .dataset_seg import FacemaskSegDataset
--- a/Code/image-inpainting/datasets/celeba/annotations/train.csv 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/celeba/annotations/train.csv 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/datasets/celeba/annotations/val.csv 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/celeba/annotations/val.csv 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/datasets/celeba/train_val_split.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/celeba/train_val_split.py 0 → 100644
View file @c81d667
+import os
+import csv
+
+f = open("./datasets/celeba/annotations/train.csv", "w", newline="")
+wr = csv.writer(f)
+wr.writerow(["_", "img_name", "mask_name"])
+
+for i in range(23304):
+    wr.writerow(
+        [
+            i,
+            "celeba512_30k_masked/"
+            + os.listdir("./datasets/celeba/images/celeba512_30k_masked")[i],
+            "celeba512_30k_binary/"
+            + os.listdir("./datasets/celeba/images/celeba512_30k_binary")[i],
+        ]
+    )
+
+f.close()
+
+f = open("./datasets/celeba/annotations/val.csv", "w", newline="")
+wr = csv.writer(f)
+wr.writerow(["_", "img_name", "mask_name"])
+
+for i in range(23304, 29131):
+    wr.writerow(
+        [
+            i,
+            "celeba512_30k_masked/"
+            + os.listdir("./datasets/celeba/images/celeba512_30k_masked")[i],
+            "celeba512_30k_binary/"
+            + os.listdir("./datasets/celeba/images/celeba512_30k_binary")[i],
+        ]
+    )
+
+f.close()
--- a/Code/image-inpainting/datasets/dataset.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/dataset.py 0 → 100644
View file @c81d667
+import os
+import torch
+import torch.nn as nn
+import torch.utils.data as data
+import cv2
+import numpy as np
+from tqdm import tqdm
+
+class Places365Dataset(data.Dataset):
+    def __init__(self, cfg):
+        self.root_dir = cfg.root_dir
+        self.cfg = cfg
+        self.load_images()
+        
+    def load_images(self):
+        self.fns =[]
+        idx = 0
+        img_paths = os.listdir(self.root_dir)
+        for cls_id in img_paths:
+            paths = os.path.join(self.root_dir, cls_id)
+            file_paths = os.listdir(paths)
+            for img_name in file_paths:
+                filename = os.path.join(paths, img_name)
+                self.fns.append(filename)
+
+    def __getitem__(self, index):
+        img_path = self.fns[index]
+        img = cv2.imread(img_path)
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        img = cv2.resize(img, (self.cfg.img_size, self.cfg.img_size))
+        
+        mask = self.random_ff_mask(
+            shape = self.cfg.img_size, 
+            max_angle = self.cfg.max_angle, 
+            max_len = self.cfg.max_len, 
+            max_width = self.cfg.max_width, 
+            times = self.cfg.times)
+        
+        img = torch.from_numpy(img.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()
+        mask = torch.from_numpy(mask.astype(np.float32)).contiguous()
+
+        return img, mask
+    
+    def collate_fn(self, batch):
+        imgs = torch.stack([i[0] for i in batch])
+        masks = torch.stack([i[1] for i in batch])
+        return {
+            'imgs': imgs,
+            'masks': masks
+        }
+    
+    def __len__(self):
+        return len(self.fns)
+    
+    def random_ff_mask(self, shape = 256 , max_angle = 4, max_len = 50, max_width = 20, times = 15):
+            """Generate a random free form mask with configuration.
+            Args:
+                config: Config should have configuration including IMG_SHAPES,
+                    VERTICAL_MARGIN, HEIGHT, HORIZONTAL_MARGIN, WIDTH.
+            Returns:
+                tuple: (top, left, height, width)
+            """
+            height = shape
+            width = shape
+            mask = np.zeros((height, width), np.float32)
+            times = np.random.randint(10, times)
+            for i in range(times):
+                start_x = np.random.randint(width)
+                start_y = np.random.randint(height)
+                for j in range(1 + np.random.randint(5)):
+                    angle = 0.01 + np.random.randint(max_angle)
+                    if i % 2 == 0:
+                        angle = 2 * 3.1415926 - angle
+                    length = 10 + np.random.randint(max_len)
+                    brush_w = 5 + np.random.randint(max_width)
+                    end_x = (start_x + length * np.sin(angle)).astype(np.int32)
+                    end_y = (start_y + length * np.cos(angle)).astype(np.int32)
+                    cv2.line(mask, (start_y, start_x), (end_y, end_x), 1.0, brush_w)
+                    start_x, start_y = end_x, end_y
+            return mask.reshape((1, ) + mask.shape).astype(np.float32)
+
+
+class FacemaskDataset(data.Dataset):
+    def __init__(self, cfg):
+        self.root_dir = cfg.root_dir
+        self.cfg = cfg
+
+        self.mask_folder = os.path.join(self.root_dir, 'celeba512_30k_binary')
+        self.img_folder = os.path.join(self.root_dir, 'celeba512_30k')
+        self.load_images()
+        
+    def load_images(self):
+        self.fns = []
+        idx = 0
+        img_paths = sorted(os.listdir(self.img_folder))
+        for img_name in img_paths:
+            mask_name = img_name.split('.')[0]+'_binary.jpg'
+            img_path = os.path.join(self.img_folder, img_name)
+            mask_path = os.path.join(self.mask_folder, mask_name)
+            if os.path.isfile(mask_path): 
+                self.fns.append([img_path, mask_path])
+
+    def __getitem__(self, index):
+        img_path, mask_path = self.fns[index]
+        img = cv2.imread(img_path)
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        img = cv2.resize(img, (self.cfg.img_size, self.cfg.img_size))
+        
+        
+        mask = cv2.imread(mask_path, 0)
+        
+        mask[mask>0]=1.0
+        mask = np.expand_dims(mask, axis=0)
+    
+        img = torch.from_numpy(img.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()
+        mask = torch.from_numpy(mask.astype(np.float32)).contiguous()
+        return img, mask
+    
+    def collate_fn(self, batch):
+        imgs = torch.stack([i[0] for i in batch])
+        masks = torch.stack([i[1] for i in batch])
+        return {
+            'imgs': imgs,
+            'masks': masks
+        }
+    
+    def __len__(self):
+        return len(self.fns)
\ No newline at end of file
--- a/Code/image-inpainting/datasets/dataset_seg.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/datasets/dataset_seg.py 0 → 100644
View file @c81d667
+import os
+import torch
+import torch.nn as nn
+import torch.utils.data as data
+import cv2
+import numpy as np
+from tqdm import tqdm
+import pandas as pd
+from PIL import Image
+
+
+class FacemaskSegDataset(data.Dataset):
+    def __init__(self, cfg, train=True):
+        self.root_dir = cfg.root_dir
+        self.cfg = cfg
+        self.train = train
+
+        if self.train:
+            self.df = pd.read_csv(cfg.train_anns)
+        else:
+            self.df = pd.read_csv(cfg.val_anns)
+
+        self.load_images()
+
+    def load_images(self):
+        self.fns = []
+        for idx, rows in self.df.iterrows():
+            _, img_name, mask_name = rows
+            img_path = os.path.join(self.root_dir, img_name)
+            mask_path = os.path.join(self.root_dir, mask_name)
+            img_path = img_path.replace("\\", "/")
+            mask_path = mask_path.replace("\\", "/")
+            if os.path.isfile(mask_path):
+                self.fns.append([img_path, mask_path])
+
+    def __getitem__(self, index):
+        img_path, mask_path = self.fns[index]
+        img = cv2.imread(img_path)
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        img = cv2.resize(img, (self.cfg.img_size, self.cfg.img_size))
+        mask = cv2.imread(mask_path, 0)
+        mask[mask > 0] = 1.0
+        mask = np.expand_dims(mask, axis=0)
+
+        img = (
+            torch.from_numpy(img.astype(np.float32) / 255.0)
+            .permute(2, 0, 1)
+            .contiguous()
+        )
+        mask = torch.from_numpy(mask.astype(np.float32)).contiguous()
+        return img, mask
+
+    def collate_fn(self, batch):
+        imgs = torch.stack([i[0] for i in batch])
+        masks = torch.stack([i[1] for i in batch])
+        return {"imgs": imgs, "masks": masks}
+
+    def __len__(self):
+        return len(self.fns)
--- a/Code/image-inpainting/infer.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/infer.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+from torchvision.utils import save_image
+
+import numpy as np
+from PIL import Image
+import cv2
+from models import UNetSemantic, GatedGenerator
+import argparse
+from configs import Config
+
+class Predictor():
+    def __init__(self, cfg):
+        self.cfg = cfg
+        self.device = torch.device('cuda:0' if cfg.cuda else 'cpu')
+        self.masking = UNetSemantic().to(self.device)
+        self.masking.load_state_dict(torch.load('weights\model_segm_19_135000.pth', map_location='cpu'))
+        #self.masking.eval()
+
+        self.inpaint = GatedGenerator().to(self.device)
+        self.inpaint.load_state_dict(torch.load('weights/model_6_100000.pth', map_location='cpu')['G'])
+        self.inpaint.eval()
+
+    def save_image(self, img_list, save_img_path, nrow):
+        img_list  = [i.clone().cpu() for i in img_list]
+        imgs = torch.stack(img_list, dim=1)
+        imgs = imgs.view(-1, *list(imgs.size())[2:])
+        save_image(imgs, save_img_path, nrow = nrow)
+        print(f"Save image to {save_img_path}")
+
+    def predict(self, image, outpath='sample/results.png'):
+        outpath=f'sample/results_{image}.png'
+        image = 'sample/'+image
+        img = cv2.imread(image+'_masked.jpg')
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        img = cv2.resize(img, (self.cfg.img_size, self.cfg.img_size))
+        img = torch.from_numpy(img.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()
+        img = img.unsqueeze(0).to(self.device)
+
+        img_ori = cv2.imread(image+'.jpg')
+        img_ori = cv2.cvtColor(img_ori, cv2.COLOR_BGR2RGB)
+        img_ori = cv2.resize(img_ori, (self.cfg.img_size, self.cfg.img_size))
+        img_ori = torch.from_numpy(img_ori.astype(np.float32) / 255.0).permute(2, 0, 1).contiguous()
+        img_ori = img_ori.unsqueeze(0)
+        with torch.no_grad():
+            outputs = self.masking(img)
+            _, out = self.inpaint(img, outputs)
+            inpaint = img * (1 - outputs) + out * outputs
+        masks = img * (1 - outputs) + outputs #torch.cat([outputs, outputs, outputs], dim=1)
+        
+
+         
+        self.save_image([img, masks, inpaint, img_ori], outpath, nrow=4)
+
+        
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='Training custom model')
+    parser.add_argument('--image', default=None, type=str, help='resume training')
+    parser.add_argument('config', default='config', type=str, help='config training')                         
+    args = parser.parse_args() 
+
+    config = Config(f'./configs/{args.config}.yaml')
+
+
+    model = Predictor(config)
+    model.predict(args.image)
\ No newline at end of file
--- a/Code/image-inpainting/loggers/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/loggers/__init__.py 0 → 100644
View file @c81d667
+from .loggers import *
\ No newline at end of file
--- a/Code/image-inpainting/loggers/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/loggers/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/loggers/__pycache__/loggers.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/loggers/__pycache__/loggers.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/loggers/loggers.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/loggers/loggers.py 0 → 100644
View file @c81d667
+import os
+import numpy as np
+from torch.utils.tensorboard import SummaryWriter
+from datetime import datetime
+
+class Logger():
+    """
+    Logger for Tensorboard visualization
+    :param log_dir: Path to save checkpoint
+    """
+    def __init__(self, log_dir=None):
+        self.log_dir = log_dir
+        if self.log_dir is None:
+            self.log_dir = os.path.join('loggers/runs',datetime.now().strftime('%Y-%m-%d_%H-%M-%S'))
+        if not os.path.exists(self.log_dir):
+            os.mkdir(self.log_dir)
+        self.writer = SummaryWriter(log_dir=self.log_dir)
+        self.iters = {}
+
+    def write(self, tags, values):
+        """
+        Write a log to specified directory
+        :param tags: (str) tag for log
+        :param values: (number) value for corresponding tag
+        """
+        if not isinstance(tags, list):
+            tags = list(tags)
+        if not isinstance(values, list):
+            values = list(values)
+
+        for i, (tag, value) in enumerate(zip(tags,values)):
+            if tag not in self.iters.keys():
+                self.iters[tag] = 0
+            self.writer.add_scalar(tag, value, self.iters[tag])
+            self.iters[tag] += 1
+
+
--- a/Code/image-inpainting/loggers/runs/your training logs are here, use tensorboard to view .txt 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/loggers/runs/your training logs are here, use tensorboard to view .txt 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__init__.py 0 → 100644
View file @c81d667
+from .adversarial import GANLoss
+from .ssim import SSIM
+from .dice import DiceLoss
\ No newline at end of file
--- a/Code/image-inpainting/losses/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/adversarial.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/adversarial.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/adversarial.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/adversarial.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/adversarial.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/adversarial.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/dice.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/dice.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/dice.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/dice.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/dice.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/dice.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/ssim.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/ssim.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/ssim.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/ssim.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/__pycache__/ssim.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/__pycache__/ssim.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/losses/adversarial.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/adversarial.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+
+class GANLoss(nn.Module):
+    def __init__(self, target_real_label=1.0, target_fake_label=0.0):
+        super(GANLoss, self).__init__()
+        self.register_buffer('real_label', torch.tensor(target_real_label))
+        self.register_buffer('fake_label', torch.tensor(target_fake_label))
+        self.loss = nn.MSELoss()
+
+    def get_target_tensor(self, input, target_is_real):
+        if target_is_real:
+            target_tensor = self.real_label
+        else:
+            target_tensor = self.fake_label
+        return target_tensor.expand_as(input)
+
+    def __call__(self, input, target_is_real):
+        target_tensor = self.get_target_tensor(input, target_is_real).to(input.device)
+        return self.loss(input, target_tensor)
\ No newline at end of file
--- a/Code/image-inpainting/losses/dice.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/dice.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+
+
+class DiceLoss(nn.Module):
+    """
+    Dice loss of binary class
+    Args:
+        smooth: A float number to smooth loss, and avoid NaN error, default: 1
+        p: Denominator value: \sum{x^p} + \sum{y^p}, default: 2
+        predict: A tensor of shape [N, *]
+        target: A tensor of shape same with predict
+        reduction: Reduction method to apply, return mean over batch if 'mean',
+            return sum if 'sum', return a tensor of shape [N,] if 'none'
+    Returns:
+        Loss tensor according to arg reduction
+    Raise:
+        Exception if unexpected reduction
+    """
+    def __init__(self, smooth=1, p=2, reduction='mean'):
+        super(DiceLoss, self).__init__()
+        self.smooth = smooth
+        self.p = p
+        self.reduction = reduction
+
+    def forward(self, predict, target):
+        assert predict.shape[0] == target.shape[0], "predict & target batch size don't match"
+        predict = predict.contiguous().view(predict.shape[0], -1)
+        target = target.contiguous().view(target.shape[0], -1)
+
+        num = torch.sum(torch.mul(predict, target), dim=1) + self.smooth
+        den = torch.sum(predict.pow(self.p) + target.pow(self.p), dim=1) + self.smooth
+
+        loss = 1 - num / den
+
+        if self.reduction == 'mean':
+            return loss.mean()
+        elif self.reduction == 'sum':
+            return loss.sum()
+        elif self.reduction == 'none':
+            return loss
+        else:
+            raise Exception('Unexpected reduction {}'.format(self.reduction))
--- a/Code/image-inpainting/losses/ssim.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/losses/ssim.py 0 → 100644
View file @c81d667
+#Source: https://github.com/Po-Hsun-Su/pytorch-ssim.git
+
+import torch
+import torch.nn.functional as F
+from torch.autograd import Variable
+import numpy as np
+from math import exp
+
+def gaussian(window_size, sigma):
+    gauss = torch.Tensor([exp(-(x - window_size//2)**2/float(2*sigma**2)) for x in range(window_size)])
+    return gauss/gauss.sum()
+
+def create_window(window_size, channel):
+    _1D_window = gaussian(window_size, 1.5).unsqueeze(1)
+    _2D_window = _1D_window.mm(_1D_window.t()).float().unsqueeze(0).unsqueeze(0)
+    window = Variable(_2D_window.expand(channel, 1, window_size, window_size).contiguous())
+    return window
+
+def _ssim(img1, img2, window, window_size, channel, size_average = True):
+    mu1 = F.conv2d(img1, window, padding = window_size//2, groups = channel)
+    mu2 = F.conv2d(img2, window, padding = window_size//2, groups = channel)
+
+    mu1_sq = mu1.pow(2)
+    mu2_sq = mu2.pow(2)
+    mu1_mu2 = mu1*mu2
+
+    sigma1_sq = F.conv2d(img1*img1, window, padding = window_size//2, groups = channel) - mu1_sq
+    sigma2_sq = F.conv2d(img2*img2, window, padding = window_size//2, groups = channel) - mu2_sq
+    sigma12 = F.conv2d(img1*img2, window, padding = window_size//2, groups = channel) - mu1_mu2
+
+    C1 = 0.01**2
+    C2 = 0.03**2
+
+    ssim_map = ((2*mu1_mu2 + C1)*(2*sigma12 + C2))/((mu1_sq + mu2_sq + C1)*(sigma1_sq + sigma2_sq + C2))
+
+    if size_average:
+        return ssim_map.mean()
+    else:
+        return ssim_map.mean(1).mean(1).mean(1)
+
+class SSIM(torch.nn.Module):
+    def __init__(self, window_size = 11, size_average = True):
+        super(SSIM, self).__init__()
+        self.window_size = window_size
+        self.size_average = size_average
+        self.channel = 1
+        self.window = create_window(window_size, self.channel)
+
+    def forward(self, img1, img2):
+        (_, channel, _, _) = img1.size()
+
+        if channel == self.channel and self.window.data.type() == img1.data.type():
+            window = self.window
+        else:
+            window = create_window(self.window_size, channel)
+            
+            if img1.is_cuda:
+                window = window.cuda(img1.get_device())
+            window = window.type_as(img1)
+            
+            self.window = window
+            self.channel = channel
+
+
+        return _ssim(img1, img2, window, self.window_size, channel, self.size_average)
+
+def ssim(img1, img2, window_size = 11, size_average = True):
+    (_, channel, _, _) = img1.size()
+    window = create_window(window_size, channel)
+    
+    if img1.is_cuda:
+        window = window.cuda(img1.get_device())
+    window = window.type_as(img1)
+    
+    return _ssim(img1, img2, window, window_size, channel, size_average)
\ No newline at end of file
--- a/Code/image-inpainting/metrics/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__init__.py 0 → 100644
View file @c81d667
+from .dicecoeff import DiceScore
+from .pixelacc import PixelAccuracy
\ No newline at end of file
--- a/Code/image-inpainting/metrics/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/dicecoeff.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/__pycache__/pixelacc.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/metrics/dicecoeff.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/dicecoeff.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+import numpy as np
+
+class DiceScore():
+    def __init__(self, num_classes, ignore_index = None, eps=1e-6, thresh = 0.5):
+        self.thresh = thresh
+        self.num_classes = num_classes
+        self.pred_type = "multi" if num_classes > 1 else "binary"
+
+        if num_classes == 1:
+            self.num_classes+=1
+        
+        self.ignore_index = ignore_index
+        self.eps = eps
+
+        self.scores_list = np.zeros(self.num_classes)
+        self.reset()
+
+    def compute(self, outputs, targets): 
+        # outputs: (batch, num_classes, W, H)
+        # targets: (batch, num_classes, W, H)
+      
+        batch_size, _ , w, h = outputs.shape
+        if len(targets.shape) == 3:
+            targets = targets.unsqueeze(1)
+      
+        one_hot_targets = torch.zeros(batch_size, self.num_classes, h, w)
+        one_hot_predicts = torch.zeros(batch_size, self.num_classes, h, w)
+        
+        if self.pred_type == 'binary':
+            predicts = (outputs > self.thresh).float()
+        elif self.pred_type =='multi':
+            predicts = torch.argmax(outputs, dim=1).unsqueeze(1)
+
+        one_hot_targets.scatter_(1, targets.long(), 1)
+        one_hot_predicts.scatter_(1, predicts.long(), 1)
+        
+        for cl in range(self.num_classes):
+            cl_pred = one_hot_predicts[:,cl,:,:]
+            cl_target = one_hot_targets[:,cl,:,:]
+            score = self.binary_compute(cl_pred, cl_target)
+            self.scores_list[cl] += sum(score)
+        
+
+    def binary_compute(self, predict, target):
+        # outputs: (batch, 1, W, H)
+        # targets: (batch, 1, W, H)
+
+        intersect = (predict * target).sum((-2,-1))
+        union = (predict + target).sum((-2,-1))
+        return (2. * intersect + self.eps) / (union +self.eps)
+        
+    def reset(self):
+        self.scores_list = np.zeros(self.num_classes)
+        self.sample_size = 0
+
+    def update(self, outputs, targets):
+        self.sample_size += outputs.shape[0]
+        self.compute(outputs, targets)
+
+    def value(self):
+        scores_each_class = self.scores_list / self.sample_size #mean over number of samples
+        if self.pred_type == 'binary':
+            scores = scores_each_class[1] # ignore background which is label 0
+        else:
+            scores = sum(scores_each_class) / self.num_classes
+        return np.round(scores, decimals=4)
+
+    def summary(self):
+        class_iou = self.scores_list / self.sample_size #mean
+        
+        print(f'{self.value()}')
+        for i, x in enumerate(class_iou):
+            print(f'\tClass {i}: {x:.4f}')
+
+    def __str__(self):
+        return f'Dice Score: {self.value()}'
+
+    def __len__(self):
+        return len(self.sample_size)
+
+    
\ No newline at end of file
--- a/Code/image-inpainting/metrics/pixelacc.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/metrics/pixelacc.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+import numpy as np
+
+class PixelAccuracy():
+    def __init__(self, num_classes, ignore_index=None, eps=1e-6, thresh = 0.5):
+        self.thresh = thresh
+        self.num_classes = num_classes
+        self.pred_type = "multi" if num_classes > 1 else "binary"
+
+        if num_classes == 1:
+            self.num_classes+=1
+        
+        self.ignore_index = ignore_index
+        self.eps = eps
+
+        self.scores_list = np.zeros(self.num_classes)
+        self.reset()
+
+    def compute(self, outputs, targets): 
+        # outputs: (batch, num_classes, W, H)
+        # targets: (batch, num_classes, W, H)
+      
+        batch_size, _ , w, h = outputs.shape
+        if len(targets.shape) == 3:
+            targets = targets.unsqueeze(1)
+      
+        one_hot_targets = torch.zeros(batch_size, self.num_classes, h, w)
+        one_hot_predicts = torch.zeros(batch_size, self.num_classes, h, w)
+        
+        if self.pred_type == 'binary':
+            predicts = (outputs > self.thresh).float()
+        elif self.pred_type =='multi':
+            predicts = torch.argmax(outputs, dim=1).unsqueeze(1)
+
+        one_hot_targets.scatter_(1, targets.long(), 1)
+        one_hot_predicts.scatter_(1, predicts.long(), 1)
+        
+        for cl in range(self.num_classes):
+            cl_pred = one_hot_predicts[:,cl,:,:]
+            cl_target = one_hot_targets[:,cl,:,:]
+            score = self.binary_compute(cl_pred, cl_target)
+            self.scores_list[cl] += sum(score)
+
+    def binary_compute(self, predict, target):
+        # predict: (batch, 1, W, H)
+        # targets: (batch, 1, W, H)
+
+        correct = (predict == target).sum((-2,-1))
+        total = target.shape[-1] * target.shape[-2]
+        return (correct + self.eps) *1.0 / (total +self.eps)
+        
+    def reset(self):
+        self.scores_list = np.zeros(self.num_classes)
+        self.sample_size = 0
+
+    def update(self, outputs, targets):
+        self.sample_size += outputs.shape[0]
+        self.compute(outputs, targets)
+
+    def value(self):
+        scores_each_class = self.scores_list / self.sample_size #mean over number of samples
+        if self.pred_type == 'binary':
+            scores = scores_each_class[1] # ignore background which is label 0
+        else:
+            scores = sum(scores_each_class) / self.num_classes
+        return np.round(scores, decimals=4)
+
+    def summary(self):
+        class_iou = self.scores_list / self.sample_size #mean
+        
+        print(f'{self.value()}')
+        for i, x in enumerate(class_iou):
+            print(f'\tClass {i}: {x:.4f}')
+
+    def __str__(self):
+        return f'Pixel Accuracy: {self.value()}'
+
+    def __len__(self):
+        return len(self.sample_size)
\ No newline at end of file
--- a/Code/image-inpainting/models/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__init__.py 0 → 100644
View file @c81d667
+from .networks import GatedGenerator, NLayerDiscriminator, PerceptualNet
+from .unet import UNetSemantic
--- a/Code/image-inpainting/models/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/__init__.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/__init__.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/networks.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/networks.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/networks.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/networks.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/networks.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/networks.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/unet.cpython-36.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/unet.cpython-36.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/unet.cpython-37.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/unet.cpython-37.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/unet.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/unet.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/__pycache__/vgg.cpython-38.pyc 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/__pycache__/vgg.cpython-38.pyc 0 → 100644
View file @c81d667
--- a/Code/image-inpainting/models/networks.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/networks.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+from torch.nn import Parameter
+import torch.nn.functional as F
+import torch.utils.data as data
+import functools
+from torchvision.models import vgg19, vgg16
+
+class GatedConv2d(nn.Module):
+    def __init__(self, in_channels, out_channels, kernel_size, stride = 1, padding = 0, dilation = 1, activation = 'lrelu', norm = 'in'):
+        super(GatedConv2d, self).__init__()
+        self.pad = nn.ZeroPad2d(padding)
+        if norm is not None:
+            self.norm = nn.InstanceNorm2d(out_channels)
+        else:
+            self.norm = None
+            
+        if activation == 'tanh':
+            self.activation = nn.Tanh()
+        else:
+            self.activation = nn.LeakyReLU(0.2, inplace = True)
+        
+       
+        self.conv2d = nn.Conv2d(in_channels, out_channels, kernel_size, stride, padding = 0, dilation = dilation)
+        self.mask_conv2d = nn.Conv2d(in_channels, out_channels, kernel_size, stride, padding = 0, dilation = dilation)
+        self.sigmoid = torch.nn.Sigmoid()
+    
+    def forward(self, x):
+        x = self.pad(x)
+        conv = self.conv2d(x)
+        mask = self.mask_conv2d(x)
+        gated_mask = self.sigmoid(mask)
+        x = conv * gated_mask
+        if self.norm:
+            x = self.norm(x)
+        if self.activation:
+            x = self.activation(x)
+        return x
+
+class TransposeGatedConv2d(nn.Module):
+    def __init__(self, in_channels, out_channels, kernel_size, stride = 1, padding = 0, dilation = 1, norm=None, scale_factor = 2):
+        super(TransposeGatedConv2d, self).__init__()
+        # Initialize the conv scheme
+        self.scale_factor = scale_factor
+        self.gated_conv2d = GatedConv2d(in_channels, out_channels, kernel_size, stride, padding, dilation, norm=norm)
+    
+    def forward(self, x):
+        x = F.interpolate(x, scale_factor = self.scale_factor, mode = 'nearest')
+        x = self.gated_conv2d(x)
+        return x
+
+
+class GatedGenerator(nn.Module):
+    def __init__(self, in_channels=4, latent_channels=64, out_channels=3):
+        super(GatedGenerator, self).__init__()
+        self.coarse = nn.Sequential(
+            # encoder
+            GatedConv2d(in_channels, latent_channels, 7, 1, 3, norm = None),
+            GatedConv2d(latent_channels, latent_channels * 2, 4, 2, 1),
+            GatedConv2d(latent_channels * 2, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 4, 2, 1),
+            # Bottleneck
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 2, dilation = 2),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 4, dilation = 4),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 8, dilation = 8),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 16, dilation = 16),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            # decoder
+            TransposeGatedConv2d(latent_channels * 4, latent_channels * 2, 3, 1, 1),
+            GatedConv2d(latent_channels * 2, latent_channels * 2, 3, 1, 1),
+            TransposeGatedConv2d(latent_channels * 2, latent_channels, 3, 1, 1),
+            GatedConv2d(latent_channels, out_channels, 7, 1, 3, activation = 'tanh', norm = None)
+        )
+        self.refinement = nn.Sequential(
+            # encoder
+            GatedConv2d(in_channels, latent_channels, 7, 1, 3, norm = None),
+            GatedConv2d(latent_channels, latent_channels * 2, 4, 2, 1),
+            GatedConv2d(latent_channels * 2, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 4, 2, 1),
+            # Bottleneck
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 2, dilation = 2),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 4, dilation = 4),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 8, dilation = 8),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 16, dilation = 16),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            GatedConv2d(latent_channels * 4, latent_channels * 4, 3, 1, 1),
+            # decoder
+            TransposeGatedConv2d(latent_channels * 4, latent_channels * 2, 3, 1, 1),
+            GatedConv2d(latent_channels * 2, latent_channels * 2, 3, 1, 1),
+            TransposeGatedConv2d(latent_channels * 2, latent_channels, 3, 1, 1),
+            GatedConv2d(latent_channels, out_channels, 7, 1, 3, activation = 'tanh', norm = None)
+        )
+        
+    def forward(self, img, mask):
+        # img: entire img
+        # mask: 1 for mask region; 0 for unmask region
+        # 1 - mask: unmask
+        # img * (1 - mask): ground truth unmask region
+        # Coarse
+     
+        first_masked_img = img * (1 - mask) + mask
+        first_in = torch.cat((first_masked_img, mask), 1)       # in: [B, 4, H, W]
+        first_out = self.coarse(first_in)                       # out: [B, 3, H, W]
+        # Refinement
+        second_masked_img = img * (1 - mask) + first_out * mask
+        second_in = torch.cat((second_masked_img, mask), 1)     # in: [B, 4, H, W]
+        second_out = self.refinement(second_in)                 # out: [B, 3, H, W]
+        return first_out, second_out
+
+
+class NLayerDiscriminator(nn.Module):
+    def __init__(self, input_nc, ndf=64, n_layers=3, norm_layer=nn.BatchNorm2d, use_sigmoid=False):
+        super(NLayerDiscriminator, self).__init__()
+        if type(norm_layer) == functools.partial:
+            use_bias = norm_layer.func == nn.InstanceNorm2d
+        else:
+            use_bias = norm_layer == nn.InstanceNorm2d
+
+        kw = 4
+        padw = 1
+        sequence = [
+            nn.Conv2d(input_nc, ndf, kernel_size=kw, stride=2, padding=padw),
+            nn.LeakyReLU(0.2, True)
+        ]
+
+        nf_mult = 1
+        nf_mult_prev = 1
+        for n in range(1, n_layers):
+            nf_mult_prev = nf_mult
+            nf_mult = min(2**n, 8)
+            sequence += [
+                nn.Conv2d(ndf * nf_mult_prev, ndf * nf_mult,
+                          kernel_size=kw, stride=2, padding=padw, bias=use_bias),
+                norm_layer(ndf * nf_mult),
+                nn.LeakyReLU(0.2, True)
+            ]
+
+        nf_mult_prev = nf_mult
+        nf_mult = min(2**n_layers, 8)
+        sequence += [
+            nn.Conv2d(ndf * nf_mult_prev, ndf * nf_mult,
+                      kernel_size=kw, stride=1, padding=padw, bias=use_bias),
+            norm_layer(ndf * nf_mult),
+            nn.LeakyReLU(0.2, True)
+        ]
+
+        sequence += [nn.Conv2d(ndf * nf_mult, 1, kernel_size=kw, stride=1, padding=padw)]
+
+        if use_sigmoid:
+            sequence += [nn.Sigmoid()]
+
+        self.model = nn.Sequential(*sequence)
+
+    def forward(self, input):
+        return self.model(input)
+
+class PerceptualNet(nn.Module):
+    # https://gist.github.com/alper111/8233cdb0414b4cb5853f2f730ab95a49
+    def __init__(self, name = "vgg19", resize=True):
+        super(PerceptualNet, self).__init__()
+        blocks = []
+        if name == "vgg19":
+            blocks.append(vgg19(pretrained=True).features[:4].eval())
+            blocks.append(vgg19(pretrained=True).features[4:9].eval())
+            blocks.append(vgg19(pretrained=True).features[9:16].eval())
+            blocks.append(vgg19(pretrained=True).features[16:23].eval())
+        elif name == "vgg16":
+            blocks.append(vgg16(pretrained=True).features[:4].eval())
+            blocks.append(vgg16(pretrained=True).features[4:9].eval())
+            blocks.append(vgg16(pretrained=True).features[9:16].eval())
+            blocks.append(vgg16(pretrained=True).features[16:23].eval())
+        else:
+            assert "wrong model name"
+        
+        for bl in blocks:
+            for p in bl:
+                p.requires_grad = False
+        self.blocks = torch.nn.ModuleList(blocks)
+        self.transform = torch.nn.functional.interpolate
+        self.mean = torch.nn.Parameter(torch.tensor([0.485, 0.456, 0.406]).view(1,3,1,1))
+        self.std = torch.nn.Parameter(torch.tensor([0.229, 0.224, 0.225]).view(1,3,1,1))
+        self.resize = resize
+
+    def forward(self, inputs, targets):
+        if inputs.shape[1] != 3:
+            inputs = inputs.repeat(1, 3, 1, 1)
+            targets = targets.repeat(1, 3, 1, 1)
+        inputs = (inputs-self.mean) / self.std
+        targets = (targets-self.mean) / self.std
+        if self.resize:
+            inputs = self.transform(inputs, mode='bilinear', size=(512, 512), align_corners=False)
+            targets = self.transform(targets, mode='bilinear', size=(512, 512), align_corners=False)
+        loss = 0.0
+        x = inputs
+        y = targets
+        for block in self.blocks:
+            x = block(x)
+            y = block(y)
+            loss += torch.nn.functional.l1_loss(x, y)
+        return loss
+
+
+
--- a/Code/image-inpainting/models/unet.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/models/unet.py 0 → 100644
View file @c81d667
+import torch
+import torch.nn as nn
+from torch.nn import Parameter
+import torch.nn.functional as F
+import torch.utils.data as data
+import functools
+
+
+class conv_block(nn.Module):
+    """
+    Convolution Block 
+    """
+    def __init__(self, in_ch, out_ch):
+        super(conv_block, self).__init__()
+        
+        self.conv = nn.Sequential(
+            nn.Conv2d(in_ch, out_ch, kernel_size=3, stride=1, padding=1, bias=True),
+            nn.BatchNorm2d(out_ch),
+            nn.ReLU(inplace=True),
+            nn.Conv2d(out_ch, out_ch, kernel_size=3, stride=1, padding=1, bias=True),
+            nn.BatchNorm2d(out_ch),
+            nn.ReLU(inplace=True))
+
+    def forward(self, x):
+
+        x = self.conv(x)
+        return x
+
+
+class up_conv(nn.Module):
+    """
+    Up Convolution Block
+    """
+    def __init__(self, in_ch, out_ch):
+        super(up_conv, self).__init__()
+        self.up = nn.Sequential(
+            nn.Upsample(scale_factor=2),
+            nn.Conv2d(in_ch, out_ch, kernel_size=3, stride=1, padding=1, bias=True),
+            nn.BatchNorm2d(out_ch),
+            nn.ReLU(inplace=True)
+        )
+
+    def forward(self, x):
+        x = self.up(x)
+        return x
+
+    
+    
+class Recurrent_block(nn.Module):
+    """
+    Recurrent Block for R2Unet_CNN
+    """
+    def __init__(self, out_ch, t=2):
+        super(Recurrent_block, self).__init__()
+
+        self.t = t
+        self.out_ch = out_ch
+        self.conv = nn.Sequential(
+            nn.Conv2d(out_ch, out_ch, kernel_size=3, stride=1, padding=1, bias=True),
+            nn.BatchNorm2d(out_ch),
+            nn.ReLU(inplace=True)
+        )
+
+    def forward(self, x):
+        for i in range(self.t):
+            if i == 0:
+                x = self.conv(x)
+            out = self.conv(x + x)
+        return out
+    
+    
+class RRCNN_block(nn.Module):
+    """
+    Recurrent Residual Convolutional Neural Network Block
+    """
+    def __init__(self, in_ch, out_ch, t=2):
+        super(RRCNN_block, self).__init__()
+
+        self.RCNN = nn.Sequential(
+            Recurrent_block(out_ch, t=t),
+            Recurrent_block(out_ch, t=t)
+        )
+        self.Conv = nn.Conv2d(in_ch, out_ch, kernel_size=1, stride=1, padding=0)
+
+    def forward(self, x):
+        x1 = self.Conv(x)
+        x2 = self.RCNN(x1)
+        out = x1 + x2
+        return out
+    
+class Attention_block(nn.Module):
+    """
+    Attention Block
+    """
+
+    def __init__(self, F_g, F_l, F_int):
+        super(Attention_block, self).__init__()
+
+        self.W_g = nn.Sequential(
+            nn.Conv2d(F_l, F_int, kernel_size=1, stride=1, padding=0, bias=True),
+            nn.BatchNorm2d(F_int)
+        )
+
+        self.W_x = nn.Sequential(
+            nn.Conv2d(F_g, F_int, kernel_size=1, stride=1, padding=0, bias=True),
+            nn.BatchNorm2d(F_int)
+        )
+
+        self.psi = nn.Sequential(
+            nn.Conv2d(F_int, 1, kernel_size=1, stride=1, padding=0, bias=True),
+            nn.BatchNorm2d(1),
+            nn.Sigmoid()
+        )
+
+        self.relu = nn.ReLU(inplace=True)
+
+    def forward(self, g, x):
+        g1 = self.W_g(g)
+        x1 = self.W_x(x)
+        psi = self.relu(g1 + x1)
+        psi = self.psi(psi)
+        out = x * psi
+        return out    
+
+class SE_Block(nn.Module):
+    "credits: https://github.com/moskomule/senet.pytorch/blob/master/senet/se_module.py#L4"
+    def __init__(self, c, r=16):
+        super().__init__()
+        self.squeeze = nn.AdaptiveAvgPool2d(1)
+        self.excitation = nn.Sequential(
+            nn.Linear(c, c // r, bias=False),
+            nn.ReLU(inplace=True),
+            nn.Linear(c // r, c, bias=False),
+            nn.Sigmoid()
+        )
+
+    def forward(self, x):
+        bs, c, _, _ = x.shape
+        y = self.squeeze(x).view(bs, c)
+        y = self.excitation(y).view(bs, c, 1, 1)
+        return x * y.expand_as(x)
+    
+class AtrousConv(nn.Module):
+    def __init__(self, in_ch):
+        super().__init__()
+        self.atrous_conv = nn.Sequential(
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, stride=1, dilation=2, padding=2),
+            nn.BatchNorm2d(in_ch),
+            nn.ReLU(),
+    
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, stride=1, dilation=4, padding=4),
+            nn.BatchNorm2d(in_ch),
+            nn.ReLU(),
+            
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, stride=1, dilation=8, padding=8),
+            nn.BatchNorm2d(in_ch),
+            nn.ReLU(),
+            
+            nn.Conv2d(in_ch, in_ch, kernel_size=3, stride=1, dilation=16, padding=16),
+            nn.BatchNorm2d(in_ch),
+            nn.ReLU(),
+        )
+        
+    def forward(self, x):
+        return self.atrous_conv(x)
+    
+
+class UNetSemantic(nn.Module):
+    """
+    UNet - Basic Implementation
+    Paper : https://arxiv.org/abs/1505.04597
+    """
+    def __init__(self, in_ch=3, out_ch=1):
+        super(UNetSemantic, self).__init__()
+
+        n1 = 32
+        filters = [n1, n1 * 2, n1 * 4, n1 * 8, n1 * 16]
+        
+        self.Maxpool1 = nn.MaxPool2d(kernel_size=2, stride=2)
+        self.Maxpool2 = nn.MaxPool2d(kernel_size=2, stride=2)
+        self.Maxpool3 = nn.MaxPool2d(kernel_size=2, stride=2)
+        self.Maxpool4 = nn.MaxPool2d(kernel_size=2, stride=2)
+
+        self.Conv1 = conv_block(in_ch, filters[0])
+        self.Conv2 = conv_block(filters[0], filters[1])
+        self.Conv3 = conv_block(filters[1], filters[2])
+        self.Conv4 = conv_block(filters[2], filters[3])
+        self.Conv5 = conv_block(filters[3], filters[4])
+
+        self.Up5 = up_conv(filters[4], filters[3])
+        self.Up_conv5 = conv_block(filters[4], filters[3])
+
+        self.Up4 = up_conv(filters[3], filters[2])
+        self.Up_conv4 = conv_block(filters[3], filters[2])
+
+        self.Up3 = up_conv(filters[2], filters[1])
+        self.Up_conv3 = conv_block(filters[2], filters[1])
+
+        self.Up2 = up_conv(filters[1], filters[0])
+        self.Up_conv2 = conv_block(filters[1], filters[0])
+
+        self.Conv = nn.Conv2d(filters[0], out_ch, kernel_size=1, stride=1, padding=0)
+        self.se1 = SE_Block(filters[0])
+        self.se2 = SE_Block(filters[1])
+        self.se3 = SE_Block(filters[2])
+        self.active = torch.nn.Sigmoid()
+
+    def forward(self, x):
+
+        e1 = self.Conv1(x)
+        e1 = self.se1(e1)
+
+        e2 = self.Maxpool1(e1)
+        e2 = self.Conv2(e2)
+        e2 = self.se2(e2)
+
+        e3 = self.Maxpool2(e2)
+        e3 = self.Conv3(e3)
+        e3 = self.se3(e3)
+
+        e4 = self.Maxpool3(e3)
+        e4 = self.Conv4(e4)
+
+        e5 = self.Maxpool4(e4)
+        e5 = self.Conv5(e5)
+
+        d5 = self.Up5(e5)
+        d5 = torch.cat((e4, d5), dim=1)
+
+        d5 = self.Up_conv5(d5)
+
+        d4 = self.Up4(d5)
+        d4 = torch.cat((e3, d4), dim=1)
+        d4 = self.Up_conv4(d4)
+
+        d3 = self.Up3(d4)
+        d3 = torch.cat((e2, d3), dim=1)
+        d3 = self.Up_conv3(d3)
+
+        d2 = self.Up2(d3)
+        d2 = torch.cat((e1, d2), dim=1)
+        d2 = self.Up_conv2(d2)
+
+        out = self.Conv(d2)
+
+        out = self.active(out)
+
+        return out
\ No newline at end of file
--- a/Code/image-inpainting/train.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/train.py 0 → 100644
View file @c81d667
+import argparse
+from configs import Config
+from trainer import Trainer
+from unet_trainer import UNetTrainer
+
+
+def main(args, cfg):
+    if args.config == "segm":
+        trainer = UNetTrainer(args, cfg)
+    else:
+        trainer = Trainer(args, cfg)
+    trainer.fit()
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Training custom model")
+    parser.add_argument("--resume", default=None, type=str, help="resume training")
+    parser.add_argument("config", default="config", type=str, help="config training")
+    args = parser.parse_args()
+
+    config = Config(f"./configs/{args.config}.yaml")
+    main(args, config)
--- a/Code/image-inpainting/trainer.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/trainer.py 0 → 100644
View file @c81d667
+import os
+import cv2
+import time
+import numpy as np
+from PIL import Image
+import matplotlib.pyplot as plt
+
+import torch
+import torch.nn as nn
+import torch.utils.data as data
+from torch.optim.lr_scheduler import StepLR
+from torchvision.utils import save_image
+
+
+from models import *
+from losses import *
+from datasets import Places365Dataset, FacemaskDataset
+
+
+def adjust_learning_rate(optimizer, gamma, num_steps=1):
+    for i in range(num_steps):
+        for param_group in optimizer.param_groups:
+            param_group['lr'] *= gamma
+
+def get_epoch_iters(path):
+    path = os.path.basename(path)
+    tokens = path[:-4].split('_')
+    try:
+        if tokens[-1] == 'interrupted':
+            epoch_idx = int(tokens[-3])
+            iter_idx = int(tokens[-2])
+        else:
+            epoch_idx = int(tokens[-2])
+            iter_idx = int(tokens[-1])
+    except:
+        return 0, 0
+
+    return epoch_idx, iter_idx
+
+def load_checkpoint(model_G, model_D, path):
+    state = torch.load(path,map_location='cpu')
+    model_G.load_state_dict(state['G'])
+    model_D.load_state_dict(state['D'])
+    print('Loaded checkpoint successfully')
+
+class Trainer():
+    def __init__(self, args, cfg):
+        
+        if args.resume is not None:
+            epoch, iters = get_epoch_iters(args.resume)
+        else:
+            epoch = 0
+            iters = 0
+
+        if not os.path.exists(cfg.checkpoint_path):
+            os.makedirs(cfg.checkpoint_path)
+        if not os.path.exists(cfg.sample_folder):
+            os.makedirs(cfg.sample_folder)
+
+        self.cfg = cfg
+        self.step_iters = cfg.step_iters
+        self.gamma = cfg.gamma
+        self.visualize_per_iter = cfg.visualize_per_iter
+        self.print_per_iter = cfg.print_per_iter
+        self.save_per_iter = cfg.save_per_iter
+        
+        self.start_iter = iters
+        self.iters = 0
+        self.num_epochs = cfg.num_epochs
+        self.device = torch.device('cuda' if cfg.cuda else 'cpu')
+
+        trainset = FacemaskDataset(cfg) # Places365Dataset(cfg) #
+
+        self.trainloader = data.DataLoader(
+            trainset, 
+            batch_size=cfg.batch_size,
+            num_workers = cfg.num_workers,
+            pin_memory = True, 
+            shuffle=True,
+            collate_fn = trainset.collate_fn)
+
+        self.epoch = int(self.start_iter / len(self.trainloader))
+        self.iters = self.start_iter
+        self.num_iters = (self.num_epochs+1) * len(self.trainloader)
+
+        self.model_G = GatedGenerator().to(self.device)
+        self.model_D = NLayerDiscriminator(cfg.d_num_layers, use_sigmoid=False).to(self.device)
+        self.model_P = PerceptualNet(name = "vgg16", resize=False).to(self.device)
+
+        if args.resume is not None:
+            load_checkpoint(self.model_G, self.model_D, args.resume)
+
+        self.criterion_adv = GANLoss(target_real_label=0.9, target_fake_label=0.1)
+        self.criterion_rec = nn.SmoothL1Loss()
+        self.criterion_ssim = SSIM(window_size = 11)
+        self.criterion_per = nn.SmoothL1Loss()
+
+        self.optimizer_D = torch.optim.Adam(self.model_D.parameters(), lr=cfg.lr)
+        self.optimizer_G = torch.optim.Adam(self.model_G.parameters(), lr=cfg.lr)
+
+    def validate(self, sample_folder, sample_name, img_list):
+        save_img_path = os.path.join(sample_folder, sample_name+'.png') 
+        img_list  = [i.clone().cpu() for i in img_list]
+        imgs = torch.stack(img_list, dim=1)
+
+        # imgs shape: Bx5xCxWxH
+
+        imgs = imgs.view(-1, *list(imgs.size())[2:])
+        save_image(imgs, save_img_path, nrow= 5)
+        print(f"Save image to {save_img_path}")
+
+    def fit(self):
+        self.model_G.train()
+        self.model_D.train()
+
+        running_loss = {
+            'D': 0,
+            'G': 0,
+            'P': 0,
+            'R_1': 0,
+            'R_2': 0,
+            'T': 0,
+        }
+
+        running_time = 0
+        step = 0
+        try:
+            for epoch in range(self.epoch, self.num_epochs):
+                self.epoch = epoch
+                for i, batch in enumerate(self.trainloader):
+                    start_time = time.time()
+                    imgs = batch['imgs'].to(self.device)
+                    masks = batch['masks'].to(self.device)
+
+                    # Train discriminator
+                    self.optimizer_D.zero_grad()
+                    self.optimizer_G.zero_grad()
+                    
+                    first_out, second_out = self.model_G(imgs, masks)
+
+                    first_out_wholeimg = imgs * (1 - masks) + first_out * masks     
+                    second_out_wholeimg = imgs * (1 - masks) + second_out * masks
+
+                    masks = masks.cpu()
+
+                    fake_D = self.model_D(second_out_wholeimg.detach())
+                    real_D = self.model_D(imgs)
+
+                    loss_fake_D = self.criterion_adv(fake_D, target_is_real=False)
+                    loss_real_D = self.criterion_adv(real_D, target_is_real=True)
+
+                    loss_D = (loss_fake_D + loss_real_D) * 0.5
+
+                    loss_D.backward()
+                    self.optimizer_D.step()
+
+                    real_D = None
+
+                    # Train Generator
+                    self.optimizer_D.zero_grad()
+                    self.optimizer_G.zero_grad()
+
+                    fake_D = self.model_D(second_out_wholeimg)
+                    loss_G = self.criterion_adv(fake_D, target_is_real=True)
+
+                    fake_D = None
+                    
+                    # Reconstruction loss
+                    loss_l1_1 = self.criterion_rec(first_out_wholeimg, imgs)
+                    loss_l1_2 = self.criterion_rec(second_out_wholeimg, imgs)
+                    loss_ssim_1 = self.criterion_ssim(first_out_wholeimg, imgs)
+                    loss_ssim_2 = self.criterion_ssim(second_out_wholeimg, imgs)
+
+                    loss_rec_1 = 0.5 * loss_l1_1 + 0.5 * (1 - loss_ssim_1)
+                    loss_rec_2 = 0.5 * loss_l1_2 + 0.5 * (1 - loss_ssim_2)
+
+                    # Perceptual loss
+                    loss_P  = self.model_P(second_out_wholeimg, imgs)                          
+
+                    loss = self.cfg.lambda_G * loss_G + self.cfg.lambda_rec_1 * loss_rec_1 + self.cfg.lambda_rec_2 * loss_rec_2 + self.cfg.lambda_per * loss_P
+                    loss.backward()
+                    self.optimizer_G.step()
+
+                    end_time = time.time()
+
+                    imgs = imgs.cpu()
+                    # Visualize number
+                    running_time += (end_time - start_time)
+                    running_loss['D'] += loss_D.item()
+                    running_loss['G'] += (self.cfg.lambda_G * loss_G.item())
+                    running_loss['P'] += (self.cfg.lambda_per * loss_P.item())
+                    running_loss['R_1'] += (self.cfg.lambda_rec_1 * loss_rec_1.item())
+                    running_loss['R_2'] += (self.cfg.lambda_rec_2 * loss_rec_2.item())
+                    running_loss['T'] += loss.item()
+                    
+
+                    if self.iters % self.print_per_iter == 0:
+                        for key in running_loss.keys():
+                            running_loss[key] /= self.print_per_iter
+                            running_loss[key] = np.round(running_loss[key], 5)
+                        loss_string = '{}'.format(running_loss)[1:-1].replace("'",'').replace(",",' ||')
+                        print("[{}|{}] [{}|{}] || {} || Time: {:10.4f}s".format(self.epoch, self.num_epochs, self.iters, self.num_iters, loss_string, running_time))
+                        
+                        running_loss = {
+                            'D': 0,
+                            'G': 0,
+                            'P': 0,
+                            'R_1': 0,
+                            'R_2': 0,
+                            'T': 0,
+                        }
+                        running_time = 0
+                
+                    if self.iters % self.save_per_iter  == 0:
+                        torch.save({
+                            'D': self.model_D.state_dict(),
+                            'G': self.model_G.state_dict(),
+                        }, os.path.join(self.cfg.checkpoint_path, f"model_{self.epoch}_{self.iters}.pth"))
+
+                    # Step learning rate
+                    if self.iters == self.step_iters[step]:
+                        adjust_learning_rate(self.optimizer_D, self.gamma)
+                        adjust_learning_rate(self.optimizer_G, self.gamma)
+                        step+=1
+               
+                    # Visualize sample
+                    if self.iters % self.visualize_per_iter == 0:
+                        masked_imgs = imgs * (1 - masks) + masks
+                        
+                        img_list = [imgs, masked_imgs, first_out, second_out, second_out_wholeimg]
+                        #name_list = ['gt', 'mask', 'masked_img', 'first_out', 'second_out']
+                        filename = f"{self.epoch}_{str(self.iters)}"
+                        self.validate(self.cfg.sample_folder, filename , img_list)
+
+                    self.iters += 1
+
+        except KeyboardInterrupt:
+                torch.save({
+                    'D': self.model_D.state_dict(),
+                    'G': self.model_G.state_dict(),
+                }, os.path.join(self.cfg.checkpoint_path, f"model_{self.epoch}_{self.iters}.pth"))
+                    
+        
\ No newline at end of file
--- a/Code/image-inpainting/unet_trainer.py 0 → 100644
View file @c81d667
+++ b/Code/image-inpainting/unet_trainer.py 0 → 100644
View file @c81d667
+import os
+import cv2
+import time
+import numpy as np
+from PIL import Image
+import matplotlib.pyplot as plt
+from tqdm import tqdm
+
+import torch
+import torch.nn as nn
+import torch.utils.data as data
+from torch.optim.lr_scheduler import StepLR
+from torchvision.utils import save_image
+
+
+from models import UNetSemantic
+from losses import DiceLoss
+from datasets import FacemaskSegDataset
+from metrics import *
+
+
+def adjust_learning_rate(optimizer, gamma, num_steps=1):
+    for i in range(num_steps):
+        for param_group in optimizer.param_groups:
+            param_group["lr"] *= gamma
+
+
+def get_epoch_iters(path):
+    path = os.path.basename(path)
+    tokens = path[:-4].split("_")
+    try:
+        if tokens[-1] == "interrupted":
+            epoch_idx = int(tokens[-3])
+            iter_idx = int(tokens[-2])
+        else:
+            epoch_idx = int(tokens[-2])
+            iter_idx = int(tokens[-1])
+    except:
+        return 0, 0
+
+    return epoch_idx, iter_idx
+
+
+def load_checkpoint(model, path):
+    state = torch.load(path, map_location="cpu")
+    model.load_state_dict(state)
+    print("Loaded checkpoint successfully")
+
+
+class UNetTrainer:
+    def __init__(self, args, cfg):
+
+        if args.resume is not None:
+            epoch, iters = get_epoch_iters(args.resume)
+        else:
+            epoch = 0
+            iters = 0
+
+        self.cfg = cfg
+        self.step_iters = cfg.step_iters
+        self.gamma = cfg.gamma
+        self.visualize_per_iter = cfg.visualize_per_iter
+        self.print_per_iter = cfg.print_per_iter
+        self.save_per_iter = cfg.save_per_iter
+
+        self.start_iter = iters
+        self.iters = 0
+        self.num_epochs = cfg.num_epochs
+        self.device = torch.device("cuda:0" if cfg.cuda else "cpu")
+
+        trainset = FacemaskSegDataset(cfg)
+        valset = FacemaskSegDataset(cfg, train=False)
+
+        self.trainloader = data.DataLoader(
+            trainset,
+            batch_size=cfg.batch_size,
+            num_workers=cfg.num_workers,
+            pin_memory=True,
+            shuffle=True,
+            collate_fn=trainset.collate_fn,
+        )
+
+        self.valloader = data.DataLoader(
+            valset,
+            batch_size=cfg.batch_size,
+            num_workers=cfg.num_workers,
+            pin_memory=True,
+            shuffle=True,
+            collate_fn=valset.collate_fn,
+        )
+
+        self.epoch = int(self.start_iter / len(self.trainloader))
+        self.iters = self.start_iter
+        self.num_iters = (self.num_epochs + 1) * len(self.trainloader)
+
+        self.model = UNetSemantic().to(self.device)
+        self.criterion_dice = DiceLoss()
+        self.criterion_bce = nn.BCELoss()
+
+        if args.resume is not None:
+            load_checkpoint(self.model, args.resume)
+
+        self.optimizer = torch.optim.Adam(self.model.parameters(), lr=cfg.lr)
+
+    def validate(self, sample_folder, sample_name, img_list):
+        save_img_path = os.path.join(sample_folder, sample_name + ".png")
+        img_list = [i.clone().cpu() for i in img_list]
+        imgs = torch.stack(img_list, dim=1)
+
+        # imgs shape: Bx5xCxWxH
+
+        imgs = imgs.view(-1, *list(imgs.size())[2:])
+        save_image(imgs, save_img_path, nrow=3)
+        print(f"Save image to {save_img_path}")
+
+    def train_epoch(self):
+        self.model.train()
+        running_loss = {
+            "DICE": 0,
+            "BCE": 0,
+            "T": 0,
+        }
+        running_time = 0
+
+        for idx, batch in enumerate(self.trainloader):
+            self.optimizer.zero_grad()
+            inputs = batch["imgs"].to(self.device)
+            targets = batch["masks"].to(self.device)
+
+            start_time = time.time()
+
+            outputs = self.model(inputs)
+
+            loss_bce = self.criterion_bce(outputs, targets)
+            loss_dice = self.criterion_dice(outputs, targets)
+            loss = loss_bce + loss_dice
+            loss.backward()
+            self.optimizer.step()
+
+            end_time = time.time()
+
+            running_loss["T"] += loss.item()
+            running_loss["DICE"] += loss_dice.item()
+            running_loss["BCE"] += loss_bce.item()
+            running_time += end_time - start_time
+
+            if self.iters % self.print_per_iter == 0:
+                for key in running_loss.keys():
+                    running_loss[key] /= self.print_per_iter
+                    running_loss[key] = np.round(running_loss[key], 5)
+                loss_string = (
+                    "{}".format(running_loss)[1:-1].replace("'", "").replace(",", " ||")
+                )
+                running_time = np.round(running_time, 5)
+                print(
+                    "[{}/{}][{}/{}] || {} || Time: {}s".format(
+                        self.epoch,
+                        self.num_epochs,
+                        self.iters,
+                        self.num_iters,
+                        loss_string,
+                        running_time,
+                    )
+                )
+                running_time = 0
+                running_loss = {
+                    "DICE": 0,
+                    "BCE": 0,
+                    "T": 0,
+                }
+
+            if self.iters % self.save_per_iter == 0:
+                save_path = os.path.join(
+                    self.cfg.checkpoint_path,
+                    f"model_segm_{self.epoch}_{self.iters}.pth",
+                )
+                torch.save(self.model.state_dict(), save_path)
+                print(f"Save model at {save_path}")
+            self.iters += 1
+
+    def validate_epoch(self):
+        # Validate
+
+        self.model.eval()
+        metrics = [DiceScore(1), PixelAccuracy(1)]
+        running_loss = {
+            "DICE": 0,
+            "BCE": 0,
+            "T": 0,
+        }
+
+        running_time = 0
+        print(
+            "=============================EVALUATION==================================="
+        )
+        with torch.no_grad():
+            start_time = time.time()
+            for idx, batch in enumerate(tqdm(self.valloader)):
+
+                inputs = batch["imgs"].to(self.device)
+                targets = batch["masks"].to(self.device)
+                outputs = self.model(inputs)
+                loss_bce = self.criterion_bce(outputs, targets)
+                loss_dice = self.criterion_dice(outputs, targets)
+                loss = loss_bce + loss_dice
+                running_loss["T"] += loss.item()
+                running_loss["DICE"] += loss_dice.item()
+                running_loss["BCE"] += loss_bce.item()
+                for metric in metrics:
+                    metric.update(outputs.cpu(), targets.cpu())
+
+            end_time = time.time()
+            running_time += end_time - start_time
+            running_time = np.round(running_time, 5)
+            for key in running_loss.keys():
+                running_loss[key] /= len(self.valloader)
+                running_loss[key] = np.round(running_loss[key], 5)
+
+            loss_string = (
+                "{}".format(running_loss)[1:-1].replace("'", "").replace(",", " ||")
+            )
+
+            print(
+                "[{}/{}] || Validation || {} || Time: {}s".format(
+                    self.epoch, self.num_epochs, loss_string, running_time
+                )
+            )
+            for metric in metrics:
+                print(metric)
+            print(
+                "=========================================================================="
+            )
+
+    def fit(self):
+        try:
+            for epoch in range(self.epoch, self.num_epochs + 1):
+                self.epoch = epoch
+                self.train_epoch()
+                self.validate_epoch()
+        except KeyboardInterrupt:
+            torch.save(
+                self.model.state_dict(),
+                os.path.join(
+                    self.cfg.checkpoint_path,
+                    f"model_segm_{self.epoch}_{self.iters}.pth",
+                ),
+            )
+            print("Model saved!")
+
--- a/Code/pConv-Keras/.gitignore 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/.gitignore 0 → 100644
View file @c81d667
+# Repo-specific
+data/masks/*
+.vscode*
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# pyenv
+.python-version
+
+# celery beat schedule file
+celerybeat-schedule
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+
+backup*
+pexels_royalty_free_photos*
\ No newline at end of file
--- a/Code/pConv-Keras/libs/__init__.py 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/libs/__init__.py 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/libs/pconv_layer.py 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/libs/pconv_layer.py 0 → 100644
View file @c81d667
+
+from keras.utils import conv_utils
+from keras import backend as K
+from keras.engine import InputSpec
+from keras.layers import Conv2D
+
+
+class PConv2D(Conv2D):
+    def __init__(self, *args, n_channels=3, mono=False, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.input_spec = [InputSpec(ndim=4), InputSpec(ndim=4)]
+
+    def build(self, input_shape):        
+        """Adapted from original _Conv() layer of Keras        
+        param input_shape: list of dimensions for [img, mask]
+        """
+        
+        if self.data_format == 'channels_first':
+            channel_axis = 1
+        else:
+            channel_axis = -1
+            
+        if input_shape[0][channel_axis] is None:
+            raise ValueError('The channel dimension of the inputs should be defined. Found `None`.')
+            
+        self.input_dim = input_shape[0][channel_axis]
+        
+        # Image kernel
+        kernel_shape = self.kernel_size + (self.input_dim, self.filters)
+        self.kernel = self.add_weight(shape=kernel_shape,
+                                      initializer=self.kernel_initializer,
+                                      name='img_kernel',
+                                      regularizer=self.kernel_regularizer,
+                                      constraint=self.kernel_constraint)
+        # Mask kernel
+        self.kernel_mask = K.ones(shape=self.kernel_size + (self.input_dim, self.filters))
+
+        # Calculate padding size to achieve zero-padding
+        self.pconv_padding = (
+            (int((self.kernel_size[0]-1)/2), int((self.kernel_size[0]-1)/2)), 
+            (int((self.kernel_size[0]-1)/2), int((self.kernel_size[0]-1)/2)), 
+        )
+
+        # Window size - used for normalization
+        self.window_size = self.kernel_size[0] * self.kernel_size[1]
+        
+        if self.use_bias:
+            self.bias = self.add_weight(shape=(self.filters,),
+                                        initializer=self.bias_initializer,
+                                        name='bias',
+                                        regularizer=self.bias_regularizer,
+                                        constraint=self.bias_constraint)
+        else:
+            self.bias = None
+        self.built = True
+
+    def call(self, inputs, mask=None):
+        '''
+        We will be using the Keras conv2d method, and essentially we have
+        to do here is multiply the mask with the input X, before we apply the
+        convolutions. For the mask itself, we apply convolutions with all weights
+        set to 1.
+        Subsequently, we clip mask values to between 0 and 1
+        ''' 
+
+        # Both image and mask must be supplied
+        if type(inputs) is not list or len(inputs) != 2:
+            raise Exception('PartialConvolution2D must be called on a list of two tensors [img, mask]. Instead got: ' + str(inputs))
+
+        # Padding done explicitly so that padding becomes part of the masked partial convolution
+        images = K.spatial_2d_padding(inputs[0], self.pconv_padding, self.data_format)
+        masks = K.spatial_2d_padding(inputs[1], self.pconv_padding, self.data_format)
+
+        # Apply convolutions to mask
+        mask_output = K.conv2d(
+            masks, self.kernel_mask, 
+            strides=self.strides,
+            padding='valid',
+            data_format=self.data_format,
+            dilation_rate=self.dilation_rate
+        )
+
+        # Apply convolutions to image
+        img_output = K.conv2d(
+            (images*masks), self.kernel, 
+            strides=self.strides,
+            padding='valid',
+            data_format=self.data_format,
+            dilation_rate=self.dilation_rate
+        )        
+
+        # Calculate the mask ratio on each pixel in the output mask
+        mask_ratio = self.window_size / (mask_output + 1e-8)
+
+        # Clip output to be between 0 and 1
+        mask_output = K.clip(mask_output, 0, 1)
+
+        # Remove ratio values where there are holes
+        mask_ratio = mask_ratio * mask_output
+
+        # Normalize iamge output
+        img_output = img_output * mask_ratio
+
+        # Apply bias only to the image (if chosen to do so)
+        if self.use_bias:
+            img_output = K.bias_add(
+                img_output,
+                self.bias,
+                data_format=self.data_format)
+        
+        # Apply activations on the image
+        if self.activation is not None:
+            img_output = self.activation(img_output)
+            
+        return [img_output, mask_output]
+    
+    def compute_output_shape(self, input_shape):
+        if self.data_format == 'channels_last':
+            space = input_shape[0][1:-1]
+            new_space = []
+            for i in range(len(space)):
+                new_dim = conv_utils.conv_output_length(
+                    space[i],
+                    self.kernel_size[i],
+                    padding='same',
+                    stride=self.strides[i],
+                    dilation=self.dilation_rate[i])
+                new_space.append(new_dim)
+            new_shape = (input_shape[0][0],) + tuple(new_space) + (self.filters,)
+            return [new_shape, new_shape]
+        if self.data_format == 'channels_first':
+            space = input_shape[2:]
+            new_space = []
+            for i in range(len(space)):
+                new_dim = conv_utils.conv_output_length(
+                    space[i],
+                    self.kernel_size[i],
+                    padding='same',
+                    stride=self.strides[i],
+                    dilation=self.dilation_rate[i])
+                new_space.append(new_dim)
+            new_shape = (input_shape[0], self.filters) + tuple(new_space)
+            return [new_shape, new_shape]
--- a/Code/pConv-Keras/libs/pconv_model.py 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/libs/pconv_model.py 0 → 100644
View file @c81d667
+import os
+import sys
+import numpy as np
+from datetime import datetime
+
+import tensorflow as tf
+from keras.models import Model
+from keras.models import load_model
+from keras.optimizers import Adam
+from keras.layers import Input, Conv2D, UpSampling2D, Dropout, LeakyReLU, BatchNormalization, Activation, Lambda
+from keras.layers.merge import Concatenate
+from keras.applications import VGG16
+from keras import backend as K
+from keras.utils.multi_gpu_utils import multi_gpu_model
+
+from libs.pconv_layer import PConv2D
+
+
+class PConvUnet(object):
+
+    def __init__(self, img_rows=512, img_cols=512, vgg_weights="imagenet", inference_only=False, net_name='default', gpus=1, vgg_device=None):
+        """Create the PConvUnet. If variable image size, set img_rows and img_cols to None
+        
+        Args:
+            img_rows (int): image height.
+            img_cols (int): image width.
+            vgg_weights (str): which weights to pass to the vgg network.
+            inference_only (bool): initialize BN layers for inference.
+            net_name (str): Name of this network (used in logging).
+            gpus (int): How many GPUs to use for training.
+            vgg_device (str): In case of training with multiple GPUs, specify which device to run VGG inference on.
+                e.g. if training on 8 GPUs, vgg inference could be off-loaded exclusively to one GPU, instead of
+                running on one of the GPUs which is also training the UNet.
+        """
+        
+        # Settings
+        self.img_rows = img_rows
+        self.img_cols = img_cols
+        self.img_overlap = 30
+        self.inference_only = inference_only
+        self.net_name = net_name
+        self.gpus = gpus
+        self.vgg_device = vgg_device
+
+        # Scaling for VGG input
+        self.mean = [0.485, 0.456, 0.406]
+        self.std = [0.229, 0.224, 0.225]
+
+        # Assertions
+        assert self.img_rows >= 256, 'Height must be >256 pixels'
+        assert self.img_cols >= 256, 'Width must be >256 pixels'
+
+        # Set current epoch
+        self.current_epoch = 0
+        
+        # VGG layers to extract features from (first maxpooling layers, see pp. 7 of paper)
+        self.vgg_layers = [3, 6, 10]
+
+        # Instantiate the vgg network
+        if self.vgg_device:
+            with tf.device(self.vgg_device):
+                self.vgg = self.build_vgg(vgg_weights)
+        else:
+            self.vgg = self.build_vgg(vgg_weights)
+        
+        # Create UNet-like model
+        if self.gpus <= 1:
+            self.model, inputs_mask = self.build_pconv_unet()
+            self.compile_pconv_unet(self.model, inputs_mask)            
+        else:
+            with tf.device("/cpu:0"):
+                self.model, inputs_mask = self.build_pconv_unet()
+            self.model = multi_gpu_model(self.model, gpus=self.gpus)
+            self.compile_pconv_unet(self.model, inputs_mask)
+        
+    def build_vgg(self, weights="imagenet"):
+        """
+        Load pre-trained VGG16 from keras applications
+        Extract features to be used in loss function from last conv layer, see architecture at:
+        https://github.com/keras-team/keras/blob/master/keras/applications/vgg16.py
+        """        
+            
+        # Input image to extract features from
+        img = Input(shape=(self.img_rows, self.img_cols, 3))
+
+        # Mean center and rescale by variance as in PyTorch
+        processed = Lambda(lambda x: (x-self.mean) / self.std)(img)
+        
+        # If inference only, just return empty model        
+        if self.inference_only:
+            model = Model(inputs=img, outputs=[img for _ in range(len(self.vgg_layers))])
+            model.trainable = False
+            model.compile(loss='mse', optimizer='adam')
+            return model
+                
+        # Get the vgg network from Keras applications
+        if weights in ['imagenet', None]:
+            vgg = VGG16(weights=weights, include_top=False)
+        else:
+            vgg = VGG16(weights=None, include_top=False)
+            vgg.load_weights(weights, by_name=True)
+
+        # Output the first three pooling layers
+        vgg.outputs = [vgg.layers[i].output for i in self.vgg_layers]        
+        
+        # Create model and compile
+        model = Model(inputs=img, outputs=vgg(processed))
+        model.trainable = False
+        model.compile(loss='mse', optimizer='adam')
+
+        return model
+        
+    def build_pconv_unet(self, train_bn=True):      
+
+        # INPUTS
+        inputs_img = Input((self.img_rows, self.img_cols, 3), name='inputs_img')
+        inputs_mask = Input((self.img_rows, self.img_cols, 3), name='inputs_mask')
+        
+        # ENCODER
+        def encoder_layer(img_in, mask_in, filters, kernel_size, bn=True):
+            conv, mask = PConv2D(filters, kernel_size, strides=2, padding='same')([img_in, mask_in])
+            if bn:
+                conv = BatchNormalization(name='EncBN'+str(encoder_layer.counter))(conv, training=train_bn)
+            conv = Activation('relu')(conv)
+            encoder_layer.counter += 1
+            return conv, mask
+        encoder_layer.counter = 0
+        
+        e_conv1, e_mask1 = encoder_layer(inputs_img, inputs_mask, 64, 7, bn=False)
+        e_conv2, e_mask2 = encoder_layer(e_conv1, e_mask1, 128, 5)
+        e_conv3, e_mask3 = encoder_layer(e_conv2, e_mask2, 256, 5)
+        e_conv4, e_mask4 = encoder_layer(e_conv3, e_mask3, 512, 3)
+        e_conv5, e_mask5 = encoder_layer(e_conv4, e_mask4, 512, 3)
+        e_conv6, e_mask6 = encoder_layer(e_conv5, e_mask5, 512, 3)
+        e_conv7, e_mask7 = encoder_layer(e_conv6, e_mask6, 512, 3)
+        e_conv8, e_mask8 = encoder_layer(e_conv7, e_mask7, 512, 3)
+        
+        # DECODER
+        def decoder_layer(img_in, mask_in, e_conv, e_mask, filters, kernel_size, bn=True):
+            up_img = UpSampling2D(size=(2,2))(img_in)
+            up_mask = UpSampling2D(size=(2,2))(mask_in)
+            concat_img = Concatenate(axis=3)([e_conv,up_img])
+            concat_mask = Concatenate(axis=3)([e_mask,up_mask])
+            conv, mask = PConv2D(filters, kernel_size, padding='same')([concat_img, concat_mask])
+            if bn:
+                conv = BatchNormalization()(conv)
+            conv = LeakyReLU(alpha=0.2)(conv)
+            return conv, mask
+            
+        d_conv9, d_mask9 = decoder_layer(e_conv8, e_mask8, e_conv7, e_mask7, 512, 3)
+        d_conv10, d_mask10 = decoder_layer(d_conv9, d_mask9, e_conv6, e_mask6, 512, 3)
+        d_conv11, d_mask11 = decoder_layer(d_conv10, d_mask10, e_conv5, e_mask5, 512, 3)
+        d_conv12, d_mask12 = decoder_layer(d_conv11, d_mask11, e_conv4, e_mask4, 512, 3)
+        d_conv13, d_mask13 = decoder_layer(d_conv12, d_mask12, e_conv3, e_mask3, 256, 3)
+        d_conv14, d_mask14 = decoder_layer(d_conv13, d_mask13, e_conv2, e_mask2, 128, 3)
+        d_conv15, d_mask15 = decoder_layer(d_conv14, d_mask14, e_conv1, e_mask1, 64, 3)
+        d_conv16, d_mask16 = decoder_layer(d_conv15, d_mask15, inputs_img, inputs_mask, 3, 3, bn=False)
+        outputs = Conv2D(3, 1, activation = 'sigmoid', name='outputs_img')(d_conv16)
+        
+        # Setup the model inputs / outputs
+        model = Model(inputs=[inputs_img, inputs_mask], outputs=outputs)
+
+        return model, inputs_mask    
+
+    def compile_pconv_unet(self, model, inputs_mask, lr=0.0002):
+        model.compile(
+            optimizer = Adam(lr=lr),
+            loss=self.loss_total(inputs_mask),
+            metrics=[self.PSNR]
+        )
+
+    def loss_total(self, mask):
+        """
+        Creates a loss function which sums all the loss components 
+        and multiplies by their weights. See paper eq. 7.
+        """
+        def loss(y_true, y_pred):
+
+            # Compute predicted image with non-hole pixels set to ground truth
+            y_comp = mask * y_true + (1-mask) * y_pred
+
+            # Compute the vgg features. 
+            if self.vgg_device:
+                with tf.device(self.vgg_device):
+                    vgg_out = self.vgg(y_pred)
+                    vgg_gt = self.vgg(y_true)
+                    vgg_comp = self.vgg(y_comp)
+            else:
+                vgg_out = self.vgg(y_pred)
+                vgg_gt = self.vgg(y_true)
+                vgg_comp = self.vgg(y_comp)
+            
+            # Compute loss components
+            l1 = self.loss_valid(mask, y_true, y_pred)
+            l2 = self.loss_hole(mask, y_true, y_pred)
+            l3 = self.loss_perceptual(vgg_out, vgg_gt, vgg_comp)
+            l4 = self.loss_style(vgg_out, vgg_gt)
+            l5 = self.loss_style(vgg_comp, vgg_gt)
+            l6 = self.loss_tv(mask, y_comp)
+
+            # Return loss function
+            return l1 + 6*l2 + 0.05*l3 + 120*(l4+l5) + 0.1*l6
+
+        return loss
+
+    def loss_hole(self, mask, y_true, y_pred):
+        """Pixel L1 loss within the hole / mask"""
+        return self.l1((1-mask) * y_true, (1-mask) * y_pred)
+    
+    def loss_valid(self, mask, y_true, y_pred):
+        """Pixel L1 loss outside the hole / mask"""
+        return self.l1(mask * y_true, mask * y_pred)
+    
+    def loss_perceptual(self, vgg_out, vgg_gt, vgg_comp): 
+        """Perceptual loss based on VGG16, see. eq. 3 in paper"""       
+        loss = 0
+        for o, c, g in zip(vgg_out, vgg_comp, vgg_gt):
+            loss += self.l1(o, g) + self.l1(c, g)
+        return loss
+        
+    def loss_style(self, output, vgg_gt):
+        """Style loss based on output/computation, used for both eq. 4 & 5 in paper"""
+        loss = 0
+        for o, g in zip(output, vgg_gt):
+            loss += self.l1(self.gram_matrix(o), self.gram_matrix(g))
+        return loss
+    
+    def loss_tv(self, mask, y_comp):
+        """Total variation loss, used for smoothing the hole region, see. eq. 6"""
+
+        # Create dilated hole region using a 3x3 kernel of all 1s.
+        kernel = K.ones(shape=(3, 3, mask.shape[3], mask.shape[3]))
+        dilated_mask = K.conv2d(1-mask, kernel, data_format='channels_last', padding='same')
+
+        # Cast values to be [0., 1.], and compute dilated hole region of y_comp
+        dilated_mask = K.cast(K.greater(dilated_mask, 0), 'float32')
+        P = dilated_mask * y_comp
+
+        # Calculate total variation loss
+        a = self.l1(P[:,1:,:,:], P[:,:-1,:,:])
+        b = self.l1(P[:,:,1:,:], P[:,:,:-1,:])        
+        return a+b
+
+    def fit_generator(self, generator, *args, **kwargs):
+        """Fit the U-Net to a (images, targets) generator
+
+        Args:
+            generator (generator): generator supplying input image & mask, as well as targets.
+            *args: arguments to be passed to fit_generator
+            **kwargs: keyword arguments to be passed to fit_generator
+        """
+        self.model.fit_generator(
+            generator,
+            *args, **kwargs
+        )
+        
+    def summary(self):
+        """Get summary of the UNet model"""
+        print(self.model.summary())
+
+    def load(self, filepath, train_bn=True, lr=0.0002):
+
+        # Create UNet-like model
+        self.model, inputs_mask = self.build_pconv_unet(train_bn)
+        self.compile_pconv_unet(self.model, inputs_mask, lr) 
+
+        # Load weights into model
+        epoch = int(os.path.basename(filepath).split('.')[1].split('-')[0])
+        assert epoch > 0, "Could not parse weight file. Should include the epoch"
+        self.current_epoch = epoch
+        self.model.load_weights(filepath)        
+
+    @staticmethod
+    def PSNR(y_true, y_pred):
+        """
+        PSNR is Peek Signal to Noise Ratio, see https://en.wikipedia.org/wiki/Peak_signal-to-noise_ratio
+        The equation is:
+        PSNR = 20 * log10(MAX_I) - 10 * log10(MSE)
+        
+        Our input is scaled with be within the range -2.11 to 2.64 (imagenet value scaling). We use the difference between these
+        two values (4.75) as MAX_I        
+        """        
+        #return 20 * K.log(4.75) / K.log(10.0) - 10.0 * K.log(K.mean(K.square(y_pred - y_true))) / K.log(10.0) 
+        return - 10.0 * K.log(K.mean(K.square(y_pred - y_true))) / K.log(10.0) 
+
+    @staticmethod
+    def current_timestamp():
+        return datetime.now().strftime('%Y-%m-%d-%H-%M-%S')
+    
+    @staticmethod
+    def l1(y_true, y_pred):
+        """Calculate the L1 loss used in all loss calculations"""
+        if K.ndim(y_true) == 4:
+            return K.mean(K.abs(y_pred - y_true), axis=[1,2,3])
+        elif K.ndim(y_true) == 3:
+            return K.mean(K.abs(y_pred - y_true), axis=[1,2])
+        else:
+            raise NotImplementedError("Calculating L1 loss on 1D tensors? should not occur for this network")
+    
+    @staticmethod
+    def gram_matrix(x, norm_by_channels=False):
+        """Calculate gram matrix used in style loss"""
+        
+        # Assertions on input
+        assert K.ndim(x) == 4, 'Input tensor should be a 4d (B, H, W, C) tensor'
+        assert K.image_data_format() == 'channels_last', "Please use channels-last format"        
+        
+        # Permute channels and get resulting shape
+        x = K.permute_dimensions(x, (0, 3, 1, 2))
+        shape = K.shape(x)
+        B, C, H, W = shape[0], shape[1], shape[2], shape[3]
+        
+        # Reshape x and do batch dot product
+        features = K.reshape(x, K.stack([B, C, H*W]))
+        gram = K.batch_dot(features, features, axes=2)
+        
+        # Normalize with channels, height and width
+        gram = gram /  K.cast(C * H * W, x.dtype)
+        
+        return gram
+    
+    # Prediction functions
+    ######################
+    def predict(self, sample, **kwargs):
+        """Run prediction using this model"""
+        return self.model.predict(sample, **kwargs)
--- a/Code/pConv-Keras/libs/util.py 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/libs/util.py 0 → 100644
View file @c81d667
+import os
+from random import randint, seed
+import itertools
+import numpy as np
+import cv2
+
+
+class MaskGenerator():
+
+    def __init__(self, height, width, channels=3, rand_seed=None, filepath=None):
+        """Convenience functions for generating masks to be used for inpainting training
+        
+        Arguments:
+            height {int} -- Mask height
+            width {width} -- Mask width
+        
+        Keyword Arguments:
+            channels {int} -- Channels to output (default: {3})
+            rand_seed {[type]} -- Random seed (default: {None})
+            filepath {[type]} -- Load masks from filepath. If None, generate masks with OpenCV (default: {None})
+        """
+
+        self.height = height
+        self.width = width
+        self.channels = channels
+        self.filepath = filepath
+
+        # If filepath supplied, load the list of masks within the directory
+        self.mask_files = []
+        if self.filepath:
+            filenames = [f for f in os.listdir(self.filepath)]
+            self.mask_files = [f for f in filenames if any(filetype in f.lower() for filetype in ['.jpeg', '.png', '.jpg'])]
+            print(">> Found {} masks in {}".format(len(self.mask_files), self.filepath))        
+
+        # Seed for reproducibility
+        if rand_seed:
+            seed(rand_seed)
+
+    def _generate_mask(self):
+        """Generates a random irregular mask with lines, circles and elipses"""
+
+        img = np.zeros((self.height, self.width, self.channels), np.uint8)
+
+        # Set size scale
+        size = int((self.width + self.height) * 0.03)
+        if self.width < 64 or self.height < 64:
+            raise Exception("Width and Height of mask must be at least 64!")
+        
+        # Draw random lines
+        for _ in range(randint(1, 20)):
+            x1, x2 = randint(1, self.width), randint(1, self.width)
+            y1, y2 = randint(1, self.height), randint(1, self.height)
+            thickness = randint(3, size)
+            cv2.line(img,(x1,y1),(x2,y2),(1,1,1),thickness)
+            
+        # Draw random circles
+        for _ in range(randint(1, 20)):
+            x1, y1 = randint(1, self.width), randint(1, self.height)
+            radius = randint(3, size)
+            cv2.circle(img,(x1,y1),radius,(1,1,1), -1)
+            
+        # Draw random ellipses
+        for _ in range(randint(1, 20)):
+            x1, y1 = randint(1, self.width), randint(1, self.height)
+            s1, s2 = randint(1, self.width), randint(1, self.height)
+            a1, a2, a3 = randint(3, 180), randint(3, 180), randint(3, 180)
+            thickness = randint(3, size)
+            cv2.ellipse(img, (x1,y1), (s1,s2), a1, a2, a3,(1,1,1), thickness)
+        
+        return 1-img
+
+    def _load_mask(self, rotation=True, dilation=True, cropping=True):
+        """Loads a mask from disk, and optionally augments it"""
+
+        # Read image
+        mask = cv2.imread(os.path.join(self.filepath, np.random.choice(self.mask_files, 1, replace=False)[0]))
+        
+        # Random rotation
+        if rotation:
+            rand = np.random.randint(-180, 180)
+            M = cv2.getRotationMatrix2D((mask.shape[1]/2, mask.shape[0]/2), rand, 1.5)
+            mask = cv2.warpAffine(mask, M, (mask.shape[1], mask.shape[0]))
+            
+        # Random dilation
+        if dilation:
+            rand = np.random.randint(5, 47)
+            kernel = np.ones((rand, rand), np.uint8) 
+            mask = cv2.erode(mask, kernel, iterations=1)
+            
+        # Random cropping
+        if cropping:
+            x = np.random.randint(0, mask.shape[1] - self.width)
+            y = np.random.randint(0, mask.shape[0] - self.height)
+            mask = mask[y:y+self.height, x:x+self.width]
+
+        return (mask > 1).astype(np.uint8)
+
+    def sample(self, random_seed=None):
+        """Retrieve a random mask"""
+        if random_seed:
+            seed(random_seed)
+        if self.filepath and len(self.mask_files) > 0:
+            return self._load_mask()
+        else:
+            return self._generate_mask()
+
+
+class ImageChunker(object): 
+    
+    def __init__(self, rows, cols, overlap):
+        self.rows = rows
+        self.cols = cols
+        self.overlap = overlap
+    
+    def perform_chunking(self, img_size, chunk_size):
+        """
+        Given an image dimension img_size, return list of (start, stop) 
+        tuples to perform chunking of chunk_size
+        """
+        chunks, i = [], 0
+        while True:
+            chunks.append((i*(chunk_size - self.overlap/2), i*(chunk_size - self.overlap/2)+chunk_size))
+            i+=1
+            if chunks[-1][1] > img_size:
+                break
+        n_count = len(chunks)        
+        chunks[-1] = tuple(x - (n_count*chunk_size - img_size - (n_count-1)*self.overlap/2) for x in chunks[-1])
+        chunks = [(int(x), int(y)) for x, y in chunks]
+        return chunks
+    
+    def get_chunks(self, img, scale=1):
+        """
+        Get width and height lists of (start, stop) tuples for chunking of img.
+        """
+        x_chunks, y_chunks = [(0, self.rows)], [(0, self.cols)]        
+        if img.shape[0] > self.rows:
+            x_chunks = self.perform_chunking(img.shape[0], self.rows)
+        else:
+            x_chunks = [(0, img.shape[0])]
+        if img.shape[1] > self.cols:
+            y_chunks = self.perform_chunking(img.shape[1], self.cols)
+        else:
+            y_chunks = [(0, img.shape[1])]
+        return x_chunks, y_chunks    
+    
+    def dimension_preprocess(self, img, padding=True):
+        """
+        In case of prediction on image of different size than 512x512,
+        this function is used to add padding and chunk up the image into pieces
+        of 512x512, which can then later be reconstructed into the original image
+        using the dimension_postprocess() function.
+        """
+    
+        # Assert single image input
+        assert len(img.shape) == 3, "Image dimension expected to be (H, W, C)"
+    
+        # Check if we are adding padding for too small images
+        if padding:
+            
+            # Check if height is too small
+            if img.shape[0] < self.rows:
+                padding = np.ones((self.rows - img.shape[0], img.shape[1], img.shape[2]))
+                img = np.concatenate((img, padding), axis=0)
+    
+            # Check if width is too small
+            if img.shape[1] < self.cols:
+                padding = np.ones((img.shape[0], self.cols - img.shape[1], img.shape[2]))
+                img = np.concatenate((img, padding), axis=1)
+    
+        # Get chunking of the image
+        x_chunks, y_chunks = self.get_chunks(img)
+    
+        # Chunk up the image
+        images = []
+        for x in x_chunks:
+            for y in y_chunks:
+                images.append(
+                    img[x[0]:x[1], y[0]:y[1], :]
+                )
+        images = np.array(images)        
+        return images
+    
+    def dimension_postprocess(self, chunked_images, original_image, scale=1, padding=True):
+        """
+        In case of prediction on image of different size than 512x512,
+        the dimension_preprocess  function is used to add padding and chunk 
+        up the image into pieces of 512x512, and this function is used to 
+        reconstruct these pieces into the original image.
+        """
+    
+        # Assert input dimensions
+        assert len(original_image.shape) == 3, "Image dimension expected to be (H, W, C)"
+        assert len(chunked_images.shape) == 4, "Chunked images dimension expected to be (B, H, W, C)"
+        
+        # Check if we are adding padding for too small images
+        if padding:
+    
+            # Check if height is too small
+            if original_image.shape[0] < self.rows:
+                new_images = []
+                for img in chunked_images:
+                    new_images.append(img[0:scale*original_image.shape[0], :, :])
+                chunked_images = np.array(new_images)
+    
+            # Check if width is too small
+            if original_image.shape[1] < self.cols:
+                new_images = []
+                for img in chunked_images:
+                    new_images.append(img[:, 0:scale*original_image.shape[1], :])
+                chunked_images = np.array(new_images)
+            
+        # Put reconstruction into this array
+        new_shape = (
+            original_image.shape[0]*scale,
+            original_image.shape[1]*scale,
+            original_image.shape[2]
+        )
+        reconstruction = np.zeros(new_shape)
+            
+        # Get the chunks for this image    
+        x_chunks, y_chunks = self.get_chunks(original_image)
+        
+        i = 0
+        s = scale
+        for x in x_chunks:
+            for y in y_chunks:
+                
+                prior_fill = reconstruction != 0
+                chunk = np.zeros(new_shape)
+                chunk[x[0]*s:x[1]*s, y[0]*s:y[1]*s, :] += chunked_images[i]
+                chunk_fill = chunk != 0
+                
+                reconstruction += chunk
+                reconstruction[prior_fill & chunk_fill] = reconstruction[prior_fill & chunk_fill] / 2
+    
+                i += 1
+        
+        return reconstruction
\ No newline at end of file
--- a/Code/pConv-Keras/main.py 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/main.py 0 → 100644
View file @c81d667
+import os
+import gc
+import datetime
+import numpy as np
+import pandas as pd
+import cv2
+
+from argparse import ArgumentParser
+from copy import deepcopy
+from tqdm import tqdm
+
+from keras.preprocessing.image import ImageDataGenerator
+from keras.callbacks import TensorBoard, ModelCheckpoint, LambdaCallback
+from keras import backend as K
+from keras.utils import Sequence
+from keras_tqdm import TQDMCallback
+
+import matplotlib.pyplot as plt
+from matplotlib.ticker import NullFormatter
+
+from libs.pconv_model import PConvUnet
+from libs.util import MaskGenerator
+
+
+# Sample call
+r"""
+# Train on CelebaHQ
+python main.py --name CelebHQ --train C:\Documents\Kaggle\celebaHQ-512\train\ --validation C:\Documents\Kaggle\celebaHQ-512\val\ --test C:\Documents\Kaggle\celebaHQ-512\test\ --checkpoint "C:\Users\Mathias Felix Gruber\Documents\GitHub\PConv-Keras\data\logs\imagenet_phase1_paperMasks\weights.35-0.70.h5"
+"""
+
+
+def parse_args():
+    parser = ArgumentParser(description="Training script for PConv inpainting")
+
+    parser.add_argument(
+        "-stage",
+        "--stage",
+        type=str,
+        default="train",
+        help="Which stage of training to run",
+        choices=["train", "finetune"],
+    )
+
+    parser.add_argument(
+        "-train", "--train", type=str, help="Folder with training images"
+    )
+
+    parser.add_argument(
+        "-validation", "--validation", type=str, help="Folder with validation images"
+    )
+
+    parser.add_argument("-test", "--test", type=str, help="Folder with testing images")
+
+    parser.add_argument(
+        "-name",
+        "--name",
+        type=str,
+        default="myDataset",
+        help="Dataset name, e.g. 'imagenet'",
+    )
+
+    parser.add_argument(
+        "-batch_size",
+        "--batch_size",
+        type=int,
+        default=4,
+        help="What batch-size should we use",
+    )
+
+    parser.add_argument(
+        "-test_path",
+        "--test_path",
+        type=str,
+        default="./data/test_samples/",
+        help="Where to output test images during training",
+    )
+
+    parser.add_argument(
+        "-weight_path",
+        "--weight_path",
+        type=str,
+        default="./data/logs/",
+        help="Where to output weights during training",
+    )
+
+    parser.add_argument(
+        "-log_path",
+        "--log_path",
+        type=str,
+        default="./data/logs/",
+        help="Where to output tensorboard logs during training",
+    )
+
+    parser.add_argument(
+        "-vgg_path",
+        "--vgg_path",
+        type=str,
+        default="./data/logs/pytorch_to_keras_vgg16.h5",
+        help="VGG16 weights trained on PyTorch with pixel scaling 1/255.",
+    )
+
+    parser.add_argument(
+        "-checkpoint",
+        "--checkpoint",
+        type=str,
+        help="Previous weights to be loaded onto model",
+    )
+
+    return parser.parse_args()
+
+
+class AugmentingDataGenerator(ImageDataGenerator):
+    """Wrapper for ImageDataGenerator to return mask & image"""
+
+    def flow_from_directory(self, directory, mask_generator, *args, **kwargs):
+        generator = super().flow_from_directory(
+            directory, class_mode=None, *args, **kwargs
+        )
+        seed = None if "seed" not in kwargs else kwargs["seed"]
+        while True:
+
+            # Get augmentend image samples
+            ori = next(generator)
+
+            # Get masks for each image sample
+            mask = np.stack(
+                [mask_generator.sample(seed) for _ in range(ori.shape[0])], axis=0
+            )
+
+            # Apply masks to all image sample
+            masked = deepcopy(ori)
+            masked[mask == 0] = 1
+
+            # Yield ([ori, masl],  ori) training batches
+            # print(masked.shape, ori.shape)
+            gc.collect()
+            yield [masked, mask], ori
+
+
+# Run script
+if __name__ == "__main__":
+
+    # Parse command-line arguments
+    args = parse_args()
+
+    if args.stage == "finetune" and not args.checkpoint:
+        raise AttributeError(
+            "If you are finetuning your model, you must supply a checkpoint file"
+        )
+
+    # Create training generator
+    train_datagen = AugmentingDataGenerator(
+        rotation_range=10,
+        width_shift_range=0.1,
+        height_shift_range=0.1,
+        rescale=1.0 / 255,
+        horizontal_flip=True,
+    )
+    train_generator = train_datagen.flow_from_directory(
+        args.train,
+        MaskGenerator(512, 512, 3),
+        target_size=(512, 512),
+        batch_size=args.batch_size,
+    )
+
+    # Create validation generator
+    val_datagen = AugmentingDataGenerator(rescale=1.0 / 255)
+    val_generator = val_datagen.flow_from_directory(
+        args.validation,
+        MaskGenerator(512, 512, 3),
+        target_size=(512, 512),
+        batch_size=args.batch_size,
+        classes=["val"],
+        seed=42,
+    )
+
+    # Create testing generator
+    test_datagen = AugmentingDataGenerator(rescale=1.0 / 255)
+    test_generator = test_datagen.flow_from_directory(
+        args.test,
+        MaskGenerator(512, 512, 3),
+        target_size=(512, 512),
+        batch_size=args.batch_size,
+        seed=42,
+    )
+
+    # Pick out an example to be send to test samples folder
+    test_data = next(test_generator)
+    (masked, mask), ori = test_data
+
+    def plot_callback(model, path):
+        """Called at the end of each epoch, displaying our previous test images,
+        as well as their masked predictions and saving them to disk"""
+
+        # Get samples & Display them
+        pred_img = model.predict([masked, mask])
+        pred_time = datetime.datetime.now().strftime("%Y-%m-%d-%H-%M-%S")
+
+        # Clear current output and display test images
+        for i in range(len(ori)):
+            _, axes = plt.subplots(1, 3, figsize=(20, 5))
+            axes[0].imshow(masked[i, :, :, :])
+            axes[1].imshow(pred_img[i, :, :, :] * 1.0)
+            axes[2].imshow(ori[i, :, :, :])
+            axes[0].set_title("Masked Image")
+            axes[1].set_title("Predicted Image")
+            axes[2].set_title("Original Image")
+
+            plt.savefig(os.path.join(path, "/img_{}_{}.png".format(i, pred_time)))
+            plt.close()
+
+    # Load the model
+    if args.vgg_path:
+        model = PConvUnet(vgg_weights=args.vgg_path)
+    else:
+        model = PConvUnet()
+
+    # Loading of checkpoint
+    if args.checkpoint:
+        if args.stage == "train":
+            model.load(args.checkpoint)
+        elif args.stage == "finetune":
+            model.load(args.checkpoint, train_bn=False, lr=0.00005)
+
+    # Fit model
+    model.fit_generator(
+        train_generator,
+        steps_per_epoch=10000,
+        validation_data=val_generator,
+        validation_steps=1000,
+        epochs=100,
+        verbose=0,
+        callbacks=[
+            TensorBoard(
+                log_dir=os.path.join(args.log_path, args.name + "_phase1"),
+                write_graph=False,
+            ),
+            ModelCheckpoint(
+                os.path.join(
+                    args.log_path,
+                    args.name + "_phase1",
+                    "weights.{epoch:02d}-{loss:.2f}.h5",
+                ),
+                monitor="val_loss",
+                save_best_only=True,
+                save_weights_only=True,
+            ),
+            LambdaCallback(
+                on_epoch_end=lambda epoch, logs: plot_callback(model, args.test_path)
+            ),
+            TQDMCallback(),
+        ],
+    )
+
--- a/Code/pConv-Keras/notebooks/Step1 - Mask Generation.ipynb 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/notebooks/Step1 - Mask Generation.ipynb 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/notebooks/Step2 - Partial Convolution Layer.ipynb 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/notebooks/Step2 - Partial Convolution Layer.ipynb 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/notebooks/Step3 - UNet Architecture.ipynb 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/notebooks/Step3 - UNet Architecture.ipynb 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/notebooks/Step4 - Imagenet Training.ipynb 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/notebooks/Step4 - Imagenet Training.ipynb 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/notebooks/Step5 - Prediction.ipynb 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/notebooks/Step5 - Prediction.ipynb 0 → 100644
View file @c81d667
--- a/Code/pConv-Keras/requirements.txt 0 → 100644
View file @c81d667
+++ b/Code/pConv-Keras/requirements.txt 0 → 100644
View file @c81d667
+h5py==2.8.0
+Keras==2.2.4
+Keras-Applications==1.0.6
+Keras-Preprocessing==1.0.5
+keras-tqdm==2.0.1
+matplotlib==3.0.2
+numpy==1.15.4
+pandas==0.23.4
+scipy==1.1.0
+seaborn==0.9.0
+tables==3.4.4
+tensorboard==1.12.2
+tensorflow==1.12.0
+tqdm==4.28.1
\ No newline at end of file
--- a/Docs/주간보고서/10주차_주간보고서_0507.docx 0 → 100644
View file @c81d667
+++ b/Docs/주간보고서/10주차_주간보고서_0507.docx 0 → 100644
View file @c81d667
--- a/Docs/주간보고서/11주차_주간보고서_0514.docx 0 → 100644
View file @c81d667
+++ b/Docs/주간보고서/11주차_주간보고서_0514.docx 0 → 100644
View file @c81d667
--- a/Docs/주간보고서/12주차_주간보고서_0521.docx 0 → 100644
View file @c81d667
+++ b/Docs/주간보고서/12주차_주간보고서_0521.docx 0 → 100644
View file @c81d667
--- a/Docs/주간보고서/14주차_주간보고서_0604.docx 0 → 100644
View file @c81d667
+++ b/Docs/주간보고서/14주차_주간보고서_0604.docx 0 → 100644
View file @c81d667
--- a/Docs/주간보고서/8주차_주간보고서_0423.docx 0 → 100644
View file @c81d667
+++ b/Docs/주간보고서/8주차_주간보고서_0423.docx 0 → 100644
View file @c81d667
--- a/Docs/최종보고서/최종보고서_2015104198_이민호.pdf 0 → 100644
View file @c81d667
+++ b/Docs/최종보고서/최종보고서_2015104198_이민호.pdf 0 → 100644
View file @c81d667
--- a/Docs/최종보고서/캡스톤디자인2_최종발표_이민호.pptx 0 → 100644
View file @c81d667
+++ b/Docs/최종보고서/캡스톤디자인2_최종발표_이민호.pptx 0 → 100644
View file @c81d667