Spaces:

srijaydeshpande
/

SAFRON

Sleeping

App Files Files Community

srijaydeshpande commited on Sep 2

Commit

4473449

•

1 Parent(s): 9c3c6ce

Upload 4 files

Browse files

Files changed (4) hide show

Assistance/SingleImageCropper.py +79 -0
Assistance/join_images.py +61 -0
segment2tissue_safron_media.py +683 -0
tools/process.py +310 -0

Assistance/SingleImageCropper.py ADDED Viewed

	@@ -0,0 +1,79 @@

+import glob
+import os
+from PIL import Image
+import numpy as np
+import time
+import PIL
+import matplotlib.pyplot as plt
+import argparse
+patchsize = 296
+stride = 236
+pad=0
+PIL.Image.MAX_IMAGE_PIXELS = 933120000
+def CropImage(image_path,output_dir,pad):
+    image_name = os.path.split(image_path)[1].split('.')[0]
+    im = Image.open(image_path)
+    size = im.size
+    # new_size = (size[0]+40,size[1]+40)
+    new_size = size
+    if(pad):
+        new_im = Image.new("RGB", new_size)  ## luckily, this is already black!
+        new_im.paste(im, ((new_size[0] - size[0]) // 2,
+                              (new_size[1] - size[1]) // 2))
+        #plt.imshow(new_im)
+        #plt.show()
+    else:
+        new_im = im
+    width, height = new_im.size
+    x = 0
+    y = 0
+    right = 0
+    bottom = 0
+    while (bottom < height):
+        while (right < width):
+            left = x
+            top = y
+            right = left + patchsize
+            bottom = top + patchsize
+            if (right > width):
+                offset = right - width
+                right -= offset
+                left -= offset
+            if (bottom > height):
+                offset = bottom - height
+                bottom -= offset
+                top -= offset
+            im_crop = new_im.crop((left, top, right, bottom))
+            im_crop_name = image_name + "_" + str(left) + "_" + str(top) + ".png"
+            output_path = os.path.join(output_dir, im_crop_name)
+            im_crop.save(output_path)
+            x += stride
+        x = 0
+        right = 0
+        y += stride
+start_time = time.time()
+parser = argparse.ArgumentParser()
+parser.add_argument("--image_path", help="path to image to crop",
+                    default=r"F:\Datasets\DigestPath\safron\Benign\test\3\ablation_study_neg_46\neg_46.png")
+parser.add_argument("--output_dir", help="path to output folder",
+                    default=r"F:\Datasets\DigestPath\safron\Benign\test\3\ablation_study_neg_46\cropped_safron_patchadv")
+parser.add_argument("--pad", type=int, default=0, help="pad the image borders")
+args = parser.parse_args()
+if not os.path.exists(args.output_dir):
+        os.makedirs(args.output_dir)
+CropImage(args.image_path,args.output_dir,args.pad)
+print("--- %s seconds ---" % (time.time() - start_time))

Assistance/join_images.py ADDED Viewed

	@@ -0,0 +1,61 @@

+import os
+import glob
+import numpy as np
+from PIL import Image
+import PIL
+import matplotlib.pyplot as plt
+import matplotlib
+import time
+import argparse
+PIL.Image.MAX_IMAGE_PIXELS = 933120000
+def join_images(input_dir,output_file,height,width):
+    start_time = time.time()
+    paths = glob.glob(os.path.join(input_dir,"*.png"))
+    patch = 256
+    image = np.zeros((height,width,3))
+    count_masks = np.zeros((height,width,3))
+    k=0
+    for path in paths:
+        if('outputs' in path):
+            imname = os.path.split(path)[1].replace("-outputs","").split(".")[0]
+            imname = imname.split("_")
+            y,x = int(imname[-2]),int(imname[-1])
+            img = Image.open(path)
+            img = np.asarray(img)
+            #print("X => ",x," Y => ",y)
+            image[x:x+patch,y:y+patch,:] += img
+            count_masks[x:x+patch,y:y+patch,:]+=1.0
+            k+=1
+    count_masks = count_masks.clip(min=1)
+    image = image/count_masks
+    image = image/255.0
+    # im = Image.fromarray(image)
+    # im.save(output_file)
+    matplotlib.image.imsave(output_file, image)
+    print("--- %s seconds ---" % (time.time() - start_time))
+    print("Done")
+parser = argparse.ArgumentParser()
+parser.add_argument("--patches_dir", help="path to generated patches to join",
+                    default="./tmp/results/images")
+parser.add_argument("--output_file", help="path to output file",
+                    default="F:/Datasets/DigestPath/safron/test/single/outputs/sample.jpeg")
+parser.add_argument("--im_height", type=int, help="image height")
+parser.add_argument("--im_width", type=int, help="image width")
+args = parser.parse_args()
+join_images(args.patches_dir,args.output_file,args.im_height,args.im_width)

segment2tissue_safron_media.py ADDED Viewed

	@@ -0,0 +1,683 @@

+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+import tensorflow.compat.v1 as tf
+import numpy as np
+import argparse
+import os
+import json
+import glob
+import random
+import collections
+import math
+import time
+# visualize image
+import matplotlib.pyplot as plt
+#disable v2 behavious
+tf.disable_v2_behavior()
+# enable eager execution
+# tf.compat.v1.enable_eager_execution()
+parser = argparse.ArgumentParser()
+parser.add_argument("--input_dir", help="path to folder containing images")
+parser.add_argument("--mode", required=True, choices=["train", "test", "export"])
+parser.add_argument("--output_dir", required=True, help="where to put output files")
+parser.add_argument("--seed", type=int)
+parser.add_argument("--checkpoint", default=None,
+                    help="directory with checkpoint to resume training from or use for testing")
+parser.add_argument("--max_steps", type=int, help="number of training steps (0 to disable)")
+parser.add_argument("--max_epochs", type=int, help="number of training epochs")
+parser.add_argument("--summary_freq", type=int, default=10000, help="update summaries every summary_freq steps")
+parser.add_argument("--progress_freq", type=int, default=50, help="display progress every progress_freq steps")
+parser.add_argument("--trace_freq", type=int, default=0, help="trace execution every trace_freq steps")
+parser.add_argument("--display_freq", type=int, default=1000, help="write current training images every display_freq steps")
+parser.add_argument("--save_freq", type=int, default=1000, help="save model every save_freq steps, 0 to disable")
+parser.add_argument("--separable_conv", action="store_true", help="use separable convolutions in the generator")
+parser.add_argument("--aspect_ratio", type=float, default=1.0, help="aspect ratio of output images (width/height)")
+parser.add_argument("--batch_size", type=int, default=1, help="number of images in batch")
+parser.add_argument("--which_direction", type=str, default="BtoA", choices=["AtoB", "BtoA"])
+parser.add_argument("--ngf", type=int, default=64, help="number of generator filters in first conv layer")
+parser.add_argument("--ndf", type=int, default=64, help="number of discriminator filters in first conv layer")
+parser.add_argument("--scale_size", type=int, default=728, help="scale images to this size before cropping to 256x256")
+parser.add_argument("--flip", dest="flip", action="store_true", help="flip images horizontally")
+parser.add_argument("--no_flip", dest="flip", action="store_false", help="don't flip images horizontally")
+# parser.set_defaults(flip=True)
+parser.add_argument("--lr", type=float, default=0.0001, help="initial learning rate for adam")
+parser.add_argument("--beta1", type=float, default=0.5, help="momentum term of adam")
+parser.add_argument("--l1_weight", type=float, default=100.0, help="weight on L1 term for generator gradient")
+parser.add_argument("--gan_weight", type=float, default=1.0, help="weight on GAN term for generator gradient")
+# export options
+parser.add_argument("--output_filetype", default="png", choices=["png", "jpeg"])
+a = parser.parse_args()
+EPS = 1e-12
+Examples = collections.namedtuple("Examples", "paths, inputs, targets, count, steps_per_epoch")
+Model = collections.namedtuple("Model",
+                               "outputs, predict_real, predict_fake, discrim_loss, discrim_grads_and_vars, gen_loss_GAN, gen_loss_L1, gen_grads_and_vars, train")
+def preprocess(image):
+    with tf.name_scope("preprocess"):
+        # [0, 1] => [-1, 1]
+        return image * 2 - 1
+def deprocess(image):
+    with tf.name_scope("deprocess"):
+        # [-1, 1] => [0, 1]
+        return (image + 1) / 2
+def discrim_conv(batch_input, out_channels, stride):
+    padded_input = tf.pad(batch_input, [[0, 0], [1, 1], [1, 1], [0, 0]], mode="CONSTANT")
+    return tf.layers.conv2d(padded_input, out_channels, kernel_size=4, strides=(stride, stride), padding="valid",
+                            kernel_initializer=tf.random_normal_initializer(0, 0.02))
+def gen_conv(batch_input, out_channels):
+    # [batch, in_height, in_width, in_channels] => [batch, out_height, out_width, out_channels]
+    initializer = tf.random_normal_initializer(0, 0.02)
+    if a.separable_conv:
+        return tf.layers.separable_conv2d(batch_input, out_channels, kernel_size=4, strides=(2, 2), padding="same",
+                                          depthwise_initializer=initializer, pointwise_initializer=initializer)
+    else:
+        return tf.layers.conv2d(batch_input, out_channels, kernel_size=4, strides=(2, 2), padding="same",
+                                kernel_initializer=initializer)
+def gen_deconv(batch_input, out_channels):
+    # [batch, in_height, in_width, in_channels] => [batch, out_height, out_width, out_channels]
+    initializer = tf.random_normal_initializer(0, 0.02)
+    if a.separable_conv:
+        _b, h, w, _c = batch_input.shape
+        resized_input = tf.image.resize_images(batch_input, [h * 2, w * 2],
+                                               method=tf.image.ResizeMethod.NEAREST_NEIGHBOR)
+        return tf.layers.separable_conv2d(resized_input, out_channels, kernel_size=4, strides=(1, 1), padding="same",
+                                          depthwise_initializer=initializer, pointwise_initializer=initializer)
+    else:
+        return tf.layers.conv2d_transpose(batch_input, out_channels, kernel_size=4, strides=(2, 2), padding="same",
+                                          kernel_initializer=initializer)
+def lrelu(x, a):
+    with tf.name_scope("lrelu"):
+        # adding these together creates the leak part and linear part
+        # then cancels them out by subtracting/adding an absolute value term
+        # leak: a*x/2 - a*abs(x)/2
+        # linear: x/2 + abs(x)/2
+        # this block looks like it has 2 inputs on the graph unless we do this
+        x = tf.identity(x)
+        return (0.5 * (1 + a)) * x + (0.5 * (1 - a)) * tf.abs(x)
+def batchnorm(inputs):
+    return tf.layers.batch_normalization(inputs, axis=3, epsilon=1e-5, momentum=0.1, training=True,
+                                         gamma_initializer=tf.random_normal_initializer(1.0, 0.02))
+def check_image(image):
+    assertion = tf.assert_equal(tf.shape(image)[-1], 3, message="image must have 3 color channels")
+    with tf.control_dependencies([assertion]):
+        image = tf.identity(image)
+    if image.get_shape().ndims not in (3, 4):
+        raise ValueError("image must be either 3 or 4 dimensions")
+    # make the last dimension 3 so that you can unstack the colors
+    shape = list(image.get_shape())
+    shape[-1] = 3
+    image.set_shape(shape)
+    return image
+def load_examples():
+    if a.input_dir is None or not os.path.exists(a.input_dir):
+        raise Exception("input_dir does not exist")
+    input_paths = glob.glob(os.path.join(a.input_dir, "*.jpg"))
+    decode = tf.image.decode_jpeg
+    if len(input_paths) == 0:
+        input_paths = glob.glob(os.path.join(a.input_dir, "*.png"))
+        decode = tf.image.decode_png
+    if len(input_paths) == 0:
+        raise Exception("input_dir contains no image files")
+    def get_name(path):
+        name, _ = os.path.splitext(os.path.basename(path))
+        return name
+    # if the image names are numbers, sort by the value rather than asciibetically
+    # having sorted inputs means that the outputs are sorted in test mode
+    if all(get_name(path).isdigit() for path in input_paths):
+        input_paths = sorted(input_paths, key=lambda path: int(get_name(path)))
+    else:
+        input_paths = sorted(input_paths)
+    with tf.name_scope("load_images"):
+        path_queue = tf.train.string_input_producer(input_paths, shuffle=a.mode == "train")
+        reader = tf.WholeFileReader()
+        paths, contents = reader.read(path_queue)
+        raw_input = decode(contents)
+        raw_input = tf.image.convert_image_dtype(raw_input, dtype=tf.float32)
+        assertion = tf.assert_equal(tf.shape(raw_input)[2], 3, message="image does not have 3 channels")
+        with tf.control_dependencies([assertion]):
+            raw_input = tf.identity(raw_input)
+        raw_input.set_shape([None, None, 3])
+        # break apart image pair and move to range [-1, 1]
+        width = tf.shape(raw_input)[1]  # [height, width, channels]
+        a_images = preprocess(raw_input[:, :width // 2, :])
+        b_images = preprocess(raw_input[:, width // 2:, :])
+    if a.which_direction == "AtoB":
+        inputs, targets = [a_images, b_images]
+    elif a.which_direction == "BtoA":
+        inputs, targets = [b_images, a_images]
+    else:
+        raise Exception("invalid direction")
+    # synchronize seed for image operations so that we do the same operations to both
+    # input and output images
+    def transform(image):
+        r = image
+        r.set_shape([a.scale_size,a.scale_size,3])
+        #r = tf.image.resize_images(r, [a.scale_size, a.scale_size], method=tf.image.ResizeMethod.AREA)
+        return r
+    with tf.name_scope("input_images"):
+        input_images = transform(inputs)
+    with tf.name_scope("target_images"):
+        target_images = transform(targets)
+    paths_batch, inputs_batch, targets_batch = tf.train.batch([paths, input_images, target_images],
+                                                              batch_size=a.batch_size)
+    steps_per_epoch = int(math.ceil(len(input_paths) / a.batch_size))
+    return Examples(
+        paths=paths_batch,
+        inputs=inputs_batch,
+        targets=targets_batch,
+        count=len(input_paths),
+        steps_per_epoch=steps_per_epoch,
+    )
+def create_generator(generator_inputs, generator_outputs_channels):
+    layers = []
+    #Add Filter to detect edges
+    filter_shape = [41,41,3,a.ngf]
+    with tf.variable_scope("encoder_1"):
+        filter = tf.get_variable('edge_detector', filter_shape, initializer=tf.random_normal_initializer(stddev=0.02))
+        strides = [1, 1, 1, 1]
+        output = tf.nn.conv2d(generator_inputs, filter, strides=strides, padding='VALID')
+        output = lrelu(output, 0.2)
+        layers.append(output)
+    # encoder_1: [batch, 256, 256, in_channels] => [batch, 128, 128, ngf]
+    with tf.variable_scope("encoder_1"):
+        output = gen_conv(output, a.ngf)
+        layers.append(output)
+    layer_specs = [
+        a.ngf * 2,  # encoder_2: [batch, 128, 128, ngf] => [batch, 64, 64, ngf * 2]
+        a.ngf * 4,  # encoder_3: [batch, 64, 64, ngf * 2] => [batch, 32, 32, ngf * 4]
+        a.ngf * 8,  # encoder_4: [batch, 32, 32, ngf * 4] => [batch, 16, 16, ngf * 8]
+        a.ngf * 8,  # encoder_5: [batch, 16, 16, ngf * 8] => [batch, 8, 8, ngf * 8]
+        a.ngf * 8,  # encoder_6: [batch, 8, 8, ngf * 8] => [batch, 4, 4, ngf * 8]
+        a.ngf * 8,  # encoder_7: [batch, 4, 4, ngf * 8] => [batch, 2, 2, ngf * 8]
+        a.ngf * 8,  # encoder_8: [batch, 2, 2, ngf * 8] => [batch, 1, 1, ngf * 8]
+    ]
+    for out_channels in layer_specs:
+        with tf.variable_scope("encoder_%d" % (len(layers) + 1)):
+            rectified = lrelu(layers[-1], 0.2)
+            # [batch, in_height, in_width, in_channels] => [batch, in_height/2, in_width/2, out_channels]
+            convolved = gen_conv(rectified, out_channels)
+            output = batchnorm(convolved)
+            layers.append(output)
+    layer_specs = [
+        (a.ngf * 8, 0.5),  # decoder_8: [batch, 1, 1, ngf * 8] => [batch, 2, 2, ngf * 8 * 2]
+        (a.ngf * 8, 0.5),  # decoder_7: [batch, 2, 2, ngf * 8 * 2] => [batch, 4, 4, ngf * 8 * 2]
+        (a.ngf * 8, 0.5),  # decoder_6: [batch, 4, 4, ngf * 8 * 2] => [batch, 8, 8, ngf * 8 * 2]
+        (a.ngf * 8, 0.0),  # decoder_5: [batch, 8, 8, ngf * 8 * 2] => [batch, 16, 16, ngf * 8 * 2]
+        (a.ngf * 4, 0.0),  # decoder_4: [batch, 16, 16, ngf * 8 * 2] => [batch, 32, 32, ngf * 4 * 2]
+        (a.ngf * 2, 0.0),  # decoder_3: [batch, 32, 32, ngf * 4 * 2] => [batch, 64, 64, ngf * 2 * 2]
+        (a.ngf, 0.0),  # decoder_2: [batch, 64, 64, ngf * 2 * 2] => [batch, 128, 128, ngf * 2]
+    ]
+    num_encoder_layers = len(layers)
+    for decoder_layer, (out_channels, dropout) in enumerate(layer_specs):
+        skip_layer = num_encoder_layers - decoder_layer - 1
+        with tf.variable_scope("decoder_%d" % (skip_layer + 1)):
+            if decoder_layer == 0:
+                # first decoder layer doesn't have skip connections
+                # since it is directly connected to the skip_layer
+                input = layers[-1]
+            else:
+                input = tf.concat([layers[-1], layers[skip_layer]], axis=3)
+                #input = layers[-1]
+            rectified = tf.nn.relu(input)
+            # [batch, in_height, in_width, in_channels] => [batch, in_height*2, in_width*2, out_channels]
+            output = gen_deconv(rectified, out_channels)
+            output = batchnorm(output)
+            if dropout > 0.0:
+                output = tf.nn.dropout(output, keep_prob=1 - dropout)
+            layers.append(output)
+    # decoder_1: [batch, 128, 128, ngf * 2] => [batch, 256, 256, generator_outputs_channels]
+    with tf.variable_scope("decoder_1"):
+        input = tf.concat([layers[-1], layers[1]], axis=3)
+        rectified = tf.nn.relu(input)
+        output = gen_deconv(rectified, generator_outputs_channels)
+        output = tf.tanh(output)
+        layers.append(output)
+    return layers[-1]
+ksize_rows = 296
+ksize_cols = 296
+strides_rows = 236
+strides_cols = 236
+num_patches = int(a.scale_size/strides_rows)
+ksizes = [1, ksize_rows, ksize_cols, 1]
+ksizes_output = [1, 256, 256, 1]
+strides = [1, strides_rows, strides_cols, 1]
+rates = [1, 1, 1, 1]
+padding='VALID'
+def extract_patches(x, ksizes, strides, rates):
+    return tf.extract_image_patches(
+        x,
+        ksizes, strides, rates,
+        padding="VALID"
+    )
+def extract_patches_inverse(x, y):
+    _x = tf.zeros_like(x)
+    _y = extract_patches(_x, ksizes_output, strides, rates)
+    grad = tf.gradients(_y, _x)[0]
+    # Divide by grad, to "average" together the overlapping patches
+    # otherwise they would simply sum up
+    return tf.gradients(_y, _x, grad_ys=y)[0] / grad
+def create_model(inputs, targets):
+    out_channels = int(targets.get_shape()[-1])
+    if(a.mode == "train" or a.scale_size != 296): #scale_size = 296 while testing
+        def create_discriminator(discrim_inputs, discrim_targets):
+            n_layers = 5
+            layers = []
+            # 2x [batch, height, width, in_channels] => [batch, height, width, in_channels * 2]
+            input = tf.concat([discrim_inputs, discrim_targets], axis=3)
+            # layer_1: [batch, 256, 256, in_channels * 2] => [batch, 128, 128, ndf]
+            with tf.variable_scope("layer_1"):
+                convolved = discrim_conv(input, a.ndf, stride=2)
+                rectified = lrelu(convolved, 0.2)
+                layers.append(rectified)
+            # layer_2: [batch, 128, 128, ndf] => [batch, 64, 64, ndf * 2]
+            # layer_3: [batch, 64, 64, ndf * 2] => [batch, 32, 32, ndf * 4]
+            # layer_4: [batch, 32, 32, ndf * 4] => [batch, 31, 31, ndf * 8]
+            for i in range(n_layers):
+                with tf.variable_scope("layer_%d" % (len(layers) + 1)):
+                    out_channels = a.ndf * min(2 ** (i + 1), 8)
+                    stride = 1 if i == n_layers - 1 else 2  # last layer here has stride 1
+                    convolved = discrim_conv(layers[-1], out_channels, stride=stride)
+                    normalized = batchnorm(convolved)
+                    rectified = lrelu(normalized, 0.2)
+                    layers.append(rectified)
+            # layer_5: [batch, 31, 31, ndf * 8] => [batch, 30, 30, 1]
+            with tf.variable_scope("layer_%d" % (len(layers) + 1)):
+                convolved = discrim_conv(rectified, out_channels=1, stride=1)
+                output = tf.sigmoid(convolved)
+                layers.append(output)
+            print(layers)
+            return layers[-1]
+        # Pad inputs to make shape to handle edge patches, so as we can give context as input to generator (context around target patch)
+        inputs_bounded = tf.image.pad_to_bounding_box(inputs, 20, 20, a.scale_size + 40, a.scale_size + 40)
+        #Extract Patches
+        with tf.variable_scope("extract_patches"):
+            inputs_patches = extract_patches(inputs_bounded, ksizes, strides, rates)
+        with tf.name_scope("patches_generator"):
+            with tf.variable_scope("generator", reuse=tf.AUTO_REUSE):
+                output_patches = []
+                patch_size_len = 256*256*3
+                #Get output from each patch via same generator
+                for i in range(0, num_patches):
+                    for j in range(0, num_patches):
+                        patch = inputs_patches[0, i, j,]
+                        #patch_size_len = int(patch.get_shape()[0]) #defined above
+                        # reshape
+                        patch = tf.reshape(patch, [ksize_rows, ksize_cols, 3])
+                        patch = tf.expand_dims(patch,0)
+                        patch_output = create_generator(patch, out_channels)
+                        output_patches.append(tf.reshape(patch_output,[patch_size_len]))
+                output_patches = tf.stack(output_patches)
+                output_patches = tf.reshape(output_patches, [1, num_patches, num_patches, patch_size_len])
+                #Stitch all patches back
+                k = tf.constant(0.1, shape=[1, a.scale_size, a.scale_size, 3])
+                outputs = extract_patches_inverse(k, output_patches)
+        # create two copies of discriminator, one for real pairs and one for fake pairs
+        # they share the same underlying variables
+        with tf.name_scope("real_discriminator"):
+            with tf.variable_scope("discriminator"):
+                # 2x [batch, height, width, channels] => [batch, 30, 30, 1]
+                predict_real = create_discriminator(inputs, targets)
+        with tf.name_scope("fake_discriminator"):
+            with tf.variable_scope("discriminator", reuse=True):
+                # 2x [batch, height, width, channels] => [batch, 30, 30, 1]
+                predict_fake = create_discriminator(inputs, outputs)
+        with tf.name_scope("discriminator_loss"):
+            # minimizing -tf.log will try to get inputs to 1
+            # predict_real => 1
+            # predict_fake => 0
+            discrim_loss = tf.reduce_mean(-(tf.log(tf.clip_by_value((predict_real + EPS),1e-12,1.0)) + tf.log(tf.clip_by_value((1 - predict_fake + EPS),1e-12,1.0))))
+        with tf.name_scope("generator_loss"):
+            # predict_fake => 1
+            # abs(targets - outputs) => 0
+            gen_loss_GAN = tf.reduce_mean(-tf.log(tf.clip_by_value((predict_fake + EPS),1e-12,1.0)))
+            gen_loss_L1 = tf.reduce_mean(tf.abs(targets - outputs))
+            gen_loss = gen_loss_GAN * a.gan_weight + gen_loss_L1 * a.l1_weight
+        with tf.name_scope("discriminator_train"):
+            discrim_tvars = [var for var in tf.trainable_variables() if var.name.startswith("discriminator")]
+            discrim_optim = tf.train.AdamOptimizer(a.lr, a.beta1)
+            discrim_grads_and_vars = discrim_optim.compute_gradients(discrim_loss, var_list=discrim_tvars)
+            discrim_train = discrim_optim.apply_gradients(discrim_grads_and_vars)
+        with tf.name_scope("generator_train"):
+            with tf.control_dependencies([discrim_train]):
+                gen_tvars = [var for var in tf.trainable_variables() if var.name.startswith("generator")]
+                gen_optim = tf.train.AdamOptimizer(a.lr, a.beta1)
+                gen_grads_and_vars = gen_optim.compute_gradients(gen_loss, var_list=gen_tvars)
+                gen_train = gen_optim.apply_gradients(gen_grads_and_vars)
+        ema = tf.train.ExponentialMovingAverage(decay=0.99)
+        update_losses = ema.apply([discrim_loss, gen_loss_GAN, gen_loss_L1])
+        global_step = tf.train.get_or_create_global_step()
+        incr_global_step = tf.assign(global_step, global_step + 1)
+        discrim_loss = ema.average(discrim_loss)
+        gen_loss_GAN=ema.average(gen_loss_GAN)
+        gen_loss_L1 = ema.average(gen_loss_L1)
+        update_ops = [update_losses, incr_global_step, gen_train]
+        train = tf.group(update_ops)
+    elif (a.mode == "test"):
+        predict_real = None
+        predict_fake = None
+        discrim_loss = None
+        discrim_grads_and_vars = None
+        gen_loss_GAN = None
+        gen_loss_L1 = None
+        gen_grads_and_vars = None
+        train = None
+        with tf.name_scope("patches_generator"):
+            with tf.variable_scope("generator", reuse=tf.AUTO_REUSE):
+                outputs = create_generator(inputs, out_channels)
+    else:
+        print("Give correct mode")
+        exit(0)
+    return Model(
+        predict_real=predict_real,
+        predict_fake=predict_fake,
+        discrim_loss=discrim_loss,
+        discrim_grads_and_vars=discrim_grads_and_vars,
+        gen_loss_GAN=gen_loss_GAN,
+        gen_loss_L1=gen_loss_L1,
+        gen_grads_and_vars=gen_grads_and_vars,
+        outputs=outputs,
+        train=train
+    )
+def save_images(fetches, step=None):
+    image_dir = os.path.join(a.output_dir, "images")
+    if not os.path.exists(image_dir):
+        os.makedirs(image_dir)
+    filesets = []
+    for i, in_path in enumerate(fetches["paths"]):
+        name, _ = os.path.splitext(os.path.basename(in_path.decode("utf8")))
+        fileset = {"name": name, "step": step}
+        for kind in ["inputs", "outputs", "targets"]:
+            filename = name + "-" + kind + ".png"
+            if step is not None:
+                filename = "%08d-%s" % (step, filename)
+            fileset[kind] = filename
+            out_path = os.path.join(image_dir, filename)
+            contents = fetches[kind][i]
+            with open(out_path, "wb") as f:
+                f.write(contents)
+        filesets.append(fileset)
+    return filesets
+def append_index(filesets, step=False):
+    index_path = os.path.join(a.output_dir, "index.html")
+    if os.path.exists(index_path):
+        index = open(index_path, "a")
+    else:
+        index = open(index_path, "w")
+        index.write("<html><body><table><tr>")
+        if step:
+            index.write("<th>step</th>")
+        index.write("<th>name</th><th>input</th><th>output</th><th>target</th></tr>")
+    for fileset in filesets:
+        index.write("<tr>")
+        if step:
+            index.write("<td>%d</td>" % fileset["step"])
+        index.write("<td>%s</td>" % fileset["name"])
+        for kind in ["inputs", "outputs", "targets"]:
+            index.write("<td><img src='images/%s'></td>" % fileset[kind])
+        index.write("</tr>")
+    return index_path
+def main():
+    if a.seed is None:
+        a.seed = random.randint(0, 2 ** 31 - 1)
+    tf.set_random_seed(a.seed)
+    np.random.seed(a.seed)
+    random.seed(a.seed)
+    if not os.path.exists(a.output_dir):
+        os.makedirs(a.output_dir)
+    if a.mode == "test" or a.mode == "export":
+        if a.checkpoint is None:
+            raise Exception("checkpoint required for test mode")
+        # load some options from the checkpoint
+        options = {"which_direction", "ngf", "ndf"}
+        with open(os.path.join(a.checkpoint, "options.json")) as f:
+            for key, val in json.loads(f.read()).items():
+                if key in options:
+                    print("loaded", key, "=", val)
+                    setattr(a, key, val)
+        # disable these features in test mode
+        #a.scale_size = CROP_SIZE
+        a.flip = False
+    for k, v in a._get_kwargs():
+        print(k, "=", v)
+    with open(os.path.join(a.output_dir, "options.json"), "w") as f:
+        f.write(json.dumps(vars(a), sort_keys=True, indent=4))
+    examples = load_examples()
+    # inputs and targets are [batch_size, height, width, channels]
+    model = create_model(examples.inputs, examples.targets)
+    inputs = deprocess(examples.inputs)
+    targets = deprocess(examples.targets)
+    outputs = deprocess(model.outputs)
+    def convert(image):
+        return tf.image.convert_image_dtype(image, dtype=tf.uint8, saturate=True)
+    # reverse any processing on images so they can be written to disk or displayed to user
+    with tf.name_scope("convert_inputs"):
+        converted_inputs = convert(inputs)
+    with tf.name_scope("convert_targets"):
+        converted_targets = convert(targets)
+    with tf.name_scope("convert_outputs"):
+        converted_outputs = convert(outputs)
+    with tf.name_scope("encode_images"):
+        display_fetches = {
+            "paths": examples.paths,
+            "inputs": tf.map_fn(tf.image.encode_png, converted_inputs, dtype=tf.string, name="input_pngs"),
+            "targets": tf.map_fn(tf.image.encode_png, converted_targets, dtype=tf.string, name="target_pngs"),
+            "outputs": tf.map_fn(tf.image.encode_png, converted_outputs, dtype=tf.string, name="output_pngs"),
+        }
+    with tf.name_scope("parameter_count"):
+        parameter_count = tf.reduce_sum([tf.reduce_prod(tf.shape(v)) for v in tf.trainable_variables()])
+    saver = tf.train.Saver(max_to_keep=1)
+    logdir = a.output_dir if (a.trace_freq > 0 or a.summary_freq > 0) else None
+    sv = tf.train.Supervisor(logdir=logdir, save_summaries_secs=0, saver=None)
+    with sv.managed_session() as sess:
+        print("parameter_count =", sess.run(parameter_count))
+        if a.checkpoint is not None:
+            print("loading model from checkpoint")
+            print(a.checkpoint)
+            checkpoint = tf.train.latest_checkpoint(a.checkpoint)
+            saver.restore(sess, checkpoint)
+        max_steps = 2 ** 32
+        if a.max_epochs is not None:
+            max_steps = examples.steps_per_epoch * a.max_epochs
+        if a.max_steps is not None:
+            max_steps = a.max_steps
+        if a.mode == "test":
+            # testing
+            # at most, process the test data once
+            start = time.time()
+            max_steps = min(examples.steps_per_epoch, max_steps)
+            for step in range(max_steps):
+                results = sess.run(display_fetches)
+                filesets = save_images(results)
+                for i, f in enumerate(filesets):
+                    print("evaluated image", f["name"])
+                index_path = append_index(filesets)
+            print("wrote index at", index_path)
+            print("rate", (time.time() - start) / max_steps)
+        else:
+            # training
+            start = time.time()
+            for step in range(max_steps):
+                def should(freq):
+                    return freq > 0 and ((step + 1) % freq == 0 or step == max_steps - 1)
+                options = None
+                run_metadata = None
+                if should(a.trace_freq):
+                    options = tf.RunOptions(trace_level=tf.RunOptions.FULL_TRACE)
+                    run_metadata = tf.RunMetadata()
+                fetches = {
+                    "train": model.train,
+                    "global_step": sv.global_step,
+                }
+                if should(a.progress_freq):
+                    fetches["discrim_loss"] = model.discrim_loss
+                    fetches["gen_loss_GAN"] = model.gen_loss_GAN
+                    fetches["gen_loss_L1"] = model.gen_loss_L1
+                if should(a.summary_freq):
+                    fetches["summary"] = sv.summary_op
+                if should(a.display_freq):
+                    fetches["display"] = display_fetches
+                results = sess.run(fetches, options=options, run_metadata=run_metadata)
+                if should(a.summary_freq):
+                    print("recording summary")
+                    sv.summary_writer.add_summary(results["summary"], results["global_step"])
+                if should(a.display_freq):
+                    print("saving display images")
+                    filesets = save_images(results["display"], step=results["global_step"])
+                    append_index(filesets, step=True)
+                if should(a.trace_freq):
+                    print("recording trace")
+                    sv.summary_writer.add_run_metadata(run_metadata, "step_%d" % results["global_step"])
+                if should(a.progress_freq):
+                    # global_step will have the correct step count if we resume from a checkpoint
+                    train_epoch = math.ceil(results["global_step"] / examples.steps_per_epoch)
+                    train_step = (results["global_step"] - 1) % examples.steps_per_epoch + 1
+                    rate = (step + 1) * a.batch_size / (time.time() - start)
+                    remaining = (max_steps - step) * a.batch_size / rate
+                    print("progress  epoch %d  step %d  image/sec %0.1f  remaining %dm" % (
+                    train_epoch, train_step, rate, remaining / 60))
+                    print("discrim_loss", results["discrim_loss"])
+                    print("gen_loss_GAN", results["gen_loss_GAN"])
+                    print("gen_loss_L1", results["gen_loss_L1"])
+                if should(a.save_freq):
+                    print("saving model")
+                    saver.save(sess, os.path.join(a.output_dir, "model"), global_step=sv.global_step)
+                if sv.should_stop():
+                    break
+main()

tools/process.py ADDED Viewed

	@@ -0,0 +1,310 @@

+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+import tensorflow.compat.v1 as tf
+tf.disable_v2_behavior()
+import argparse
+import os
+import tempfile
+import subprocess
+#import tensorflow as tf
+import numpy as np
+import tfimage as im
+import threading
+import time
+import multiprocessing
+edge_pool = None
+parser = argparse.ArgumentParser()
+parser.add_argument("--input_dir", required=True, help="path to folder containing images")
+parser.add_argument("--output_dir", required=True, help="output path")
+parser.add_argument("--operation", required=True, choices=["grayscale", "resize", "blank", "combine", "edges"])
+parser.add_argument("--workers", type=int, default=1, help="number of workers")
+# resize
+parser.add_argument("--pad", action="store_true", help="pad instead of crop for resize operation")
+parser.add_argument("--size", type=int, default=256, help="size to use for resize operation")
+# combine
+parser.add_argument("--b_dir", type=str, help="path to folder containing B images for combine operation")
+a = parser.parse_args()
+def resize(src):
+    height, width, _ = src.shape
+    dst = src
+    if height != width:
+        if a.pad:
+            size = max(height, width)
+            # pad to correct ratio
+            oh = (size - height) // 2
+            ow = (size - width) // 2
+            dst = im.pad(image=dst, offset_height=oh, offset_width=ow, target_height=size, target_width=size)
+        else:
+            # crop to correct ratio
+            size = min(height, width)
+            oh = (height - size) // 2
+            ow = (width - size) // 2
+            dst = im.crop(image=dst, offset_height=oh, offset_width=ow, target_height=size, target_width=size)
+    assert(dst.shape[0] == dst.shape[1])
+    size, _, _ = dst.shape
+    if size > a.size:
+        dst = im.downscale(images=dst, size=[a.size, a.size])
+    elif size < a.size:
+        dst = im.upscale(images=dst, size=[a.size, a.size])
+    return dst
+def blank(src):
+    height, width, _ = src.shape
+    if height != width:
+        raise Exception("non-square image")
+    image_size = width
+    size = int(image_size * 0.3)
+    offset = int(image_size / 2 - size / 2)
+    dst = src
+    dst[offset:offset + size,offset:offset + size,:] = np.ones([size, size, 3])
+    return dst
+def combine(src, src_path):
+    if a.b_dir is None:
+        raise Exception("missing b_dir")
+    # find corresponding file in b_dir, could have a different extension
+    basename, _ = os.path.splitext(os.path.basename(src_path))
+    for ext in [".png", ".jpg"]:
+        sibling_path = os.path.join(a.b_dir, basename + ext)
+        if os.path.exists(sibling_path):
+            sibling = im.load(sibling_path)
+            break
+    else:
+        raise Exception("could not find sibling image for " + src_path)
+    # make sure that dimensions are correct
+    height, width, _ = src.shape
+    if height != sibling.shape[0] or width != sibling.shape[1]:
+        raise Exception("differing sizes")
+    # convert both images to RGB if necessary
+    if src.shape[2] == 1:
+        src = im.grayscale_to_rgb(images=src)
+    if sibling.shape[2] == 1:
+        sibling = im.grayscale_to_rgb(images=sibling)
+    # remove alpha channel
+    if src.shape[2] == 4:
+        src = src[:,:,:3]
+    if sibling.shape[2] == 4:
+        sibling = sibling[:,:,:3]
+    return np.concatenate([src, sibling], axis=1)
+def grayscale(src):
+    return im.grayscale_to_rgb(images=im.rgb_to_grayscale(images=src))
+net = None
+def run_caffe(src):
+    # lazy load caffe and create net
+    global net
+    if net is None:
+        # don't require caffe unless we are doing edge detection
+        os.environ["GLOG_minloglevel"] = "2" # disable logging from caffe
+        import caffe
+        # using this requires using the docker image or assembling a bunch of dependencies
+        # and then changing these hardcoded paths
+        net = caffe.Net("/opt/caffe/examples/hed/deploy.prototxt", "/opt/caffe/hed_pretrained_bsds.caffemodel", caffe.TEST)
+    net.blobs["data"].reshape(1, *src.shape)
+    net.blobs["data"].data[...] = src
+    net.forward()
+    return net.blobs["sigmoid-fuse"].data[0][0,:,:]
+def edges(src):
+    # based on https://github.com/phillipi/pix2pix/blob/master/scripts/edges/batch_hed.py
+    # and https://github.com/phillipi/pix2pix/blob/master/scripts/edges/PostprocessHED.m
+    import scipy.io
+    src = src * 255
+    border = 128 # put a padding around images since edge detection seems to detect edge of image
+    src = src[:,:,:3] # remove alpha channel if present
+    src = np.pad(src, ((border, border), (border, border), (0,0)), "reflect")
+    src = src[:,:,::-1]
+    src -= np.array((104.00698793,116.66876762,122.67891434))
+    src = src.transpose((2, 0, 1))
+    # [height, width, channels] => [batch, channel, height, width]
+    fuse = edge_pool.apply(run_caffe, [src])
+    fuse = fuse[border:-border, border:-border]
+    with tempfile.NamedTemporaryFile(suffix=".png") as png_file, tempfile.NamedTemporaryFile(suffix=".mat") as mat_file:
+        scipy.io.savemat(mat_file.name, {"input": fuse})
+        octave_code = r"""
+E = 1-load(input_path).input;
+E = imresize(E, [image_width,image_width]);
+E = 1 - E;
+E = single(E);
+[Ox, Oy] = gradient(convTri(E, 4), 1);
+[Oxx, ~] = gradient(Ox, 1);
+[Oxy, Oyy] = gradient(Oy, 1);
+O = mod(atan(Oyy .* sign(-Oxy) ./ (Oxx + 1e-5)), pi);
+E = edgesNmsMex(E, O, 1, 5, 1.01, 1);
+E = double(E >= max(eps, threshold));
+E = bwmorph(E, 'thin', inf);
+E = bwareaopen(E, small_edge);
+E = 1 - E;
+E = uint8(E * 255);
+imwrite(E, output_path);
+"""
+        config = dict(
+            input_path="'%s'" % mat_file.name,
+            output_path="'%s'" % png_file.name,
+            image_width=256,
+            threshold=25.0/255.0,
+            small_edge=5,
+        )
+        args = ["octave"]
+        for k, v in config.items():
+            args.extend(["--eval", "%s=%s;" % (k, v)])
+        args.extend(["--eval", octave_code])
+        try:
+            subprocess.check_output(args, stderr=subprocess.STDOUT)
+        except subprocess.CalledProcessError as e:
+            print("octave failed")
+            print("returncode:", e.returncode)
+            print("output:", e.output)
+            raise
+        return im.load(png_file.name)
+def process(src_path, dst_path):
+    src = im.load(src_path)
+    if a.operation == "grayscale":
+        dst = grayscale(src)
+    elif a.operation == "resize":
+        dst = resize(src)
+    elif a.operation == "blank":
+        dst = blank(src)
+    elif a.operation == "combine":
+        dst = combine(src, src_path)
+    elif a.operation == "edges":
+        dst = edges(src)
+    else:
+        raise Exception("invalid operation")
+    im.save(dst, dst_path)
+complete_lock = threading.Lock()
+start = None
+num_complete = 0
+total = 0
+def complete():
+    global num_complete, rate, last_complete
+    with complete_lock:
+        num_complete += 1
+        now = time.time()
+        elapsed = now - start
+        rate = num_complete / elapsed
+        if rate > 0:
+            remaining = (total - num_complete) / rate
+        else:
+            remaining = 0
+        print("%d/%d complete  %0.2f images/sec  %dm%ds elapsed  %dm%ds remaining" % (num_complete, total, rate, elapsed // 60, elapsed % 60, remaining // 60, remaining % 60))
+        last_complete = now
+def main():
+    if not os.path.exists(a.output_dir):
+        os.makedirs(a.output_dir)
+    src_paths = []
+    dst_paths = []
+    skipped = 0
+    for src_path in im.find(a.input_dir):
+        name, _ = os.path.splitext(os.path.basename(src_path))
+        dst_path = os.path.join(a.output_dir, name + ".png")
+        if os.path.exists(dst_path):
+            skipped += 1
+        else:
+            src_paths.append(src_path)
+            dst_paths.append(dst_path)
+    print("skipping %d files that already exist" % skipped)
+    global total
+    total = len(src_paths)
+    print("processing %d files" % total)
+    global start
+    start = time.time()
+    if a.operation == "edges":
+        # use a multiprocessing pool for this operation so it can use multiple CPUs
+        # create the pool before we launch processing threads
+        global edge_pool
+        edge_pool = multiprocessing.Pool(a.workers)
+    if a.workers == 1:
+        with tf.Session() as sess:
+            for src_path, dst_path in zip(src_paths, dst_paths):
+                process(src_path, dst_path)
+                complete()
+    else:
+        queue = tf.train.input_producer(zip(src_paths, dst_paths), shuffle=False, num_epochs=1)
+        dequeue_op = queue.dequeue()
+        def worker(coord):
+            with sess.as_default():
+                while not coord.should_stop():
+                    try:
+                        src_path, dst_path = sess.run(dequeue_op)
+                    except tf.errors.OutOfRangeError:
+                        coord.request_stop()
+                        break
+                    process(src_path, dst_path)
+                    complete()
+        # init epoch counter for the queue
+        local_init_op = tf.local_variables_initializer()
+        with tf.Session() as sess:
+            sess.run(local_init_op)
+            coord = tf.train.Coordinator()
+            threads = tf.train.start_queue_runners(coord=coord)
+            for i in range(a.workers):
+                t = threading.Thread(target=worker, args=(coord,))
+                t.start()
+                threads.append(t)
+            try:
+                coord.join(threads)
+            except KeyboardInterrupt:
+                coord.request_stop()
+                coord.join(threads)
+main()