Spaces:
Runtime error
Runtime error
| # Copyright 2017 Google Inc. | |
| # | |
| # Licensed under the Apache License, Version 2.0 (the "License"); | |
| # you may not use this file except in compliance with the License. | |
| # You may obtain a copy of the License at | |
| # | |
| # http://www.apache.org/licenses/LICENSE-2.0 | |
| # | |
| # Unless required by applicable law or agreed to in writing, software | |
| # distributed under the License is distributed on an "AS IS" BASIS, | |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| # See the License for the specific language governing permissions and | |
| # limitations under the License. | |
| """Utilities for PixelDA model.""" | |
| import math | |
| # Dependency imports | |
| import tensorflow as tf | |
| slim = tf.contrib.slim | |
| flags = tf.app.flags | |
| FLAGS = flags.FLAGS | |
| def remove_depth(images): | |
| """Takes a batch of images and remove depth channel if present.""" | |
| if images.shape.as_list()[-1] == 4: | |
| return images[:, :, :, 0:3] | |
| return images | |
| def image_grid(images, max_grid_size=4): | |
| """Given images and N, return first N^2 images as an NxN image grid. | |
| Args: | |
| images: a `Tensor` of size [batch_size, height, width, channels] | |
| max_grid_size: Maximum image grid height/width | |
| Returns: | |
| Single image batch, of dim [1, h*n, w*n, c] | |
| """ | |
| images = remove_depth(images) | |
| batch_size = images.shape.as_list()[0] | |
| grid_size = min(int(math.sqrt(batch_size)), max_grid_size) | |
| assert images.shape.as_list()[0] >= grid_size * grid_size | |
| # If we have a depth channel | |
| if images.shape.as_list()[-1] == 4: | |
| images = images[:grid_size * grid_size, :, :, 0:3] | |
| depth = tf.image.grayscale_to_rgb(images[:grid_size * grid_size, :, :, 3:4]) | |
| images = tf.reshape(images, [-1, images.shape.as_list()[2], 3]) | |
| split = tf.split(0, grid_size, images) | |
| depth = tf.reshape(depth, [-1, images.shape.as_list()[2], 3]) | |
| depth_split = tf.split(0, grid_size, depth) | |
| grid = tf.concat(split + depth_split, 1) | |
| return tf.expand_dims(grid, 0) | |
| else: | |
| images = images[:grid_size * grid_size, :, :, :] | |
| images = tf.reshape( | |
| images, [-1, images.shape.as_list()[2], | |
| images.shape.as_list()[3]]) | |
| split = tf.split(images, grid_size, 0) | |
| grid = tf.concat(split, 1) | |
| return tf.expand_dims(grid, 0) | |
| def source_and_output_image_grid(output_images, | |
| source_images=None, | |
| max_grid_size=4): | |
| """Create NxN image grid for output, concatenate source grid if given. | |
| Makes grid out of output_images and, if provided, source_images, and | |
| concatenates them. | |
| Args: | |
| output_images: [batch_size, h, w, c] tensor of images | |
| source_images: optional[batch_size, h, w, c] tensor of images | |
| max_grid_size: Image grid height/width | |
| Returns: | |
| Single image batch, of dim [1, h*n, w*n, c] | |
| """ | |
| output_grid = image_grid(output_images, max_grid_size=max_grid_size) | |
| if source_images is not None: | |
| source_grid = image_grid(source_images, max_grid_size=max_grid_size) | |
| # Make sure they have the same # of channels before concat | |
| # Assumes either 1 or 3 channels | |
| if output_grid.shape.as_list()[-1] != source_grid.shape.as_list()[-1]: | |
| if output_grid.shape.as_list()[-1] == 1: | |
| output_grid = tf.tile(output_grid, [1, 1, 1, 3]) | |
| if source_grid.shape.as_list()[-1] == 1: | |
| source_grid = tf.tile(source_grid, [1, 1, 1, 3]) | |
| output_grid = tf.concat([output_grid, source_grid], 1) | |
| return output_grid | |
| def summarize_model(end_points): | |
| """Summarizes the given model via its end_points. | |
| Args: | |
| end_points: A dictionary of end_point names to `Tensor`. | |
| """ | |
| tf.summary.histogram('domain_logits_transferred', | |
| tf.sigmoid(end_points['transferred_domain_logits'])) | |
| tf.summary.histogram('domain_logits_target', | |
| tf.sigmoid(end_points['target_domain_logits'])) | |
| def summarize_transferred_grid(transferred_images, | |
| source_images=None, | |
| name='Transferred'): | |
| """Produces a visual grid summarization of the image transferrence. | |
| Args: | |
| transferred_images: A `Tensor` of size [batch_size, height, width, c]. | |
| source_images: A `Tensor` of size [batch_size, height, width, c]. | |
| name: Name to use in summary name | |
| """ | |
| if source_images is not None: | |
| grid = source_and_output_image_grid(transferred_images, source_images) | |
| else: | |
| grid = image_grid(transferred_images) | |
| tf.summary.image('%s_Images_Grid' % name, grid, max_outputs=1) | |
| def summarize_transferred(source_images, | |
| transferred_images, | |
| max_images=20, | |
| name='Transferred'): | |
| """Produces a visual summary of the image transferrence. | |
| This summary displays the source image, transferred image, and a grayscale | |
| difference image which highlights the differences between input and output. | |
| Args: | |
| source_images: A `Tensor` of size [batch_size, height, width, channels]. | |
| transferred_images: A `Tensor` of size [batch_size, height, width, channels] | |
| max_images: The number of images to show. | |
| name: Name to use in summary name | |
| Raises: | |
| ValueError: If number of channels in source and target are incompatible | |
| """ | |
| source_channels = source_images.shape.as_list()[-1] | |
| transferred_channels = transferred_images.shape.as_list()[-1] | |
| if source_channels < transferred_channels: | |
| if source_channels != 1: | |
| raise ValueError( | |
| 'Source must be 1 channel or same # of channels as target') | |
| source_images = tf.tile(source_images, [1, 1, 1, transferred_channels]) | |
| if transferred_channels < source_channels: | |
| if transferred_channels != 1: | |
| raise ValueError( | |
| 'Target must be 1 channel or same # of channels as source') | |
| transferred_images = tf.tile(transferred_images, [1, 1, 1, source_channels]) | |
| diffs = tf.abs(source_images - transferred_images) | |
| diffs = tf.reduce_max(diffs, reduction_indices=[3], keep_dims=True) | |
| diffs = tf.tile(diffs, [1, 1, 1, max(source_channels, transferred_channels)]) | |
| transition_images = tf.concat([ | |
| source_images, | |
| transferred_images, | |
| diffs, | |
| ], 2) | |
| tf.summary.image( | |
| '%s_difference' % name, transition_images, max_outputs=max_images) | |
| def summaries_color_distributions(images, name): | |
| """Produces a histogram of the color distributions of the images. | |
| Args: | |
| images: A `Tensor` of size [batch_size, height, width, 3]. | |
| name: The name of the images being summarized. | |
| """ | |
| tf.summary.histogram('color_values/%s' % name, images) | |
| def summarize_images(images, name): | |
| """Produces a visual summary of the given images. | |
| Args: | |
| images: A `Tensor` of size [batch_size, height, width, 3]. | |
| name: The name of the images being summarized. | |
| """ | |
| grid = image_grid(images) | |
| tf.summary.image('%s_Images' % name, grid, max_outputs=1) | |