kylekyle/style_transfer.py

## style_transfer.py
# -*- coding: utf-8 -*-
# style_transfer.py <content> <style>
# CUDA_VISIBLE_DEVICES=3 python style_transfer.py walk.jpg kandinsky.jpg
import sys

content_path = sys.argv[1]
style_path = sys.argv[2]

max_dim = 1024
total_variation_weight=30

# 150px
#style_weight=1e-2
# 1024px
style_weight=1e-1
# 3000px
#style_weight=1
content_weight=1e4

"""style_transfer.ipynb

Automatically generated by Colaboratory.

Original file is located at
    https://colab.research.google.com/github/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb

##### Copyright 2018 The TensorFlow Authors.
"""

#@title Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""# Neural style transfer

<table class="tfo-notebook-buttons" align="left">
  <td>
    <a target="_blank" href="https://www.tensorflow.org/tutorials/generative/style_transfer"><img src="https://www.tensorflow.org/images/tf_logo_32px.png" />View on TensorFlow.org</a>
  </td>
  <td>
    <a target="_blank" href="https://colab.research.google.com/github/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/colab_logo_32px.png" />Run in Google Colab</a>
  </td>
  <td>
    <a target="_blank" href="https://github.com/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/GitHub-Mark-32px.png" />View source on GitHub</a>
  </td>
  <td>
    <a href="https://storage.googleapis.com/tensorflow_docs/docs/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/download_logo_32px.png" />Download notebook</a>
  </td>
</table>

This tutorial uses deep learning to compose one image in the style of another image (ever wish you could paint like Picasso or Van Gogh?). This is known as *neural style transfer* and the technique is outlined in <a href="https://arxiv.org/abs/1508.06576" class="external">A Neural Algorithm of Artistic Style</a> (Gatys et al.).

Note: This tutorial demonstrates the original style-transfer algorithm. It optimizes the image content to a particular style. Modern approaches train a model to generate the stylized image directly (similar to [cyclegan](cyclegan.ipynb)). This approach is much faster (up to 1000x). A pretrained [Arbitrary Image Stylization module](https://colab.research.google.com/github/tensorflow/hub/blob/master/examples/colab/tf2_arbitrary_image_stylization.ipynb) is available in [TensorFlow Hub](https://tensorflow.org/hub), and for [TensorFlow Lite](https://www.tensorflow.org/lite/models/style_transfer/overview).

Neural style transfer is an optimization technique used to take two images—a *content* image and a *style reference* image (such as an artwork by a famous painter)—and blend them together so the output image looks like the content image, but “painted” in the style of the style reference image.

This is implemented by optimizing the output image to match the content statistics of the content image and the style statistics of the style reference image. These statistics are extracted from the images using a convolutional network.

For example, let’s take an image of this dog and Wassily Kandinsky's Composition 7:

<img src="https://storage.googleapis.com/download.tensorflow.org/example_images/YellowLabradorLooking_new.jpg" width="500px"/>

[Yellow Labrador Looking](https://commons.wikimedia.org/wiki/File:YellowLabradorLooking_new.jpg), from Wikimedia Commons

<img src="https://storage.googleapis.com/download.tensorflow.org/example_images/Vassily_Kandinsky%2C_1913_-_Composition_7.jpg" width="500px"/>


Now how would it look like if Kandinsky decided to paint the picture of this Dog exclusively with this style? Something like this?

<img src="https://tensorflow.org/tutorials/generative/images/stylized-image.png" style="width: 500px;"/>

## Setup

### Import and configure modules
"""

import tensorflow as tf
import IPython.display as display

import matplotlib.pyplot as plt
import matplotlib as mpl
mpl.rcParams['figure.figsize'] = (12,12)
mpl.rcParams['axes.grid'] = False

import numpy as np
import PIL.Image
import time
import functools

def tensor_to_image(tensor):
  tensor = tensor*255
  tensor = np.array(tensor, dtype=np.uint8)
  if np.ndim(tensor)>3:
    assert tensor.shape[0] == 1
    tensor = tensor[0]
  return PIL.Image.fromarray(tensor)


"""## Visualize the input

Define a function to load an image and limit its maximum dimension to 512 pixels.
"""

def load_img(path_to_img, max_dim):

  img = tf.io.read_file(path_to_img)
  img = tf.image.decode_image(img, channels=3)
  img = tf.image.convert_image_dtype(img, tf.float32)

  shape = tf.cast(tf.shape(img)[:-1], tf.float32)
  long_dim = max(shape)
  scale = max_dim / long_dim

  new_shape = tf.cast(shape * scale, tf.int32)

  img = tf.image.resize(img, new_shape)
  img = img[tf.newaxis, :]
  return img

content_image = load_img(content_path, max_dim)
style_image = load_img(style_path, max_dim)

"""## Fast Style Transfer using TF-Hub

This tutorial demonstrates the original style-transfer algorithm, which optimizes the image content to a particular style. Before getting into the details, let's see how the [TensorFlow Hub](https://tensorflow.org/hub) module does:
"""


"""## Define content and style representations

Use the intermediate layers of the model to get the *content* and *style* representations of the image. Starting from the network's input layer, the first few layer activations represent low-level features like edges and textures. As you step through the network, the final few layers represent higher-level features—object parts like *wheels* or *eyes*. In this case, you are using the VGG19 network architecture, a pretrained image classification network. These intermediate layers are necessary to define the representation of content and style from the images. For an input image, try to match the corresponding style and content target representations at these intermediate layers.

Load a [VGG19](https://keras.io/applications/#vgg19) and test run it on our image to ensure it's used correctly:
"""

x = tf.keras.applications.vgg19.preprocess_input(content_image*255)
x = tf.image.resize(x, (224, 224))
vgg = tf.keras.applications.VGG19(include_top=True, weights='imagenet')
prediction_probabilities = vgg(x)
prediction_probabilities.shape

predicted_top_5 = tf.keras.applications.vgg19.decode_predictions(prediction_probabilities.numpy())[0]
[(class_name, prob) for (number, class_name, prob) in predicted_top_5]

"""Now load a `VGG19` without the classification head, and list the layer names"""

vgg = tf.keras.applications.VGG19(include_top=False, weights='imagenet')

"""Choose intermediate layers from the network to represent the style and content of the image:"""

content_layers = ['block5_conv2']

style_layers = ['block1_conv1',
                'block2_conv1',
                'block3_conv1',
                'block4_conv1',
                'block5_conv1']

num_content_layers = len(content_layers)
num_style_layers = len(style_layers)

"""#### Intermediate layers for style and content

So why do these intermediate outputs within our pretrained image classification network allow us to define style and content representations?

At a high level, in order for a network to perform image classification (which this network has been trained to do), it must understand the image. This requires taking the raw image as input pixels and building an internal representation that converts the raw image pixels into a complex understanding of the features present within the image.

This is also a reason why convolutional neural networks are able to generalize well: they’re able to capture the invariances and defining features within classes (e.g. cats vs. dogs) that are agnostic to background noise and other nuisances. Thus, somewhere between where the raw image is fed into the model and the output classification label, the model serves as a complex feature extractor. By accessing intermediate layers of the model, you're able to describe the content and style of input images.

## Build the model

The networks in `tf.keras.applications` are designed so you can easily extract the intermediate layer values using the Keras functional API.

To define a model using the functional API, specify the inputs and outputs:

`model = Model(inputs, outputs)`

This following function builds a VGG19 model that returns a list of intermediate layer outputs:
"""

def vgg_layers(layer_names):
  """ Creates a vgg model that returns a list of intermediate output values."""
  # Load our model. Load pretrained VGG, trained on imagenet data
  vgg = tf.keras.applications.VGG19(include_top=False, weights='imagenet')
  vgg.trainable = False

  outputs = [vgg.get_layer(name).output for name in layer_names]

  model = tf.keras.Model([vgg.input], outputs)
  return model

"""And to create the model:"""

style_extractor = vgg_layers(style_layers)
style_outputs = style_extractor(style_image*255)

"""## Calculate style

The content of an image is represented by the values of the intermediate feature maps.

It turns out, the style of an image can be described by the means and correlations across the different feature maps. Calculate a Gram matrix that includes this information by taking the outer product of the feature vector with itself at each location, and averaging that outer product over all locations. This Gram matrix can be calcualted for a particular layer as:

$$G^l_{cd} = \frac{\sum_{ij} F^l_{ijc}(x)F^l_{ijd}(x)}{IJ}$$

This can be implemented concisely using the `tf.linalg.einsum` function:
"""

def gram_matrix(input_tensor):
  result = tf.linalg.einsum('bijc,bijd->bcd', input_tensor, input_tensor)
  input_shape = tf.shape(input_tensor)
  num_locations = tf.cast(input_shape[1]*input_shape[2], tf.float32)
  return result/(num_locations)

"""## Extract style and content

Build a model that returns the style and content tensors.
"""

class StyleContentModel(tf.keras.models.Model):
  def __init__(self, style_layers, content_layers):
    super(StyleContentModel, self).__init__()
    self.vgg =  vgg_layers(style_layers + content_layers)
    self.style_layers = style_layers
    self.content_layers = content_layers
    self.num_style_layers = len(style_layers)
    self.vgg.trainable = False

  def call(self, inputs):
    "Expects float input in [0,1]"
    inputs = inputs*255.0
    preprocessed_input = tf.keras.applications.vgg19.preprocess_input(inputs)
    outputs = self.vgg(preprocessed_input)
    style_outputs, content_outputs = (outputs[:self.num_style_layers],
                                      outputs[self.num_style_layers:])

    style_outputs = [gram_matrix(style_output)
                     for style_output in style_outputs]

    content_dict = {content_name:value
                    for content_name, value
                    in zip(self.content_layers, content_outputs)}

    style_dict = {style_name:value
                  for style_name, value
                  in zip(self.style_layers, style_outputs)}

    return {'content':content_dict, 'style':style_dict}

"""When called on an image, this model returns the gram matrix (style) of the `style_layers` and content of the `content_layers`:"""

extractor = StyleContentModel(style_layers, content_layers)
results = extractor(tf.constant(content_image))
style_results = results['style']

print('Styles:')
for name, output in sorted(results['style'].items()):
  print("  ", name)
  print("    shape: ", output.numpy().shape)
  print()

print("Contents:")
for name, output in sorted(results['content'].items()):
  print("  ", name)
  print("    shape: ", output.numpy().shape)
  print()

"""## Run gradient descent

With this style and content extractor, you can now implement the style transfer algorithm. Do this by calculating the mean square error for your image's output relative to each target, then take the weighted sum of these losses.

Set your style and content target values:
"""

style_targets = extractor(style_image)['style']
content_targets = extractor(content_image)['content']

"""Define a `tf.Variable` to contain the image to optimize. To make this quick, initialize it with the content image (the `tf.Variable` must be the same shape as the content image):"""

image = tf.Variable(content_image)

"""Since this is a float image, define a function to keep the pixel values between 0 and 1:"""

def clip_0_1(image):
  return tf.clip_by_value(image, clip_value_min=0.0, clip_value_max=1.0)

"""Create an optimizer. The paper recommends LBFGS, but `Adam` works okay, too:"""

opt = tf.optimizers.Adam(learning_rate=0.02, beta_1=0.99, epsilon=1e-1)

def style_content_loss(outputs):
    style_outputs = outputs['style']
    content_outputs = outputs['content']
    style_loss = tf.add_n([tf.reduce_mean((style_outputs[name]-style_targets[name])**2)
                           for name in style_outputs.keys()])
    #style_loss *= style_weight / num_style_layers

    content_loss = tf.add_n([tf.reduce_mean((content_outputs[name]-content_targets[name])**2)
                             for name in content_outputs.keys()])
    #content_loss *= content_weight / num_content_layers
    loss = style_loss + content_loss
    return loss

"""Now include it in the `train_step` function:"""
@tf.function()
def train_step(image):
  with tf.GradientTape() as tape:
    outputs = extractor(image)
    loss = style_content_loss(outputs)
    loss += total_variation_weight*tf.image.total_variation(image)

  grad = tape.gradient(loss, image)
  opt.apply_gradients([(grad, image)])
  image.assign(clip_0_1(image))

"""Reinitialize the optimization variable:"""

image = tf.Variable(content_image)

"""And run the optimization:"""

import time
start = time.time()

epochs = 10
steps_per_epoch = 100

step = 0
print("Train step: 0", end='')
for n in range(epochs):
  for m in range(steps_per_epoch):
    step += 1
    train_step(image)
    print(".", end='', flush=True)
  print("\nTrain step: {}".format(step),end='')

end = time.time()
print("\nTotal time: {:.1f}".format(end-start))

"""Finally, save the result:"""
from pathlib import Path

file_name = "{}_{}_{}.png".format(
  Path(content_path).with_suffix(''),
  Path(style_path).with_suffix(''),
  max_dim
  )
print("Saving to {}".format(file_name))
tensor_to_image(image).save(file_name)
	# -- coding: utf-8 --
	# style_transfer.py <content> <style>
	# CUDA_VISIBLE_DEVICES=3 python style_transfer.py walk.jpg kandinsky.jpg
	import sys

	content_path = sys.argv[1]
	style_path = sys.argv[2]

	max_dim = 1024
	total_variation_weight=30

	# 150px
	#style_weight=1e-2
	# 1024px
	style_weight=1e-1
	# 3000px
	#style_weight=1
	content_weight=1e4

	"""style_transfer.ipynb

	Automatically generated by Colaboratory.

	Original file is located at
	https://colab.research.google.com/github/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb

	##### Copyright 2018 The TensorFlow Authors.
	"""

	#@title Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# https://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	"""# Neural style transfer

	<table class="tfo-notebook-buttons" align="left">
	<td>
	<a target="_blank" href="https://www.tensorflow.org/tutorials/generative/style_transfer"><img src="https://www.tensorflow.org/images/tf_logo_32px.png" />View on TensorFlow.org</a>
	</td>
	<td>
	<a target="_blank" href="https://colab.research.google.com/github/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/colab_logo_32px.png" />Run in Google Colab</a>
	</td>
	<td>
	<a target="_blank" href="https://github.com/tensorflow/docs/blob/master/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/GitHub-Mark-32px.png" />View source on GitHub</a>
	</td>
	<td>
	<a href="https://storage.googleapis.com/tensorflow_docs/docs/site/en/tutorials/generative/style_transfer.ipynb"><img src="https://www.tensorflow.org/images/download_logo_32px.png" />Download notebook</a>
	</td>
	</table>

	This tutorial uses deep learning to compose one image in the style of another image (ever wish you could paint like Picasso or Van Gogh?). This is known as neural style transfer and the technique is outlined in <a href="https://arxiv.org/abs/1508.06576" class="external">A Neural Algorithm of Artistic Style</a> (Gatys et al.).

	Note: This tutorial demonstrates the original style-transfer algorithm. It optimizes the image content to a particular style. Modern approaches train a model to generate the stylized image directly (similar to [cyclegan](cyclegan.ipynb)). This approach is much faster (up to 1000x). A pretrained [Arbitrary Image Stylization module](https://colab.research.google.com/github/tensorflow/hub/blob/master/examples/colab/tf2_arbitrary_image_stylization.ipynb) is available in [TensorFlow Hub](https://tensorflow.org/hub), and for [TensorFlow Lite](https://www.tensorflow.org/lite/models/style_transfer/overview).

	Neural style transfer is an optimization technique used to take two images—a content image and a style reference image (such as an artwork by a famous painter)—and blend them together so the output image looks like the content image, but “painted” in the style of the style reference image.

	This is implemented by optimizing the output image to match the content statistics of the content image and the style statistics of the style reference image. These statistics are extracted from the images using a convolutional network.

	For example, let’s take an image of this dog and Wassily Kandinsky's Composition 7:

	<img src="https://storage.googleapis.com/download.tensorflow.org/example_images/YellowLabradorLooking_new.jpg" width="500px"/>

	[Yellow Labrador Looking](https://commons.wikimedia.org/wiki/File:YellowLabradorLooking_new.jpg), from Wikimedia Commons

	<img src="https://storage.googleapis.com/download.tensorflow.org/example_images/Vassily_Kandinsky%2C_1913_-_Composition_7.jpg" width="500px"/>


	Now how would it look like if Kandinsky decided to paint the picture of this Dog exclusively with this style? Something like this?

	<img src="https://tensorflow.org/tutorials/generative/images/stylized-image.png" style="width: 500px;"/>

	## Setup

	### Import and configure modules
	"""

	import tensorflow as tf
	import IPython.display as display

	import matplotlib.pyplot as plt
	import matplotlib as mpl
	mpl.rcParams['figure.figsize'] = (12,12)
	mpl.rcParams['axes.grid'] = False

	import numpy as np
	import PIL.Image
	import time
	import functools

	def tensor_to_image(tensor):
	tensor = tensor*255
	tensor = np.array(tensor, dtype=np.uint8)
	if np.ndim(tensor)>3:
	assert tensor.shape[0] == 1
	tensor = tensor[0]
	return PIL.Image.fromarray(tensor)


	"""## Visualize the input

	Define a function to load an image and limit its maximum dimension to 512 pixels.
	"""

	def load_img(path_to_img, max_dim):

	img = tf.io.read_file(path_to_img)
	img = tf.image.decode_image(img, channels=3)
	img = tf.image.convert_image_dtype(img, tf.float32)

	shape = tf.cast(tf.shape(img)[:-1], tf.float32)
	long_dim = max(shape)
	scale = max_dim / long_dim

	new_shape = tf.cast(shape * scale, tf.int32)

	img = tf.image.resize(img, new_shape)
	img = img[tf.newaxis, :]
	return img

	content_image = load_img(content_path, max_dim)
	style_image = load_img(style_path, max_dim)

	"""## Fast Style Transfer using TF-Hub

	This tutorial demonstrates the original style-transfer algorithm, which optimizes the image content to a particular style. Before getting into the details, let's see how the [TensorFlow Hub](https://tensorflow.org/hub) module does:
	"""


	"""## Define content and style representations

	Use the intermediate layers of the model to get the content and style representations of the image. Starting from the network's input layer, the first few layer activations represent low-level features like edges and textures. As you step through the network, the final few layers represent higher-level features—object parts like wheels or eyes. In this case, you are using the VGG19 network architecture, a pretrained image classification network. These intermediate layers are necessary to define the representation of content and style from the images. For an input image, try to match the corresponding style and content target representations at these intermediate layers.

	Load a [VGG19](https://keras.io/applications/#vgg19) and test run it on our image to ensure it's used correctly:
	"""

	x = tf.keras.applications.vgg19.preprocess_input(content_image*255)
	x = tf.image.resize(x, (224, 224))
	vgg = tf.keras.applications.VGG19(include_top=True, weights='imagenet')
	prediction_probabilities = vgg(x)
	prediction_probabilities.shape

	predicted_top_5 = tf.keras.applications.vgg19.decode_predictions(prediction_probabilities.numpy())[0]
	[(class_name, prob) for (number, class_name, prob) in predicted_top_5]

	"""Now load a `VGG19` without the classification head, and list the layer names"""

	vgg = tf.keras.applications.VGG19(include_top=False, weights='imagenet')

	"""Choose intermediate layers from the network to represent the style and content of the image:"""

	content_layers = ['block5_conv2']

	style_layers = ['block1_conv1',
	'block2_conv1',
	'block3_conv1',
	'block4_conv1',
	'block5_conv1']

	num_content_layers = len(content_layers)
	num_style_layers = len(style_layers)

	"""#### Intermediate layers for style and content

	So why do these intermediate outputs within our pretrained image classification network allow us to define style and content representations?

	At a high level, in order for a network to perform image classification (which this network has been trained to do), it must understand the image. This requires taking the raw image as input pixels and building an internal representation that converts the raw image pixels into a complex understanding of the features present within the image.

	This is also a reason why convolutional neural networks are able to generalize well: they’re able to capture the invariances and defining features within classes (e.g. cats vs. dogs) that are agnostic to background noise and other nuisances. Thus, somewhere between where the raw image is fed into the model and the output classification label, the model serves as a complex feature extractor. By accessing intermediate layers of the model, you're able to describe the content and style of input images.

	## Build the model

	The networks in `tf.keras.applications` are designed so you can easily extract the intermediate layer values using the Keras functional API.

	To define a model using the functional API, specify the inputs and outputs:

	`model = Model(inputs, outputs)`

	This following function builds a VGG19 model that returns a list of intermediate layer outputs:
	"""

	def vgg_layers(layer_names):
	""" Creates a vgg model that returns a list of intermediate output values."""
	# Load our model. Load pretrained VGG, trained on imagenet data
	vgg = tf.keras.applications.VGG19(include_top=False, weights='imagenet')
	vgg.trainable = False

	outputs = [vgg.get_layer(name).output for name in layer_names]

	model = tf.keras.Model([vgg.input], outputs)
	return model

	"""And to create the model:"""

	style_extractor = vgg_layers(style_layers)
	style_outputs = style_extractor(style_image*255)

	"""## Calculate style

	The content of an image is represented by the values of the intermediate feature maps.

	It turns out, the style of an image can be described by the means and correlations across the different feature maps. Calculate a Gram matrix that includes this information by taking the outer product of the feature vector with itself at each location, and averaging that outer product over all locations. This Gram matrix can be calcualted for a particular layer as:

	$$G^l_{cd} = \frac{\sum_{ij} F^l_{ijc}(x)F^l_{ijd}(x)}{IJ}$$

	This can be implemented concisely using the `tf.linalg.einsum` function:
	"""

	def gram_matrix(input_tensor):
	result = tf.linalg.einsum('bijc,bijd->bcd', input_tensor, input_tensor)
	input_shape = tf.shape(input_tensor)
	num_locations = tf.cast(input_shape[1]*input_shape[2], tf.float32)
	return result/(num_locations)

	"""## Extract style and content

	Build a model that returns the style and content tensors.
	"""

	class StyleContentModel(tf.keras.models.Model):
	def __init__(self, style_layers, content_layers):
	super(StyleContentModel, self).__init__()
	self.vgg = vgg_layers(style_layers + content_layers)
	self.style_layers = style_layers
	self.content_layers = content_layers
	self.num_style_layers = len(style_layers)
	self.vgg.trainable = False

	def call(self, inputs):
	"Expects float input in [0,1]"
	inputs = inputs*255.0
	preprocessed_input = tf.keras.applications.vgg19.preprocess_input(inputs)
	outputs = self.vgg(preprocessed_input)
	style_outputs, content_outputs = (outputs[:self.num_style_layers],
	outputs[self.num_style_layers:])

	style_outputs = [gram_matrix(style_output)
	for style_output in style_outputs]

	content_dict = {content_name:value
	for content_name, value
	in zip(self.content_layers, content_outputs)}

	style_dict = {style_name:value
	for style_name, value
	in zip(self.style_layers, style_outputs)}

	return {'content':content_dict, 'style':style_dict}

	"""When called on an image, this model returns the gram matrix (style) of the `style_layers` and content of the `content_layers`:"""

	extractor = StyleContentModel(style_layers, content_layers)
	results = extractor(tf.constant(content_image))
	style_results = results['style']

	print('Styles:')
	for name, output in sorted(results['style'].items()):
	print(" ", name)
	print(" shape: ", output.numpy().shape)
	print()

	print("Contents:")
	for name, output in sorted(results['content'].items()):
	print(" ", name)
	print(" shape: ", output.numpy().shape)
	print()

	"""## Run gradient descent

	With this style and content extractor, you can now implement the style transfer algorithm. Do this by calculating the mean square error for your image's output relative to each target, then take the weighted sum of these losses.

	Set your style and content target values:
	"""

	style_targets = extractor(style_image)['style']
	content_targets = extractor(content_image)['content']

	"""Define a `tf.Variable` to contain the image to optimize. To make this quick, initialize it with the content image (the `tf.Variable` must be the same shape as the content image):"""

	image = tf.Variable(content_image)

	"""Since this is a float image, define a function to keep the pixel values between 0 and 1:"""

	def clip_0_1(image):
	return tf.clip_by_value(image, clip_value_min=0.0, clip_value_max=1.0)

	"""Create an optimizer. The paper recommends LBFGS, but `Adam` works okay, too:"""

	opt = tf.optimizers.Adam(learning_rate=0.02, beta_1=0.99, epsilon=1e-1)

	def style_content_loss(outputs):
	style_outputs = outputs['style']
	content_outputs = outputs['content']
	style_loss = tf.add_n([tf.reduce_mean((style_outputs[name]-style_targets[name])**2)
	for name in style_outputs.keys()])
	#style_loss *= style_weight / num_style_layers

	content_loss = tf.add_n([tf.reduce_mean((content_outputs[name]-content_targets[name])**2)
	for name in content_outputs.keys()])
	#content_loss *= content_weight / num_content_layers
	loss = style_loss + content_loss
	return loss

	"""Now include it in the `train_step` function:"""
	@tf.function()
	def train_step(image):
	with tf.GradientTape() as tape:
	outputs = extractor(image)
	loss = style_content_loss(outputs)
	loss += total_variation_weight*tf.image.total_variation(image)

	grad = tape.gradient(loss, image)
	opt.apply_gradients([(grad, image)])
	image.assign(clip_0_1(image))

	"""Reinitialize the optimization variable:"""

	image = tf.Variable(content_image)

	"""And run the optimization:"""

	import time
	start = time.time()

	epochs = 10
	steps_per_epoch = 100

	step = 0
	print("Train step: 0", end='')
	for n in range(epochs):
	for m in range(steps_per_epoch):
	step += 1
	train_step(image)
	print(".", end='', flush=True)
	print("\nTrain step: {}".format(step),end='')

	end = time.time()
	print("\nTotal time: {:.1f}".format(end-start))

	"""Finally, save the result:"""
	from pathlib import Path

	file_name = "{}_{}_{}.png".format(
	Path(content_path).with_suffix(''),
	Path(style_path).with_suffix(''),
	max_dim
	)
	print("Saving to {}".format(file_name))
	tensor_to_image(image).save(file_name)