Xuechen Li lxuechen

## ft_t5.py
# Copyright (C) Xuechen Li
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

## vae.py
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import tqdm
import os
import gzip
from absl import flags
import urllib.request as req

## unit_test.py
block = Residual()
x = tf.random_normal(shape=(N, C, H, W))
dy = tf.random_normal(shape=(N, C, H, W))
with tf.GradientTape() as tape:
  tape.watch(x)
  y = block(x)
# Compute true grads
dx_true = tape.gradient(y, x, output_gradients=dy)

# Compute grads from reconstruction

## defun_vs_ag.py
def tensor_square(x, stop_when):  # x is scalar Tensor
  cnt = 0
  while x < stop_when:
    x = tf.square(x)
    cnt += 1
  return cnt

## residual.py
class Residual(tf.keras.Model):
  def __init__(self, filters):
    super(Residual, self).__init__()
    self.f = ResidualInner(filters=filters, strides=(1, 1))
    self.g = ResidualInner(filters=filters, strides=(1, 1))

  def call(self, x, training=True):
    x1, x2 = tf.split(x, num_or_size_splits=2, axis=self.axis)
    f_x2 = self.f(x2, training=training)
    y1 = f_x2 + x1

## estimator.py
def model_fn(features, labels, mode, params):
  model = RevNet(params["hyperparameters"])
  if mode == tf.estimator.ModeKeys.TRAIN:
    optimizer = tf.train.MomentumOptimizer(learning_rate, momentum)
    logits, saved_hidden = model(features, training=True)
    grads, loss = model.compute_gradients(saved_hidden, labels, training=True)
    with tf.control_dependencies(model.get_updates_for(features)):
      train_op = optimizer.apply_gradients(zip(grads, model.trainable_variables))
    return tf.estimator.EstimatorSpec(mode=mode, loss=loss, train_op=train_op)

## loop_ds.py
for image, label in dataset:
  logits = model(image, training=True)
  ...

## init_ds.py
dataset = tf.data.TFRecordDataset(filename)
dataset = dataset.repeat(epochs).map(parser).batch(batch_size)

## defun_optim.py
def apply_gradients(optimizer, gradients, variables, global_step=None):
    optimizer.apply_gradients(
        zip(gradients, variables), global_step=global_step)
apply_gradients = tfe.defun(apply_gradients)

## defun.py
tfe = tf.contrib.eager
model.call = tfe.defun(model.call)
model.compute_gradients = tfe.defun(model.compute_gradients)
	# Copyright (C) Xuechen Li
	#
	# This program is free software: you can redistribute it and/or modify
	# it under the terms of the GNU General Public License as published by
	# the Free Software Foundation, either version 3 of the License, or
	# (at your option) any later version.
	#
	# This program is distributed in the hope that it will be useful,
	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	import tqdm
	import os
	import gzip
	from absl import flags
	import urllib.request as req
	block = Residual()
	x = tf.random_normal(shape=(N, C, H, W))
	dy = tf.random_normal(shape=(N, C, H, W))
	with tf.GradientTape() as tape:
	tape.watch(x)
	y = block(x)
	# Compute true grads
	dx_true = tape.gradient(y, x, output_gradients=dy)

	# Compute grads from reconstruction
	def tensor_square(x, stop_when): # x is scalar Tensor
	cnt = 0
	while x < stop_when:
	x = tf.square(x)
	cnt += 1
	return cnt
	class Residual(tf.keras.Model):
	def __init__(self, filters):
	super(Residual, self).__init__()
	self.f = ResidualInner(filters=filters, strides=(1, 1))
	self.g = ResidualInner(filters=filters, strides=(1, 1))

	def call(self, x, training=True):
	x1, x2 = tf.split(x, num_or_size_splits=2, axis=self.axis)
	f_x2 = self.f(x2, training=training)
	y1 = f_x2 + x1
	def model_fn(features, labels, mode, params):
	model = RevNet(params["hyperparameters"])
	if mode == tf.estimator.ModeKeys.TRAIN:
	optimizer = tf.train.MomentumOptimizer(learning_rate, momentum)
	logits, saved_hidden = model(features, training=True)
	grads, loss = model.compute_gradients(saved_hidden, labels, training=True)
	with tf.control_dependencies(model.get_updates_for(features)):
	train_op = optimizer.apply_gradients(zip(grads, model.trainable_variables))
	return tf.estimator.EstimatorSpec(mode=mode, loss=loss, train_op=train_op)
	for image, label in dataset:
	logits = model(image, training=True)
	...
	dataset = tf.data.TFRecordDataset(filename)
	dataset = dataset.repeat(epochs).map(parser).batch(batch_size)
	def apply_gradients(optimizer, gradients, variables, global_step=None):
	optimizer.apply_gradients(
	zip(gradients, variables), global_step=global_step)
	apply_gradients = tfe.defun(apply_gradients)
	tfe = tf.contrib.eager
	model.call = tfe.defun(model.call)
	model.compute_gradients = tfe.defun(model.compute_gradients)