Ajout RandAug (Before train) (Work in progress)

2025-06-27 23:45:25 +02:00 · 2019-12-02 06:38:13 -05:00 · 2019-12-02 06:38:13 -05:00 · 31f0b745b5
commit 31f0b745b5
parent 3ec99bf729
86 changed files with 256531 additions and 0 deletions
--- a/UDA/LeNet.py
+++ b/UDA/LeNet.py
@ -0,0 +1,73 @@
+import numpy as np
+import tensorflow as tf
+
+## build the neural network class
+# weight initialization
+def weight_variable(shape, name = None):
+    initial = tf.truncated_normal(shape, stddev=0.1)
+    return tf.Variable(initial, name = name)
+
+# bias initialization
+def bias_variable(shape, name = None):
+    initial = tf.constant(0.1, shape=shape) #  positive bias
+    return tf.Variable(initial, name = name)
+
+# 2D convolution
+def conv2d(x, W, name = None):
+    return tf.nn.conv2d(x, W, strides=[1, 1, 1, 1], padding='VALID', name = name)
+
+# max pooling
+def max_pool_2x2(x, name = None):
+    return tf.nn.max_pool(x, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1],
+                              padding='SAME', name = name)
+
+def LeNet(images, num_classes):
+     # tunable hyperparameters for nn architecture
+     s_f_conv1 = 5; # filter size of first convolution layer (default = 3)
+     n_f_conv1 = 20; # number of features of first convolution layer (default = 36)
+     s_f_conv2 = 5; # filter size of second convolution layer (default = 3)
+     n_f_conv2 = 50; # number of features of second convolution layer (default = 36)
+     n_n_fc1 = 500; # number of neurons of first fully connected layer (default = 576)
+     n_n_fc2 = 500; # number of neurons of first fully connected layer (default = 576)
+
+     #print(images.shape)
+     # 1.layer: convolution + max pooling
+     W_conv1_tf = weight_variable([s_f_conv1, s_f_conv1, int(images.shape[3]), n_f_conv1], name = 'W_conv1_tf') # (5,5,1,32)
+     b_conv1_tf = bias_variable([n_f_conv1], name = 'b_conv1_tf') # (32)
+     h_conv1_tf = tf.nn.relu(conv2d(images, W_conv1_tf) + b_conv1_tf, name = 'h_conv1_tf') # (.,28,28,32)
+     h_pool1_tf = max_pool_2x2(h_conv1_tf, name = 'h_pool1_tf') # (.,14,14,32)
+     #print(h_conv1_tf.shape)
+     #print(h_pool1_tf.shape)
+     # 2.layer: convolution + max pooling
+     W_conv2_tf = weight_variable([s_f_conv2, s_f_conv2, n_f_conv1, n_f_conv2], name = 'W_conv2_tf')
+     b_conv2_tf = bias_variable([n_f_conv2], name = 'b_conv2_tf')
+     h_conv2_tf = tf.nn.relu(conv2d(h_pool1_tf, W_conv2_tf) + b_conv2_tf, name ='h_conv2_tf') #(.,14,14,32)
+     h_pool2_tf = max_pool_2x2(h_conv2_tf, name = 'h_pool2_tf') #(.,7,7,32)
+
+     #print(h_pool2_tf.shape)
+
+     # 4.layer: fully connected
+     W_fc1_tf = weight_variable([5*5*n_f_conv2,n_n_fc1], name = 'W_fc1_tf') # (4*4*32, 1024)
+     b_fc1_tf = bias_variable([n_n_fc1], name = 'b_fc1_tf') # (1024)
+     h_pool2_flat_tf = tf.reshape(h_pool2_tf, [int(h_pool2_tf.shape[0]), -1], name = 'h_pool3_flat_tf') # (.,1024)
+     h_fc1_tf = tf.nn.relu(tf.matmul(h_pool2_flat_tf, W_fc1_tf) + b_fc1_tf, 
+                                   name = 'h_fc1_tf') # (.,1024)
+      
+     # add dropout
+     #keep_prob_tf = tf.placeholder(dtype=tf.float32, name = 'keep_prob_tf')
+     #h_fc1_drop_tf = tf.nn.dropout(h_fc1_tf, keep_prob_tf, name = 'h_fc1_drop_tf')
+     print(h_fc1_tf.shape)
+
+     # 5.layer: fully connected
+     W_fc2_tf = weight_variable([n_n_fc1, num_classes], name = 'W_fc2_tf')
+     b_fc2_tf = bias_variable([num_classes], name = 'b_fc2_tf')
+     z_pred_tf = tf.add(tf.matmul(h_fc1_tf, W_fc2_tf), b_fc2_tf, name = 'z_pred_tf')# => (.,10)
+     # predicted probabilities in one-hot encoding
+     #y_pred_proba_tf = tf.nn.softmax(z_pred_tf, name='y_pred_proba_tf') 
+        
+     # tensor of correct predictions
+     #y_pred_correct_tf = tf.equal(tf.argmax(y_pred_proba_tf, 1),
+     #                                     tf.argmax(y_data_tf, 1),
+     #                                     name = 'y_pred_correct_tf')  
+     logits = z_pred_tf
+     return logits #y_pred_proba_tf
--- a/UDA/main.py
+++ b/UDA/main.py
@ -0,0 +1,620 @@
+# coding=utf-8
+# Copyright 2019 The Google UDA Team Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""UDA on CIFAR-10 and SVHN.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import contextlib
+import os
+import time
+import json
+
+import numpy as np
+
+from absl import flags
+import absl.logging as _logging  # pylint: disable=unused-import
+
+import tensorflow as tf
+
+from randaugment import custom_ops as ops
+import data
+import utils
+
+from randaugment.wrn import build_wrn_model
+from randaugment.shake_drop import build_shake_drop_model
+from randaugment.shake_shake import build_shake_shake_model
+
+from randaugment.LeNet import LeNet
+
+
+# TPU related
+flags.DEFINE_string(
+    "master", default=None,
+    help="the TPU address. This should be set when using Cloud TPU")
+flags.DEFINE_string(
+    "tpu", default=None,
+    help="The Cloud TPU to use for training. This should be either the name "
+    "used when creating the Cloud TPU, or a grpc://ip.address.of.tpu:8470 url.")
+flags.DEFINE_string(
+    "gcp_project", default=None,
+    help="Project name for the Cloud TPU-enabled project. If not specified, "
+    "we will attempt to automatically detect the GCE project from metadata.")
+flags.DEFINE_string(
+    "tpu_zone", default=None,
+    help="GCE zone where the Cloud TPU is located in. If not specified, we "
+    "will attempt to automatically detect the GCE project from metadata.")
+flags.DEFINE_bool(
+    "use_tpu", default=False,
+    help="Use TPUs rather than GPU/CPU.")
+flags.DEFINE_enum(
+    "task_name", "cifar10",
+    enum_values=["cifar10", "svhn"],
+    help="The task to use")
+
+# UDA config:
+flags.DEFINE_integer(
+    "sup_size", default=4000,
+    help="Number of supervised pairs to use. "
+    "-1: all training samples. 4000: 4000 supervised examples.")
+flags.DEFINE_integer(
+    "aug_copy", default=0,
+    help="Number of different augmented data generated.")
+flags.DEFINE_integer(
+    "unsup_ratio", default=0,
+    help="The ratio between batch size of unlabeled data and labeled data, "
+    "i.e., unsup_ratio * train_batch_size is the batch_size for unlabeled data."
+    "Do not use the unsupervised objective if set to 0.")
+flags.DEFINE_enum(
+    "tsa", "",
+    enum_values=["", "linear_schedule", "log_schedule", "exp_schedule"],
+    help="anneal schedule of training signal annealing. "
+    "tsa='' means not using TSA. See the paper for other schedules.")
+flags.DEFINE_float(
+    "uda_confidence_thresh", default=-1,
+    help="The threshold on predicted probability on unsupervised data. If set,"
+    "UDA loss will only be calculated on unlabeled examples whose largest"
+    "probability is larger than the threshold")
+flags.DEFINE_float(
+    "uda_softmax_temp", -1,
+    help="The temperature of the Softmax when making prediction on unlabeled"
+    "examples. -1 means to use normal Softmax")
+flags.DEFINE_float(
+    "ent_min_coeff", default=0,
+    help="")
+flags.DEFINE_integer(
+    "unsup_coeff", default=1,
+    help="The coefficient on the UDA loss. "
+    "setting unsup_coeff to 1 works for most settings. "
+    "When you have extermely few samples, consider increasing unsup_coeff")
+
+# Experiment (data/checkpoint/directory) config
+flags.DEFINE_string(
+    "data_dir", default=None,
+    help="Path to data directory containing `*.tfrecords`.")
+flags.DEFINE_string(
+    "model_dir", default=None,
+    help="model dir of the saved checkpoints.")
+flags.DEFINE_bool(
+    "do_train", default=True,
+    help="Whether to run training.")
+flags.DEFINE_bool(
+    "do_eval", default=False,
+    help="Whether to run eval on the test set.")
+flags.DEFINE_integer(
+    "dev_size", default=-1,
+    help="dev set size.")
+flags.DEFINE_bool(
+    "verbose", default=False,
+    help="Whether to print additional information.")
+
+# Training config
+flags.DEFINE_integer(
+    "train_batch_size", default=32,
+    help="Size of train batch.")
+flags.DEFINE_integer(
+    "eval_batch_size", default=8,
+    help="Size of evalation batch.")
+flags.DEFINE_integer(
+    "train_steps", default=100000,
+    help="Total number of training steps.")
+flags.DEFINE_integer(
+    "iterations", default=10000,
+    help="Number of iterations per repeat loop.")
+flags.DEFINE_integer(
+    "save_steps", default=10000,
+    help="number of steps for model checkpointing.")
+flags.DEFINE_integer(
+    "max_save", default=10,
+    help="Maximum number of checkpoints to save.")
+
+# Model config
+flags.DEFINE_enum(
+    "model_name", default="wrn",
+    enum_values=["wrn", "shake_shake_32", "shake_shake_96", "shake_shake_112", "pyramid_net", "LeNet"],
+    help="Name of the model")
+flags.DEFINE_integer(
+    "num_classes", default=10,
+    help="Number of categories for classification.")
+flags.DEFINE_integer(
+    "wrn_size", default=32,
+    help="The size of WideResNet. It should be set to 32 for WRN-28-2"
+    "and should be set to 160 for WRN-28-10")
+
+# Optimization config
+flags.DEFINE_float(
+    "learning_rate", default=0.03,
+    help="Maximum learning rate.")
+flags.DEFINE_float(
+    "weight_decay_rate", default=5e-4,
+    help="Weight decay rate.")
+flags.DEFINE_float(
+    "min_lr_ratio", default=0.004,
+    help="Minimum ratio learning rate.")
+flags.DEFINE_integer(
+    "warmup_steps", default=20000,
+    help="Number of steps for linear lr warmup.")
+
+
+
+FLAGS = tf.flags.FLAGS
+
+arg_scope = tf.contrib.framework.arg_scope
+
+
+def get_tsa_threshold(schedule, global_step, num_train_steps, start, end):
+  step_ratio = tf.to_float(global_step) / tf.to_float(num_train_steps)
+  if schedule == "linear_schedule":
+    coeff = step_ratio
+  elif schedule == "exp_schedule":
+    scale = 5
+    # [exp(-5), exp(0)] = [1e-2, 1]
+    coeff = tf.exp((step_ratio - 1) * scale)
+  elif schedule == "log_schedule":
+    scale = 5
+    # [1 - exp(0), 1 - exp(-5)] = [0, 0.99]
+    coeff = 1 - tf.exp((-step_ratio) * scale)
+  return coeff * (end - start) + start
+
+
+def setup_arg_scopes(is_training):
+  """Sets up the argscopes that will be used when building an image model.
+
+  Args:
+    is_training: Is the model training or not.
+
+  Returns:
+    Arg scopes to be put around the model being constructed.
+  """
+
+  batch_norm_decay = 0.9
+  batch_norm_epsilon = 1e-5
+  batch_norm_params = {
+      # Decay for the moving averages.
+      "decay": batch_norm_decay,
+      # epsilon to prevent 0s in variance.
+      "epsilon": batch_norm_epsilon,
+      "scale": True,
+      # collection containing the moving mean and moving variance.
+      "is_training": is_training,
+  }
+
+  scopes = []
+
+  scopes.append(arg_scope([ops.batch_norm], **batch_norm_params))
+  return scopes
+
+
+def build_model(inputs, num_classes, is_training, update_bn, hparams):
+  """Constructs the vision model being trained/evaled.
+
+  Args:
+    inputs: input features/images being fed to the image model build built.
+    num_classes: number of output classes being predicted.
+    is_training: is the model training or not.
+    hparams: additional hyperparameters associated with the image model.
+
+  Returns:
+    The logits of the image model.
+  """
+  scopes = setup_arg_scopes(is_training)
+
+  try:
+      from contextlib import nested
+  except ImportError:
+      from contextlib import ExitStack, contextmanager
+
+      @contextmanager
+      def nested(*contexts):
+          with ExitStack() as stack:
+              for ctx in contexts:
+                  stack.enter_context(ctx)
+              yield contexts
+
+  with nested(*scopes):
+    if hparams.model_name == "pyramid_net":
+      logits = build_shake_drop_model(
+          inputs, num_classes, is_training)
+    elif hparams.model_name == "wrn":
+      logits = build_wrn_model(
+          inputs, num_classes, hparams.wrn_size, update_bn)
+    elif hparams.model_name == "shake_shake":
+      logits = build_shake_shake_model(
+          inputs, num_classes, hparams, is_training)
+
+    elif hparams.model_name == "LeNet":
+      logits = LeNet(inputs, num_classes)
+
+  return logits
+
+
+def _kl_divergence_with_logits(p_logits, q_logits):
+  p = tf.nn.softmax(p_logits)
+  log_p = tf.nn.log_softmax(p_logits)
+  log_q = tf.nn.log_softmax(q_logits)
+
+  kl = tf.reduce_sum(p * (log_p - log_q), -1)
+  return kl
+
+
+def anneal_sup_loss(sup_logits, sup_labels, sup_loss, global_step, metric_dict):
+  tsa_start = 1. / FLAGS.num_classes
+  eff_train_prob_threshold = get_tsa_threshold(
+      FLAGS.tsa, global_step, FLAGS.train_steps,
+      tsa_start, end=1)
+
+  one_hot_labels = tf.one_hot(
+      sup_labels, depth=FLAGS.num_classes, dtype=tf.float32)
+  sup_probs = tf.nn.softmax(sup_logits, axis=-1)
+  correct_label_probs = tf.reduce_sum(
+      one_hot_labels * sup_probs, axis=-1)
+  larger_than_threshold = tf.greater(
+      correct_label_probs, eff_train_prob_threshold)
+  loss_mask = 1 - tf.cast(larger_than_threshold, tf.float32)
+  loss_mask = tf.stop_gradient(loss_mask)
+  sup_loss = sup_loss * loss_mask
+  avg_sup_loss = (tf.reduce_sum(sup_loss) /
+                  tf.maximum(tf.reduce_sum(loss_mask), 1))
+  metric_dict["sup/sup_trained_ratio"] = tf.reduce_mean(loss_mask)
+  metric_dict["sup/eff_train_prob_threshold"] = eff_train_prob_threshold
+  return sup_loss, avg_sup_loss
+
+
+def get_ent(logits, return_mean=True):
+  log_prob = tf.nn.log_softmax(logits, axis=-1)
+  prob = tf.exp(log_prob)
+  ent = tf.reduce_sum(-prob * log_prob, axis=-1)
+  if return_mean:
+    ent = tf.reduce_mean(ent)
+  return ent
+
+
+def get_model_fn(hparams):
+  def model_fn(features, labels, mode, params):
+    sup_labels = tf.reshape(features["label"], [-1])
+
+    #### Configuring the optimizer
+    global_step = tf.train.get_global_step()
+    metric_dict = {}
+    is_training = (mode == tf.estimator.ModeKeys.TRAIN)
+    if FLAGS.unsup_ratio > 0 and is_training:
+      all_images = tf.concat([features["image"],
+                              features["ori_image"],
+                              features["aug_image"]], 0)
+    else:
+      all_images = features["image"]
+
+    with tf.variable_scope("model", reuse=tf.AUTO_REUSE):
+      all_logits = build_model(
+          inputs=all_images,
+          num_classes=FLAGS.num_classes,
+          is_training=is_training,
+          update_bn=True and is_training,
+          hparams=hparams,
+      )
+
+      sup_bsz = tf.shape(features["image"])[0]
+      sup_logits = all_logits[:sup_bsz]
+
+      sup_loss = tf.nn.sparse_softmax_cross_entropy_with_logits(
+          labels=sup_labels,
+          logits=sup_logits)
+      sup_prob = tf.nn.softmax(sup_logits, axis=-1)
+      metric_dict["sup/pred_prob"] = tf.reduce_mean(
+          tf.reduce_max(sup_prob, axis=-1))
+    if FLAGS.tsa:
+      sup_loss, avg_sup_loss = anneal_sup_loss(sup_logits, sup_labels, sup_loss,
+                                               global_step, metric_dict)
+    else:
+      avg_sup_loss = tf.reduce_mean(sup_loss)
+    total_loss = avg_sup_loss
+
+    if FLAGS.unsup_ratio > 0 and is_training:
+      aug_bsz = tf.shape(features["ori_image"])[0]
+
+      ori_logits = all_logits[sup_bsz : sup_bsz + aug_bsz]
+      aug_logits = all_logits[sup_bsz + aug_bsz:]
+      if FLAGS.uda_softmax_temp != -1:
+        ori_logits_tgt = ori_logits / FLAGS.uda_softmax_temp
+      else:
+        ori_logits_tgt = ori_logits
+      ori_prob = tf.nn.softmax(ori_logits, axis=-1)
+      aug_prob = tf.nn.softmax(aug_logits, axis=-1)
+      metric_dict["unsup/ori_prob"] = tf.reduce_mean(
+          tf.reduce_max(ori_prob, axis=-1))
+      metric_dict["unsup/aug_prob"] = tf.reduce_mean(
+          tf.reduce_max(aug_prob, axis=-1))
+
+      aug_loss = _kl_divergence_with_logits(
+          p_logits=tf.stop_gradient(ori_logits_tgt),
+          q_logits=aug_logits)
+
+      if FLAGS.uda_confidence_thresh != -1:
+        ori_prob = tf.nn.softmax(ori_logits, axis=-1)
+        largest_prob = tf.reduce_max(ori_prob, axis=-1)
+        loss_mask = tf.cast(tf.greater(
+            largest_prob, FLAGS.uda_confidence_thresh), tf.float32)
+        metric_dict["unsup/high_prob_ratio"] = tf.reduce_mean(loss_mask)
+        loss_mask = tf.stop_gradient(loss_mask)
+        aug_loss = aug_loss * loss_mask
+        metric_dict["unsup/high_prob_loss"] = tf.reduce_mean(aug_loss)
+
+      if FLAGS.ent_min_coeff > 0:
+        ent_min_coeff = FLAGS.ent_min_coeff
+        metric_dict["unsup/ent_min_coeff"] = ent_min_coeff
+        per_example_ent = get_ent(ori_logits)
+        ent_min_loss = tf.reduce_mean(per_example_ent)
+        total_loss = total_loss + ent_min_coeff * ent_min_loss
+
+      avg_unsup_loss = tf.reduce_mean(aug_loss)
+      total_loss += FLAGS.unsup_coeff * avg_unsup_loss
+      metric_dict["unsup/loss"] = avg_unsup_loss
+
+    total_loss = utils.decay_weights(
+        total_loss,
+        FLAGS.weight_decay_rate)
+
+    #### Check model parameters
+    num_params = sum([np.prod(v.shape) for v in tf.trainable_variables()])
+    tf.logging.info("#params: {}".format(num_params))
+
+    if FLAGS.verbose:
+      format_str = "{{:<{0}s}}\t{{}}".format(
+          max([len(v.name) for v in tf.trainable_variables()]))
+      for v in tf.trainable_variables():
+        tf.logging.info(format_str.format(v.name, v.get_shape()))
+
+    #### Evaluation mode
+    if mode == tf.estimator.ModeKeys.EVAL:
+      #### Metric function for classification
+      def metric_fn(per_example_loss, label_ids, logits):
+        # classification loss & accuracy
+        loss = tf.metrics.mean(per_example_loss)
+
+        predictions = tf.argmax(logits, axis=-1, output_type=tf.int32)
+        accuracy = tf.metrics.accuracy(label_ids, predictions)
+
+        ret_dict = {
+            "eval/classify_loss": loss,
+            "eval/classify_accuracy": accuracy
+        }
+
+        return ret_dict
+
+      eval_metrics = (metric_fn, [sup_loss, sup_labels, sup_logits])
+
+      #### Constucting evaluation TPUEstimatorSpec.
+      eval_spec = tf.contrib.tpu.TPUEstimatorSpec(
+          mode=mode,
+          loss=total_loss,
+          eval_metrics=eval_metrics)
+
+      return eval_spec
+
+    # increase the learning rate linearly
+    if FLAGS.warmup_steps > 0:
+      warmup_lr = tf.to_float(global_step) / tf.to_float(FLAGS.warmup_steps) \
+                  * FLAGS.learning_rate
+    else:
+      warmup_lr = 0.0
+
+    # decay the learning rate using the cosine schedule
+    decay_lr = tf.train.cosine_decay(
+        FLAGS.learning_rate,
+        global_step=global_step-FLAGS.warmup_steps,
+        decay_steps=FLAGS.train_steps-FLAGS.warmup_steps,
+        alpha=FLAGS.min_lr_ratio)
+
+    learning_rate = tf.where(global_step < FLAGS.warmup_steps,
+                             warmup_lr, decay_lr)
+
+    optimizer = tf.train.MomentumOptimizer(
+        learning_rate=learning_rate,
+        momentum=0.9,
+        use_nesterov=True)
+
+    if FLAGS.use_tpu:
+      optimizer = tf.contrib.tpu.CrossShardOptimizer(optimizer)
+
+    grads_and_vars = optimizer.compute_gradients(total_loss)
+    gradients, variables = zip(*grads_and_vars)
+    update_ops = tf.get_collection(tf.GraphKeys.UPDATE_OPS)
+    with tf.control_dependencies(update_ops):
+      train_op = optimizer.apply_gradients(
+          zip(gradients, variables), global_step=tf.train.get_global_step())
+
+    #### Creating training logging hook
+    # compute accuracy
+    sup_pred = tf.argmax(sup_logits, axis=-1, output_type=sup_labels.dtype)
+    is_correct = tf.to_float(tf.equal(sup_pred, sup_labels))
+    acc = tf.reduce_mean(is_correct)
+    metric_dict["sup/sup_loss"] = avg_sup_loss
+    metric_dict["training/loss"] = total_loss
+    metric_dict["sup/acc"] = acc
+    metric_dict["training/lr"] = learning_rate
+    metric_dict["training/step"] = global_step
+
+    if not FLAGS.use_tpu:
+      log_info = ("step [{training/step}] lr {training/lr:.6f} "
+                  "loss {training/loss:.4f} "
+                  "sup/acc {sup/acc:.4f} sup/loss {sup/sup_loss:.6f} ")
+      if FLAGS.unsup_ratio > 0:
+        log_info += "unsup/loss {unsup/loss:.6f} "
+      formatter = lambda kwargs: log_info.format(**kwargs)
+      logging_hook = tf.train.LoggingTensorHook(
+          tensors=metric_dict,
+          every_n_iter=FLAGS.iterations,
+          formatter=formatter)
+      training_hooks = [logging_hook]
+      #### Constucting training TPUEstimatorSpec.
+      train_spec = tf.contrib.tpu.TPUEstimatorSpec(
+          mode=mode, loss=total_loss, train_op=train_op,
+          training_hooks=training_hooks)
+    else:
+      #### Constucting training TPUEstimatorSpec.
+      host_call = utils.construct_scalar_host_call(
+          metric_dict=metric_dict,
+          model_dir=params["model_dir"],
+          prefix="",
+          reduce_fn=tf.reduce_mean)
+      train_spec = tf.contrib.tpu.TPUEstimatorSpec(
+          mode=mode, loss=total_loss, train_op=train_op,
+          host_call=host_call)
+
+    return train_spec
+
+  return model_fn
+
+
+def train(hparams):
+  ##### Create input function
+  if FLAGS.unsup_ratio == 0:
+    FLAGS.aug_copy = 0
+  if FLAGS.dev_size != -1:
+    FLAGS.do_train = True
+    FLAGS.do_eval = True
+  if FLAGS.do_train:
+    train_input_fn = data.get_input_fn(
+        data_dir=FLAGS.data_dir,
+        split="train",
+        task_name=FLAGS.task_name,
+        sup_size=FLAGS.sup_size,
+        unsup_ratio=FLAGS.unsup_ratio,
+        aug_copy=FLAGS.aug_copy,
+    )
+
+  if FLAGS.do_eval:
+    if FLAGS.dev_size != -1:
+      eval_input_fn = data.get_input_fn(
+          data_dir=FLAGS.data_dir,
+          split="dev",
+          task_name=FLAGS.task_name,
+          sup_size=FLAGS.dev_size,
+          unsup_ratio=0,
+          aug_copy=0)
+      eval_size = FLAGS.dev_size
+    else:
+      eval_input_fn = data.get_input_fn(
+          data_dir=FLAGS.data_dir,
+          split="test",
+          task_name=FLAGS.task_name,
+          sup_size=-1,
+          unsup_ratio=0,
+          aug_copy=0)
+      if FLAGS.task_name == "cifar10":
+        eval_size = 10000
+      elif FLAGS.task_name == "svhn":
+        eval_size = 26032
+      else:
+        assert False, "You need to specify the size of your test set."
+    eval_steps = eval_size // FLAGS.eval_batch_size
+
+  ##### Get model function
+  model_fn = get_model_fn(hparams)
+  estimator = utils.get_TPU_estimator(FLAGS, model_fn)
+
+  #### Training
+  if FLAGS.dev_size != -1:
+    tf.logging.info("***** Running training and validation *****")
+    tf.logging.info("  Supervised batch size = %d", FLAGS.train_batch_size)
+    tf.logging.info("  Unsupervised batch size = %d",
+                    FLAGS.train_batch_size * FLAGS.unsup_ratio)
+    tf.logging.info("  Num train steps = %d", FLAGS.train_steps)
+    curr_step = 0
+    while True:
+      if curr_step >= FLAGS.train_steps:
+        break
+      tf.logging.info("Current step {}".format(curr_step))
+      train_step = min(FLAGS.save_steps, FLAGS.train_steps - curr_step)
+      estimator.train(input_fn=train_input_fn, steps=train_step)
+      estimator.evaluate(input_fn=eval_input_fn, steps=eval_steps)
+      curr_step += FLAGS.save_steps
+  else:
+    if FLAGS.do_train:
+      tf.logging.info("***** Running training *****")
+      tf.logging.info("  Supervised batch size = %d", FLAGS.train_batch_size)
+      tf.logging.info("  Unsupervised batch size = %d",
+                      FLAGS.train_batch_size * FLAGS.unsup_ratio)
+      estimator.train(input_fn=train_input_fn, max_steps=FLAGS.train_steps)
+    if FLAGS.do_eval:
+      tf.logging.info("***** Running evaluation *****")
+      results = estimator.evaluate(input_fn=eval_input_fn, steps=eval_steps)
+      tf.logging.info(">> Results:")
+      for key in results.keys():
+        tf.logging.info("  %s = %s", key, str(results[key]))
+        results[key] = results[key].item()
+      acc = results["eval/classify_accuracy"]
+      with tf.gfile.Open("{}/results.txt".format(FLAGS.model_dir), "w") as ouf:
+        ouf.write(str(acc))
+
+
+def main(_):
+
+  if FLAGS.do_train:
+    tf.gfile.MakeDirs(FLAGS.model_dir)
+    flags_dict = tf.app.flags.FLAGS.flag_values_dict()
+    with tf.gfile.Open(os.path.join(FLAGS.model_dir, "FLAGS.json"), "w") as ouf:
+      json.dump(flags_dict, ouf)
+  hparams = tf.contrib.training.HParams()
+
+  if FLAGS.model_name == "wrn":
+    hparams.add_hparam("model_name", "wrn")
+    hparams.add_hparam("wrn_size", FLAGS.wrn_size)
+  elif FLAGS.model_name == "shake_shake_32":
+    hparams.add_hparam("model_name", "shake_shake")
+    hparams.add_hparam("shake_shake_widen_factor", 2)
+  elif FLAGS.model_name == "shake_shake_96":
+    hparams.add_hparam("model_name", "shake_shake")
+    hparams.add_hparam("shake_shake_widen_factor", 6)
+  elif FLAGS.model_name == "shake_shake_112":
+    hparams.add_hparam("model_name", "shake_shake")
+    hparams.add_hparam("shake_shake_widen_factor", 7)
+  elif FLAGS.model_name == "pyramid_net":
+    hparams.add_hparam("model_name", "pyramid_net")
+
+  elif FLAGS.model_name == "LeNet":
+    hparams.add_hparam("model_name", "LeNet")
+
+  else:
+    raise ValueError("Not Valid Model Name: %s" % FLAGS.model_name)
+
+  train(hparams)
+
+
+if __name__ == "__main__":
+  tf.logging.set_verbosity(tf.logging.INFO)
+  tf.app.run()
--- a/UDA/run_cifar10_gpu.sh
+++ b/UDA/run_cifar10_gpu.sh
@ -0,0 +1,31 @@
+# coding=utf-8
+# Copyright 2019 The Google UDA Team Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#!/bin/bash
+
+task_name=cifar10
+
+python main.py \
+  --model_name="LeNet"\
+  --use_tpu=False \
+  --do_train=True \
+  --do_eval=True \
+  --task_name=${task_name} \
+  --sup_size=4000 \
+  --unsup_ratio=5 \
+  --train_batch_size=32 \
+  --data_dir=data/proc_data/${task_name} \
+  --model_dir=ckpt/cifar10_gpu \
+  --train_steps=400000 \
+  $@
--- a/higher/augmentation_transforms.py
+++ b/higher/augmentation_transforms.py
@ -0,0 +1,490 @@
+# coding=utf-8
+# Copyright 2019 The Google UDA Team Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Transforms used in the Augmentation Policies.
+
+Copied from AutoAugment: https://github.com/tensorflow/models/blob/master/research/autoaugment/
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import random
+import numpy as np
+# pylint:disable=g-multiple-import
+from PIL import ImageOps, ImageEnhance, ImageFilter, Image
+# pylint:enable=g-multiple-import
+
+#import tensorflow as tf
+
+#FLAGS = tf.flags.FLAGS
+
+
+IMAGE_SIZE = 32
+# What is the dataset mean and std of the images on the training set
+PARAMETER_MAX = 10  # What is the max 'level' a transform could be predicted
+
+
+def get_mean_and_std():
+  #if FLAGS.task_name == "cifar10":
+  means = [0.49139968, 0.48215841, 0.44653091]
+  stds = [0.24703223, 0.24348513, 0.26158784]
+  #elif FLAGS.task_name == "svhn":
+  #  means = [0.4376821, 0.4437697, 0.47280442]
+  #  stds = [0.19803012, 0.20101562, 0.19703614]
+  #else:
+  #  assert False
+  return means, stds
+
+
+def random_flip(x):
+  """Flip the input x horizontally with 50% probability."""
+  if np.random.rand(1)[0] > 0.5:
+    return np.fliplr(x)
+  return x
+
+
+def zero_pad_and_crop(img, amount=4):
+  """Zero pad by `amount` zero pixels on each side then take a random crop.
+
+  Args:
+    img: numpy image that will be zero padded and cropped.
+    amount: amount of zeros to pad `img` with horizontally and verically.
+
+  Returns:
+    The cropped zero padded img. The returned numpy array will be of the same
+    shape as `img`.
+  """
+  padded_img = np.zeros((img.shape[0] + amount * 2, img.shape[1] + amount * 2,
+                         img.shape[2]))
+  padded_img[amount:img.shape[0] + amount, amount:
+             img.shape[1] + amount, :] = img
+  top = np.random.randint(low=0, high=2 * amount)
+  left = np.random.randint(low=0, high=2 * amount)
+  new_img = padded_img[top:top + img.shape[0], left:left + img.shape[1], :]
+  return new_img
+
+
+def create_cutout_mask(img_height, img_width, num_channels, size):
+  """Creates a zero mask used for cutout of shape `img_height` x `img_width`.
+
+  Args:
+    img_height: Height of image cutout mask will be applied to.
+    img_width: Width of image cutout mask will be applied to.
+    num_channels: Number of channels in the image.
+    size: Size of the zeros mask.
+
+  Returns:
+    A mask of shape `img_height` x `img_width` with all ones except for a
+    square of zeros of shape `size` x `size`. This mask is meant to be
+    elementwise multiplied with the original image. Additionally returns
+    the `upper_coord` and `lower_coord` which specify where the cutout mask
+    will be applied.
+  """
+  assert img_height == img_width
+
+  # Sample center where cutout mask will be applied
+  height_loc = np.random.randint(low=0, high=img_height)
+  width_loc = np.random.randint(low=0, high=img_width)
+
+  # Determine upper right and lower left corners of patch
+  upper_coord = (max(0, height_loc - size // 2), max(0, width_loc - size // 2))
+  lower_coord = (min(img_height, height_loc + size // 2),
+                 min(img_width, width_loc + size // 2))
+  mask_height = lower_coord[0] - upper_coord[0]
+  mask_width = lower_coord[1] - upper_coord[1]
+  assert mask_height > 0
+  assert mask_width > 0
+
+  mask = np.ones((img_height, img_width, num_channels))
+  zeros = np.zeros((mask_height, mask_width, num_channels))
+  mask[upper_coord[0]:lower_coord[0], upper_coord[1]:lower_coord[1], :] = (
+      zeros)
+  return mask, upper_coord, lower_coord
+
+
+def cutout_numpy(img, size=16):
+  """Apply cutout with mask of shape `size` x `size` to `img`.
+
+  The cutout operation is from the paper https://arxiv.org/abs/1708.04552.
+  This operation applies a `size`x`size` mask of zeros to a random location
+  within `img`.
+
+  Args:
+    img: Numpy image that cutout will be applied to.
+    size: Height/width of the cutout mask that will be
+
+  Returns:
+    A numpy tensor that is the result of applying the cutout mask to `img`.
+  """
+  img_height, img_width, num_channels = (img.shape[0], img.shape[1],
+                                         img.shape[2])
+  assert len(img.shape) == 3
+  mask, _, _ = create_cutout_mask(img_height, img_width, num_channels, size)
+  return img * mask
+
+
+def float_parameter(level, maxval):
+  """Helper function to scale `val` between 0 and maxval .
+
+  Args:
+    level: Level of the operation that will be between [0, `PARAMETER_MAX`].
+    maxval: Maximum value that the operation can have. This will be scaled
+      to level/PARAMETER_MAX.
+
+  Returns:
+    A float that results from scaling `maxval` according to `level`.
+  """
+  return float(level) * maxval / PARAMETER_MAX
+
+
+def int_parameter(level, maxval):
+  """Helper function to scale `val` between 0 and maxval .
+
+  Args:
+    level: Level of the operation that will be between [0, `PARAMETER_MAX`].
+    maxval: Maximum value that the operation can have. This will be scaled
+      to level/PARAMETER_MAX.
+
+  Returns:
+    An int that results from scaling `maxval` according to `level`.
+  """
+  return int(level * maxval / PARAMETER_MAX)
+
+
+def pil_wrap(img, use_mean_std):
+  """Convert the `img` numpy tensor to a PIL Image."""
+
+  if use_mean_std:
+    MEANS, STDS = get_mean_and_std()
+  else:
+    MEANS = [0, 0, 0]
+    STDS = [1, 1, 1]
+  img_ori = (img * STDS + MEANS) * 255
+
+  return Image.fromarray(
+      np.uint8((img * STDS + MEANS) * 255.0)).convert('RGBA')
+
+
+def pil_unwrap(pil_img, use_mean_std, img_shape):
+  """Converts the PIL img to a numpy array."""
+  if use_mean_std:
+    MEANS, STDS = get_mean_and_std()
+  else:
+    MEANS = [0, 0, 0]
+    STDS = [1, 1, 1]
+  pic_array = np.array(pil_img.getdata()).reshape((img_shape[0], img_shape[1], 4)) / 255.0
+  i1, i2 = np.where(pic_array[:, :, 3] == 0)
+  pic_array = (pic_array[:, :, :3] - MEANS) / STDS
+  pic_array[i1, i2] = [0, 0, 0]
+  return pic_array
+
+
+def apply_policy(policy, img, use_mean_std=True):
+  """Apply the `policy` to the numpy `img`.
+
+  Args:
+    policy: A list of tuples with the form (name, probability, level) where
+      `name` is the name of the augmentation operation to apply, `probability`
+      is the probability of applying the operation and `level` is what strength
+      the operation to apply.
+    img: Numpy image that will have `policy` applied to it.
+
+  Returns:
+    The result of applying `policy` to `img`.
+  """
+  img_shape = img.shape
+  pil_img = pil_wrap(img, use_mean_std)
+  for xform in policy:
+    assert len(xform) == 3
+    name, probability, level = xform
+    xform_fn = NAME_TO_TRANSFORM[name].pil_transformer(
+        probability, level, img_shape)
+    pil_img = xform_fn(pil_img)
+  return pil_unwrap(pil_img, use_mean_std, img_shape)
+
+
+class TransformFunction(object):
+  """Wraps the Transform function for pretty printing options."""
+
+  def __init__(self, func, name):
+    self.f = func
+    self.name = name
+
+  def __repr__(self):
+    return '<' + self.name + '>'
+
+  def __call__(self, pil_img):
+    return self.f(pil_img)
+
+
+class TransformT(object):
+  """Each instance of this class represents a specific transform."""
+
+  def __init__(self, name, xform_fn):
+    self.name = name
+    self.xform = xform_fn
+
+  def pil_transformer(self, probability, level, img_shape):
+
+    def return_function(im):
+      if random.random() < probability:
+        im = self.xform(im, level, img_shape)
+      return im
+
+    name = self.name + '({:.1f},{})'.format(probability, level)
+    return TransformFunction(return_function, name)
+
+
+################## Transform Functions ##################
+identity = TransformT('identity', lambda pil_img, level, _: pil_img)
+flip_lr = TransformT(
+    'FlipLR',
+    lambda pil_img, level, _: pil_img.transpose(Image.FLIP_LEFT_RIGHT))
+flip_ud = TransformT(
+    'FlipUD',
+    lambda pil_img, level, _: pil_img.transpose(Image.FLIP_TOP_BOTTOM))
+# pylint:disable=g-long-lambda
+auto_contrast = TransformT(
+    'AutoContrast',
+    lambda pil_img, level, _: ImageOps.autocontrast(
+        pil_img.convert('RGB')).convert('RGBA'))
+equalize = TransformT(
+    'Equalize',
+    lambda pil_img, level, _: ImageOps.equalize(
+        pil_img.convert('RGB')).convert('RGBA'))
+invert = TransformT(
+    'Invert',
+    lambda pil_img, level, _: ImageOps.invert(
+        pil_img.convert('RGB')).convert('RGBA'))
+# pylint:enable=g-long-lambda
+blur = TransformT(
+    'Blur', lambda pil_img, level, _: pil_img.filter(ImageFilter.BLUR))
+smooth = TransformT(
+    'Smooth',
+    lambda pil_img, level, _: pil_img.filter(ImageFilter.SMOOTH))
+
+
+def _rotate_impl(pil_img, level, _):
+  """Rotates `pil_img` from -30 to 30 degrees depending on `level`."""
+  degrees = int_parameter(level, 30)
+  if random.random() > 0.5:
+    degrees = -degrees
+  return pil_img.rotate(degrees)
+
+
+rotate = TransformT('Rotate', _rotate_impl)
+
+
+def _posterize_impl(pil_img, level, _):
+  """Applies PIL Posterize to `pil_img`."""
+  level = int_parameter(level, 4)
+  return ImageOps.posterize(pil_img.convert('RGB'), 4 - level).convert('RGBA')
+
+
+posterize = TransformT('Posterize', _posterize_impl)
+
+
+def _shear_x_impl(pil_img, level, img_shape):
+  """Applies PIL ShearX to `pil_img`.
+
+  The ShearX operation shears the image along the horizontal axis with `level`
+  magnitude.
+
+  Args:
+    pil_img: Image in PIL object.
+    level: Strength of the operation specified as an Integer from
+      [0, `PARAMETER_MAX`].
+
+  Returns:
+    A PIL Image that has had ShearX applied to it.
+  """
+  level = float_parameter(level, 0.3)
+  if random.random() > 0.5:
+    level = -level
+  return pil_img.transform(
+      (img_shape[0], img_shape[1]),
+      Image.AFFINE,
+      (1, level, 0, 0, 1, 0))
+
+
+shear_x = TransformT('ShearX', _shear_x_impl)
+
+
+def _shear_y_impl(pil_img, level, img_shape):
+  """Applies PIL ShearY to `pil_img`.
+
+  The ShearY operation shears the image along the vertical axis with `level`
+  magnitude.
+
+  Args:
+    pil_img: Image in PIL object.
+    level: Strength of the operation specified as an Integer from
+      [0, `PARAMETER_MAX`].
+
+  Returns:
+    A PIL Image that has had ShearX applied to it.
+  """
+  level = float_parameter(level, 0.3)
+  if random.random() > 0.5:
+    level = -level
+  return pil_img.transform(
+      (img_shape[0], img_shape[1]),
+      Image.AFFINE,
+      (1, 0, 0, level, 1, 0))
+
+
+shear_y = TransformT('ShearY', _shear_y_impl)
+
+
+def _translate_x_impl(pil_img, level, img_shape):
+  """Applies PIL TranslateX to `pil_img`.
+
+  Translate the image in the horizontal direction by `level`
+  number of pixels.
+
+  Args:
+    pil_img: Image in PIL object.
+    level: Strength of the operation specified as an Integer from
+      [0, `PARAMETER_MAX`].
+
+  Returns:
+    A PIL Image that has had TranslateX applied to it.
+  """
+  level = int_parameter(level, 10)
+  if random.random() > 0.5:
+    level = -level
+  return pil_img.transform(
+      (img_shape[0], img_shape[1]),
+      Image.AFFINE,
+      (1, 0, level, 0, 1, 0))
+
+
+translate_x = TransformT('TranslateX', _translate_x_impl)
+
+
+def _translate_y_impl(pil_img, level, img_shape):
+  """Applies PIL TranslateY to `pil_img`.
+
+  Translate the image in the vertical direction by `level`
+  number of pixels.
+
+  Args:
+    pil_img: Image in PIL object.
+    level: Strength of the operation specified as an Integer from
+      [0, `PARAMETER_MAX`].
+
+  Returns:
+    A PIL Image that has had TranslateY applied to it.
+  """
+  level = int_parameter(level, 10)
+  if random.random() > 0.5:
+    level = -level
+  return pil_img.transform(
+      (img_shape[0], img_shape[1]),
+      Image.AFFINE,
+      (1, 0, 0, 0, 1, level))
+
+
+translate_y = TransformT('TranslateY', _translate_y_impl)
+
+
+def _crop_impl(pil_img, level, img_shape, interpolation=Image.BILINEAR):
+  """Applies a crop to `pil_img` with the size depending on the `level`."""
+  cropped = pil_img.crop((level, level, img_shape[0] - level, img_shape[1] - level))
+  resized = cropped.resize((img_shape[0], img_shape[1]), interpolation)
+  return resized
+
+
+crop_bilinear = TransformT('CropBilinear', _crop_impl)
+
+
+def _solarize_impl(pil_img, level, _):
+  """Applies PIL Solarize to `pil_img`.
+
+  Translate the image in the vertical direction by `level`
+  number of pixels.
+
+  Args:
+    pil_img: Image in PIL object.
+    level: Strength of the operation specified as an Integer from
+      [0, `PARAMETER_MAX`].
+
+  Returns:
+    A PIL Image that has had Solarize applied to it.
+  """
+  level = int_parameter(level, 256)
+  return ImageOps.solarize(pil_img.convert('RGB'), 256 - level).convert('RGBA')
+
+
+solarize = TransformT('Solarize', _solarize_impl)
+
+
+def _cutout_pil_impl(pil_img, level, img_shape):
+  """Apply cutout to pil_img at the specified level."""
+  size = int_parameter(level, 20)
+  if size <= 0:
+    return pil_img
+  img_height, img_width, num_channels = (img_shape[0], img_shape[1], 3)
+  _, upper_coord, lower_coord = (
+      create_cutout_mask(img_height, img_width, num_channels, size))
+  pixels = pil_img.load()  # create the pixel map
+  for i in range(upper_coord[0], lower_coord[0]):  # for every col:
+    for j in range(upper_coord[1], lower_coord[1]):  # For every row
+      pixels[i, j] = (125, 122, 113, 0)  # set the colour accordingly
+  return pil_img
+
+cutout = TransformT('Cutout', _cutout_pil_impl)
+
+
+def _enhancer_impl(enhancer):
+  """Sets level to be between 0.1 and 1.8 for ImageEnhance transforms of PIL."""
+  def impl(pil_img, level, _):
+    v = float_parameter(level, 1.8) + .1  # going to 0 just destroys it
+    return enhancer(pil_img).enhance(v)
+  return impl
+
+
+color = TransformT('Color', _enhancer_impl(ImageEnhance.Color))
+contrast = TransformT('Contrast', _enhancer_impl(ImageEnhance.Contrast))
+brightness = TransformT('Brightness', _enhancer_impl(
+    ImageEnhance.Brightness))
+sharpness = TransformT('Sharpness', _enhancer_impl(ImageEnhance.Sharpness))
+
+ALL_TRANSFORMS = [
+    flip_lr,
+    flip_ud,
+    auto_contrast,
+    equalize,
+    invert,
+    rotate,
+    posterize,
+    crop_bilinear,
+    solarize,
+    color,
+    contrast,
+    brightness,
+    sharpness,
+    shear_x,
+    shear_y,
+    translate_x,
+    translate_y,
+    cutout,
+    blur,
+    smooth
+]
+
+NAME_TO_TRANSFORM = {t.name: t for t in ALL_TRANSFORMS}
+TRANSFORM_NAMES = NAME_TO_TRANSFORM.keys()
--- a/higher/res/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-Mag)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-Mag)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-20TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-20TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-3TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-3TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-4TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-4TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-7TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-7TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-7TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-7TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)rand0,5-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)rand0,5-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-14TFx1-Mag)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-14TFx1-Mag)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-14TFx2-Mag)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-14TFx2-Mag)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx1-Mag)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx1-Mag)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx1-MagSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx1-MagSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx2-MagSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-17TFx2-MagSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-7TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-7TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-7TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-7TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV5(UniformFx-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV5(UniformFx-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV6(Uniform-18TF(2)x1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV6(Uniform-18TF(2)x1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV6(Uniform-18TF(2)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV6(Uniform-18TF(2)x2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x1-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x1-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
--- a/higher/res/Aug_mod(RandAug(14TFx1-Mag1)-LeNet)-150
+++ b/higher/res/Aug_mod(RandAug(14TFx1-Mag1)-LeNet)-150
--- a/higher/res/Aug_mod(RandAug(14TFx2-Mag1)-LeNet)-150
+++ b/higher/res/Aug_mod(RandAug(14TFx2-Mag1)-LeNet)-150
--- a/higher/res/Aug_mod(RandAug(18TFx2-Mag1)-LeNet)-100
+++ b/higher/res/Aug_mod(RandAug(18TFx2-Mag1)-LeNet)-100
--- a/higher/res/Aug_mod(RandAugUDA(14TFx2-Mag1)-LeNet)-150
+++ b/higher/res/Aug_mod(RandAugUDA(14TFx2-Mag1)-LeNet)-150
--- a/higher/res/Aug_mod(RandAugUDA(18TFx2-Mag1)-LeNet)-100
+++ b/higher/res/Aug_mod(RandAugUDA(18TFx2-Mag1)-LeNet)-100
--- a/higher/res/brutus-tests/Aug_mod(Data_augV5(Mix0,5-14TFx1-Mag)-LeNet)-150epochs(dataug:0)-0in_it-0.png
+++ b/higher/res/brutus-tests/Aug_mod(Data_augV5(Mix0,5-14TFx1-Mag)-LeNet)-150epochs(dataug:0)-0in_it-0.png
--- a/higher/res/brutus-tests/Aug_mod(Data_augV5(Mix0,5-14TFx1-Mag)-LeNet)-150epochs(dataug:0)-1in_it-0.png
+++ b/higher/res/brutus-tests/Aug_mod(Data_augV5(Mix0,5-14TFx1-Mag)-LeNet)-150epochs(dataug:0)-1in_it-0.png
--- a/higher/res/brutus-tests/Aug_mod(Data_augV5(Uniform-14TFx4-MagFxSh)-LeNet)-150epochs(dataug:0)-0in_it-2.png
+++ b/higher/res/brutus-tests/Aug_mod(Data_augV5(Uniform-14TFx4-MagFxSh)-LeNet)-150epochs(dataug:0)-0in_it-2.png
--- a/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Mix0.5-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-0in_it-0.json
+++ b/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Mix0.5-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-0in_it-0.json
--- a/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Mix0.5-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-10in_it-0.json
+++ b/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Mix0.5-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-10in_it-0.json
--- a/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Uniform-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-0in_it-0.json
+++ b/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Uniform-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-0in_it-0.json
--- a/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Uniform-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-10in_it-0.json
+++ b/higher/res/good_TF_tests/log/Aug_mod(Data_augV5(Uniform-6TFx1-MagFxSh)-LeNet)-100epochs(dataug:0)-10in_it-0.json
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-13TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-Mag)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-Mag)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-14TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-15TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-20TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-20TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-3TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-3TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-4TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-4TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-7TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-7TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-7TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-7TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)rand0.5-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(Uniform-9TFx1-MagFxSh)rand0.5-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-14TFx1-Mag)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-14TFx1-Mag)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-14TFx2-Mag)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-14TFx2-Mag)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx1-Mag)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx1-Mag)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx1-MagSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx1-MagSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx2-MagSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-17TFx2-MagSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-7TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-7TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-7TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-7TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV5(UniformFx-9TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV5(UniformFx-9TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-14TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-14TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(2)x1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(2)x1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(2)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(2)x2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TF(3)x2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TFx1-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TFx1-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(Data_augV6(Uniform-18TFx2-MagFxSh)-LeNet)-100
+++ b/higher/res/log/Aug_mod(Data_augV6(Uniform-18TFx2-MagFxSh)-LeNet)-100
--- a/higher/res/log/Aug_mod(RandAug(14TFx1-Mag1)-LeNet)-150
+++ b/higher/res/log/Aug_mod(RandAug(14TFx1-Mag1)-LeNet)-150
--- a/higher/res/log/Aug_mod(RandAug(14TFx2-Mag1)-LeNet)-150
+++ b/higher/res/log/Aug_mod(RandAug(14TFx2-Mag1)-LeNet)-150
--- a/higher/res/log/Aug_mod(RandAug(18TFx2-Mag1)-LeNet)-100
+++ b/higher/res/log/Aug_mod(RandAug(18TFx2-Mag1)-LeNet)-100
--- a/higher/res/log/Aug_mod(RandAugUDA(14TFx2-Mag1)-LeNet)-150
+++ b/higher/res/log/Aug_mod(RandAugUDA(14TFx2-Mag1)-LeNet)-150
--- a/higher/res/log/Aug_mod(RandAugUDA(18TFx2-Mag1)-LeNet)-100
+++ b/higher/res/log/Aug_mod(RandAugUDA(18TFx2-Mag1)-LeNet)-100