google · Dor1s · Aug 19, 2020 · Aug 14, 2020 · Aug 15, 2020 · Aug 15, 2020
diff --git a/src/python/bot/fuzzers/ml/rnn/train.py b/src/python/bot/fuzzers/ml/rnn/train.py
@@ -26,10 +26,6 @@
 import tensorflow as tf
 import time
 
-# TODO(mmoroz): Use replacements for Tensorflow 2.x
-from tensorflow.contrib import layers
-from tensorflow.contrib import rnn
-
 from bot.fuzzers.ml.rnn import constants
 from bot.fuzzers.ml.rnn import utils
 
@@ -49,6 +45,77 @@
 #     to use an insufficient amount of training data.
 
 
+def build_model(num_rnn_cells, dropout_pkeep, batch_size, debug):
+  """Build the RNN model.
+
+  Since we use the Keras sequential model and we use different batch sizes for
+  train, validation and demo output generation, we use this function to rebatch
+  the model.
+
+  Args:
+    num_rnn_cells: number of RNN cells to use.
+    dropout_pkeep: probability of keeping a node in dropout.
+    batch_size: batch size used by the model layer.
+    debug: if True, print a summary of the model.
+
+  Returns:
+    Keras Sequential RNN model.
+  """
+  dropout_pdrop = 1 - dropout_pkeep
+  model = tf.keras.Sequential([
+      tf.keras.layers.Embedding(
+          constants.ALPHA_SIZE,
+          constants.ALPHA_SIZE,
+          batch_input_shape=[batch_size, None]),
+      tf.keras.layers.GRU(
+          num_rnn_cells,
+          return_sequences=True,
+          stateful=True,
+          dropout=dropout_pdrop),
+      tf.keras.layers.Dense(constants.ALPHA_SIZE),
+  ])
+
+  # Display a summary of the model to debug shapes.
+  if debug:
+    model.summary()
+
+  return model
+
+
+@tf.function
+def train_step(model, optimizer, input_data, expected_data, train=False):
+  """Train the model for one step.
+
+  Args:
+    model: RNN model to train/predict.
+    optimize: optimizer to use to train the model.
+    input_data: input sequence to the model.
+    expected_data: expected output of the model.
+
+  Returns:
+    Tuple containing the sequential loss between the expected output and the
+    real output, the batch loss between the two, the accuracy metric value as
+    well as the most likely predicted output.
+  """
+  with tf.GradientTape() as tape:
+    predicted_data = model(input_data)
+    loss = tf.keras.losses.sparse_categorical_crossentropy(
+        expected_data, predicted_data, from_logits=True)
+    seq_loss = tf.reduce_mean(input_tensor=loss, axis=1)
+    batch_loss = tf.reduce_mean(input_tensor=seq_loss)
+
+    output_bytes = tf.cast(
+        tf.argmax(predicted_data, axis=-1), expected_data.dtype)
+    accuracy = tf.reduce_mean(
+        tf.cast(tf.equal(expected_data, output_bytes), tf.float32))
+
+  if train:
+    grads = tape.gradient(loss, model.trainable_variables)
+    optimizer.apply_gradients(zip(grads, model.trainable_variables))
+
+  return seq_loss, batch_loss, accuracy, output_bytes
+
+
 def main(args):
   """Main function to train the model.
 
@@ -101,90 +168,27 @@ def main(args):
   epoch_size = len(code_text) // (batch_size * constants.TRAINING_SEQLEN)
   utils.print_data_stats(len(code_text), len(validation_text), epoch_size)
 
-  # Set graph-level random seed, so any random sequence generated in this
-  # graph is repeatable. It could also be removed.
-  tf.compat.v1.set_random_seed(0)
-
-  # Define placeholder for learning rate, dropout and batch size.
-  lr = tf.compat.v1.placeholder(tf.float32, name='lr')
-  pkeep = tf.compat.v1.placeholder(tf.float32, name='pkeep')
-  batchsize = tf.compat.v1.placeholder(tf.int32, name='batchsize')
-
-  # Input data.
-  input_bytes = tf.compat.v1.placeholder(
-      tf.uint8, [None, None], name='input_bytes')
-  input_onehot = tf.one_hot(input_bytes, constants.ALPHA_SIZE, 1.0, 0.0)
-
-  # Expected outputs = same sequence shifted by 1, since we are trying to
-  # predict the next character.
-  expected_bytes = tf.compat.v1.placeholder(
-      tf.uint8, [None, None], name='expected_bytes')
-  expected_onehot = tf.one_hot(expected_bytes, constants.ALPHA_SIZE, 1.0, 0.0)
-
-  # Input state.
-  hidden_state = tf.compat.v1.placeholder(
-      tf.float32, [None, hidden_state_size * hidden_layer_size],
-      name='hidden_state')
-
-  # "naive dropout" implementation.
-  cells = [rnn.GRUCell(hidden_state_size) for _ in range(hidden_layer_size)]
-  dropcells = [
-      rnn.DropoutWrapper(cell, input_keep_prob=pkeep) for cell in cells
-  ]
-  multicell = rnn.MultiRNNCell(dropcells, state_is_tuple=False)
-  multicell = rnn.DropoutWrapper(multicell, output_keep_prob=pkeep)
-
-  output_raw, next_state = tf.compat.v1.nn.dynamic_rnn(
-      multicell, input_onehot, dtype=tf.float32, initial_state=hidden_state)
-  next_state = tf.identity(next_state, name='next_state')
-
-  # Reshape training outputs.
-  output_flat = tf.reshape(output_raw, [-1, hidden_state_size])
-  output_logits = layers.linear(output_flat, constants.ALPHA_SIZE)
-
-  # Reshape expected outputs.
-  expected_flat = tf.reshape(expected_onehot, [-1, constants.ALPHA_SIZE])
-
-  # Compute training loss.
-  loss = tf.nn.softmax_cross_entropy_with_logits(
-      logits=output_logits, labels=expected_flat)
-  loss = tf.reshape(loss, [batchsize, -1])
-
-  # Use softmax to normalize training outputs.
-  output_onehot = tf.nn.softmax(output_logits, name='output_onehot')
-
-  # Use argmax to get the max value, which is the predicted bytes.
-  output_bytes = tf.argmax(input=output_onehot, axis=1)
-  output_bytes = tf.reshape(output_bytes, [batchsize, -1], name='output_bytes')
+  # Set global random seed, so any random sequence generated is repeatable.
+  # It could also be removed.
+  tf.random.set_seed(0)
+
+  # Build the RNN model.
+  model = build_model(hidden_layer_size * hidden_state_size, dropout_pkeep,
+                      batch_size, debug)
 
   # Choose Adam optimizer to compute gradients.
-  optimizer = tf.compat.v1.train.AdamOptimizer(lr).minimize(loss)
-
-  # Stats for display.
-  seqloss = tf.reduce_mean(input_tensor=loss, axis=1)
-  batchloss = tf.reduce_mean(input_tensor=seqloss)
-  accuracy = tf.reduce_mean(
-      input_tensor=tf.cast(
-          tf.equal(expected_bytes, tf.cast(output_bytes, tf.uint8)),
-          tf.float32))
-  loss_summary = tf.compat.v1.summary.scalar('batch_loss', batchloss)
-  acc_summary = tf.compat.v1.summary.scalar('batch_accuracy', accuracy)
-  summaries = tf.compat.v1.summary.merge([loss_summary, acc_summary])
+  optimizer = tf.keras.optimizers.Adam(learning_rate)
 
   # Init Tensorboard stuff.
   # This will save Tensorboard information in folder specified in command line.
   # Two sets of data are saved so that you can compare training and
   # validation curves visually in Tensorboard.
   timestamp = str(math.trunc(time.time()))
-  summary_writer = tf.compat.v1.summary.FileWriter(
+  summary_writer = tf.summary.create_file_writer(
       os.path.join(log_dir, timestamp + '-training'))
-  validation_writer = tf.compat.v1.summary.FileWriter(
+  validation_writer = tf.summary.create_file_writer(
       os.path.join(log_dir, timestamp + '-validation'))
 
-  # Init for saving models.
-  # They will be saved into a directory specified in command line.
-  saver = tf.compat.v1.train.Saver(max_to_keep=constants.MAX_TO_KEEP)
-
   # For display: init the progress bar.
   step_size = batch_size * constants.TRAINING_SEQLEN
   frequency = constants.DISPLAY_FREQ * step_size
@@ -193,15 +197,11 @@ def main(args):
       size=constants.DISPLAY_LEN,
       msg='Training on next {} batches'.format(constants.DISPLAY_FREQ))
 
-  # Set initial state.
-  state = np.zeros([batch_size, hidden_state_size * hidden_layer_size])
-  session = tf.compat.v1.Session()
-
-  # We continue training on exsiting model, or start with a new model.
+  # We continue training on existing model, or start with a new model.
   if existing_model:
     print('Continue training on existing model: {}'.format(existing_model))
     try:
-      saver.restore(session, existing_model)
+      model.load_weights(existing_model)
     except:
       print(
           ('Failed to restore existing model since model '
@@ -210,7 +210,6 @@ def main(args):
       return constants.ExitCode.TENSORFLOW_ERROR
   else:
     print('No existing model provided. Start training with a new model.')
-    session.run(tf.compat.v1.global_variables_initializer())
 
   # Num of bytes we have trained so far.
   steps = 0
@@ -223,35 +222,19 @@ def main(args):
       nb_epochs=constants.EPOCHS):
 
     # Train on one mini-batch.
-    feed_dict = {
-        input_bytes: input_batch,
-        expected_bytes: expected_batch,
-        hidden_state: state,
-        lr: learning_rate,
-        pkeep: dropout_pkeep,
-        batchsize: batch_size
-    }
-
-    _, predicted, new_state = session.run(
-        [optimizer, output_bytes, next_state], feed_dict=feed_dict)
+    seq_loss, batch_loss, accuracy, output_bytes = train_step(
+        model, optimizer, input_batch, expected_batch, train=True)
 
     # Log training data for Tensorboard display a mini-batch of sequences
     # every `frequency` batches.
     if debug and steps % frequency == 0:
-      feed_dict = {
-          input_bytes: input_batch,
-          expected_bytes: expected_batch,
-          hidden_state: state,
-          pkeep: 1.0,
-          batchsize: batch_size
-      }
-      predicted, seq_loss, batch_loss, acc_value, summaries_value = session.run(
-          [output_bytes, seqloss, batchloss, accuracy, summaries],
-          feed_dict=feed_dict)
       utils.print_learning_learned_comparison(
-          input_batch, predicted, seq_loss, input_ranges, batch_loss, acc_value,
-          epoch_size, steps, epoch)
-      summary_writer.add_summary(summaries_value, steps)
+          input_batch, output_bytes, seq_loss, input_ranges, batch_loss,
+          accuracy, epoch_size, steps, epoch)
+      with summary_writer.as_default():  # pylint: disable=not-context-manager
+        tf.summary.scalar('batch_loss', batch_loss, step=steps)
+        tf.summary.scalar('batch_accuracy', accuracy, step=steps)
+      summary_writer.flush()
 
     # Run a validation step every `frequency` batches.
     # The validation text should be a single sequence but that's too slow.
@@ -261,21 +244,27 @@ def main(args):
       validation_x, validation_y, _ = next(
           utils.rnn_minibatch_sequencer(validation_text, validation_batch_size,
                                         constants.VALIDATION_SEQLEN, 1))
-      null_state = np.zeros(
-          [validation_batch_size, hidden_state_size * hidden_layer_size])
-      feed_dict = {
-          input_bytes: validation_x,
-          expected_bytes: validation_y,
-          hidden_state: null_state,
-          pkeep: 1.0,
-          batchsize: validation_batch_size
-      }
-      batch_loss, acc_value, summaries_value = session.run(
-          [batchloss, accuracy, summaries], feed_dict=feed_dict)
-      utils.print_validation_stats(batch_loss, acc_value)
+
+      validation_model = build_model(hidden_layer_size * hidden_state_size,
+                                     dropout_pkeep, validation_batch_size,
+                                     False)
+      last_weights = tf.train.latest_checkpoint(model_dir)
+      if last_weights:
+        validation_model.load_weights(tf.train.latest_checkpoint(model_dir))
+        validation_model.build(tf.TensorShape([validation_batch_size, None]))
+        validation_model.reset_states()
+
+      # Run one single inference step
+      _, batch_loss, accuracy, _ = train_step(
+          validation_model, optimizer, validation_x, validation_y, train=False)
+
+      utils.print_validation_stats(batch_loss, accuracy)
 
       # Save validation data for Tensorboard.
-      validation_writer.add_summary(summaries_value, steps)
+      with validation_writer.as_default():  # pylint: disable=not-context-manager
+        tf.summary.scalar('batch_loss', batch_loss, step=steps)
+        tf.summary.scalar('batch_accuracy', accuracy, step=steps)
+      validation_writer.flush()
 
     # Display a short text generated with the current weights and biases.
     # If enabled, there will be a large output.
@@ -284,19 +273,24 @@ def main(args):
       file_info = utils.random_element_from_list(files_info_list)
       first_byte, file_size = file_info['first_byte'], file_info['file_size']
       ry = np.array([[first_byte]])
-      rh = np.zeros([1, hidden_state_size * hidden_layer_size])
       sample = [first_byte]
+
+      generation_model = build_model(hidden_layer_size * hidden_state_size,
+                                     dropout_pkeep, 1, False)
+      last_weights = tf.train.latest_checkpoint(model_dir)
+      if last_weights:
+        generation_model.load_weights(tf.train.latest_checkpoint(model_dir))
+        generation_model.build(tf.TensorShape([1, None]))
+        generation_model.reset_states()
+
       for _ in range(file_size - 1):
-        feed_dict = {
-            input_bytes: ry,
-            pkeep: 1.0,
-            hidden_state: rh,
-            batchsize: 1
-        }
-        ryo, rh = session.run([output_onehot, next_state], feed_dict=feed_dict)
-        rc = utils.sample_from_probabilities(ryo, topn=10 if epoch <= 1 else 2)
+        prediction = generation_model(ry)
+        prediction = tf.squeeze(prediction, 0).numpy()
+        rc = utils.sample_from_probabilities(
+            prediction, topn=10 if epoch <= 1 else 2)
         sample.append(rc)
         ry = np.array([[rc]])
+
       print(repr(utils.decode_to_text(sample)))
       utils.print_text_generation_footer()
 
@@ -305,22 +299,21 @@ def main(args):
     if steps // 10 % frequency == 0:
       saved_model_name = constants.RNN_MODEL_NAME + '_' + timestamp
       saved_model_path = os.path.join(model_dir, saved_model_name)
-      saved_model = saver.save(session, saved_model_path, global_step=steps)
-      print('Saved model: {}'.format(saved_model))
+      model.save_weights(saved_model_path)
+      print('Saved model: {}'.format(saved_model_path))
 
     # Display progress bar.
     if debug:
       progress.step(reset=steps % frequency == 0)
 
     # Update state.
-    state = new_state
     steps += step_size
 
   # Save the model after training is done.
   saved_model_name = constants.RNN_MODEL_NAME + '_' + timestamp
   saved_model_path = os.path.join(model_dir, saved_model_name)
-  saved_model = saver.save(session, saved_model_path, global_step=steps)
-  print('Saved model: {}'.format(saved_model))
+  model.save_weights(saved_model_path)
+  print('Saved model: {}'.format(saved_model_path))
 
   return constants.ExitCode.SUCCESS
 

diff --git a/src/python/bot/fuzzers/ml/rnn/utils.py b/src/python/bot/fuzzers/ml/rnn/utils.py
@@ -32,7 +32,6 @@
 def validate_model_path(model_path):
   """RNN model consists of three files. This validates if they all exist."""
   model_exists = (
-      os.path.exists(model_path + constants.MODEL_META_SUFFIX) and
       os.path.exists(model_path + constants.MODEL_DATA_SUFFIX) and
       os.path.exists(model_path + constants.MODEL_INDEX_SUFFIX))
   return model_exists
@@ -283,7 +282,7 @@ def print_progress():
       for _ in range(maxi):
         k = 0
         while d >= 0:
-          print('=', end=' ')
+          print('=', end='')
           sys.stdout.write('')
           sys.stdout.flush()
           k += 1