From charlesreid1

No edit summary
 
(9 intermediate revisions by the same user not shown)
Line 1: Line 1:
=MNIST Convolutional Neural Network=
=Simple MNIST Convolutional Network=


Concept: Simple, end-to-end, LeNet-5-like convolutional MNIST model example. Meant as a tutorial for simple convolutional models.
==Input Function==


Link to code: https://github.com/tensorflow/models/blob/master/tutorials/image/mnist/convolutional.py
Define an input function. This has an internal function that parses the example data (one piece of data at a time) and one-hot encodes the labeled images with the digit it corresponds to.
 
Link to tutorial(s): https://www.tensorflow.org/tutorials/
 
Link to original data set: http://yann.lecun.com/exdb/mnist/
 
==License==


<pre>
<pre>
# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
def input_fn(mode, batch_size=1):
#
  """A simple input_fn using the contrib.data input pipeline."""
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
</pre>


==Import Statements and Variables==
  def example_parser(serialized_example):
    """Parses a single tf.Example into image and label tensors."""
    features = tf.parse_single_example(
        serialized_example,
        features={
            'image_raw': tf.FixedLenFeature([], tf.string),
            'label': tf.FixedLenFeature([], tf.int64),
        })
    image = tf.decode_raw(features['image_raw'], tf.uint8)
    image.set_shape([28 * 28])


Import statements:
    # Normalize the values of the image from the range [0, 255] to [-0.5, 0.5]
    image = tf.cast(image, tf.float32) / 255 - 0.5
    label = tf.cast(features['label'], tf.int32)
    return image, tf.one_hot(label, 10)


<pre>
  if mode == tf.estimator.ModeKeys.TRAIN:
from __future__ import absolute_import
    tfrecords_file = os.path.join(FLAGS.data_dir, 'train.tfrecords')
from __future__ import division
  else:
from __future__ import print_function
    assert mode == tf.estimator.ModeKeys.EVAL, 'invalid mode'
    tfrecords_file = os.path.join(FLAGS.data_dir, 'test.tfrecords')


import argparse
  assert tf.gfile.Exists(tfrecords_file), (
import gzip
      'Run convert_to_records.py first to convert the MNIST data to TFRecord '
import os
      'file format.')
import sys
import time


import numpy
  dataset = tf.contrib.data.TFRecordDataset([tfrecords_file])
from six.moves import urllib
from six.moves import xrange  # pylint: disable=redefined-builtin
import tensorflow as tf
</pre>
 
Variable definitions for use in the rest of the model:
 
<pre>
SOURCE_URL = 'http://yann.lecun.com/exdb/mnist/'
WORK_DIRECTORY = 'data'
IMAGE_SIZE = 28
NUM_CHANNELS = 1
PIXEL_DEPTH = 255
NUM_LABELS = 10
VALIDATION_SIZE = 5000  # Size of the validation set.
SEED = 66478  # Set to None for random seed.
BATCH_SIZE = 64
NUM_EPOCHS = 10
EVAL_BATCH_SIZE = 64
EVAL_FREQUENCY = 100  # Number of steps between evaluations.
FLAGS = None
</pre>


==Obtaining the Data==
  # For training, repeat the dataset forever
  if mode == tf.estimator.ModeKeys.TRAIN:
    dataset = dataset.repeat()


Several functions are defined to help obtain the data. First, define the variable types we will use in the model:
  # Map example_parser over dataset, and batch results by up to batch_size
  dataset = dataset.map(
      example_parser, num_threads=1, output_buffer_size=batch_size)
  dataset = dataset.batch(batch_size)
  images, labels = dataset.make_one_shot_iterator().get_next()


<pre>
   return images, labels
def data_type():
   """Return the type of the activations, weights, and placeholder variables."""
  if FLAGS.use_fp16:
    return tf.float16
  else:
    return tf.float32
</pre>
</pre>


Now define a function that will attempt to download the data if it does not already exist on disk. This uses urllib to obtain the MNIST files, and TensorFlow's gfile module to interact with the file and filesystem.
==Prepare Model==


<pre>
<pre>
def maybe_download(filename):
def mnist_model(inputs, mode):
   """Download the data from Yann's website, unless it's already here."""
   """Takes the MNIST inputs and mode and outputs a tensor of logits."""
   if not tf.gfile.Exists(WORK_DIRECTORY):
   # Input Layer
    tf.gfile.MakeDirs(WORK_DIRECTORY)
  # Reshape X to 4-D tensor: [batch_size, width, height, channels]
   filepath = os.path.join(WORK_DIRECTORY, filename)
   # MNIST images are 28x28 pixels, and have one color channel
   if not tf.gfile.Exists(filepath):
   inputs = tf.reshape(inputs, [-1, 28, 28, 1])
    filepath, _ = urllib.request.urlretrieve(SOURCE_URL + filename, filepath)
   data_format = FLAGS.data_format
    with tf.gfile.GFile(filepath) as f:
      size = f.size()
    print('Successfully downloaded', filename, size, 'bytes.')
   return filepath
</pre>
 
Once the data is downloaded, it must be converted to a format convenient for Tensorflow - in particular, a 4D tensor in which the first index is the image number, the second and third are the width and height, and the fourth dimension is each channel of the image.


These values are then normalized and re-scaled.
  if data_format is None:
    # When running on GPU, transpose the data from channels_last (NHWC) to
    # channels_first (NCHW) to improve performance.
    # See https://www.tensorflow.org/performance/performance_guide#data_formats
    data_format = ('channels_first' if tf.test.is_built_with_cuda() else
                  'channels_last')


<pre>
   if data_format == 'channels_first':
def extract_data(filename, num_images):
     inputs = tf.transpose(inputs, [0, 3, 1, 2])
   """Extract the images into a 4D tensor [image index, y, x, channels].
  Values are rescaled from [0, 255] down to [-0.5, 0.5].
  """
  print('Extracting', filename)
  with gzip.open(filename) as bytestream:
     bytestream.read(16)
    buf = bytestream.read(IMAGE_SIZE * IMAGE_SIZE * num_images * NUM_CHANNELS)
    data = numpy.frombuffer(buf, dtype=numpy.uint8).astype(numpy.float32)
    data = (data - (PIXEL_DEPTH / 2.0)) / PIXEL_DEPTH
    data = data.reshape(num_images, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNELS)
    return data
</pre>
</pre>


The labels - the predictions - must also be put into a format conducive for TensorFlow - a 1D vector:
==Construct Model==


<pre>
<pre>
def extract_labels(filename, num_images):
  # Convolutional Layer #1
   """Extract the labels into a vector of int64 label IDs."""
   # Computes 32 features using a 5x5 filter with ReLU activation.
   print('Extracting', filename)
  # Padding is added to preserve width and height.
   with gzip.open(filename) as bytestream:
   # Input Tensor Shape: [batch_size, 28, 28, 1]
    bytestream.read(8)
   # Output Tensor Shape: [batch_size, 28, 28, 32]
    buf = bytestream.read(1 * num_images)
  conv1 = tf.layers.conv2d(
    labels = numpy.frombuffer(buf, dtype=numpy.uint8).astype(numpy.int64)
      inputs=inputs,
  return labels
      filters=32,
</pre>
      kernel_size=[5, 5],
      padding='same',
      activation=tf.nn.relu,
      data_format=data_format)


There's also a utility for creating a fake data set.
  # Pooling Layer #1
  # First max pooling layer with a 2x2 filter and stride of 2
  # Input Tensor Shape: [batch_size, 28, 28, 32]
  # Output Tensor Shape: [batch_size, 14, 14, 32]
  pool1 = tf.layers.max_pooling2d(inputs=conv1, pool_size=[2, 2], strides=2,
                                  data_format=data_format)


==Error Rate==
  # Convolutional Layer #2
  # Computes 64 features using a 5x5 filter.
  # Padding is added to preserve width and height.
  # Input Tensor Shape: [batch_size, 14, 14, 32]
  # Output Tensor Shape: [batch_size, 14, 14, 64]
  conv2 = tf.layers.conv2d(
      inputs=pool1,
      filters=64,
      kernel_size=[5, 5],
      padding='same',
      activation=tf.nn.relu,
      data_format=data_format)


There is a function defined to compute the error rate. It computes the accuracy first: sums up the number of correctly-labeled digits, divides by the total number of digits, multiplies by 100 to convert to percent. Last, it subtracts the accuracy from 100 to get a percent error.
  # Pooling Layer #2
  # Second max pooling layer with a 2x2 filter and stride of 2
  # Input Tensor Shape: [batch_size, 14, 14, 64]
  # Output Tensor Shape: [batch_size, 7, 7, 64]
  pool2 = tf.layers.max_pooling2d(inputs=conv2, pool_size=[2, 2], strides=2,
                                  data_format=data_format)


<pre>
  # Flatten tensor into a batch of vectors
def error_rate(predictions, labels):
  # Input Tensor Shape: [batch_size, 7, 7, 64]
   """Return the error rate based on dense predictions and sparse labels."""
   # Output Tensor Shape: [batch_size, 7 * 7 * 64]
   return 100.0 - (
   pool2_flat = tf.reshape(pool2, [-1, 7 * 7 * 64])
      100.0 *
      numpy.sum(numpy.argmax(predictions, 1) == labels) /
      predictions.shape[0])
</pre>


Note that this metric is NOT used for training the convolutional network, it is only used for printing purposes.
  # Dense Layer
  # Densely connected layer with 1024 neurons
  # Input Tensor Shape: [batch_size, 7 * 7 * 64]
  # Output Tensor Shape: [batch_size, 1024]
  dense = tf.layers.dense(inputs=pool2_flat, units=1024,
                          activation=tf.nn.relu)


==Main Method==
  # Add dropout operation; 0.6 probability that element will be kept
  dropout = tf.layers.dropout(
      inputs=dense, rate=0.4, training=(mode == tf.estimator.ModeKeys.TRAIN))


===Get Data===
  # Logits layer
 
  # Input Tensor Shape: [batch_size, 1024]
The main method starts by checking if it is in self-test mode (debug mode), in which case, it generates fake data:
  # Output Tensor Shape: [batch_size, 10]
 
   logits = tf.layers.dense(inputs=dropout, units=10)
<pre>
  return logits
   if FLAGS.self_test:
    print('Running self-test.')
    train_data, train_labels = fake_data(256)
    validation_data, validation_labels = fake_data(EVAL_BATCH_SIZE)
    test_data, test_labels = fake_data(EVAL_BATCH_SIZE)
    num_epochs = 1
</pre>
</pre>


Otherwise, it extracts data from the downloaded training/testing MNIST images. None of this is using TensorFlow functionality yet.
==Get Estimator==


<pre>
<pre>
  else:
def mnist_model_fn(features, labels, mode):
    # Get the data.
  """Model function for MNIST."""
    train_data_filename = maybe_download('train-images-idx3-ubyte.gz')
  logits = mnist_model(features, mode)
    train_labels_filename = maybe_download('train-labels-idx1-ubyte.gz')
    test_data_filename = maybe_download('t10k-images-idx3-ubyte.gz')
    test_labels_filename = maybe_download('t10k-labels-idx1-ubyte.gz')


    # Extract it into numpy arrays.
  predictions = {
    train_data = extract_data(train_data_filename, 60000)
      'classes': tf.argmax(input=logits, axis=1),
    train_labels = extract_labels(train_labels_filename, 60000)
      'probabilities': tf.nn.softmax(logits, name='softmax_tensor')
    test_data = extract_data(test_data_filename, 10000)
  }
    test_labels = extract_labels(test_labels_filename, 10000)


    # Generate a validation set.
  if mode == tf.estimator.ModeKeys.PREDICT:
    validation_data = train_data[:VALIDATION_SIZE, ...]
     return tf.estimator.EstimatorSpec(mode=mode, predictions=predictions)
    validation_labels = train_labels[:VALIDATION_SIZE]
     train_data = train_data[VALIDATION_SIZE:, ...]
    train_labels = train_labels[VALIDATION_SIZE:]
    num_epochs = NUM_EPOCHS
  train_size = train_labels.shape[0]
</pre>


===Variable Definitions===
  loss = tf.losses.softmax_cross_entropy(onehot_labels=labels, logits=logits)


To use the input variables we have on the computational graph that TensorFlow will build, we have to declare those input variables. We do that using a TensorFlow placeholder type.
  # Configure the training op
 
  if mode == tf.estimator.ModeKeys.TRAIN:
We also created a placeholder variable in the [[TensorFlow/Adversarial Crypto]] class, in the [[TensorFlow/Adversarial_Crypto#AdversarialCrypto_Class_-_Creation_of_Message_and_Key|Creation of Message and Key]] section. There, the placeholder variable was batch size. (However, the input variables in that network were different because we used that somewhat mysterious function, "tf.contrib.framework.arg_scope()", and passed it TensorFlow variables to initialize on each of the three graph we had.)
    optimizer = tf.train.AdamOptimizer(learning_rate=1e-4)
    train_op = optimizer.minimize(loss, tf.train.get_or_create_global_step())
  else:
    train_op = None


Here, we are explicitly creating a variable placeholder for the trianing data (inputs), training labels (outputs), and evaluation data. (Remember, the data_type() function was defined above and just returns a float16 or float32 type.)
  accuracy = tf.metrics.accuracy(
      tf.argmax(labels, axis=1), predictions['classes'])
  metrics = {'accuracy': accuracy}


Again, notice the four dimensions - meaning train_data_node is a placeholder representing a 4D tensor.
  # Create a tensor named train_accuracy for logging purposes
  tf.identity(accuracy[1], name='train_accuracy')
  tf.summary.scalar('train_accuracy', accuracy[1])


<pre>
   return tf.estimator.EstimatorSpec(
   # This is where training samples and labels are fed to the graph.
       mode=mode,
  # These placeholder nodes will be fed a batch of training data at each
       predictions=predictions,
  # training step using the {feed_dict} argument to the Run() call below.
      loss=loss,
  train_data_node = tf.placeholder(
      train_op=train_op,
       data_type(),
       eval_metric_ops=metrics)
       shape=(BATCH_SIZE, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNELS))
  train_labels_node = tf.placeholder(tf.int64, shape=(BATCH_SIZE,))
  eval_data = tf.placeholder(
      data_type(),
       shape=(EVAL_BATCH_SIZE, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNELS))
</pre>
</pre>


Next, we create a set of tensors that will hold the weights and biases of the convolutional neural network layers. (When we use high-level neural net APIs like [[Keras]], this is all taken care of for us, but here we do it all manually.)
==Main Function==
 
====Convolutional Layers====
 
First, convolutional layer 1: in this layer we are defining a 5 x 5 filter - meaning the 28 x 28 pixel images in the NIST data set will be convoluted down to a 5 x 5 image set. But the number of feature maps is 32, meaning we're going to convolute the 28 x 28 pixel images down into 32 different 5 x 5 pixel images. The idea is that each of those feature maps will pick out a particular feature about the image topology that is important, and "represent" it, or "allow" that signal to pass through the first layer of the convolutional neural network.
 
The bias determines the importance of each of those feature maps, so we need the number of biases to match the number of feature maps (32).


<pre>
<pre>
  # The variables below hold all the trainable weights. They are passed an
def main(unused_argv):
  # initial value which will be assigned when we call:
   # Create the Estimator
   # {tf.global_variables_initializer().run()}
   mnist_classifier = tf.estimator.Estimator(
   conv1_weights = tf.Variable(
       model_fn=mnist_model_fn, model_dir=FLAGS.model_dir)
       tf.truncated_normal([5, 5, NUM_CHANNELS, 32],  # 5x5 filter, depth 32.
                          stddev=0.1,
                          seed=SEED, dtype=data_type()))
  conv1_biases = tf.Variable(tf.zeros([32], dtype=data_type()))
</pre>


We do the same thing with the second convolutional layer. This time there is no number of channels showing up in the size.
  # Train the model
  tensors_to_log = {
      'train_accuracy': 'train_accuracy'
  }


<pre>
   logging_hook = tf.train.LoggingTensorHook(
   conv2_weights = tf.Variable(tf.truncated_normal(
       tensors=tensors_to_log, every_n_iter=100)
       [5, 5, 32, 64], stddev=0.1,
      seed=SEED, dtype=data_type()))
  conv2_biases = tf.Variable(tf.constant(0.1, shape=[64], dtype=data_type()))
</pre>


The truncated_normal variable types refer to how the variables are initialized - they are initialized with values drawn from a (truncated) normal distribution. Truncated simply means that they cannot go above 1 or below 0, which makes it easier for the machine learning algorithm.  
  batches_per_epoch = _NUM_IMAGES['train'] / FLAGS.batch_size


Link to truncated_normal documentation: https://www.tensorflow.org/api_docs/python/tf/truncated_normal
  mnist_classifier.train(
      input_fn=lambda: input_fn(tf.estimator.ModeKeys.TRAIN, FLAGS.batch_size),
      steps=FLAGS.train_epochs * batches_per_epoch,
      hooks=[logging_hook])


====Variables for Fully Connected Layers====
  # Evaluate the model and print results
 
   eval_results = mnist_classifier.evaluate(
Next come the two fully connected (FC) layers, which re-assemble the feature maps that were detected in the convolutional layers. The fully connected layer creates 64 neurons for every 4 x 4 square of pixels in the original image, with a depth of 512 neurons each.
       input_fn=lambda: input_fn(tf.estimator.ModeKeys.EVAL))
 
   print()
(NOTE: This doesn't make sense. There's waaaaaay too many neurons here.)
  print('Evaluation results:\n    %s' % eval_results)
 
(It may be that this is the number of inputs, then the number of outputs - as in, there are (size/4)*(size/4)*64 inputs on one side, 512 outputs on the other side.)
 
<pre>
   fc1_weights = tf.Variable( # fully connected, depth 512.
       tf.truncated_normal([IMAGE_SIZE // 4 * IMAGE_SIZE // 4 * 64, 512],
                          stddev=0.1,
                          seed=SEED,
                          dtype=data_type()))
</pre>
 
The second (last) fully connected layer is a 512-wide layer that has a depth equal to the number of labels - in this case, 10 corresponding to 10 digits.
 
(Again, this looks like 512 inputs connecting to NUM_LABELS outputs.)
 
<pre>
  fc2_weights = tf.Variable(tf.truncated_normal([512, NUM_LABELS],
                                                stddev=0.1,
                                                seed=SEED,
                                                dtype=data_type()))
   fc2_biases = tf.Variable(tf.constant(
      0.1, shape=[NUM_LABELS], dtype=data_type()))
</pre>
</pre>



Latest revision as of 01:44, 28 October 2017

Simple MNIST Convolutional Network

Input Function

Define an input function. This has an internal function that parses the example data (one piece of data at a time) and one-hot encodes the labeled images with the digit it corresponds to.

def input_fn(mode, batch_size=1):
  """A simple input_fn using the contrib.data input pipeline."""

  def example_parser(serialized_example):
    """Parses a single tf.Example into image and label tensors."""
    features = tf.parse_single_example(
        serialized_example,
        features={
            'image_raw': tf.FixedLenFeature([], tf.string),
            'label': tf.FixedLenFeature([], tf.int64),
        })
    image = tf.decode_raw(features['image_raw'], tf.uint8)
    image.set_shape([28 * 28])

    # Normalize the values of the image from the range [0, 255] to [-0.5, 0.5]
    image = tf.cast(image, tf.float32) / 255 - 0.5
    label = tf.cast(features['label'], tf.int32)
    return image, tf.one_hot(label, 10)

  if mode == tf.estimator.ModeKeys.TRAIN:
    tfrecords_file = os.path.join(FLAGS.data_dir, 'train.tfrecords')
  else:
    assert mode == tf.estimator.ModeKeys.EVAL, 'invalid mode'
    tfrecords_file = os.path.join(FLAGS.data_dir, 'test.tfrecords')

  assert tf.gfile.Exists(tfrecords_file), (
      'Run convert_to_records.py first to convert the MNIST data to TFRecord '
      'file format.')

  dataset = tf.contrib.data.TFRecordDataset([tfrecords_file])

  # For training, repeat the dataset forever
  if mode == tf.estimator.ModeKeys.TRAIN:
    dataset = dataset.repeat()

  # Map example_parser over dataset, and batch results by up to batch_size
  dataset = dataset.map(
      example_parser, num_threads=1, output_buffer_size=batch_size)
  dataset = dataset.batch(batch_size)
  images, labels = dataset.make_one_shot_iterator().get_next()

  return images, labels

Prepare Model

def mnist_model(inputs, mode):
  """Takes the MNIST inputs and mode and outputs a tensor of logits."""
  # Input Layer
  # Reshape X to 4-D tensor: [batch_size, width, height, channels]
  # MNIST images are 28x28 pixels, and have one color channel
  inputs = tf.reshape(inputs, [-1, 28, 28, 1])
  data_format = FLAGS.data_format

  if data_format is None:
    # When running on GPU, transpose the data from channels_last (NHWC) to
    # channels_first (NCHW) to improve performance.
    # See https://www.tensorflow.org/performance/performance_guide#data_formats
    data_format = ('channels_first' if tf.test.is_built_with_cuda() else
                   'channels_last')

  if data_format == 'channels_first':
    inputs = tf.transpose(inputs, [0, 3, 1, 2])

Construct Model

  # Convolutional Layer #1
  # Computes 32 features using a 5x5 filter with ReLU activation.
  # Padding is added to preserve width and height.
  # Input Tensor Shape: [batch_size, 28, 28, 1]
  # Output Tensor Shape: [batch_size, 28, 28, 32]
  conv1 = tf.layers.conv2d(
      inputs=inputs,
      filters=32,
      kernel_size=[5, 5],
      padding='same',
      activation=tf.nn.relu,
      data_format=data_format)

  # Pooling Layer #1
  # First max pooling layer with a 2x2 filter and stride of 2
  # Input Tensor Shape: [batch_size, 28, 28, 32]
  # Output Tensor Shape: [batch_size, 14, 14, 32]
  pool1 = tf.layers.max_pooling2d(inputs=conv1, pool_size=[2, 2], strides=2,
                                  data_format=data_format)

  # Convolutional Layer #2
  # Computes 64 features using a 5x5 filter.
  # Padding is added to preserve width and height.
  # Input Tensor Shape: [batch_size, 14, 14, 32]
  # Output Tensor Shape: [batch_size, 14, 14, 64]
  conv2 = tf.layers.conv2d(
      inputs=pool1,
      filters=64,
      kernel_size=[5, 5],
      padding='same',
      activation=tf.nn.relu,
      data_format=data_format)

  # Pooling Layer #2
  # Second max pooling layer with a 2x2 filter and stride of 2
  # Input Tensor Shape: [batch_size, 14, 14, 64]
  # Output Tensor Shape: [batch_size, 7, 7, 64]
  pool2 = tf.layers.max_pooling2d(inputs=conv2, pool_size=[2, 2], strides=2,
                                  data_format=data_format)

  # Flatten tensor into a batch of vectors
  # Input Tensor Shape: [batch_size, 7, 7, 64]
  # Output Tensor Shape: [batch_size, 7 * 7 * 64]
  pool2_flat = tf.reshape(pool2, [-1, 7 * 7 * 64])

  # Dense Layer
  # Densely connected layer with 1024 neurons
  # Input Tensor Shape: [batch_size, 7 * 7 * 64]
  # Output Tensor Shape: [batch_size, 1024]
  dense = tf.layers.dense(inputs=pool2_flat, units=1024,
                          activation=tf.nn.relu)

  # Add dropout operation; 0.6 probability that element will be kept
  dropout = tf.layers.dropout(
      inputs=dense, rate=0.4, training=(mode == tf.estimator.ModeKeys.TRAIN))

  # Logits layer
  # Input Tensor Shape: [batch_size, 1024]
  # Output Tensor Shape: [batch_size, 10]
  logits = tf.layers.dense(inputs=dropout, units=10)
  return logits

Get Estimator

def mnist_model_fn(features, labels, mode):
  """Model function for MNIST."""
  logits = mnist_model(features, mode)

  predictions = {
      'classes': tf.argmax(input=logits, axis=1),
      'probabilities': tf.nn.softmax(logits, name='softmax_tensor')
  }

  if mode == tf.estimator.ModeKeys.PREDICT:
    return tf.estimator.EstimatorSpec(mode=mode, predictions=predictions)

  loss = tf.losses.softmax_cross_entropy(onehot_labels=labels, logits=logits)

  # Configure the training op
  if mode == tf.estimator.ModeKeys.TRAIN:
    optimizer = tf.train.AdamOptimizer(learning_rate=1e-4)
    train_op = optimizer.minimize(loss, tf.train.get_or_create_global_step())
  else:
    train_op = None

  accuracy = tf.metrics.accuracy(
      tf.argmax(labels, axis=1), predictions['classes'])
  metrics = {'accuracy': accuracy}

  # Create a tensor named train_accuracy for logging purposes
  tf.identity(accuracy[1], name='train_accuracy')
  tf.summary.scalar('train_accuracy', accuracy[1])

  return tf.estimator.EstimatorSpec(
      mode=mode,
      predictions=predictions,
      loss=loss,
      train_op=train_op,
      eval_metric_ops=metrics)

Main Function

def main(unused_argv):
  # Create the Estimator
  mnist_classifier = tf.estimator.Estimator(
      model_fn=mnist_model_fn, model_dir=FLAGS.model_dir)

  # Train the model
  tensors_to_log = {
      'train_accuracy': 'train_accuracy'
  }

  logging_hook = tf.train.LoggingTensorHook(
      tensors=tensors_to_log, every_n_iter=100)

  batches_per_epoch = _NUM_IMAGES['train'] / FLAGS.batch_size

  mnist_classifier.train(
      input_fn=lambda: input_fn(tf.estimator.ModeKeys.TRAIN, FLAGS.batch_size),
      steps=FLAGS.train_epochs * batches_per_epoch,
      hooks=[logging_hook])

  # Evaluate the model and print results
  eval_results = mnist_classifier.evaluate(
      input_fn=lambda: input_fn(tf.estimator.ModeKeys.EVAL))
  print()
  print('Evaluation results:\n    %s' % eval_results)

Flags