A sheet of Tensorflow snippets/tips

`tf.where` can spawn NaN in gradients:

If either branch in tf.where contains Inf/NaN then it produces NaN in gradients, e.g.:

# log_stddev = log(stddev).
log_stddev = tf.constant([-100., 100.], dtype=tf.float32)
# Computes 1.0 / stddev, in a numerically robust way.
inv_stddev = tf.where(log_stddev >= 0.,
                      tf.exp(-log_stddev),  # Creates Inf when -log_stddev is very large.
                      1. / (tf.exp(log_stddev) + 1e-6))  # tf.exp(log_stddev) creates Inf when log_stddev is very large.
grad_log_stddev = tf.gradients(inv_stddev, [log_stddev])
with tf.Session() as sess:
    inv_s, grad_log_s = sess.run([inv_stddev, grad_log_stddev])
    print(inv_s)  # [  1.00000000e+06   3.78350585e-44]
    print(grad_log_s)  # [array([ nan,  nan], dtype=float32)]

Shapes:

tensor.shape returns tensor's static shape, while the graph is being built.
tensor.shape.as_list() returns the static shape as a integer list.
tensor.shape[i].value returns the static shape's i-th dimension size as an integer.
tf.shape(t) returns t's run-time shape as a tensor.
An example:

x = tf.placeholder(tf.float32, shape=[None, 8]) # x shape is non-deterministic while building the graph.
print(x.shape) # Outputs static shape (?, 8).
shape_t = tf.shape(x)
with tf.Session() as sess:
    print(sess.run(shape_t, feed_dict={x: np.random.random(size=[4, 8])})) # Outputs run-time shape (4, 8).

[] (empty square brackets) as a shape denotes a scalar (0 dim). E.g. tf.FixedLenFeature([], ..) is a scalar feature.

Tensor contraction (more generalized matrix multiplication):

# Matrix multiplication
tf.einsum('ij,jk->ik', m0, m1)  # output[i, k] = sum_j m0[i, j] * m1[j, k]

# Dot product
tf.einsum('i,i->', u, v)  # output = sum_i u[i]*v[i]

# Outer product
tf.einsum('i,j->ij', u, v)  # output[i, j] = u[i]*v[j]

# Transpose
tf.einsum('ij->ji', m)  # output[j, i] = m[i,j]

# Batch matrix multiplication
tf.einsum('aij,jk->aik', s, t)  # out[a, i, k] = sum_j s[a, i, j] * t[j, k]

# Batch tensor contraction
tf.einsum('nhwc,nwcd->nhd', s, t)  # out[n, h, d] = sum_w_c s[n, h, w, c] * t[n, w, c, d]

A typical input_fn (used for train/eval) for tf.estimator API:

def make_input_fn(mode, ...):
    """Return input_fn for train/eval in tf.estimator API.

    Args:
        mode: Must be tf.estimator.ModeKeys.TRAIN or tf.estimator.ModeKeys.EVAL.
        ...
    Returns:
        The input_fn.
    """
    def _input_fn():
        """The input function.
        
        Returns:
            features: A dict of {'feature_name': feature_tensor}.
            labels: A tensor of labels.
        """
        if mode == tf.estimator.ModeKeys.TRAIN:
            features = ...
            labels = ...
        elif mode == tf.estimator.ModeKeys.EVAL:
            features = ...
            labels = ...
        else:
            raise ValueError(mode)
        return features, labels

    return _input_fn

A typical model_fn for tf.estimator API:

def make_model_fn(...):
    """Return model_fn to build a tf.estimator.Estimator.

    Args:
        ...
    Returns:
        The model_fn.
    """
    def _model_fn(features, labels, mode):
        """Model function.
        
        Args:
            features: The first item returned from the input_fn for train/eval, a dict of {'feature_name': feature_tensor}. If mode is ModeKeys.PREDICT, same as in serving_input_receiver_fn.
            labels: The second item returned from the input_fn, a single Tensor or dict. If mode is ModeKeys.PREDICT, labels=None will be passed.
            mode: Optional. Specifies if this training, evaluation or prediction. See ModeKeys.
        """
        if mode == tf.estimator.ModeKeys.PREDICT:
            # Calculate the predictions.
            predictions = ...
            # For inference/prediction outputs.
            export_outputs = {
                tf.saved_model.signature_constants.PREDICT_METHOD_NAME: tf.estimator.export.PredictOutput({
                    'output_1': predict_output_1,
                    'output_2': predict_output_2,
                    ...
                }),
            }
            ...
        else:
            predictions = None
            export_outputs = None

        if (mode == tf.estimator.ModeKeys.TRAIN or mode == tf.estimator.ModeKeys.EVAL):
            loss = ...
        else:
            loss = None

        if mode == tf.estimator.ModeKeys.TRAIN:
            train_op = ...
            # Can use tf.group(..) to group multiple train_op as a single train_op.
        else:
            train_op = None

        return tf.estimator.EstimatorSpec(
            mode=mode,
            predictions=predictions,
            loss=loss,
            train_op=train_op,
            export_outputs=export_outputs)

    return _model_fn

Use tf.estimator.Estimator to export a saved_model:

# serving_features must match features in model_fn when mode == tf.estimator.ModeKeys.PREDICT.
serving_features = {'serving_input_1': tf.placeholder(...), 'serving_input_2': tf.placeholder(...), ...}
estimator.export_savedmodel(export_dir,
                            tf.estimator.export.build_raw_serving_input_receiver_fn(serving_features))

Use tf.contrib.learn.Experiment to export a saved_model:

# serving_features must match features in model_fn when mode == tf.estimator.ModeKeys.PREDICT.
serving_features = {'serving_input_1': tf.placeholder(...), 'serving_input_2': tf.placeholder(...), ...}
export_strategy = tf.contrib.learn.utils.make_export_strategy(tf.estimator.export.build_raw_serving_input_receiver_fn(serving_features))
expriment = tf.contrib.learn.Experiment(..., export_strategies=[export_strategy], ...)

Load a saved_model and run inference (in Python):

with tf.Session(...) as sess:
    # Load saved_model MetaGraphDef from export_dir.
    meta_graph_def = tf.saved_model.loader.load(sess, [tf.saved_model.tag_constants.SERVING], export_dir)
    
    # Get SignatureDef for serving (here PREDICT_METHOD_NAME is used as export_outputs key in model_fn).
    sigs = meta_graph_def.signature_def[tf.saved_model.signature_constants.PREDICT_METHOD_NAME]
    
    # Get the graph for retrieving input/output tensors.
    g = tf.get_default_graph()
    
    # Retrieve serving input tensors, keys must match keys defined in serving_features (when building input receiver fn).
    input_1 = g.get_tensor_by_name(sigs.inputs['input_1'].name)
    input_2 = g.get_tensor_by_name(sigs.inputs['input_2'].name)
    ...
    
    # Retrieve serving output tensors, keys must match keys defined in ExportOutput (e.g. PredictOutput) in export_outputs.
    output_1 = g.get_tensor_by_name(sigs.outputs['output_1'].name)
    output_2 = g.get_tensor_by_name(sigs.outputs['output_2'].name)
    ...
    
    # Run inferences.
    outputs_values = sess.run([output_1, output_2, ...], feed_dict={input_1: ..., input_2: ..., ...})

Build a tf.train.Example in Python:

# ==================== Build in one line ====================
example = tf.train.Example(features=tf.train.Features(feature={
    'bytes_values': tf.train.Feature(
        bytes_list=tf.train.BytesList(value=[bytes_feature])),
    'float_values': tf.train.Feature(
        float_list=tf.train.FloatList(value=[float_feature])),
    'int64_values': tf.train.Feature(
        int64_list=tf.train.Int64List(value=[int64_feature])),
    ...
}))
# ==================== OR progressivly ====================
example = tf.train.Example()
example.features.feature['bytes_feature'].bytes_list.value.extend(bytes_values)
example.features.feature['float_feature'].float_list.value.extend(float_values)
example.features.feature['int64_feature'].int64_list.value.extend(int64_values)
...

Build a tf.train.SequenceExample in Python:

sequence_example = tf.train.SequenceExample()

# Populate context data.
sequence_example.context.feature[
    'context_bytes_values_1'].bytes_list.value.extend(bytes_values)
sequence_example.context.feature[
    'context_float_values_1'].float_list.value.extend(float_values)
sequence_example.context.feature[
    'context_int64_values_1'].int64_list.value.extend(int64_values)
...

# Populate sequence data.
feature_list_1 = sequence_example.feature_lists.feature_list['feature_list_1']
# Add tf.train.Feature to feature_list_1.
feature_1 = feature_list_1.feature.add()
# Populate feature_1, e.g. feature_1.float_list.value.extend(float_values)
# Add tf.train.Feature to feature_list_1, if any.
...

Example is roughly a map of {feature_name: value_list}.

SequenceExample is roughly a map of {feature_name: list_of_value_lists}.

To parse a SequenceExample:

tf.parse_single_sequence_example(serialized,
    context_features={
        'context_feature_1': tf.FixedLenFeature([], dtype=...),
        ...
    },
    sequence_features={
        # For 'sequence_features_1' shape, [] results with [?] and [k] results with [?, k], where:
        # ?: timesteps, i.e. number of tf.Train.Feature in 'sequence_features_1' list, can be variable.
        # k: number of elements in each tf.Train.Feature in 'sequence_features_1'.
        'sequence_features_1': tf.FixedLenSequenceFeature([], dtype=...),
        ...
    },)

Writes seqeuence/iterator of tfrecords into multiple sharded files, round-robin:

class TFRecordsWriter:
    def __init__(self, file_path):
        """Constructs a TFRecordsWriter that supports writing to sharded files.
        
        Writes a sequence of Example or SequenceExample to sharded files.
        Typical usage:
        with TFRecordsWriter(<file_path>) as writer:
            # tfrecords 
            writer.write(tfrecords)

        :param file_path: Destination file path, with '@<num_shards>' at the
        end to produce sharded files.
        """
        shard_sym_idx = file_path.rfind('@')
        if shard_sym_idx != -1:
            self._num_shards = int(file_path[shard_sym_idx + 1:])
            if self._num_shards <= 0:
                raise ValueError('Number of shards must be a positive integer.')
            self._file_path = file_path[:shard_sym_idx]
        else:
            self._num_shards = 1
            self._file_path = file_path

    def __enter__(self):
        if self._num_shards > 1:
            shard_name_fmt = '{{}}-{{:0>{}}}-of-{}'.format(
                len(str(self._num_shards)),
                self._num_shards)
            self._writers = [
                tf.python_io.TFRecordWriter(
                    shard_name_fmt.format(self._file_path, i))
                for
                i in range(self._num_shards)]
        else:
            self._writers = [tf.python_io.TFRecordWriter(self._file_path)]
        return self

    def __exit__(self, exc_type, exc_val, exc_tb):
        if self._writers:
            for writer in self._writers:
                if writer:
                    writer.flush()
                    writer.close()

    def write(self, tfrecords):
        """Writes a sequence/iterator of Example or SequenceExample to file(s).

        :param tfrecords: A sequence/iterator of Example or SequenceExample.
        :return:
        """
        if self._writers:
            for i, tfrecord in enumerate(tfrecords):
                writer = self._writers[i % self._num_shards]
                if writer:
                    writer.write(tfrecord.SerializeToString())

Visualize Tensorflow graph in jupyter/ipython:

import numpy as np
from IPython import display

def strip_consts(graph_def, max_const_size=32):
    """Strip large constant values from graph_def."""
    strip_def = tf.GraphDef()
    for n0 in graph_def.node:
        n = strip_def.node.add()
        n.MergeFrom(n0)
        if n.op == 'Const':
            tensor = n.attr['value'].tensor
            size = len(tensor.tensor_content)
            if size > max_const_size:
                tensor.tensor_content = "<stripped {} bytes>".format(size)
    return strip_def


def show_graph(graph_def, max_const_size=32):
    """Visualize TensorFlow graph."""
    if hasattr(graph_def, 'as_graph_def'):
        graph_def = graph_def.as_graph_def()
    strip_def = strip_consts(graph_def, max_const_size=max_const_size)
    code = """
        <script>
          function load() {{
            document.getElementById("{id}").pbtxt = {data};
          }}
        </script>
        <link rel="import" href="https://tensorboard.appspot.com/tf-graph
        -basic.build.html" onload=load()>
        <div style="height:600px">
          <tf-graph-basic id="{id}"></tf-graph-basic>
        </div>
    """.format(data=repr(str(strip_def)), id='graph' + str(np.random.rand()))

    iframe = """
        <iframe seamless style="width:1200px;height:620px;border:0" srcdoc="{}"></iframe>
    """.format(code.replace('"', '&quot;'))
    display.display(display.HTML(iframe))

Then call show_graph(tf.get_default_graph()) to show in your Jupyter/IPython notebook.

liuyongwei / tensorflow_snippets Goto Github PK

tensorflow_snippets's Introduction

A sheet of Tensorflow snippets/tips

tf.where can spawn NaN in gradients:

Shapes:

Tensor contraction (more generalized matrix multiplication):

A typical input_fn (used for train/eval) for tf.estimator API:

A typical model_fn for tf.estimator API:

Use tf.estimator.Estimator to export a saved_model:

Use tf.contrib.learn.Experiment to export a saved_model:

Load a saved_model and run inference (in Python):

Build a tf.train.Example in Python:

Build a tf.train.SequenceExample in Python:

Example is roughly a map of {feature_name: value_list}.

SequenceExample is roughly a map of {feature_name: list_of_value_lists}.

To parse a SequenceExample:

Writes seqeuence/iterator of tfrecords into multiple sharded files, round-robin:

Visualize Tensorflow graph in jupyter/ipython:

tensorflow_snippets's People

Contributors

Watchers

Recommend Projects

Recommend Topics

Recommend Org

`tf.where` can spawn NaN in gradients: