Ensure that final layer of networks (which doesn't have an activation) get correctly...

author Suharsh Sivakumar <suharshs@google.com>

Wed, 21 Feb 2018 20:57:05 +0000 (12:57 -0800)

committer TensorFlower Gardener <gardener@tensorflow.org>

Wed, 21 Feb 2018 21:00:38 +0000 (13:00 -0800)
author Suharsh Sivakumar <suharshs@google.com>
Wed, 21 Feb 2018 20:57:05 +0000 (12:57 -0800)
committer TensorFlower Gardener <gardener@tensorflow.org>
Wed, 21 Feb 2018 21:00:38 +0000 (13:00 -0800)
diff --git a/tensorflow/contrib/quantize/python/quantize.py b/tensorflow/contrib/quantize/python/quantize.py

index 7a3f92f..5fd806d 100644 (file)
--- a/tensorflow/contrib/quantize/python/quantize.py
+++ b/tensorflow/contrib/quantize/python/quantize.py
@@ -207,6 +207,18 @@ def _FindLayersToQuantize(graph):
      yield _LayerMatch(layer_op, weight_tensor, activation_op, bypass_op,
                        bias_add_op)
  
+  # Match the final layer, where there will not be an activation and instead
+  # the output of the final BiasAdd must be quantized, so we treat it as the
+  # 'activation_op' in the _LayerMatch.
+  # TODO(suharshs): Figure out how to quantize this final layer across many
+  # models.
+  final_layer_matcher = graph_matcher.GraphMatcher(bias_add_pattern)
+  for match_result in final_layer_matcher.match_graph(graph):
+    layer_op = match_result.get_op(layer_pattern)
+    weight_tensor = match_result.get_tensor(weight_pattern)
+    activation_op = match_result.get_op(bias_add_pattern)
+    yield _LayerMatch(layer_op, weight_tensor, activation_op, None, None)
+
  
  class _LayerMatch(object):
    """Contains all information related to a matched Layer."""
diff --git a/tensorflow/contrib/quantize/python/quantize_test.py b/tensorflow/contrib/quantize/python/quantize_test.py

index bb7be08..ef59475 100644 (file)
--- a/tensorflow/contrib/quantize/python/quantize_test.py
+++ b/tensorflow/contrib/quantize/python/quantize_test.py
@@ -113,6 +113,28 @@ class QuantizeTest(test_util.TensorFlowTestCase):
                                              quantization_node_name)
      self.assertEqual(add_quant.type, quantization_node_name)
  
+  def testFinalLayerQuantized(self):
+    self._RunTestOverParameters(self._TestFinalLayerQuantized)
+
+  def _TestFinalLayerQuantized(self, is_training):
+    graph = ops.Graph()
+    with graph.as_default():
+      batch_size, height, width, depth = 5, 128, 128, 3
+      input1 = array_ops.zeros((batch_size, height, width, depth))
+      _ = conv2d(
+          input1,
+          32, [5, 5],
+          stride=2,
+          padding='SAME',
+          weights_initializer=self._WeightInit(0.09),
+          activation_fn=None,
+          scope='test')
+      # Ensure that the a FakeQuant operation is in the outputs of the BiasAdd.
+      bias_add_op = graph.get_operation_by_name('test/BiasAdd')
+      quantize.Quantize(graph, is_training, weight_bits=8, activation_bits=8)
+      self.assertTrue('FakeQuantWithMinMaxVars' in
+                      [op.type for op in bias_add_op.outputs[0].consumers()])
+
    def _WeightInit(self, stddev):
      """Returns truncated normal variable initializer.
author	Suharsh Sivakumar <suharshs@google.com>
	Wed, 21 Feb 2018 20:57:05 +0000 (12:57 -0800)
committer	TensorFlower Gardener <gardener@tensorflow.org>
	Wed, 21 Feb 2018 21:00:38 +0000 (13:00 -0800)
tensorflow/contrib/quantize/python/quantize.py		patch \| blob \| history
tensorflow/contrib/quantize/python/quantize_test.py		patch \| blob \| history