+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Contains the definition for inception v1 classification network."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+
+from nets import inception_utils
+
+slim = tf.contrib.slim
+trunc_normal = lambda stddev: tf.truncated_normal_initializer(0.0, stddev)
+
+
+def inception_v1_base(inputs,
+ final_endpoint='Mixed_5c',
+ scope='InceptionV1'):
+ """Defines the Inception V1 base architecture.
+
+ This architecture is defined in:
+ Going deeper with convolutions
+ Christian Szegedy, Wei Liu, Yangqing Jia, Pierre Sermanet, Scott Reed,
+ Dragomir Anguelov, Dumitru Erhan, Vincent Vanhoucke, Andrew Rabinovich.
+ http://arxiv.org/pdf/1409.4842v1.pdf.
+
+ Args:
+ inputs: a tensor of size [batch_size, height, width, channels].
+ final_endpoint: specifies the endpoint to construct the network up to. It
+ can be one of ['Conv2d_1a_7x7', 'MaxPool_2a_3x3', 'Conv2d_2b_1x1',
+ 'Conv2d_2c_3x3', 'MaxPool_3a_3x3', 'Mixed_3b', 'Mixed_3c',
+ 'MaxPool_4a_3x3', 'Mixed_4b', 'Mixed_4c', 'Mixed_4d', 'Mixed_4e',
+ 'Mixed_4f', 'MaxPool_5a_2x2', 'Mixed_5b', 'Mixed_5c']
+ scope: Optional variable_scope.
+
+ Returns:
+ A dictionary from components of the network to the corresponding activation.
+
+ Raises:
+ ValueError: if final_endpoint is not set to one of the predefined values.
+ """
+ end_points = {}
+ with tf.variable_scope(scope, 'InceptionV1', [inputs]):
+ with slim.arg_scope(
+ [slim.conv2d, slim.fully_connected],
+ weights_initializer=trunc_normal(0.01)):
+ with slim.arg_scope([slim.conv2d, slim.max_pool2d],
+ stride=1, padding='SAME'):
+ end_point = 'Conv2d_1a_7x7'
+ net = slim.conv2d(inputs, 64, [7, 7], stride=2, scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+ end_point = 'MaxPool_2a_3x3'
+ net = slim.max_pool2d(net, [3, 3], stride=2, scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+ end_point = 'Conv2d_2b_1x1'
+ net = slim.conv2d(net, 64, [1, 1], scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+ end_point = 'Conv2d_2c_3x3'
+ net = slim.conv2d(net, 192, [3, 3], scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+ end_point = 'MaxPool_3a_3x3'
+ net = slim.max_pool2d(net, [3, 3], stride=2, scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_3b'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 64, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 96, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 128, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 16, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 32, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 32, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_3c'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 128, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 128, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 192, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 32, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 96, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 64, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'MaxPool_4a_3x3'
+ net = slim.max_pool2d(net, [3, 3], stride=2, scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_4b'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 192, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 96, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 208, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 16, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 48, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 64, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_4c'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 160, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 112, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 224, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 24, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 64, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 64, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_4d'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 128, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 128, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 256, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 24, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 64, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 64, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_4e'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 112, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 144, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 288, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 32, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 64, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 64, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_4f'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 256, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 160, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 320, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 32, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 128, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 128, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'MaxPool_5a_2x2'
+ net = slim.max_pool2d(net, [2, 2], stride=2, scope=end_point)
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_5b'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 256, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 160, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 320, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 32, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 128, [3, 3], scope='Conv2d_0a_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 128, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+
+ end_point = 'Mixed_5c'
+ with tf.variable_scope(end_point):
+ with tf.variable_scope('Branch_0'):
+ branch_0 = slim.conv2d(net, 384, [1, 1], scope='Conv2d_0a_1x1')
+ with tf.variable_scope('Branch_1'):
+ branch_1 = slim.conv2d(net, 192, [1, 1], scope='Conv2d_0a_1x1')
+ branch_1 = slim.conv2d(branch_1, 384, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_2'):
+ branch_2 = slim.conv2d(net, 48, [1, 1], scope='Conv2d_0a_1x1')
+ branch_2 = slim.conv2d(branch_2, 128, [3, 3], scope='Conv2d_0b_3x3')
+ with tf.variable_scope('Branch_3'):
+ branch_3 = slim.max_pool2d(net, [3, 3], scope='MaxPool_0a_3x3')
+ branch_3 = slim.conv2d(branch_3, 128, [1, 1], scope='Conv2d_0b_1x1')
+ net = tf.concat(axis=3, values=[branch_0, branch_1, branch_2, branch_3])
+ end_points[end_point] = net
+ if final_endpoint == end_point: return net, end_points
+ raise ValueError('Unknown final endpoint %s' % final_endpoint)
+
+
+def inception_v1(inputs,
+ num_classes=1000,
+ is_training=True,
+ dropout_keep_prob=0.8,
+ prediction_fn=slim.softmax,
+ spatial_squeeze=True,
+ reuse=None,
+ scope='InceptionV1'):
+ """Defines the Inception V1 architecture.
+
+ This architecture is defined in:
+
+ Going deeper with convolutions
+ Christian Szegedy, Wei Liu, Yangqing Jia, Pierre Sermanet, Scott Reed,
+ Dragomir Anguelov, Dumitru Erhan, Vincent Vanhoucke, Andrew Rabinovich.
+ http://arxiv.org/pdf/1409.4842v1.pdf.
+
+ The default image size used to train this network is 224x224.
+
+ Args:
+ inputs: a tensor of size [batch_size, height, width, channels].
+ num_classes: number of predicted classes.
+ is_training: whether is training or not.
+ dropout_keep_prob: the percentage of activation values that are retained.
+ prediction_fn: a function to get predictions out of logits.
+ spatial_squeeze: if True, logits is of shape [B, C], if false logits is
+ of shape [B, 1, 1, C], where B is batch_size and C is number of classes.
+ reuse: whether or not the network and its variables should be reused. To be
+ able to reuse 'scope' must be given.
+ scope: Optional variable_scope.
+
+ Returns:
+ logits: the pre-softmax activations, a tensor of size
+ [batch_size, num_classes]
+ end_points: a dictionary from components of the network to the corresponding
+ activation.
+ """
+ # Final pooling and prediction
+ with tf.variable_scope(scope, 'InceptionV1', [inputs, num_classes],
+ reuse=reuse) as scope:
+ with slim.arg_scope([slim.batch_norm, slim.dropout],
+ is_training=is_training):
+ net, end_points = inception_v1_base(inputs, scope=scope)
+ with tf.variable_scope('Logits'):
+ net = slim.avg_pool2d(net, [7, 7], stride=1, scope='AvgPool_0a_7x7')
+ net = slim.dropout(net,
+ dropout_keep_prob, scope='Dropout_0b')
+ logits = slim.conv2d(net, num_classes, [1, 1], activation_fn=None,
+ normalizer_fn=None, scope='Conv2d_0c_1x1')
+ if spatial_squeeze:
+ logits = tf.squeeze(logits, [1, 2], name='SpatialSqueeze')
+
+ end_points['Logits'] = logits
+ end_points['Predictions'] = prediction_fn(logits, scope='Predictions')
+ return logits, end_points
+inception_v1.default_image_size = 224
+
+inception_v1_arg_scope = inception_utils.inception_arg_scope