tkdrgithub
diff --git a/‎examples/vgg_cifar.py‎ ‎examples/inception_cifar.py‎examples/vgg_cifar.py renamed to examples/inception_cifar.py
Lines changed: 15 additions & 14 deletions b/‎examples/vgg_cifar.py‎ ‎examples/inception_cifar.py‎examples/vgg_cifar.py renamed to examples/inception_cifar.py
Lines changed: 15 additions & 14 deletions
diff --git a/‎src/models/inception_module.py‎
Lines changed: 23 additions & 43 deletions b/‎src/models/inception_module.py‎
Lines changed: 23 additions & 43 deletions
diff --git a/‎src/models/vgg_module.py‎
Lines changed: 0 additions & 154 deletions b/‎src/models/vgg_module.py‎
Lines changed: 0 additions & 154 deletions
diff --git a/‎src/nets/googlenet.py‎
Lines changed: 37 additions & 4 deletions b/‎src/nets/googlenet.py‎
Lines changed: 37 additions & 4 deletions
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-# File: vgg_cifar.py
+# File: inception_cifar.py
 # Author: Qian Ge <geqian1001@gmail.com>
 
 import os
@@ -12,14 +12,15 @@
 
 sys.path.append('../')
 import loader as loader
-from src.nets.vgg import VGG_CIFAR10
+from src.nets.googlenet import GoogleNet_cifar
 from src.helper.trainer import Trainer
 from src.helper.evaluator import Evaluator
 
 
 DATA_PATH = '/home/qge2/workspace/data/dataset/cifar/'
-SAVE_PATH = '/home/qge2/workspace/data/out/vgg/cifar/final/'
-VGG_PATH = '/home/qge2/workspace/data/pretrain/vgg/vgg19.npy'
+# DATA_PATH = '/Users/gq/workspace/Dataset/cifar-10-batches-py/'
+SAVE_PATH = '/home/qge2/workspace/data/out/googlenet/cifar/'
+PRETRINED_PATH = '/home/qge2/workspace/data/pretrain/inception/googlenet.npy'
 
 def get_args():
     parser = argparse.ArgumentParser()
@@ -51,14 +52,14 @@ def train():
 
     pre_trained_path=None
     if FLAGS.finetune:
-        pre_trained_path = VGG_PATH
-    train_model = VGG_CIFAR10(
+        pre_trained_path = PRETRINED_PATH
+    train_model = GoogleNet_cifar(
         n_channel=3, n_class=10, pre_trained_path=pre_trained_path,
-        bn=True, wd=5e-3, trainable=True, sub_vgg_mean=False)
+        bn=True, wd=0, trainable=True, sub_imagenet_mean=False)
     train_model.create_train_model()
 
-    valid_model = VGG_CIFAR10(
-        n_channel=3, n_class=10, bn=True, sub_vgg_mean=False)
+    valid_model = GoogleNet_cifar(
+        n_channel=3, n_class=10, bn=True, sub_imagenet_mean=False)
     valid_model.create_test_model()
 
     trainer = Trainer(train_model, valid_model, train_data, init_lr=FLAGS.lr)
@@ -71,24 +72,24 @@ def train():
         for epoch_id in range(FLAGS.maxepoch):
             trainer.train_epoch(sess, keep_prob=FLAGS.keep_prob, summary_writer=writer)
             trainer.valid_epoch(sess, dataflow=valid_data, summary_writer=writer)
-            saver.save(sess, '{}vgg-cifar-epoch-{}'.format(SAVE_PATH, epoch_id))
-        saver.save(sess, '{}vgg-cifar-epoch-{}'.format(SAVE_PATH, epoch_id))
+        #     saver.save(sess, '{}inception-cifar-epoch-{}'.format(SAVE_PATH, epoch_id))
+        # saver.save(sess, '{}inception-cifar-epoch-{}'.format(SAVE_PATH, epoch_id))
 
 def evaluate():
     FLAGS = get_args()
     train_data, valid_data = loader.load_cifar(
         cifar_path=DATA_PATH, batch_size=FLAGS.bsize, substract_mean=True)
 
-    valid_model = VGG_CIFAR10(
-        n_channel=3, n_class=10, bn=True, sub_vgg_mean=False)
+    valid_model = GoogleNet(
+        n_channel=3, n_class=10, bn=True, sub_imagenet_mean=False)
     valid_model.create_test_model()
 
     evaluator = Evaluator(valid_model)
 
     with tf.Session() as sess:
         saver = tf.train.Saver()
         sess.run(tf.global_variables_initializer())
-        saver.restore(sess, '{}vgg-cifar-epoch-{}'.format(SAVE_PATH, FLAGS.load))
+        saver.restore(sess, '{}inception-cifar-epoch-{}'.format(SAVE_PATH, FLAGS.load))
         print('training set:', end='')
         evaluator.accuracy(sess, train_data)
         print('testing set:', end='')
 
@@ -61,19 +61,6 @@ def inception_layer(conv_11_size, conv_33_reduce_size, conv_33_size,
         convpool = L.conv(filter_size=1, out_dim=pool_size,
                           name='{}_pool_proj'.format(name))
 
-        # conv_11 = conv(inputs, 1, conv_11_size, '{}_1x1'.format(name))
-
-        # conv_33_reduce = conv(inputs, 1, conv_33_reduce_size,
-        #                       '{}_3x3_reduce'.format(name))
-        # conv_33 = conv(conv_33_reduce, 3, conv_33_size, '{}_3x3'.format(name))
-
-        # conv_55_reduce = conv(inputs, 1, conv_55_reduce_size,
-        #                       '{}_5x5_reduce'.format(name))
-        # conv_55 = conv(conv_55_reduce, 5, conv_55_size, '{}_5x5'.format(name))
-
-        # pool = max_pool(inputs, '{}_pool'.format(name), stride=1,
-        #                 padding='SAME', filter_size=3)
-        # convpool = conv(pool, 1, pool_size, '{}_pool_proj'.format(name))
         output = tf.concat([conv_11, conv_33, conv_55, convpool], 3,
                            name='{}_concat'.format(name))
         layer_dict['cur_input'] = output
@@ -143,7 +130,7 @@ def inception_layers(layer_dict, inputs=None, pretrained_dict=None,
 
     return layer_dict['cur_input']
 
-def inception_fc(layer_dict, n_class, keep_prob, inputs=None,
+def inception_fc(layer_dict, n_class, keep_prob=1., inputs=None,
                  pretrained_dict=None, is_training=True,
                  bn=False, init_w=None, trainable=True, wd=0):
 
@@ -161,36 +148,29 @@ def inception_fc(layer_dict, n_class, keep_prob, inputs=None,
 
     return layer_dict['cur_input']
 
+def auxiliary_classifier(layer_dict, n_class, keep_prob=1., inputs=None,
+                         pretrained_dict=None, is_training=True,
+                         bn=False, init_w=None, trainable=True, wd=0):
+    
+    if inputs is not None:
+        layer_dict['cur_input'] = inputs
 
-    # with arg_scope([inception_layer],
-    #                    trainable=self._trainable,
-    #                    data_dict=data_dict):
-    #         # inception3a = inception_layer(
-    #         #     pool2_lrn, 64, 96, 128, 16, 32, 32, name='inception_3a')
-    #         # inception3b = inception_layer(
-    #         #     inception3a, 128, 128, 192, 32, 96, 64, name='inception_3b')
-    #         # pool3 = max_pool(
-    #         #     inception3b, 'pool3', padding='SAME', filter_size=3, stride=2)
-
-    #         # inception4a = inception_layer(
-    #         #     pool3, 192, 96, 208, 16, 48, 64, name='inception_4a')
-    #         # inception4b = inception_layer(
-    #         #     inception4a, 160, 112, 224, 24, 64, 64, name='inception_4b')
-    #         # inception4c = inception_layer(
-    #         #     inception4b, 128, 128, 256, 24, 64, 64, name='inception_4c')
-    #         # inception4d = inception_layer(
-    #         #     inception4c, 112, 144, 288, 32, 64, 64, name='inception_4d')
-    #         # inception4e = inception_layer(
-    #         #     inception4d, 256, 160, 320, 32, 128, 128, name='inception_4e')
-    #         # pool4 = max_pool(
-    #         #     inception4e, 'pool4', padding='SAME', filter_size=3, stride=2)
-
-    #         inception5a = inception_layer(
-    #             pool4, 256, 160, 320, 32, 128, 128, name='inception_5a')
-    #         inception5b = inception_layer(
-    #             inception5a, 384, 192, 384, 48, 128, 128, name='inception_5b')
-
-
+    layer_dict['cur_input'] = tf.layers.average_pooling2d(
+        inputs=layer_dict['cur_input'],
+        pool_size=5, strides=3,
+        padding='valid', name='averagepool')
 
+    arg_scope = tf.contrib.framework.arg_scope
+    with arg_scope([L.conv], layer_dict=layer_dict, pretrained_dict=pretrained_dict,
+                   bn=bn, init_w=init_w, trainable=trainable,
+                   is_training=is_training, wd=wd, add_summary=False):
 
+        L.conv(1, 128, name='conv', stride=1, nl=tf.nn.relu)
+        L.conv(4, 1024, name='fc_1', stride=1, padding='VALID')
+        L.drop_out(layer_dict, is_training, keep_prob=keep_prob)
+        L.conv(1, 1024, name='fc_2', stride=1, padding='VALID', nl=tf.nn.relu)
+        L.drop_out(layer_dict, is_training, keep_prob=keep_prob)
+        L.conv(1, n_class, name='classifier', stride=1, padding='VALID')
+        layer_dict['cur_input'] = tf.squeeze(layer_dict['cur_input'], [1, 2])
+    return layer_dict['cur_input']
 
@@ -60,6 +60,13 @@ def create_train_model(self):
         with tf.variable_scope('fc_layers', reuse=tf.AUTO_REUSE):   
             self.layers['logits'] = self._fc_layers(self.layers['inception_out'])
 
+        with tf.variable_scope('auxiliary_classifier_0'):
+            self.layers['auxiliary_logits_0'] = self._auxiliary_classifier(
+                self.layers['inception_4a'])
+        with tf.variable_scope('auxiliary_classifier_1'):
+            self.layers['auxiliary_logits_1'] = self._auxiliary_classifier(
+                self.layers['inception_4d'])
+
     def create_test_model(self):
         self.set_is_training(is_training=False)
         self._create_test_input()
@@ -101,24 +108,50 @@ def _fc_layers(self, inputs):
             is_training=self.is_training, wd=self._wd)
         return fc_out
 
+    def _auxiliary_classifier(self, inputs):
+        logits = auxiliary_classifier(
+            layer_dict=self.layers, n_class=self.n_class, keep_prob=self.keep_prob,
+            inputs=inputs, pretrained_dict=None, is_training=self.is_training,
+            bn=self._bn, init_w=INIT_W, trainable=self._trainable, wd=self._wd)
+        return logits
+
     def _get_loss(self):
         with tf.name_scope('loss'):
             labels = self.label
-            logits = self.layers['gap_out']
-            # logits = tf.squeeze(logits, axis=1)
+            logits = self.layers['logits']
+            cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
+                labels=labels,
+                logits=logits,
+                name='cross_entropy')
+        auxilarity_loss = self._get_auxiliary_loss(0) + self._get_auxiliary_loss(1)
+        return tf.reduce_mean(cross_entropy) + 0.3 * auxilarity_loss
+
+    def _get_auxiliary_loss(self, loss_id):
+        with tf.name_scope('auxilarity_loss_{}'.format(loss_id)):
+            labels = self.label
+            logits = self.layers['auxiliary_logits_{}'.format(loss_id)]
             cross_entropy = tf.nn.sparse_softmax_cross_entropy_with_logits(
                 labels=labels,
                 logits=logits,
                 name='cross_entropy')
-            return tf.reduce_mean(cross_entropy)
+        return tf.reduce_mean(cross_entropy)
 
     def _get_optimizer(self):
         return tf.train.AdamOptimizer(self.lr)
 
     def get_accuracy(self):
         with tf.name_scope('accuracy'):
-            prediction = tf.argmax(self.layers['gap_out'], axis=1)
+            prediction = tf.argmax(self.layers['logits'], axis=1)
             correct_prediction = tf.equal(prediction, self.label)
             return tf.reduce_mean(
                 tf.cast(correct_prediction, tf.float32), 
                 name = 'result')
+
+class GoogleNet_cifar(GoogleNet):
+    def _fc_layers(self, inputs):
+        fc_out = module.inception_fc(
+            layer_dict=self.layers, n_class=self.n_class, keep_prob=self.keep_prob,
+            inputs=inputs, pretrained_dict=None,
+            bn=self._bn, init_w=INIT_W, trainable=self._trainable,
+            is_training=self.is_training, wd=self._wd)
+        return fc_out