update googlenet code

wymmd · Jul 24, 2020 · 3cf29a3 · 3cf29a3
1 parent 697520a
commit 3cf29a3
Show file tree

Hide file tree

Showing 3 changed files with 338 additions and 0 deletions.
diff --git a/tensorflow_classification/Test4_goolenet/model_add_bn.py b/tensorflow_classification/Test4_goolenet/model_add_bn.py
@@ -0,0 +1,141 @@
+from tensorflow.keras import layers, models, Model, Sequential
+
+
+def InceptionV1(im_height=224, im_width=224, class_num=1000, aux_logits=False):
+    # tensorflow中的tensor通道排序是NHWC
+    input_image = layers.Input(shape=(im_height, im_width, 3), dtype="float32")
+    # (None, 224, 224, 3)
+    x = layers.Conv2D(64, kernel_size=7, strides=2, padding="SAME", use_bias=False, name="conv1/conv")(input_image)
+    x = layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="conv1/bn")(x)
+    x = layers.ReLU()(x)
+    # (None, 112, 112, 64)
+    x = layers.MaxPool2D(pool_size=3, strides=2, padding="SAME", name="maxpool_1")(x)
+    # (None, 56, 56, 64)
+    x = layers.Conv2D(64, kernel_size=1, use_bias=False, name="conv2/conv")(x)
+    x = layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="conv2/bn")(x)
+    x = layers.ReLU()(x)
+    # (None, 56, 56, 64)
+    x = layers.Conv2D(192, kernel_size=3, padding="SAME", use_bias=False, name="conv3/conv")(x)
+    x = layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="conv3/bn")(x)
+    x = layers.ReLU()(x)
+    # (None, 56, 56, 192)
+    x = layers.MaxPool2D(pool_size=3, strides=2, padding="SAME", name="maxpool_2")(x)
+
+    # (None, 28, 28, 192)
+    x = Inception(64, 96, 128, 16, 32, 32, name="inception3a")(x)
+    # (None, 28, 28, 256)
+    x = Inception(128, 128, 192, 32, 96, 64, name="inception3b")(x)
+
+    # (None, 28, 28, 480)
+    x = layers.MaxPool2D(pool_size=3, strides=2, padding="SAME", name="maxpool_3")(x)
+    # (None, 14, 14, 480)
+    x = Inception(192, 96, 208, 16, 48, 64, name="inception4a")(x)
+    if aux_logits:
+        aux1 = InceptionAux(class_num, name="aux1")(x)
+
+    # (None, 14, 14, 512)
+    x = Inception(160, 112, 224, 24, 64, 64, name="inception4b")(x)
+    # (None, 14, 14, 512)
+    x = Inception(128, 128, 256, 24, 64, 64, name="inception4c")(x)
+    # (None, 14, 14, 512)
+    x = Inception(112, 144, 288, 32, 64, 64, name="inception4d")(x)
+    if aux_logits:
+        aux2 = InceptionAux(class_num, name="aux2")(x)
+
+    # (None, 14, 14, 528)
+    x = Inception(256, 160, 320, 32, 128, 128, name="inception4e")(x)
+    # (None, 14, 14, 532)
+    x = layers.MaxPool2D(pool_size=2, strides=2, padding="SAME", name="maxpool_4")(x)
+
+    # (None, 7, 7, 832)
+    x = Inception(256, 160, 320, 32, 128, 128, name="inception5a")(x)
+    # (None, 7, 7, 832)
+    x = Inception(384, 192, 384, 48, 128, 128, name="inception5b")(x)
+    # (None, 7, 7, 1024)
+    x = layers.AvgPool2D(pool_size=7, strides=1, name="avgpool_1")(x)
+
+    # (None, 1, 1, 1024)
+    x = layers.Flatten(name="output_flatten")(x)
+    # (None, 1024)
+    x = layers.Dropout(rate=0.4, name="output_dropout")(x)
+    x = layers.Dense(class_num, name="fc")(x)
+    # (None, class_num)
+    aux3 = layers.Softmax()(x)
+
+    if aux_logits:
+        model = models.Model(inputs=input_image, outputs=[aux1, aux2, aux3])
+    else:
+        model = models.Model(inputs=input_image, outputs=aux3)
+    return model
+
+
+class Inception(layers.Layer):
+    def __init__(self, ch1x1, ch3x3red, ch3x3, ch5x5red, ch5x5, pool_proj, **kwargs):
+        super(Inception, self).__init__(**kwargs)
+        self.branch1 = Sequential([
+            layers.Conv2D(ch1x1, kernel_size=1, use_bias=False, name="conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="bn"),
+            layers.ReLU()], name="branch1")
+
+        self.branch2 = Sequential([
+            layers.Conv2D(ch3x3red, kernel_size=1, use_bias=False, name="0/conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="0/bn"),
+            layers.ReLU(),
+            layers.Conv2D(ch3x3, kernel_size=3, padding="SAME", use_bias=False, name="1/conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="1/bn"),
+            layers.ReLU()], name="branch2")      # output_size= input_size
+
+        self.branch3 = Sequential([
+            layers.Conv2D(ch5x5red, kernel_size=1, use_bias=False, name="0/conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="0/bn"),
+            layers.ReLU(),
+            layers.Conv2D(ch5x5, kernel_size=3, padding="SAME", use_bias=False, name="1/conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="1/bn"),
+            layers.ReLU()], name="branch3")      # output_size= input_size
+
+        self.branch4 = Sequential([
+            layers.MaxPool2D(pool_size=3, strides=1, padding="SAME"),  # caution: default strides==pool_size
+            layers.Conv2D(pool_proj, kernel_size=1, use_bias=False, name="1/conv"),
+            layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="1/bn"),
+            layers.ReLU()], name="branch4")                  # output_size= input_size
+
+    def call(self, inputs, **kwargs):
+        branch1 = self.branch1(inputs)
+        branch2 = self.branch2(inputs)
+        branch3 = self.branch3(inputs)
+        branch4 = self.branch4(inputs)
+        outputs = layers.concatenate([branch1, branch2, branch3, branch4])
+        return outputs
+
+
+class InceptionAux(layers.Layer):
+    def __init__(self, num_classes, **kwargs):
+        super(InceptionAux, self).__init__(**kwargs)
+        self.averagePool = layers.AvgPool2D(pool_size=5, strides=3)
+        self.conv = layers.Conv2D(128, kernel_size=1, use_bias=False, name="conv/conv")
+        self.bn1 = layers.BatchNormalization(momentum=0.9, epsilon=1e-5, name="conv/bn")
+        self.rule1 = layers.ReLU()
+
+        self.fc1 = layers.Dense(1024, activation="relu", name="fc1")
+        self.fc2 = layers.Dense(num_classes, name="fc2")
+        self.softmax = layers.Softmax()
+
+    def call(self, inputs, **kwargs):
+        # aux1: N x 512 x 14 x 14, aux2: N x 528 x 14 x 14
+        x = self.averagePool(inputs)
+        # aux1: N x 512 x 4 x 4, aux2: N x 528 x 4 x 4
+        x = self.conv(x)
+        x = self.bn1(x)
+        x = self.rule1(x)
+        # N x 128 x 4 x 4
+        x = layers.Flatten()(x)
+        x = layers.Dropout(rate=0.5)(x)
+        # N x 2048
+        x = self.fc1(x)
+        x = layers.Dropout(rate=0.5)(x)
+        # N x 1024
+        x = self.fc2(x)
+        # N x num_classes
+        x = self.softmax(x)
+
+        return x
diff --git a/tensorflow_classification/Test4_goolenet/read_pth.py b/tensorflow_classification/Test4_goolenet/read_pth.py
@@ -0,0 +1,71 @@
+import torch
+import numpy as np
+import tensorflow as tf
+
+
+def rename_var(pth_path, new_ckpt_path, num_classes):
+    pytorch_dict = torch.load(pth_path)
+
+    with tf.Graph().as_default(), tf.compat.v1.Session().as_default() as sess:
+        new_var_list = []
+
+        for key, value in pytorch_dict.items():
+            if key in except_list:
+                continue
+
+            new_name = key
+            value = value.detach().numpy()
+
+            new_name = new_name.replace(".", "/")
+
+            # 将卷积核的通道顺序由pytorch调整到tensorflow
+            if 'conv/weight' in new_name:
+                new_name = new_name.replace("weight", "kernel")
+                value = np.transpose(value, (2, 3, 1, 0)).astype(np.float32)
+            elif 'bn' in new_name:
+                if "num_batches_tracked" in new_name:
+                    continue
+
+                new_name = new_name.replace("weight", "gamma")
+                new_name = new_name.replace("bias", "beta")
+                new_name = new_name.replace("running_mean", "moving_mean")
+                new_name = new_name.replace("running_var", "moving_variance")
+
+                value = np.transpose(value).astype(np.float32)
+            elif 'fc1' in new_name:
+                new_name = new_name.replace("weight", "kernel")
+                value = np.transpose(value).astype(np.float32)
+
+            re_var = tf.Variable(value, name=new_name)
+            new_var_list.append(re_var)
+
+        # aux1
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([1024, num_classes]), name="aux1/fc2/kernel")
+        new_var_list.append(re_var)
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([num_classes]), name="aux1/fc2/bias")
+        new_var_list.append(re_var)
+
+        # aux2
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([1024, num_classes]), name="aux2/fc2/kernel")
+        new_var_list.append(re_var)
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([num_classes]), name="aux2/fc2/bias")
+        new_var_list.append(re_var)
+
+        # fc
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([1024, num_classes]), name="fc/kernel")
+        new_var_list.append(re_var)
+        re_var = tf.Variable(tf.keras.initializers.he_uniform()([num_classes]), name="fc/bias")
+        new_var_list.append(re_var)
+
+        saver = tf.compat.v1.train.Saver(new_var_list)
+        sess.run(tf.compat.v1.global_variables_initializer())
+        saver.save(sess, save_path=new_ckpt_path, write_meta_graph=False, write_state=False)
+
+
+# this script only use for model_add_bn.py
+except_list = ['aux1.fc2.weight', 'aux1.fc2.bias', 'aux2.fc2.weight', 'aux2.fc2.bias', 'fc.weight', 'fc.bias']
+# https://download.pytorch.org/models/googlenet-1378be20.pth
+pth_path = './googlenet-1378be20.pth'
+new_ckpt_path = './pretrain_weights.ckpt'
+num_classes = 5
+rename_var(pth_path, new_ckpt_path, num_classes)
diff --git a/tensorflow_classification/Test4_goolenet/train_add_bn.py b/tensorflow_classification/Test4_goolenet/train_add_bn.py
@@ -0,0 +1,126 @@
+from tensorflow.keras.preprocessing.image import ImageDataGenerator
+import matplotlib.pyplot as plt
+from model_add_bn import InceptionV1
+import tensorflow as tf
+import json
+import os
+import numpy as np
+
+data_root = os.path.abspath(os.path.join(os.getcwd(), "../.."))  # get data root path
+image_path = data_root + "/data_set/flower_data/"  # flower data set path
+train_dir = image_path + "train"
+validation_dir = image_path + "val"
+
+# create direction for saving weights
+if not os.path.exists("save_weights"):
+    os.makedirs("save_weights")
+
+im_height = 224
+im_width = 224
+batch_size = 16
+epochs = 30
+
+
+def pre_function(img: np.ndarray):
+    # img = im.open('test.jpg')
+    # img = np.array(img).astype(np.float32)
+    img = img / 255.
+    img = img - [0.485, 0.456, 0.406]
+    img = img / [0.229, 0.224, 0.225]
+
+    return img
+
+
+# data generator with data augmentation
+train_image_generator = ImageDataGenerator(preprocessing_function=pre_function,
+                                           horizontal_flip=True)
+validation_image_generator = ImageDataGenerator(preprocessing_function=pre_function)
+
+train_data_gen = train_image_generator.flow_from_directory(directory=train_dir,
+                                                           batch_size=batch_size,
+                                                           shuffle=True,
+                                                           target_size=(im_height, im_width),
+                                                           class_mode='categorical')
+total_train = train_data_gen.n
+
+# get class dict
+class_indices = train_data_gen.class_indices
+
+# transform value and key of dict
+inverse_dict = dict((val, key) for key, val in class_indices.items())
+# write dict into json file
+json_str = json.dumps(inverse_dict, indent=4)
+with open('class_indices.json', 'w') as json_file:
+    json_file.write(json_str)
+
+val_data_gen = train_image_generator.flow_from_directory(directory=validation_dir,
+                                                         batch_size=batch_size,
+                                                         shuffle=True,
+                                                         target_size=(im_height, im_width),
+                                                         class_mode='categorical')
+total_val = val_data_gen.n
+
+model = InceptionV1(im_height=im_height, im_width=im_width, class_num=5, aux_logits=True)
+# model.build((batch_size, 224, 224, 3))  # when using subclass model
+model.load_weights("pretrain_weights.ckpt")
+model.summary()
+
+# using keras low level api for training
+loss_object = tf.keras.losses.CategoricalCrossentropy(from_logits=False)
+optimizer = tf.keras.optimizers.Adam(learning_rate=0.0005)
+
+train_loss = tf.keras.metrics.Mean(name='train_loss')
+train_accuracy = tf.keras.metrics.CategoricalAccuracy(name='train_accuracy')
+
+test_loss = tf.keras.metrics.Mean(name='test_loss')
+test_accuracy = tf.keras.metrics.CategoricalAccuracy(name='test_accuracy')
+
+
+@tf.function
+def train_step(images, labels):
+    with tf.GradientTape() as tape:
+        aux1, aux2, output = model(images, training=True)
+        loss1 = loss_object(labels, aux1)
+        loss2 = loss_object(labels, aux2)
+        loss3 = loss_object(labels, output)
+        loss = loss1*0.3 + loss2*0.3 + loss3
+    gradients = tape.gradient(loss, model.trainable_variables)
+    optimizer.apply_gradients(zip(gradients, model.trainable_variables))
+
+    train_loss(loss)
+    train_accuracy(labels, output)
+
+
+@tf.function
+def test_step(images, labels):
+    _, _, output = model(images, training=False)
+    t_loss = loss_object(labels, output)
+
+    test_loss(t_loss)
+    test_accuracy(labels, output)
+
+
+best_test_loss = float('inf')
+for epoch in range(1, epochs+1):
+    train_loss.reset_states()        # clear history info
+    train_accuracy.reset_states()    # clear history info
+    test_loss.reset_states()         # clear history info
+    test_accuracy.reset_states()     # clear history info
+
+    for step in range(total_train // batch_size):
+        images, labels = next(train_data_gen)
+        train_step(images, labels)
+
+    for step in range(total_val // batch_size):
+        test_images, test_labels = next(val_data_gen)
+        test_step(test_images, test_labels)
+
+    template = 'Epoch {}, Loss: {}, Accuracy: {}, Test Loss: {}, Test Accuracy: {}'
+    print(template.format(epoch,
+                          train_loss.result(),
+                          train_accuracy.result() * 100,
+                          test_loss.result(),
+                          test_accuracy.result() * 100))
+    if test_loss.result() < best_test_loss:
+        best_test_loss = test_loss.result()
+        model.save_weights("./save_weights/myInceptionV1.h5")