Classifier_Model.py

""" train and test for a convolutional neural network for predicting face attrubute for celebA """

import os
import time
import glob
import numpy as np
import pandas as pd
import PIL
from keras.applications.inception_v3 import preprocess_input
from keras.applications.inception_v3 import InceptionV3
from keras.models import Model
from keras.layers import Dense, GlobalAveragePooling2D

import tensorflow as tf
import keras.backend.tensorflow_backend as KTF

config = tf.ConfigProto()
config.gpu_options.allow_growth = True  # 不全部占满显存, 按需分配
session = tf.Session(config=config)

# 设置session
KTF.set_session(session)

path_celeba_img = '/home1/yuanye/data/celebahq/celebahq/'
path_celeba_att = '/home1/yuanye/data/celebahq/new_att.txt'
path_model_save = '/home1/Nan_Y/stylegan2/stylegan2_pytorch-master/result'

""" create path if not exist """
for path_used in [path_celeba_img, path_celeba_att, path_model_save]:
    if not os.path.exists(path_used):
        os.mkdir(path_used)


def create_cnn_model(size_output=None, tf_print=False):
    """
    create keras model with convolution layers of MobileNet and added fully connected layers on to top
    :param size_output: number of nodes in the output layer
    :param tf_print:    True/False to print
    :return: keras model object
    """

    if size_output is None:
        # get number of attrubutes, needed for defining the final layer size of network
        df_attr = pd.read_csv(path_celeba_att, sep='\s+', header=1, index_col=0)
        size_output = df_attr.shape[1]

    # Load the convolutional layers of pretrained model: mobilenet
    base_model = InceptionV3(include_top=False, input_shape=(1024, 1024, 3), weights="imagenet")

    # add fully connected layers
    fc0 = base_model.output
    fc0_pool = GlobalAveragePooling2D(data_format='channels_last', name='fc0_pool')(fc0)
    fc1 = Dense(256, activation='relu', name='fc1_dense')(fc0_pool)
    fc2 = Dense(size_output, activation='tanh', name='fc2_dense')(fc1)

    model = Model(inputs=base_model.input, outputs=fc2)

    # freeze the early layers
    for layer in base_model.layers:
        layer.trainable = False

    model.compile(optimizer='sgd', loss='binary_crossentropy', metrics=['accuracy'])

    if tf_print:
        print('use convolution layers of MobileNet, add fully connected layers')
        print(model.summary())

    return model


def get_data_info(path_celeba_img=path_celeba_img, path_celeba_att=path_celeba_att, yn_print_head_tail=False):
    """
    function to get names of images files and and pandas data-frame containing face attributes

    :param path_celeba_img: path to image files directory (cropped to 128*128)
    :param path_celeba_att: path to face attribute file (the original txt)
    :param yn_print_head_tail: true/false to print head and tail of data
    :return: img_names(list of file names of images), df_attr (pandas dataframe of face attributes)
    """
    df_attr = pd.read_csv(path_celeba_att, sep='\s+', header=1, index_col=0)

    img_names = os.listdir(path_celeba_img)
    img_names = [img_name for img_name in img_names if img_name[-4:] == '.jpg']
    img_names.sort()

    assert df_attr.shape[0] == len(img_names), 'images number does not match attribute table'

    if yn_print_head_tail:
        print(df_attr.head(3))
        print(df_attr.tail(3))
        print(img_names[:3])
        print(img_names[-3:])

    assert df_attr.shape[0] == len(img_names), \
        'images number does not match attribute table'
    assert set(img_names) == set(df_attr.index.tolist()), \
        'image names are not consistent between image files and attribute table '

    return img_names, df_attr


try:
    img_names, df_attr = get_data_info()
    num_image, num_attr = df_attr.shape
    # print(len(img_names), img_names[0], num_image, num_attr)
except:
    raise Exception('can not reach data needed for training, here we can only do test')


def get_data_sample(img_name, yn_interactive_plot=False):
    """
    function to load one image and the corresponding attributes, either using idx_img or img_name

    :param img_idx:    index of image
    :param img_name:   name of image, will overwrite img_idx if given
    :param yn_interactive_plot: True/False to print the sample
    :return:           image (3d array, H*W*RGB), attributes (1d array)
    """

    # if img_name is None:  # if not given, use img_idx to find the name
    #     if img_idx is None:  # if not given, randomly select one
    #         img_idx = np.random.randint(num_image)
    #     img_name = img_names[img_idx]

    img = np.asarray(PIL.Image.open(os.path.join(path_celeba_img, img_name))).astype(np.float32)  # load image
    labels = df_attr.loc[img_name]  # get labels

    if yn_interactive_plot:  # if show things interactively for verification
        import matplotlib.pyplot as plt
        print(labels)
        print("image file name: {}".format(img_name))
        plt.imshow(img)
        plt.show()

    x = img
    y = np.array(labels)
    return x, y


def load_data_batch(batch_size, num_images_total=None):
    """
    load data and preprocess before feeding it to Keras model
    :param num_images_total:
    :return:
    """

    list_x, list_y = [], []

    if num_images_total is None:
        image_names_select = img_names
    else:
        image_names_select = np.random.choice(img_names, num_images_total, replace=False)

    batch_num = int(len(image_names_select) / batch_size)
    max_len = batch_num * batch_size
    X_samples = np.array(image_names_select[:max_len])

    # print(type(X_samples), X_samples.shape, X_samples[0])

    X_batches = np.split(X_samples, batch_num)  # 10000个图片分成了batch_size=10的1000份
    # print(type(X_batches) ,len(X_batches), X_batches[0], type(X_batches[0]))

    for i in range(len(X_batches)):
        for j in range(batch_size):
            x, y = get_data_sample(X_batches[i][j])
            list_x.append(x)
            list_y.append(y)
        x_batch = np.stack(list_x, axis=0)
        y_batch = np.stack(list_y, axis=0)
        x_batch_ready = preprocess_input(x_batch)
        y_batch_ready = np.array(y_batch, dtype='float32')
        yield x_batch_ready, y_batch_ready

    # for img_name in image_names_select:
    #     x, y = get_data_sample(img_name=img_name, yn_interactive_plot=False)
    #     list_x.append(x)
    #     list_y.append(y)
    #
    # x_batch = np.stack(list_x, axis=0)
    # y_batch = np.stack(list_y, axis=0)
    #
    # x_batch_ready = preprocess_input(x_batch)
    # y_batch_ready = np.array(y_batch, dtype='float32')

    # return x_batch_ready, y_batch_ready


##
def train_protocol():
    """ train the model with model.fit() """

    model = create_cnn_model(tf_print=True)

    model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

    # x_all, y_all = load_data_batch(num_images_total=30000)

    # model.fit(x=x_all, y=y_all, batch_size=32, epochs=50, verbose=2,
    #           validation_split=0.125, shuffle=True)

    model.fit_generator(
        load_data_batch(batch_size=5, num_images_total=len(img_names)),
        epochs=50,
        steps_per_epoch=int(len(img_names) / 5))

    name_model_save = os.path.join(path_model_save, 'model_{}.h5'.format(gen_time_str()))
    model.save(filepath=name_model_save)


##
def gen_time_str():
    return time.strftime("%Y%m%d_%H%M%S", time.gmtime())


def get_list_model_save(path_model_save=path_model_save):
    return glob.glob(os.path.join(path_model_save, 'model*.h5'))


if __name__ == '__main__':
    train_protocol()
    # data_ier = load_data_batch(batch_size=10, num_images_total=10000)
    # x_batch, y_batch = next(data_ier)
    # print(x_batch.shape, y_batch.shape)