基于tensorflow的AlexNet实现

来源:互联网 发布:js广告 编辑:程序博客网 时间:2024/05/16 14:54

from test import *
import tensorflow as tf


ABS_PATH = "/home/elvis/work/ML/tensorflow/separa/"


SIZE = 4743
# SIZE = 828


LABEL = 5
# LABEL = 6
TRAIN_SIZE = 768
# ACCELERATION_FACTOR = 256
ACCELERATION_FACTOR = 2048
BASE_DIVIDE = 2048
# TRAIN_SIZE = 3200
BATCH_SIZE = 128
GLOBAL_STEP = 200000000
DECAY_STEPS = 100
EVAL_SIZE = SIZE - TRAIN_SIZE
# IMAGE_SIZE = 645 - 60
IMAGE_SIZE = 227
NUM_CHANNEL = 3
REPORT_CONTROL = 10
TRAIN_SLICE = (int(SIZE / LABEL * round((float(TRAIN_SIZE) / SIZE), 1)))


LEARNING_RATE = 0.001
# REGULAR = 3e-3
REGULAR = 3e-4
DROP_OUT = 80e-2
DECAY_RATE = 0.9995
MOMENTUM = 99e-2
SEED = int(random.random() * 1000)
BATCH_NORMALIZATION = 1e-3




# SEED = 295.730694719
# SEED = 935.121374578
# SEED = 149.555544719
# SEED = 266.751015428 pretty good for this data .


out_file = "./cleaned_data_1.csv"




def data_clean(img, filename, label):
    window_name = "IMG"
    label = np.argmax(label)
    print (filename)
    print (label)
    cv.namedWindow(window_name)
    while True:
        cv.imshow(window_name, img)
        character = cv.waitKey(100)
        if int(character) == 97:
            f = file(out_file, 'a+')
            f.writelines(str(filename) + "," + str(label) + "\n")
            f.close()
            break
        elif int(character) == 98:
            f = file(out_file, 'a+')
            label = raw_input("input the label you wanna.")
            f.writelines(str(filename) + "," + str(label) + "\n")
            f.close()
            break
        else:
            continue




def main(argv=None):
    if argv is None:
        print ("ERROR FOR ARGV IS NONE")
    else:
        print (argv)
    global SIZE


    data, label, fileset = parse_new_data(SIZE=SIZE, IMAGE_SIZE=IMAGE_SIZE, NUM_CHANNEL=NUM_CHANNEL, LABEL=LABEL,
                                          BASE_DIVIDE=BASE_DIVIDE)


    # for x in range(SIZE):
    #     data_clean(data[x], fileset[x], label[x])


    print (data.shape)
    print (data.dtype)


    print (fileset[0])
    print (label[0])


    print (fileset[1])
    print (label[1])


    print (fileset[-1])
    print (label[-1])


    SIZE = label.shape[0]


    data, label = alignment_data(data=data, label=label, LABEL=LABEL, BASE_DIVIDE=BASE_DIVIDE)


    data = approximate_normalization(data)


    train_data, train_label, eval_data, eval_label = random_sample(data, label, ACCELERATION_FACTOR, LABEL)


    TRAIN_SIZE = train_label.shape[0]
    EVAL_SIZE = eval_label.shape[0]


    train_data, train_label = random_shuffle(train_data, train_label)
    eval_data, eval_label = random_shuffle(eval_data, eval_label)


    train_data = train_data.astype(np.float32)
    eval_data = eval_data.astype(np.float32)


    train_label = train_label.astype(np.int64)
    eval_label = eval_label.astype(np.int64)


    print ("ALL SIZE FOR %d " % SIZE)
    print ("TRAIN SIZE FOR %d " % TRAIN_SIZE)


    feed_eval_data = tf.placeholder(dtype=tf.float32, shape=[None, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNEL],
                                    name="feed_eval_data")
    feed_eval_label = tf.placeholder(dtype=tf.int64, shape=[None, LABEL], name="feed_eval_label")


    feed_train_data = tf.placeholder(dtype=tf.float32, shape=[None, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNEL],
                                     name="feed_train_data")


    feed_train_label = tf.placeholder(dtype=tf.int64, shape=[None, LABEL], name="feed_train_label")


    convolution_weights_1 = tf.Variable(initial_value=tf.truncated_normal(shape=[11, 11, NUM_CHANNEL, 96], seed=SEED,
                                                                          stddev=0.01, dtype=tf.float32), name="conv1")


    convolution_biases_1 = tf.Variable(initial_value=tf.zeros(shape=[96], dtype=tf.float32), name="conv1_bias")


    convolution_weights2 = tf.Variable(initial_value=tf.truncated_normal(shape=[5, 5, 96, 256], seed=SEED,
                                                                         stddev=0.01, dtype=tf.float32), name="conv2")


    convolution_biases2 = tf.Variable(initial_value=tf.zeros(shape=[256], dtype=tf.float32), name="conv2_bias")


    convolution_weights3 = tf.Variable(initial_value=tf.truncated_normal(shape=[3, 3, 256, 384], seed=SEED,
                                                                         stddev=0.01, dtype=tf.float32), name="conv3")


    convolution_biases3 = tf.Variable(initial_value=tf.zeros(shape=[384], dtype=tf.float32), name="conv3_bias")


    convolution_weights4 = tf.Variable(initial_value=tf.truncated_normal(shape=[3, 3, 384, 384], seed=SEED,
                                                                         stddev=0.01, dtype=tf.float32), name="conv4")


    convolution_biases4 = tf.Variable(initial_value=tf.zeros(shape=[384], dtype=tf.float32), name="conv4_bias")


    convolution_weights5 = tf.Variable(initial_value=tf.truncated_normal(shape=[3, 3, 384, 256], seed=SEED,
                                                                         stddev=0.01, dtype=tf.float32), name="conv5")


    convolution_biases5 = tf.Variable(initial_value=tf.zeros(shape=[256], dtype=tf.float32), name="conv5_bias")


    fc1_weights = tf.Variable(
        initial_value=tf.truncated_normal(shape=[9216, 4096], stddev=0.01, seed=SEED, dtype=tf.float32), name="fc1")


    fc1_biases = tf.Variable(initial_value=tf.zeros(shape=[4096], dtype=tf.float32), name="fc1_bias")


    fc2_weights = tf.Variable(
        initial_value=tf.truncated_normal(shape=[4096, 4096], stddev=0.01, seed=SEED, dtype=tf.float32), name="fc2")


    fc2_biases = tf.Variable(initial_value=tf.zeros(shape=[4096], dtype=tf.float32), name="fc2_bias")


    fc3_weights = tf.Variable(
        initial_value=tf.truncated_normal(shape=[4096, LABEL], stddev=0.01, seed=SEED, dtype=tf.float32), name="fc3")


    # fc3_biases = tf.Variable(initial_value=tf.zeros(shape=[5], dtype=tf.float32))


    def forward(info=None, flag=False):


        info = tf.reshape(info, [-1, IMAGE_SIZE, IMAGE_SIZE, NUM_CHANNEL])


        print (info.get_shape())


        conv1 = tf.nn.conv2d(input=info,
                             filter=convolution_weights_1,
                             padding="VALID",
                             strides=[1, 4, 4, 1])


        print (conv1.get_shape())


        # conv1_bn = batch_normalization(x=conv1, depth=conv1.get_shape()[-1], phase_train=flag)


        relu1 = tf.nn.relu(tf.nn.bias_add(conv1, convolution_biases_1))


        print (relu1.get_shape())


        pool1 = tf.nn.avg_pool(value=relu1,
                               ksize=[1, 3, 3, 1],
                               strides=[1, 2, 2, 1],
                               padding="VALID")


        print (pool1.get_shape())


        norm1 = tf.nn.local_response_normalization(pool1)


        # norm1 = batch_norm(pool1, flag)


        print (norm1.get_shape())


        conv2 = tf.nn.conv2d(input=norm1,
                             strides=[1, 1, 1, 1],
                             padding="SAME",
                             filter=convolution_weights2)


        # tf.nn.batch_normalization()


        # conv2_bn = batch_normalization(x=conv2, depth=conv2.get_shape()[-1], phase_train=flag)


        print (conv2.get_shape())


        relu2 = tf.nn.relu(tf.nn.bias_add(conv2, convolution_biases2))


        print (relu2.get_shape())


        pool2 = tf.nn.max_pool(value=relu2,
                               ksize=[1, 3, 3, 1],
                               strides=[1, 2, 2, 1],
                               padding="VALID")


        print (pool2.get_shape())


        norm2 = tf.nn.local_response_normalization(pool2)


        # norm2 = batch_norm(pool2, flag)


        print (norm2.get_shape())


        conv3 = tf.nn.conv2d(input=norm2,
                             strides=[1, 1, 1, 1],
                             padding="SAME",
                             filter=convolution_weights3)


        print (conv3.get_shape())


        relu3 = tf.nn.relu(tf.nn.bias_add(conv3, convolution_biases3))


        print (relu3.get_shape())


        conv4 = tf.nn.conv2d(input=relu3,
                             strides=[1, 1, 1, 1],
                             padding="SAME",
                             filter=convolution_weights4)


        print (conv4.get_shape())


        relu4 = tf.nn.relu(tf.nn.bias_add(conv4, convolution_biases4))


        print (relu4.get_shape())


        conv5 = tf.nn.conv2d(input=relu4,
                             strides=[1, 1, 1, 1],
                             padding="SAME",
                             filter=convolution_weights5)


        print (conv5.get_shape())


        relu5 = tf.nn.relu(tf.nn.bias_add(conv5, convolution_biases5))


        print (relu5.get_shape())


        pool5 = tf.nn.max_pool(value=relu5,
                               ksize=[1, 3, 3, 1],
                               strides=[1, 2, 2, 1],
                               padding="VALID")


        fc = tf.reshape(pool5, [-1, fc1_weights.get_shape().as_list()[0]])


        # fc = batch_normalization(fc, depth=fc.get_shape()[-1], phase_train=flag)


        hidden_1 = tf.matmul(fc, fc1_weights) + fc1_biases


        hidden_1_relu = tf.nn.relu(hidden_1)


        # hidden_1_relu_bn = batch_norm(hidden_1_relu, flag)


        if flag:
            hidden_1_relu = tf.nn.dropout(hidden_1_relu, keep_prob=DROP_OUT)


        hidden_2 = tf.matmul(a=hidden_1_relu, b=fc2_weights) + fc2_biases


        hidden_2_relu = tf.nn.relu(hidden_2)


        hidden_2_relu_bn = batch_norm(hidden_2_relu, flag)


        if flag:
            hidden_2_relu_bn = tf.nn.dropout(hidden_2_relu_bn, keep_prob=DROP_OUT)


        hidden_3 = tf.matmul(hidden_2_relu_bn, fc3_weights)


        network = hidden_3


        return network


    logits = forward(feed_train_data, True)


    loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits, feed_train_label))


    regularizers = (tf.nn.l2_loss(fc1_weights) + tf.nn.l2_loss(fc1_biases) +
                    tf.nn.l2_loss(fc2_weights) + tf.nn.l2_loss(fc2_biases) +
                    tf.nn.l2_loss(fc3_weights))


    loss += REGULAR * regularizers


    train_predict = tf.nn.softmax(logits)


    eval_logits = forward(feed_eval_data, False)


    eval_loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(eval_logits, feed_eval_label))


    eval_predict = tf.nn.softmax(eval_logits)


    TENSOR_GLOBAL_STEP = tf.Variable(0, dtype=tf.int64)
    learning_rate = tf.train.exponential_decay(
        LEARNING_RATE,  # Base learning rate.
        TENSOR_GLOBAL_STEP,  # Current index into the dataset.
        DECAY_STEPS,  # Decay step.
        DECAY_RATE,  # Decay rate.
        staircase=True)


    # optimizer = tf.train.GradientDescentOptimizer(learning_rate=learning_rate).minimize(loss=loss)
    # optimizer = tf.train.RMSPropOptimizer(learning_rate=learning_rate, decay=DECAY_RATE).minimize(loss)


    optimizer = tf.train.MomentumOptimizer(learning_rate=learning_rate,
                                           momentum=MOMENTUM).minimize(loss=loss,
                                                                       global_step=TENSOR_GLOBAL_STEP)


    # optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate).minimize(loss)
    # optimizer = tf.train.AdagradOptimizer(learning_rate=learning_rate).minimize(loss=eval_loss)
    # optimizer = tf.train.FtrlOptimizer(learning_rate=learning_rate).minimize(loss)
    # optimizer = tf.train.ProximalGradientDescentOptimizer(learning_rate).minimize(loss)


    with tf.Session() as sess:
        print ("INIT.")
        print (SEED)


        init = tf.global_variables_initializer()


        sess.run(init)


        tf.summary.scalar(name="learning", tensor=learning_rate)
        tf.summary.histogram(name="learning", values=learning_rate)


        tf.summary.scalar(name="regularizers", tensor=regularizers * REGULAR)
        tf.summary.histogram(name="regularizers", values=regularizers * REGULAR)


        tf.summary.scalar(name="loss", tensor=loss - REGULAR * regularizers)
        tf.summary.histogram(name="loss", values=loss - REGULAR * regularizers)


        tf.summary.scalar(name="eval_loss", tensor=eval_loss)
        tf.summary.histogram(name="eval_loss", values=eval_loss)


        merge_op = tf.summary.merge_all()


        train_writer = tf.summary.FileWriter(logdir="./log/train/", graph=sess.graph)
        valid_writer = tf.summary.FileWriter(logdir="./log/valid")


        limit = TRAIN_SIZE // BATCH_SIZE + 1
        limit_eval = EVAL_SIZE // BATCH_SIZE + 1


        acc_loss = 1000


        saver = tf.train.Saver()


        while acc_loss > 0.2:
            for step in range(GLOBAL_STEP):


                if step % REPORT_CONTROL == 0:


                    ave_eval_loss = 0.0
                    ave_eval_acc = 0.0


                    print ("STEP %d " % step)
                    print ("------------------------------------>")
                    for batch in range(limit_eval):
                        print ("EVAL BATCH SIZE FOR %d " % batch)
                        if batch == limit_eval - 1:
                            start = batch * BATCH_SIZE
                            end = EVAL_SIZE
                            if end - start == 0:
                                continue
                        else:
                            start = batch * BATCH_SIZE
                            end = start + BATCH_SIZE


                        input = eval_data[start:end]
                        input_label = eval_label[start:end]


                        feed_dict = {feed_eval_data: input,
                                     feed_eval_label: input_label}


                        _eval_predict, _eval_loss, _regularizers = sess.run(
                            [eval_predict, eval_loss, regularizers],
                            feed_dict=feed_dict)


                        media = np.argmax(_eval_predict, 1)
                        array = np.argmax(input_label, 1)


                        acc_sum = np.sum(media == array)
                        accurate = (acc_sum / float(end - start))


                        acc_loss = _eval_loss
                        _regularizers *= REGULAR


                        print (media)
                        print (array)


                        ave_eval_loss += _eval_loss
                        ave_eval_acc += accurate


                        print ("accurate %f " % accurate)
                        print ("loss %s " % str(_eval_loss))
                        print ("regularizers %f " % _regularizers)
                        print ("------------------------------------>")


                    if end == EVAL_SIZE:


                        ave_eval_loss = ave_eval_loss / (batch)
                        ave_eval_acc = ave_eval_acc / (batch)


                        print ("average eval acc %f " % ave_eval_acc)
                        print ("average eval loss %f " % ave_eval_loss)


                        if ave_eval_loss > 0:
                            if ave_eval_acc >= 0.95 or ave_eval_loss <= 0.15:
                                model = "alexnet-eval-acc-" + str(ave_eval_acc) + "-loss-" + str(
                                    ave_eval_loss) + ".model"
                                path = saver.save(sess, model)
                                print ("save model for %s " % path)


                ave_train_loss = 0.0
                ave_train_acc = 0.0


                for batch in xrange(limit):


                    if batch == limit - 1:
                        start = batch * BATCH_SIZE
                        end = TRAIN_SIZE
                        if end - start == 0:
                            continue
                    else:
                        start = batch * BATCH_SIZE
                        end = start + BATCH_SIZE


                    input = train_data[start:end]
                    input_label = train_label[start:end]


                    feed_dict = {feed_train_data: input,
                                 feed_train_label: input_label}


                    _loss, _optimizer, _train_predict, _regular, _learn_rate = sess.run(
                        [loss, optimizer, train_predict, regularizers, learning_rate],
                        feed_dict=feed_dict)


                    _adjust_regular = _regular * np.float16(REGULAR)


                    media = np.argmax(_train_predict, 1)
                    array = np.argmax(input_label, 1)


                    temp = np.sum(media == array)


                    if step % REPORT_CONTROL == 0:
                        accurate = (temp / float(end - start))


                        print ("*************************>")
                        print ("batch for %d " % batch)
                        print ("loss %f" % _loss)
                        print ("regular %f" % _adjust_regular)
                        print ("accurate %f " % accurate)
                        print ("learn_rate %f " % _learn_rate)
                        print ("*************************<")


                        ave_train_loss += _loss - float(_adjust_regular)
                        ave_train_acc += accurate


                        if end == TRAIN_SIZE:


                            ave_train_loss = ave_train_loss / (batch + 1)
                            ave_train_acc = ave_train_acc / (batch + 1)


                            print ("average train acc : %f " % ave_train_acc)
                            print ("average train loss : %f " % ave_train_loss)


                            if ave_train_loss > 0:
                                if ave_train_acc >= 0.95 or ave_train_loss <= 0.15:
                                    model = "alexnet-train-acc-" + str(ave_train_acc) + "-loss-" + str(
                                        ave_train_loss) + ".ckpt"
                                    path = saver.save(sess, model)
                                    print ("save model for %s " % path)
        print ("train over.")
    return




if '__main__' == __name__:
    tf.app.run()

原创粉丝点击