keras tensorboard的使用, 设置GPU使用的内存, 强制只使用cpu

import osos.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"   # see issue #152os.environ["CUDA_VISIBLE_DEVICES"] = ""


直接上例子:   (注意: 貌似调用tensorboard,训练速度好像被托慢了不少。其实可以记录model.fit的history对象,自己写几行代码显示 点击打开链接)

# coding: utf-8import numpy as npfrom keras.datasets import mnistfrom keras.models import Sequentialfrom keras.layers.core import Dense, Dropout, Activationfrom keras.optimizers import SGDfrom keras.utils import np_utilsimport keras.callbacksimport osimport tensorflow as tfimport keras.backend.tensorflow_backend as KTF####################################### TODO: set the gpu memory using fraction ######################################def get_session(gpu_fraction=0.3):    """    This function is to allocate GPU memory a specific fraction    Assume that you have 6GB of GPU memory and want to allocate ~2GB    """    num_threads = os.environ.get('OMP_NUM_THREADS')    gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=gpu_fraction)    if num_threads:        return tf.Session(config=tf.ConfigProto(            gpu_options=gpu_options, intra_op_parallelism_threads=num_threads))    else:        return tf.Session(config=tf.ConfigProto(gpu_options=gpu_options))KTF.set_session(get_session(0.6))  # using 60% of total GPU Memoryos.system("nvidia-smi")  # Execute the command (a string) in a subshellraw_input("Press Enter to continue...")######################batch_size = 128nb_classes = 10nb_epoch = 10nb_data = 28 * 28log_filepath = '/tmp/keras_log'# load data(X_train, y_train), (X_test, y_test) = mnist.load_data()# reshapeprint X_train.shapeX_train = X_train.reshape(X_train.shape[0], X_train.shape[1] * X_train.shape[2])X_test = X_test.reshape(X_test.shape[0], X_test.shape[1] * X_test.shape[2])# rescaleX_train = X_train.astype(np.float32)X_train /= 255X_test = X_test.astype(np.float32)X_test /= 255# convert class vectors to binary class matrices (one hot vectors)Y_train = np_utils.to_categorical(y_train, nb_classes)Y_test = np_utils.to_categorical(y_test, nb_classes)model = Sequential()model.add(Dense(512, input_shape=(nb_data,), init='normal', name='dense1'))  # a sample is a row 28*28model.add(Activation('relu', name='relu1'))model.add(Dropout(0.2, name='dropout1'))model.add(Dense(512, init='normal', name='dense2'))model.add(Activation('relu', name='relu2'))model.add(Dropout(0.2, name='dropout2'))model.add(Dense(10, init='normal', name='dense3'))model.add(Activation('softmax', name='softmax1'))model.summary()model.compile(loss='categorical_crossentropy', optimizer=SGD(lr=0.001), metrics=['accuracy'])tb_cb = keras.callbacks.TensorBoard(log_dir=log_filepath, write_images=1, histogram_freq=1)# 设置log的存储位置,将网络权值以图片格式保持在tensorboard中显示,设置每一个周期计算一次网络的#权值,每层输出值的分布直方图cbks = [tb_cb]history =, Y_train, batch_size=batch_size, nb_epoch=nb_epoch, verbose=1, callbacks=cbks, validation_data=(X_test, Y_test))score = model.evaluate(X_test, Y_test, verbose=0)print('Test score:', score[0])print('Test accuracy;', score[1])
其实可以自己给每一层layer命名一个name, 也可以由keras根据自己的命名规则自动取名,自动命名的规则在Layer类中,代码如下:
name = kwargs.get('name')  if not name:      prefix = self.__class__.__name__      name = _to_snake_case(prefix) + '_' + str(K.get_uid(prefix)) = name 
而在keras的call back模块中,tensorborad class类实现源码可以看出,keras默认将模型的所有层的所有weights, bias以及每一层输出的distribution, histogram等传送到tensorborad,方便在浏览器中观察网络的运行情况。实现源码如下:

def set_model(self, model):      self.model = model      self.sess = K.get_session()      if self.histogram_freq and self.merged is None:          for layer in self.model.layers:                for weight in layer.weights:                  tf.summary.histogram(, weight)                  if self.write_images:                      w_img = tf.squeeze(weight)                      shape = w_img.get_shape()                      if len(shape) > 1 and shape[0] > shape[1]:                          w_img = tf.transpose(w_img)                      if len(shape) == 1:                          w_img = tf.expand_dims(w_img, 0)                      w_img = tf.expand_dims(tf.expand_dims(w_img, 0), -1)                      tf.summary.image(, w_img)                if hasattr(layer, 'output'):                  tf.summary.histogram('{}_out'.format(,                                       layer.output)      self.merged = tf.summary.merge_all() 


embeddings_freq: frequency (in epochs) at which selected embedding    layers will be saved.embeddings_layer_names: a list of names of layers to keep eye on. If    None or empty list all the embedding layer will be watched.


tensorboard --logdir=/tmp/keras_log

在terminal打开浏览器地址,进入tensorboard可以随意浏览graph, distribution, histogram, 以及sclar列表中的loss, acc等等。

以下摘录自: 这里

TensorBoard will automatically include all runs logged within the sub-directories of the specifiedlog_dir, for example, if you logged another run using:

callback_tensorboard(log_dir = "logs/run_b")

Then the TensorBoard visualization would look like this:

You can use the unique_log_dir function if you want to record every training run in it’s own directory:

callback_tensorboard(log_dir = unique_log_dir())

Once again note that it’s not required to record every training run in it’s own directory. Using the default “logs” directory will work just fine, you’ll just only be able to visualize the most recent run using TensorBoard.


    model.compile(        loss = 'mean_squared_error',        optimizer = 'sgd',        metrics= c('mae', 'acc')  # 可视化mae和acc      )  

