Tiago de Freitas Pereira
--- a/bob/learn/tensorflow/test/test_cnn_trainable_variables_select.py

+ 21

− 54

View file @ 15580121

Open in Web IDE
+++ b/bob/learn/tensorflow/test/test_cnn_trainable_variables_select.py

+ 21

− 54

View file @ 15580121

Open in Web IDE
 @@ -23,7 +23,7 @@ step2_path = os.path.join(directory, "step2")
 @@ -23,7 +23,7 @@ step2_path = os.path.join(directory, "step2")
 slim = tf.contrib.slim
-def base_network(train_data_shuffler, reuse=False, get_embedding=False):
+def base_network(train_data_shuffler, reuse=False, get_embedding=False, trainable=True):
    if isinstance(train_data_shuffler, tf.Tensor):
        inputs = train_data_shuffler
 @@ -33,11 +33,11 @@ def base_network(train_data_shuffler, reuse=False, get_embedding=False):
 @@ -33,11 +33,11 @@ def base_network(train_data_shuffler, reuse=False, get_embedding=False):
    # Creating a random network
    initializer = tf.contrib.layers.xavier_initializer(seed=seed)
    graph = slim.conv2d(inputs, 10, [3, 3], activation_fn=tf.nn.relu, stride=1, scope='conv1',
-                        weights_initializer=initializer, reuse=reuse)
+                        weights_initializer=initializer, reuse=reuse, trainable=trainable)
    graph = slim.max_pool2d(graph, [4, 4], scope='pool1')
    graph = slim.flatten(graph, scope='flatten1')
    graph = slim.fully_connected(graph, 30, activation_fn=None, scope='fc1',
-                                 weights_initializer=initializer, reuse=reuse)
+                                 weights_initializer=initializer, reuse=reuse, trainable=trainable)
    if get_embedding:
        graph = graph
 @@ -95,17 +95,11 @@ def test_trainable_variables():
 @@ -95,17 +95,11 @@ def test_trainable_variables():
        writer.close()
-    # 1 - Create
+    ######## 1 - BASE NETWORK #########    
-    # 2 - Initialize
-    # 3 - Minimize with certain variables 
-    # 4 - Load the last checkpoint
-    ######## BASE NETWORK #########    
    tfrecords_filename = "mnist_train.tfrecords"    
-    #create_tf_record(tfrecords_filename, train_data, train_labels)
+    create_tf_record(tfrecords_filename, train_data, train_labels)
    filename_queue = tf.train.string_input_producer([tfrecords_filename], num_epochs=1, name="input")
    # Doing the first training
 @@ -128,21 +122,22 @@ def test_trainable_variables():
 @@ -128,21 +122,22 @@ def test_trainable_variables():
                                        )
    trainer.train()
-    conv1_trained = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
+    # Saving the cov after first training
+    conv1_after_first_train = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
    del trainer
    del filename_queue
    del train_data_shuffler
    tf.reset_default_graph()
+    ######## 2 - AMEMDING NETWORK ######### 
-    ##### Creating an amendment network
    filename_queue = tf.train.string_input_producer([tfrecords_filename], num_epochs=1, name="input")
    train_data_shuffler  = TFRecord(filename_queue=filename_queue,
                                    batch_size=batch_size)
-    graph = base_network(train_data_shuffler, get_embedding=True)
+    # Here I'm creating the base network not trainable
+    graph = base_network(train_data_shuffler, get_embedding=True, trainable=False)
    graph = amendment_network(graph)
    loss = MeanSoftMaxLoss(add_regularization_losses=False)
 @@ -151,7 +146,6 @@ def test_trainable_variables():
 @@ -151,7 +146,6 @@ def test_trainable_variables():
                  analizer=None,
                  temp_dir=step2_path)
    learning_rate = constant(0.01, name="regular_lr")
    trainer.create_network_from_scratch(graph=graph,
                                        loss=loss,
 @@ -159,45 +153,18 @@ def test_trainable_variables():
 @@ -159,45 +153,18 @@ def test_trainable_variables():
                                        optimizer=tf.train.GradientDescentOptimizer(learning_rate),
                                        )
-    conv1_before_load = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
+    # Loading two layers from the "old" model
+    external_model = os.path.join(step1_path, "model.ckp")
-    var_list =  tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1') + \
+    trainer.load_variables_from_external_model(external_model, var_list=['conv1', 'fc1'])
-                tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='fc1')
-    saver = tf.train.Saver(var_list)
-    saver.restore(trainer.session, os.path.join(step1_path, "model.ckp"))
    conv1_restored = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
+    assert numpy.allclose(conv1_after_first_train, conv1_restored)  
-    trainer.train()
+    # Second round of training    
+    trainer.train()    
-    conv1_after_train = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
+    conv1_after_second_train = tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES, scope='conv1')[0].eval(session=trainer.session)[0]
-    print(conv1_trained - conv1_before_load)
-    print(conv1_trained - conv1_restored)
-    print(conv1_trained - conv1_after_train)    
-    import ipdb; ipdb.set_trace();
-    x = 0
-    #var_list = tf.get_collection(tf.GraphKeys.VARIABLES, scope='fc1') + tf.get_collection(tf.GraphKeys.VARIABLES, scope='logits')
+    # Since conv1 was set as NON TRAINABLE, both have to match
-    #optimizer = tf.train.GradientDescentOptimizer(0.01).minimize(loss, global_step=global_step, var_list=var_list)
+    assert numpy.allclose(conv1_after_first_train, conv1_after_second_train)  
-    #print("Go ...")
-    """
-    last_iteration = numpy.sum(tf.trainable_variables()[0].eval(session=session)[0])
-    for i in range(10):
-        _, l  = session.run([optimizer, loss])
-        current_iteration = numpy.sum(tf.trainable_variables()[0].eval(session=session)[0])
-        print numpy.abs(current_iteration - last_iteration)
-        current_iteration = last_iteration        
-        print l
-    thread_pool.request_stop()
-    """        
-    #x = 0