Fix:minor

abilng · abilng · commit 7d597b522914 · 2014-08-28T13:39:05.000+05:30
diff --git a/config/CNN/conv_spec.json b/config/CNN/conv_spec.json
@@ -1,26 +1,35 @@
 {
-
-   "comment" : "layers :: convolution layer configuration",
-   "layers": [
-		{
-			"convmat_dim" : [5,5],
-			"num_filters" : 100,
-			"poolsize" :  [2,2],
-			"flatten" : false,
-			"update" : true
-		},
-		{
-			"convmat_dim" : [4,4],
-			"num_filters" : 200,
-			"poolsize" :  [2,2],
-			"flatten" : true,
-			"update" : true
-		}
+    "conv_spec":{
+	"comment" : "layers :: convolution layer configuration",
+	"layers": [
+	    {
+		"convmat_dim" : [5,5],
+		"num_filters" : 100,
+		"poolsize" :  [2,2],
+		"flatten" : false,
+		"update" : true
+	    },
+	    {
+		"convmat_dim" : [4,4],
+		"num_filters" : 200,
+		"poolsize" :  [2,2],
+		"flatten" : true,
+		"update" : true
+	    }
 	],
 
-   "comment" : "activation :: sigmoid or tanh",
-   "activation" : "tanh",
+	"comment" : "activation :: sigmoid or tanh",
+	"activation" : "tanh",
+
+	"comment" : "use_fast :: To use pylearn2 library for faster computation or not",
+	"use_fast" : false
+    },
+    "mlp_spec":{
+
+	"comment" : "layers :: hidden layer configuration",
+	"layers": [500,200],
 
-  "comment" : "use_fast :: To use pylearn2 library for faster computation or not",
-  "use_fast" : false
+	"comment" : "activation :: sigmoid or tanh",
+	"activation" : "tanh"
+    }
 }
diff --git a/config/CNN/model_conf.json b/config/CNN/model_conf.json
@@ -8,18 +8,18 @@
 	"comment" : "valid_data (Mandatory) specify the path of the validation data relative to the working directory",
 	"data_spec" : "data_spec.json",
 	
-	"comment" : "hidden_nnet_spec :: (Mandatory) specify the path of hidden network configuration specification relative to working directory",
-	"hidden_nnet_spec" : "mlp_spec.json",
-	
-	"comment" : "conv_nnet_spec :: (Mandatory) specify the path of convolution network configuration specification relative to working directory",
-	"conv_nnet_spec" : "conv_spec.json",
+	"comment" : "nnet_spec :: (Mandatory) specify the path of network configuration specification relative to working directory",
+	"nnet_spec" : "conv_spec.json",
 
 	"comment" : "hidden_output_file :: (Mandatory) specify the path of convolution network output file relative to working directory",
 	"hidden_output_file" : "hidden_out.model",
 	
 	"comment" : "conv_output_file :: (Mandatory) specify the path of convolution network output file relative to working directory",
 	"conv_output_file" : "conv_out.model",
 	
+	"comment" : "conv_output_file :: (Mandatory) specify the path of convolution network output file relative to working directory",
+	"output_file" : "conv_out.model",
+	
 	"comment" : "input_shape :: (Mandatory) specify the input shape of a given feature vector" ,
 	"input_shape" : [3,28,28],
 	
@@ -47,5 +47,13 @@
 			"min_epoch_decay_start" : 15,
 			"init_error" :100
 		},
+
+	"processes":{
+		"pretraining":false,
+		"finetuning":true,
+		"testing":true,
+		"export_data":false
+	},
+	
 	"export_path" : "data/export"
 }
diff --git a/config/CNN1/model_conf.json b/config/CNN1/model_conf.json
@@ -8,11 +8,8 @@
 	"comment" : "valid_data (Mandatory) specify the path of the validation data relative to the working directory",
 	"data_spec" : "data_spec.json",
 	
-	"comment" : "hidden_nnet_spec :: (Mandatory) specify the path of hidden network configuration specification relative to working directory",
-	"hidden_nnet_spec" : "mlp_spec.json",
-	
 	"comment" : "conv_nnet_spec :: (Mandatory) specify the path of convolution network configuration specification relative to working directory",
-	"conv_nnet_spec" : "conv_spec.json",
+	"nnet_spec" : "conv_spec.json",
 
 	"comment" : "hidden_output_file :: (Mandatory) specify the path of convolution network output file relative to working directory",
 	"hidden_output_file" : "hidden_out.model",
@@ -47,5 +44,13 @@
 			"min_epoch_decay_start" : 15,
 			"init_error" :100
 	},
+
+	"processes":{
+		"pretraining":false,
+		"finetuning":true,
+		"testing":true,
+		"export_data":false,
+	},
+
 	"export_path" : "data/export"
 }
diff --git a/config/DBN/model_conf.json b/config/DBN/model_conf.json
@@ -9,7 +9,7 @@
 	"data_spec" : "data_spec.json",
 	
 	"comment" : "rbm_nnet_spec:: (Mandatory) specify the path of RBM network configuration specification relative to working directory",
-	"rbm_nnet_spec" : "rbm_spec.json",
+	"nnet_spec" : "rbm_spec.json",
 
 	"comment" : "output_file :: (Mandatory) specify the path of RBM network output file relative to working directory",
 	"output_file" : "rbm_out.model",
@@ -44,7 +44,13 @@
 	},
 
 	"comment" : "finetune_momentum ::  Specify the momentum factor while finetuning",
-	"finetune_momentum": 0.5
-
+	"finetune_momentum": 0.5,
+
+	"processes":{
+		"pretraining":false,
+		"finetuning":true,
+		"testing":true,
+		"export_data":false
+	}
 
 }
diff --git a/config/DBN/rbm_spec.json b/config/DBN/rbm_spec.json
@@ -10,7 +10,7 @@
   "n_outs":200,
 
   "comment" : "activation :: sigmoid or tanh",
-  "activation" : "tanh",
+  "activation" : "sigmoid",
 
   "comment" : "pretrained_layers:number of layers to be pre-trained",
   "pretrained_layers" : 5,
diff --git a/config/SDA/model_conf.json b/config/SDA/model_conf.json
@@ -9,7 +9,7 @@
 	"data_spec" : "data_spec.json",
 	
 	"comment" : "sda_nnet_spec:: (Mandatory) specify the path of SDA network configuration specification relative to working directory",
-	"sda_nnet_spec" : "sda_spec.json",
+	"nnet_spec" : "sda_spec.json",
 
 	"comment" : "output_file :: (Mandatory) specify the path of SDA network output file relative to working directory",
 	"output_file" : "sda_out.model",
@@ -41,6 +41,12 @@
 	},
 
 	"comment" : "finetune_momentum ::  Specify the momentum factor while finetuning",
-	"finetune_momentum": 0.5
-
+	"finetune_momentum": 0.5,
+
+	"processes":{
+		"pretraining":true,
+		"finetuning":true,
+		"testing":true,
+		"export_data":false
+	}
 }
diff --git a/layers/rbm.py b/layers/rbm.py
@@ -4,16 +4,17 @@
 from theano.sandbox.rng_mrg import MRG_RandomStreams as RandomStreams
 from collections import OrderedDict
 
+
 class RBM(object):
     """Bernoulli-bernoulli restricted Boltzmann machine (RBM)  """
     
     def __init__(self, input=None, n_visible=1024, n_hidden=1024,
                  W = None, hbias = None, vbias = None, numpy_rng = None,
-                 theano_rng = None,activation=T.nnet.sigmoid):
+                 theano_rng = None):
                
         self.n_visible = n_visible
         self.n_hidden  = n_hidden
-        self.activation = activation
+
 
         if numpy_rng is None:
             numpy_rng = numpy.random.RandomState(1234)
@@ -44,9 +45,12 @@ def __init__(self, input=None, n_visible=1024, n_hidden=1024,
         if not input:
             self.input = T.matrix('input')
         
-        self.delta_W = theano.shared(value=numpy.zeros_like(W.get_value(borrow=True), dtype=theano.config.floatX), name='delta_W')
-        self.delta_hbias = theano.shared(value=numpy.zeros_like(hbias.get_value(borrow=True), dtype=theano.config.floatX), name='delta_hbias')
-        self.delta_vbias = theano.shared(value=numpy.zeros_like(vbias.get_value(borrow=True), dtype=theano.config.floatX), name='delta_vbias')
+        self.delta_W = theano.shared(value=numpy.zeros_like(W.get_value(borrow=True),
+            dtype=theano.config.floatX), name='delta_W')
+        self.delta_hbias = theano.shared(value=numpy.zeros_like(hbias.get_value(borrow=True),
+            dtype=theano.config.floatX), name='delta_hbias')
+        self.delta_vbias = theano.shared(value=numpy.zeros_like(vbias.get_value(borrow=True),
+            dtype=theano.config.floatX), name='delta_vbias')
         
         self.W = W
         self.hbias = hbias
@@ -67,7 +71,7 @@ def free_energy(self, v_sample):
     def propup(self, vis):
         ''' Propagate the visible activations up to the hidden units '''
         pre_sigmoid_activation = T.dot(vis, self.W) + self.hbias
-        return [pre_sigmoid_activation, self.activation(pre_sigmoid_activation)]
+        return [pre_sigmoid_activation, T.nnet.sigmoid(pre_sigmoid_activation)]
 
     def sample_h_given_v(self, v0_sample):
         ''' Generates hidden unit outputs given visible inputs '''
@@ -82,7 +86,7 @@ def sample_h_given_v(self, v0_sample):
     def propdown(self, hid):
         '''Propagates the hidden activation downwards to the visible units'''
         pre_sigmoid_activation = T.dot(hid, self.W.T) + self.vbias
-        return [pre_sigmoid_activation, self.activation(pre_sigmoid_activation)]
+        return [pre_sigmoid_activation, T.nnet.sigmoid(pre_sigmoid_activation)]
 
     def sample_v_given_h(self, h0_sample):
         ''' Generates visible units given hidden units '''
@@ -106,7 +110,8 @@ def gibbs_vhv(self, v0_sample):
         pre_sigmoid_v1, v1_mean, v1_sample = self.sample_v_given_h(h1_sample)
         return [pre_sigmoid_h1, h1_mean, h1_sample, pre_sigmoid_v1, v1_mean, v1_sample]
 
-#    def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_cost=0.00001, persistent=None, k=1):        
+#    def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, 
+#    weight_cost=0.00001, persistent=None, k=1):        
     def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_cost=0.00001):
         """
         get the cost and the gradient corresponding to one step of CD-k (k=1)
@@ -117,9 +122,15 @@ def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_c
                 
         # gradient of parameters
         updates=OrderedDict()
-        updates[self.delta_W] = momentum * self.delta_W + lr * (1.0/batch_size) * (T.dot(self.input.T, hp_data) - T.dot(v_rec_sigm.T, hp_rec)) - lr * weight_cost * self.W
-        updates[self.delta_hbias] = momentum * self.delta_hbias + lr * (1.0/batch_size) * (T.sum(h_data, axis=0) - T.sum(hp_rec, axis=0))
-        updates[self.delta_vbias] = momentum * self.delta_vbias + lr * (1.0/batch_size) * (T.sum(self.input, axis=0) - T.sum(v_rec_sigm, axis=0))
+        updates[self.delta_W] = (
+            momentum * self.delta_W + lr * (1.0/batch_size) *(T.dot(self.input.T, hp_data) -
+             T.dot(v_rec_sigm.T, hp_rec)) - lr * weight_cost * self.W)
+        updates[self.delta_hbias] = (
+            momentum * self.delta_hbias + lr * (1.0/batch_size) *
+            (T.sum(h_data, axis=0) - T.sum(hp_rec, axis=0)))
+        updates[self.delta_vbias] = (
+            momentum * self.delta_vbias + lr * (1.0/batch_size) *
+            (T.sum(self.input, axis=0) - T.sum(v_rec_sigm, axis=0)))
         
         for param, dparam in zip(self.params, self.delta_params):
             updates[param] = param + updates[dparam]
@@ -138,14 +149,13 @@ class GBRBM(RBM):
     
     def __init__(self, input=None, n_visible=351, n_hidden=1000,
                  W = None, hbias = None, vbias = None, numpy_rng = None,
-                 theano_rng = None,activation=T.nnet.sigmoid):
+                 theano_rng = None):
         
         super(GBRBM, self).__init__(input=input, n_visible=n_visible,
                     n_hidden=n_hidden,
                     W=W, hbias=hbias,
                     vbias=vbias, numpy_rng=numpy_rng, 
-                    theano_rng=theano_rng,
-                    activation=activation)
+                    theano_rng=theano_rng)
     
     def free_energy(self, v_sample):
         ''' Compute the free energy '''
@@ -163,7 +173,8 @@ def sample_v_given_h(self, h0_sample):
 
         return [pre_sigmoid_v1, v1_mean, v1_sample]
 
-#    def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_cost=0.00001, persistent=None, k = 1):    
+#    def get_cost_updates(self, batch_size = 128, lr = 0.0001, 
+#    momentum=0.5, weight_cost=0.00001, persistent=None, k = 1):    
     def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_cost=0.00001):
         
         x, hp_data, h_data = self.sample_h_given_v(self.input)
@@ -172,9 +183,15 @@ def get_cost_updates(self, batch_size = 128, lr = 0.0001, momentum=0.5, weight_c
                 
         updates=OrderedDict()
         
-        updates[self.delta_W] = momentum * self.delta_W + lr * (1.0/batch_size) * (T.dot(self.input.T, hp_data) - T.dot(v_rec.T, hp_rec)) - lr * weight_cost * self.W
-        updates[self.delta_hbias] = momentum * self.delta_hbias + lr * (1.0/batch_size) * (T.sum(h_data, axis=0) - T.sum(hp_rec, axis=0))
-        updates[self.delta_vbias] = momentum * self.delta_vbias + lr * (1.0/batch_size) * (T.sum(self.input, axis=0) - T.sum(v_rec, axis=0))
+        updates[self.delta_W] = (
+            momentum * self.delta_W + lr * (1.0/batch_size) * (T.dot(self.input.T, hp_data) -
+            T.dot(v_rec.T, hp_rec)) - lr * weight_cost * self.W)
+        updates[self.delta_hbias] = (
+            momentum * self.delta_hbias + lr * (1.0/batch_size) * 
+            (T.sum(h_data, axis=0) - T.sum(hp_rec, axis=0)))
+        updates[self.delta_vbias] = (
+            momentum * self.delta_vbias + lr * (1.0/batch_size) *
+            (T.sum(self.input, axis=0) - T.sum(v_rec, axis=0)))
             
         updates[self.W] = self.W + updates[self.delta_W]
         updates[self.hbias] = self.hbias + updates[self.delta_hbias]
diff --git a/models/dbn.py b/models/dbn.py
@@ -122,17 +122,15 @@ def __init__(self, numpy_rng, theano_rng=None, n_ins=784,
                               n_visible=input_size,
                               n_hidden=hidden_layers_sizes[i],
                               W=sigmoid_layer.W,
-                              hbias=sigmoid_layer.b,
-                              activation=activation)
+                              hbias=sigmoid_layer.b)
             else:
                 rbm_layer = RBM(numpy_rng=numpy_rng,
                               theano_rng=theano_rng,
                               input=layer_input,
                               n_visible=input_size,
                               n_hidden=hidden_layers_sizes[i],
                               W=sigmoid_layer.W,
-                              hbias=sigmoid_layer.b,
-                              activation=activation)
+                              hbias=sigmoid_layer.b)
             self.rbm_layers.append(rbm_layer)            
 
         # We now need to add a logistic layer on top of the MLP
diff --git a/run/run_DBN.py b/run/run_DBN.py
@@ -97,7 +97,7 @@ def runRBM(arg):
     else :
         model_config = load_model(arg,'RBM')
 
-    rbm_config = load_rbm_spec(model_config['rbm_nnet_spec'])
+    rbm_config = load_rbm_spec(model_config['nnet_spec'])
     data_spec =  load_data_spec(model_config['data_spec']);
 
 
@@ -110,19 +110,21 @@ def runRBM(arg):
     createDir(model_config['wdir']);
     #create working dir
 
+    keep_layer_num = model_config['keep_layer_num']
+    batch_size = model_config['batch_size']
+    wdir = model_config['wdir']
+    
+
     dbn = DBN(numpy_rng=numpy_rng, theano_rng = theano_rng, n_ins=rbm_config['n_ins'],
             hidden_layers_sizes=rbm_config['hidden_layers'],n_outs=rbm_config['n_outs'],
             first_layer_gb = rbm_config['first_layer_gb'],
             pretrainedLayers=rbm_config['pretrained_layers'],
             activation=activationFn)
 
+
     train_sets, train_xy, train_x, train_y = read_dataset(data_spec['training'],
         model_config['batch_size'])
 
-    keep_layer_num = model_config['keep_layer_num']
-    batch_size = model_config['batch_size']
-    wdir = model_config['wdir']
-    
     if keep_layer_num > 0:
         current_nnet = wdir + '/nnet.ptr.current'
         logger.info('Initializing model from ' + str(current_nnet) + '....')
@@ -132,10 +134,6 @@ def runRBM(arg):
 
     preTraining(dbn,train_sets,train_xy,train_x,train_y,model_config)
 
-    # save the pretrained nnet to file
-    logger.info('Saving model to ' + str(model_config['output_file']) + '....')
-    _nnet2file(dbn.sigmoid_layers, filename=model_config['output_file'], withfinal=True)
-    
 
     ########################
     # FINETUNING THE MODEL #
@@ -164,8 +162,6 @@ def runRBM(arg):
     fineTunning(dbn,train_sets,train_xy,train_x,train_y,
         valid_sets,valid_xy,valid_x,valid_y,lrate,momentum,batch_size)
 
-    logger.info('Saving model to ' + str(model_config['output_file']) + '.final ....')
-    _nnet2file(dbn.sigmoid_layers, filename=model_config['output_file']+'.final', withfinal=True)
 
     try:
         test_sets, test_xy, test_x, test_y = read_dataset(data_spec['testing'],
@@ -178,6 +174,9 @@ def runRBM(arg):
 
     testing(dbn,test_sets, test_xy, test_x, test_y,batch_size)
 
+    logger.info('Saving model to ' + str(model_config['output_file']) + ' ....')
+    _nnet2file(dbn.sigmoid_layers, filename=model_config['output_file'], withfinal=True)
+
 
 
 if __name__ == '__main__':
diff --git a/run/run_SDA.py b/run/run_SDA.py
diff --git a/utils/load_conf.py b/utils/load_conf.py