Set dtype consistently for all features.

rrlyman · rrlyman · commit 445e9a58ed85 · 2016-09-30T17:12:01.000-07:00
diff --git a/ocr_utils.py b/ocr_utils.py
@@ -156,7 +156,7 @@ class TruthedCharacters(object):
     Holds the training features and size information
 
     """
-    def __init__(self,  features, output_feature_list, one_hot_map, engine_type,h,w):
+    def __init__(self,  features, output_feature_list, one_hot_map, engine_type,h,w, dtype):
 
         self._num_examples = features[0].shape[0]
         self._nRows = h
@@ -168,6 +168,7 @@ def __init__(self,  features, output_feature_list, one_hot_map, engine_type,h,w)
         self._num_features = len(features)
         self._one_hot_map = one_hot_map             # list >0 for each feature that is one_hot
         self._engine_type= engine_type        
+        self._dtype = dtype
         
         self._feature_width=[]
         for i in range(self._num_features ):
@@ -210,7 +211,7 @@ def get_features(self, i, start, end):
         if n_hots==0:
             rtn=self.engine_conversion(t1, self._feature_names[i])
         else:
-            rtn= self.engine_conversion(np.eye(n_hots )[t1], self._feature_names[i])            
+            rtn= self.engine_conversion(np.eye(n_hots, dtype=self._dtype )[t1], self._feature_names[i])            
         return rtn    
     
     @property
@@ -222,7 +223,7 @@ def features(self):
                 rtn.append(self.engine_conversion(t1, nm) )
                 #assert(np.all(rtn[-1]==t1))
             else:
-                rtn.append( self.engine_conversion(np.eye(n_hots )[t1], nm)   )             
+                rtn.append( self.engine_conversion(np.eye(n_hots, dtype=self._dtype )[t1], nm)   )             
         return rtn
     
     @property
@@ -271,7 +272,7 @@ def next_batch(self, batch_size):
         outs = []
         for i in range(self._num_features):
             outs += [self.get_features(i,start,end)]
-         
+           
         return outs
         
     def dump_values(self): 
@@ -500,19 +501,19 @@ class DataSets(object):
     feature_name=[]  
     one_hot_map = []   
      
-    for colName in output_feature_list:
+    for colName in output_feature_list:       
         one_hot_map.append(0)
         if colName=="aspect_ratio":  
-            t1  = np.array(df['originalW'] ,dtype=np.float32)
-            t2  = np.array(df['originalH'] ,dtype=np.float32) 
+            t1  = np.array(df['originalW'] ,dtype=dtype)
+            t2  = np.array(df['originalH'] ,dtype=dtype) 
             t1 = t1[:]/t2[:]
             feature_name.append(colName)  
             
         elif colName=="upper_case":
             boolDF1 = df['m_label']>=64
             boolDF2 = df['m_label']<=90   
             boolDF = boolDF1 & boolDF2     
-            t1 = np.array(boolDF,dtype=np.float32) 
+            t1 = np.array(boolDF,dtype=dtype) 
             feature_name.append(colName)                                
                    
         elif colName=='image':  
@@ -521,7 +522,7 @@ class DataSets(object):
             feature_name.append(colName)                                  
             
         elif colName=='m_label_one_hot': 
-            t1  = np.array(df['m_label'] )
+            t1  = np.array(df['m_label'])
             t1 = convert_to_unique(t1)
             one_hot_map[-1] = len(np.unique(t1))    
             feature_name.append(colName)                     
@@ -561,7 +562,7 @@ class DataSets(object):
 
         else: 
             if colName in df.columns  :     
-                t1=np.array(df[colName])
+                t1=np.array(df[colName], dtype=dtype)
                 feature_name.append(colName)              
             else:
                 raise ValueError('Invalid ouput_feature_name: {}: it is not in the the database'.format(colName))          
@@ -576,9 +577,9 @@ class DataSets(object):
         outvars_test.append( ot[:nTestCount])    
         outvars_evaluation.append(ot[nTestCount:nTestCount+nEvaluationCount])
          
-    data_sets.train = TruthedCharacters(outvars_train, feature_name, one_hot_map, engine_type, h, w)
-    data_sets.test = TruthedCharacters(outvars_test, feature_name, one_hot_map,  engine_type, h,  w)
-    data_sets.evaluation = TruthedCharacters(outvars_evaluation,feature_name,  one_hot_map,  engine_type, h,  w)    
+    data_sets.train = TruthedCharacters(outvars_train, feature_name, one_hot_map, engine_type, h, w, dtype)
+    data_sets.test = TruthedCharacters(outvars_test, feature_name, one_hot_map,  engine_type, h,  w, dtype)
+    data_sets.evaluation = TruthedCharacters(outvars_evaluation,feature_name,  one_hot_map,  engine_type, h,  w, dtype)    
     print ('feature results:')    
     print ('\tnumber of train Images = ',nTrainCount)
     print ('\tnumber of test Images = ',nTestCount) 
diff --git a/q2_tensorflow_mnist.py b/q2_tensorflow_mnist.py
@@ -33,14 +33,16 @@
 import pandas as pd
  
 import tensorflow as tf  
+dtype=np.float32
 #with tf.device('/gpu:0'):
 #with tf.device('/cpu:0'):    
 def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
  
     ds = ocr_utils.read_data(input_filters_dict = input_filters_dict, 
                                 output_feature_list=output_feature_list,
                                 test_size = .1,
-                                engine_type='tensorflow')
+                                engine_type='tensorflow',
+                                dtype=dtype)
 
         
     """# ==============================================================================
@@ -85,7 +87,7 @@ def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
             nm = 'x_'+nm
         if i>1:
             extra_features_width += ds.train.feature_width[i]
-        lst.append(tf.placeholder(tf.float32, shape=[None, ds.train.feature_width[i]], name=nm))
+        lst.append(tf.placeholder(dtype, shape=[None, ds.train.feature_width[i]], name=nm))
         
     # ph is a named tuple with key names like 'image', 'm_label', and values that
     # are tensors.  The display name on the Chrome graph are 'y_m_label', 'x_image, 
@@ -110,13 +112,13 @@ def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
     
     """# ==============================================================================
     
-    def weight_variable(shape):
-        initial = tf.truncated_normal(shape, stddev=0.1)
+    def weight_variable(shape, dtype):
+        initial = tf.truncated_normal(shape, stddev=0.1,dtype=dtype)
         return tf.Variable(initial)
     
-    def bias_variable(shape):
-        initial = tf.constant(0.1, shape=shape)
-        return tf.Variable(initial)
+    def bias_variable(shape, dtype):
+        initial = tf.constant(0.1, shape=shape, dtype=dtype)
+        return tf.Variable(initial)   
     
     """# ==============================================================================
     
@@ -139,8 +141,8 @@ def max_pool_2x2(x):
     
     """# ==============================================================================
     with tf.name_scope("w_conv1") as scope:
-        W_conv1 = weight_variable([5, 5, 1, nConv1])
-        b_conv1 = bias_variable([nConv1])    
+        W_conv1 = weight_variable([5, 5, 1, nConv1],dtype)
+        b_conv1 = bias_variable([nConv1],dtype)    
     
     with tf.name_scope("reshape_x_image") as scope:
         x_image = tf.reshape(ph.image, [-1,nCols,nRows,1])
@@ -170,8 +172,8 @@ def max_pool_2x2(x):
     """# ==============================================================================
     
     with tf.name_scope("convolve_2") as scope:
-        W_conv2 = weight_variable([5, 5, nConv1, nConv2])
-        b_conv2 = bias_variable([64])
+        W_conv2 = weight_variable([5, 5, nConv1, nConv2],dtype)
+        b_conv2 = bias_variable([64],dtype)
         h_conv2 = tf.nn.relu(conv2d(h_pool1, W_conv2) + b_conv2)  
          
     with tf.name_scope("pool_2") as scope:
@@ -189,8 +191,8 @@ def max_pool_2x2(x):
     """# ==============================================================================
     
     with tf.name_scope("W_fc1_b") as scope:
-        W_fc1 = weight_variable([n_h_pool2_outputsx, nFc])
-        b_fc1 = bias_variable([nFc])
+        W_fc1 = weight_variable([n_h_pool2_outputsx, nFc],dtype)
+        b_fc1 = bias_variable([nFc],dtype)
             
         h_pool2_flat = tf.reshape(h_pool2, [-1, n_h_pool2_outputs])
         
@@ -204,7 +206,7 @@ def max_pool_2x2(x):
     Dropout
     
     """# ==============================================================================
-    keep_prob = tf.placeholder(tf.float32,name='keep_prob')
+    keep_prob = tf.placeholder(dtype,name='keep_prob')
     
     with tf.name_scope("drop") as scope:
         h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob)
@@ -215,8 +217,8 @@ def max_pool_2x2(x):
     
     """# ==============================================================================
     with tf.name_scope("softmax") as scope:
-        W_fc2 = weight_variable([nFc, nTarget])
-        b_fc2 = bias_variable([nTarget])    
+        W_fc2 = weight_variable([nFc, nTarget],dtype)
+        b_fc2 = bias_variable([nTarget],dtype)    
         y_conv=tf.nn.softmax(tf.matmul(h_fc1_drop, W_fc2) + b_fc2)
     
     """# ==============================================================================
@@ -236,7 +238,7 @@ def max_pool_2x2(x):
     with tf.name_scope("test") as scope:        
         correct_prediction = tf.equal(tf.argmax(y_conv,1), tf.argmax(ph[0],1))
     
-        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+        accuracy = tf.reduce_mean(tf.cast(correct_prediction, dtype))
         accuracy_summary = tf.scalar_summary("accuracy", accuracy)    
     
     merged = tf.merge_all_summaries()
@@ -340,7 +342,7 @@ def computeSize(s,tens):
     # input_filters_dict = {'font': ('OCRA','OCRB'), 'fontVariant':('scanned',)}
     
     # select everything; all fonts , font variants, etc.
-    input_filters_dict = {}
+    #input_filters_dict = {}
     
     # select the digits 0 through 9 in the E13B font
     # input_filters_dict = {'m_label': range(48,58), 'font': 'E13B'}
@@ -358,9 +360,9 @@ def computeSize(s,tens):
     #output_feature_list = ['font_one_hot','image','italic','aspect_ratio','upper_case']   
 
     # train the digits 0-9 for all fonts
-    #input_filters_dict = {'m_label': range(48,58)}
+    input_filters_dict = {'m_label': range(48,58)}
     output_feature_list = ['m_label_one_hot','image','italic','aspect_ratio','upper_case']    
-    train_a_font(input_filters_dict,  output_feature_list, nEpochs = 50000)    
+    train_a_font(input_filters_dict,  output_feature_list, nEpochs = 5000)    
     
 else:
     # loop through all the fonts and train individually
diff --git a/q5_tensorflow_residual.py b/q5_tensorflow_residual.py
@@ -35,14 +35,16 @@
 import pandas as pd
  
 import tensorflow as tf  
+dtype = np.float32
 #with tf.device('/GPU:0'):
 #with tf.device('/cpu:0'):    
 def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
  
     ds = ocr_utils.read_data(input_filters_dict = input_filters_dict, 
                                 output_feature_list=output_feature_list,
                                 test_size = .1,
-                                engine_type='tensorflow')
+                                engine_type='tensorflow',
+                                dtype=dtype)
 
         
     """# ==============================================================================
@@ -86,7 +88,7 @@ def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
             nm = 'x_'+nm
         if i>1:
             extra_features_width += ds.train.feature_width[i]
-        lst.append(tf.placeholder(tf.float32, shape=[None, ds.train.feature_width[i]], name=nm))
+        lst.append(tf.placeholder(dtype, shape=[None, ds.train.feature_width[i]], name=nm))
         
     # ph is a named tuple with key names like 'image', 'm_label', and values that
     # are tensors.  The display name on the Chrome graph are 'y_m_label', 'x_image, 
@@ -113,13 +115,13 @@ def train_a_font(input_filters_dict,output_feature_list, nEpochs=5000):
     
     """# ==============================================================================
     
-    def weight_variable(shape):
-        initial = tf.truncated_normal(shape, stddev=0.1)
+    def weight_variable(shape, dtype):
+        initial = tf.truncated_normal(shape, stddev=0.1,dtype=dtype)
         return tf.Variable(initial)
     
-    def bias_variable(shape):
-        initial = tf.constant(0.1, shape=shape)
-        return tf.Variable(initial)
+    def bias_variable(shape, dtype):
+        initial = tf.constant(0.1, shape=shape, dtype=dtype)
+        return tf.Variable(initial)   
     
     """# ==============================================================================
     
@@ -142,8 +144,8 @@ def max_pool_2x2(x):
     
     """# ==============================================================================
     with tf.name_scope("w_conv1") as scope:
-        W_conv1 = weight_variable([5, 5, 1, nConv1])
-        b_conv1 = bias_variable([nConv1])    
+        W_conv1 = weight_variable([5, 5, 1, nConv1],dtype)
+        b_conv1 = bias_variable([nConv1],dtype)    
     
     with tf.name_scope("reshape_x_image") as scope:
         x_image = tf.reshape(ph.image, [-1,nCols,nRows,1])
@@ -173,8 +175,8 @@ def max_pool_2x2(x):
     """# ==============================================================================
     
     with tf.name_scope("convolve_2") as scope:
-        W_conv2 = weight_variable([5, 5, nConv1, nConv2])
-        b_conv2 = bias_variable([64])
+        W_conv2 = weight_variable([5, 5, nConv1, nConv2],dtype)
+        b_conv2 = bias_variable([64],dtype)
         h_conv2 = tf.nn.relu(conv2d(h_pool1, W_conv2) + b_conv2)  
          
     with tf.name_scope("pool_2") as scope:
@@ -192,8 +194,8 @@ def max_pool_2x2(x):
     """# ==============================================================================
     
     with tf.name_scope("W_fc0_b") as scope:
-        W_fc0 = weight_variable([n_h_pool2_outputsx, nFc0])
-        b_fc0 = bias_variable([nFc0])
+        W_fc0 = weight_variable([n_h_pool2_outputsx, nFc0],dtype)
+        b_fc0 = bias_variable([nFc0],dtype)
             
         h_pool2_flat = tf.reshape(h_pool2, [-1, n_h_pool2_outputs])
         
@@ -213,8 +215,8 @@ def max_pool_2x2(x):
     """# ==============================================================================  
           
     with tf.name_scope("W_fc1_b") as scope:
-        W_fc1 = weight_variable([nFc0, nFc1])
-        b_fc1 = bias_variable([nFc1])
+        W_fc1 = weight_variable([nFc0, nFc1],dtype)
+        b_fc1 = bias_variable([nFc1],dtype)
         
         h_fc1 = tf.nn.relu(tf.matmul(h_fc0, W_fc1) + b_fc1)    
     
@@ -230,16 +232,16 @@ def max_pool_2x2(x):
     """# ==============================================================================
     
     with tf.name_scope("W_fc2_b") as scope:
-        W_fc2 = weight_variable([nFc1, nFc2])
-        b_fc2 = bias_variable([nFc2])
+        W_fc2 = weight_variable([nFc1, nFc2],dtype)
+        b_fc2 = bias_variable([nFc2],dtype)
         
         h_fc2 = tf.nn.relu(tf.matmul(h_fc1, W_fc2) + b_fc2)
         
     """# ==============================================================================        
     Dropout
     
     """# ==============================================================================
-    keep_prob = tf.placeholder(tf.float32,name='keep_prob')
+    keep_prob = tf.placeholder(dtype,name='keep_prob')
     
     with tf.name_scope("drop") as scope:
         h_fc2_drop = tf.nn.dropout(h_fc2, keep_prob)
@@ -250,8 +252,8 @@ def max_pool_2x2(x):
     
     """# ==============================================================================
     with tf.name_scope("softmax") as scope:
-        W_fc3 = weight_variable([nFc2, nTarget])
-        b_fc3 = bias_variable([nTarget])    
+        W_fc3 = weight_variable([nFc2, nTarget],dtype)
+        b_fc3 = bias_variable([nTarget],dtype)    
         y_conv=tf.nn.softmax(tf.matmul(h_fc2_drop, W_fc3) + b_fc3)
     
     """# ==============================================================================
@@ -271,7 +273,7 @@ def max_pool_2x2(x):
     with tf.name_scope("test") as scope:        
         correct_prediction = tf.equal(tf.argmax(y_conv,1), tf.argmax(ph[0],1))
     
-        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+        accuracy = tf.reduce_mean(tf.cast(correct_prediction,dtype))
         accuracy_summary = tf.scalar_summary("accuracy", accuracy)    
     
     merged = tf.merge_all_summaries()
@@ -399,7 +401,7 @@ def computeSize(s,tens):
     #output_feature_list = ['font_one_hot','image','italic','aspect_ratio','upper_case']   
 
     # train the digits 0-9 for all fonts
-    input_filters_dict = {'m_label': list(range(48,58))+list(range(65,91))+list(range(97,123))}
+    input_filters_dict = {'m_label': list(range(48,58))+list(range(65,91))+list(range(97,123)),'fontVariant':'scanned'}
     #input_filters_dict = {}    
     output_feature_list = ['m_label_one_hot','image','italic','aspect_ratio','upper_case']    
     train_a_font(input_filters_dict,  output_feature_list, nEpochs = 20000)    
diff --git a/q6_tensorflow_residual3x3.py b/q6_tensorflow_residual3x3.py