bug fix and char emb as option in config

unilight · unilight · commit 77c18253b5bc · 2017-11-10T17:48:54.000+08:00
diff --git a/Models/config.json b/Models/config.json
@@ -3,6 +3,7 @@
 		"train":{  
 			"glove": "300",
 			"share_context_LSTM":true,
+			"char_emb":false,
 			"in_keep_prob":0.8,
 			"batch_size":60,
 			"state_size":75,
@@ -19,6 +20,7 @@
 		"dev":{  
 			"glove":"300",
 			"share_context_LSTM":true,
+			"char_emb":false,
 			"in_keep_prob":1.0,
 			"batch_size":60,
 			"state_size":75,
diff --git a/Models/model_rnet.py b/Models/model_rnet.py
@@ -31,7 +31,9 @@ def __init__(self, options):
 			self.options = options
 			
 			# Char embeddings
-			self.char_emb_mat = self.random_weight(self.options['char_vocab_size'], self.options['char_emb_mat_dim'], name = 'char_emb_matrix')
+			if options['char_emb']: 
+				self.char_emb_mat = self.random_weight(self.options['char_vocab_size'], 
+									self.options['char_emb_mat_dim'], name = 'char_emb_matrix')
 
 			# Weights
 			self.W_uQ = self.random_weight(2 * options['state_size'], options['state_size'], name='W_uQ')
@@ -55,86 +57,98 @@ def __init__(self, options):
 
 			# QP_match
 			with tf.variable_scope('QP_match') as scope:
-				self.QPmatch_cell = self.DropoutWrappedGRUCell(self.options['state_size'], 1.0)
+				self.QPmatch_cell = self.DropoutWrappedGRUCell(self.options['state_size'], self.options['in_keep_prob'])
 				self.QPmatch_state = self.QPmatch_cell.zero_state(self.options['batch_size'], dtype=tf.float32)
 
 			# Ans Ptr
 			with tf.variable_scope('Ans_ptr') as scope:
-				self.AnsPtr_cell = self.DropoutWrappedGRUCell(2 * self.options['state_size'], 1.0)
+				self.AnsPtr_cell = self.DropoutWrappedGRUCell(2 * self.options['state_size'], self.options['in_keep_prob'])
 		
 	def build_model(self):
-		paragraph = tf.placeholder(tf.float32, [self.options['batch_size'], self.options['p_length'], self.options['emb_dim']])
-		paragraph_c = tf.placeholder(tf.int32, [self.options['batch_size'], self.options['p_length'], self.options['char_max_length']])
-		question = tf.placeholder(tf.float32, [self.options['batch_size'], self.options['q_length'], self.options['emb_dim']])
-		question_c = tf.placeholder(tf.int32, [self.options['batch_size'], self.options['q_length'], self.options['char_max_length']])
-		answer_si = tf.placeholder(tf.float32, [self.options['batch_size'], self.options['p_length']])
-		answer_ei = tf.placeholder(tf.float32, [self.options['batch_size'], self.options['p_length']])
+		opts = self.options
+
+		# placeholders
+		paragraph = tf.placeholder(tf.float32, [opts['batch_size'], opts['p_length'], opts['emb_dim']])
+		question = tf.placeholder(tf.float32, [opts['batch_size'], opts['q_length'], opts['emb_dim']])
+		answer_si = tf.placeholder(tf.float32, [opts['batch_size'], opts['p_length']])
+		answer_ei = tf.placeholder(tf.float32, [opts['batch_size'], opts['p_length']])
+		if opts['char_emb']:
+			paragraph_c = tf.placeholder(tf.int32, [opts['batch_size'], opts['p_length'], opts['char_max_length']])
+			question_c = tf.placeholder(tf.int32, [opts['batch_size'], opts['q_length'], opts['char_max_length']])
 
 		print('Question and Passage Encoding')
-		# char embedding -> word level char embedding
-		paragraph_c_emb = tf.nn.embedding_lookup(self.char_emb_mat, paragraph_c) # [batch_size, p_length, char_max_length, char_emb_dim]
-		question_c_emb = tf.nn.embedding_lookup(self.char_emb_mat, question_c)
-		paragraph_c_list = [tf.squeeze(w, [1]) for w in tf.split(paragraph_c_emb, self.options['p_length'], axis=1)]
-		question_c_list = [tf.squeeze(w, [1]) for w in tf.split(question_c_emb, self.options['q_length'], axis=1)]
+		if opts['char_emb']:
+			# char embedding -> word level char embedding
+			paragraph_c_emb = tf.nn.embedding_lookup(self.char_emb_mat, paragraph_c) # [batch_size, p_length, char_max_length, char_emb_dim]
+			question_c_emb = tf.nn.embedding_lookup(self.char_emb_mat, question_c)
+			paragraph_c_list = [tf.squeeze(w, [1]) for w in tf.split(paragraph_c_emb, opts['p_length'], axis=1)]
+			question_c_list = [tf.squeeze(w, [1]) for w in tf.split(question_c_emb, opts['q_length'], axis=1)]
+
+			c_Q = []
+			c_P = []
+			with tf.variable_scope('char_emb_rnn') as scope:
+				char_emb_fw_cell = self.DropoutWrappedGRUCell(opts['emb_dim'], 1.0)
+				char_emb_bw_cell = self.DropoutWrappedGRUCell(opts['emb_dim'], 1.0)
+				for t in range(opts['q_length']):
+					unstacked_q_c = tf.unstack(question_c_list[t], opts['char_max_length'], 1)
+					if t>0 :
+						tf.get_variable_scope().reuse_variables()
+					q_c_e_outputs, q_c_e_final_fw, q_c_e_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
+						char_emb_fw_cell, char_emb_bw_cell, unstacked_q_c, dtype=tf.float32, scope = 'char_emb')
+					c_q_t = tf.concat([q_c_e_final_fw[1], q_c_e_final_bw[1]], 1)
+					c_Q.append(c_q_t)
+				for t in range(opts['p_length']):
+					unstacked_p_c = tf.unstack(paragraph_c_list[t], opts['char_max_length'], 1)
+					p_c_e_outputs, p_c_e_final_fw, p_c_e_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
+						char_emb_fw_cell, char_emb_bw_cell, unstacked_p_c, dtype=tf.float32, scope = 'char_emb')
+					c_p_t = tf.concat([p_c_e_final_fw[1], p_c_e_final_bw[1]], 1)
+					c_P.append(c_p_t)
+			c_Q = tf.stack(c_Q, 1)
+			c_P = tf.stack(c_P, 1)
+			print('c_Q', c_Q)
+			print('c_P', c_P)
+		
+			# Concat e and c
+			eQcQ = tf.concat([question, c_Q], 2)
+			ePcP = tf.concat([paragraph, c_P], 2)
+		else:
+			eQcQ = question
+			ePcP = paragraph
 
-		c_Q = []
-		c_P = []
-		with tf.variable_scope('char_emb_rnn') as scope:
-			char_emb_fw_cell = self.DropoutWrappedGRUCell(self.options['emb_dim'], 1.0)
-			char_emb_bw_cell = self.DropoutWrappedGRUCell(self.options['emb_dim'], 1.0)
-			for t in range(self.options['q_length']):
-				unstacked_q_c = tf.unstack(question_c_list[t], self.options['char_max_length'], 1)
-				if t>0 :
-					tf.get_variable_scope().reuse_variables()
-				q_c_e_outputs, q_c_e_final_fw, q_c_e_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
-					char_emb_fw_cell, char_emb_bw_cell, unstacked_q_c, dtype=tf.float32, scope = 'char_emb')
-				c_q_t = tf.concat([q_c_e_final_fw[1], q_c_e_final_bw[1]], 1)
-				c_Q.append(c_q_t)
-			for t in range(self.options['p_length']):
-				unstacked_p_c = tf.unstack(paragraph_c_list[t], self.options['char_max_length'], 1)
-				p_c_e_outputs, p_c_e_final_fw, p_c_e_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
-					char_emb_fw_cell, char_emb_bw_cell, unstacked_p_c, dtype=tf.float32, scope = 'char_emb')
-				c_p_t = tf.concat([p_c_e_final_fw[1], p_c_e_final_bw[1]], 1)
-				c_P.append(c_p_t)
-		c_Q = tf.stack(c_Q, 1)
-		c_P = tf.stack(c_P, 1)
-		print('c_Q', c_Q)
-		print('c_P', c_P)
-		# Concat e and c
-		eQcQ = tf.concat([question, c_Q], 2)
-		ePcP = tf.concat([paragraph, c_P], 2)
-		unstacked_eQcQ = tf.unstack(eQcQ, self.options['q_length'], 1)
-		unstacked_ePcP = tf.unstack(ePcP, self.options['p_length'], 1)
+		unstacked_eQcQ = tf.unstack(eQcQ, opts['q_length'], 1)
+		unstacked_ePcP = tf.unstack(ePcP, opts['p_length'], 1)
 		with tf.variable_scope('encoding') as scope:
-			enc_fw_cell = self.DropoutWrappedGRUCell(self.options['state_size'], 1.0)
-			enc_bw_cell = self.DropoutWrappedGRUCell(self.options['state_size'], 1.0)
-			q_enc_outputs, q_enc_final_fw, q_enc_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
-				enc_fw_cell, enc_bw_cell, unstacked_eQcQ, dtype=tf.float32, scope = 'context_encoding')
+			stacked_enc_fw_cells=[ self.DropoutWrappedGRUCell(opts['state_size'], opts['in_keep_prob']) for _ in range(2)]
+			stacked_enc_bw_cells=[ self.DropoutWrappedGRUCell(opts['state_size'], opts['in_keep_prob']) for _ in range(2)]
+			q_enc_outputs, q_enc_final_fw, q_enc_final_bw = tf.contrib.rnn.stack_bidirectional_rnn(
+									stacked_enc_fw_cells, stacked_enc_bw_cells, unstacked_eQcQ, dtype=tf.float32, scope = 'context_encoding')
 			tf.get_variable_scope().reuse_variables()
-			p_enc_outputs, p_enc_final_fw, p_enc_final_bw = tf.contrib.rnn.static_bidirectional_rnn(
-				enc_fw_cell, enc_bw_cell, unstacked_ePcP, dtype=tf.float32, scope = 'context_encoding')
+			p_enc_outputs, p_enc_final_fw, p_enc_final_bw = tf.contrib.rnn.stack_bidirectional_rnn(
+									stacked_enc_fw_cells, stacked_enc_bw_cells, unstacked_ePcP, dtype=tf.float32, scope = 'context_encoding')
 			u_Q = tf.stack(q_enc_outputs, 1)
 			u_P = tf.stack(p_enc_outputs, 1)
+		u_Q = tf.nn.dropout(u_Q, opts['in_keep_prob'])
+		u_P = tf.nn.dropout(u_P, opts['in_keep_prob'])
 		print(u_Q)
 		print(u_P)
 
 		v_P = []
 		print('Question-Passage Matching')
-		for t in range(self.options['p_length']):
+		for t in range(opts['p_length']):
 			# Calculate c_t
 			W_uQ_u_Q = self.mat_weight_mul(u_Q, self.W_uQ) # [batch_size, q_length, state_size]
-			tiled_u_tP = tf.concat( [tf.reshape(u_P[:, t, :], [self.options['batch_size'], 1, -1])] * self.options['q_length'], 1)
+			tiled_u_tP = tf.concat( [tf.reshape(u_P[:, t, :], [opts['batch_size'], 1, -1])] * opts['q_length'], 1)
 			W_uP_u_tP = self.mat_weight_mul(tiled_u_tP , self.W_uP)
 			
 			if t == 0:
 				tanh = tf.tanh(W_uQ_u_Q + W_uP_u_tP)
 			else:
-				tiled_v_t1P = tf.concat( [tf.reshape(v_P[t-1], [self.options['batch_size'], 1, -1])] * self.options['q_length'], 1)
+				tiled_v_t1P = tf.concat( [tf.reshape(v_P[t-1], [opts['batch_size'], 1, -1])] * opts['q_length'], 1)
 				W_vP_v_t1P = self.mat_weight_mul(tiled_v_t1P, self.W_vP)
 				tanh = tf.tanh(W_uQ_u_Q + W_uP_u_tP + W_vP_v_t1P)
 			s_t = tf.squeeze(self.mat_weight_mul(tanh, tf.reshape(self.B_v_QP, [-1, 1])))
 			a_t = tf.nn.softmax(s_t, 1)
-			tiled_a_t = tf.concat( [tf.reshape(a_t, [self.options['batch_size'], -1, 1])] * 2 * self.options['state_size'] , 2)
+			tiled_a_t = tf.concat( [tf.reshape(a_t, [opts['batch_size'], -1, 1])] * 2 * opts['state_size'] , 2)
 			c_t = tf.reduce_sum( tf.multiply(tiled_a_t, u_Q) , 1) # [batch_size, 2 * state_size]
 
 			# gate
@@ -148,20 +162,21 @@ def build_model(self):
 				output, self.QPmatch_state = self.QPmatch_cell(u_tP_c_t_star, self.QPmatch_state)
 				v_P.append(output)
 		v_P = tf.stack(v_P, 1)
+		v_P = tf.nn.dropout(v_P, opts['in_keep_prob'])
 		print('v_P', v_P)
 
 		print('Self-Matching Attention')
 		SM_star = []
-		for t in range(self.options['p_length']):
+		for t in range(opts['p_length']):
 			# Calculate s_t
 			W_p1_v_P = self.mat_weight_mul(v_P, self.W_smP1) # [batch_size, p_length, state_size]
-			tiled_v_tP = tf.concat( [tf.reshape(v_P[:, t, :], [self.options['batch_size'], 1, -1])] * self.options['p_length'], 1)
+			tiled_v_tP = tf.concat( [tf.reshape(v_P[:, t, :], [opts['batch_size'], 1, -1])] * opts['p_length'], 1)
 			W_p2_v_tP = self.mat_weight_mul(tiled_v_tP , self.W_smP2)
 			
 			tanh = tf.tanh(W_p1_v_P + W_p2_v_tP)
 			s_t = tf.squeeze(self.mat_weight_mul(tanh, tf.reshape(self.B_v_SM, [-1, 1])))
 			a_t = tf.nn.softmax(s_t, 1)
-			tiled_a_t = tf.concat( [tf.reshape(a_t, [self.options['batch_size'], -1, 1])] * self.options['state_size'] , 2)
+			tiled_a_t = tf.concat( [tf.reshape(a_t, [opts['batch_size'], -1, 1])] * opts['state_size'] , 2)
 			c_t = tf.reduce_sum( tf.multiply(tiled_a_t, v_P) , 1) # [batch_size, 2 * state_size]
 
 			# gate
@@ -170,25 +185,27 @@ def build_model(self):
 			v_tP_c_t_star = tf.squeeze(tf.multiply(v_tP_c_t, g_t))
 			SM_star.append(v_tP_c_t_star)
 		SM_star = tf.stack(SM_star, 1)
-		unstacked_SM_star = tf.unstack(SM_star, self.options['p_length'], 1)
+		unstacked_SM_star = tf.unstack(SM_star, opts['p_length'], 1)
 		with tf.variable_scope('Self_match') as scope:
-			SM_fw_cell = self.DropoutWrappedGRUCell(self.options['state_size'], 1.0)
-			SM_bw_cell = self.DropoutWrappedGRUCell(self.options['state_size'], 1.0)
+			SM_fw_cell = self.DropoutWrappedGRUCell(opts['state_size'], opts['in_keep_prob'])
+			SM_bw_cell = self.DropoutWrappedGRUCell(opts['state_size'], opts['in_keep_prob'])
 			SM_outputs, SM_final_fw, SM_final_bw = tf.contrib.rnn.static_bidirectional_rnn(SM_fw_cell, SM_bw_cell, unstacked_SM_star, dtype=tf.float32)
 			h_P = tf.stack(SM_outputs, 1)
+		h_P = tf.nn.dropout(h_P, opts['in_keep_prob'])
 		print('h_P', h_P)
 		
 		print('Output Layer')
 		# calculate r_Q
 		W_ruQ_u_Q = self.mat_weight_mul(u_Q, self.W_ruQ) # [batch_size, q_length, 2 * state_size]
 		W_vQ_V_rQ = tf.matmul(self.W_VrQ, self.W_vQ)
-		W_vQ_V_rQ = tf.stack([W_vQ_V_rQ]*self.options['batch_size'], 0) # stack -> [batch_size, state_size, state_size]
+		W_vQ_V_rQ = tf.stack([W_vQ_V_rQ]*opts['batch_size'], 0) # stack -> [batch_size, state_size, state_size]
 		
 		tanh = tf.tanh(W_ruQ_u_Q + W_vQ_V_rQ)
 		s_t = tf.squeeze(self.mat_weight_mul(tanh, tf.reshape(self.B_v_rQ, [-1, 1])))
 		a_t = tf.nn.softmax(s_t, 1)
-		tiled_a_t = tf.concat( [tf.reshape(a_t, [self.options['batch_size'], -1, 1])] * 2 * self.options['state_size'] , 2)
+		tiled_a_t = tf.concat( [tf.reshape(a_t, [opts['batch_size'], -1, 1])] * 2 * opts['state_size'] , 2)
 		r_Q = tf.reduce_sum( tf.multiply(tiled_a_t, u_Q) , 1) # [batch_size, 2 * state_size]
+		r_Q = tf.nn.dropout(r_Q, opts['in_keep_prob'])
 		print('r_Q', r_Q)
 
 		# r_Q as initial state of ans ptr
@@ -202,19 +219,19 @@ def build_model(self):
 			else:
 				h_t1a = h_a
 			print('h_t1a', h_t1a)
-			tiled_h_t1a = tf.concat( [tf.reshape(h_t1a, [self.options['batch_size'], 1, -1])] * self.options['p_length'], 1)
+			tiled_h_t1a = tf.concat( [tf.reshape(h_t1a, [opts['batch_size'], 1, -1])] * opts['p_length'], 1)
 			W_ha_h_t1a = self.mat_weight_mul(tiled_h_t1a , self.W_ha)
 			
 			tanh = tf.tanh(W_hP_h_P + W_ha_h_t1a)
 			s_t = tf.squeeze(self.mat_weight_mul(tanh, tf.reshape(self.B_v_ap, [-1, 1])))
 			a_t = tf.nn.softmax(s_t, 1)
 			p[t] = a_t
 
-			tiled_a_t = tf.concat( [tf.reshape(a_t, [self.options['batch_size'], -1, 1])] * 2 * self.options['state_size'] , 2)
+			tiled_a_t = tf.concat( [tf.reshape(a_t, [opts['batch_size'], -1, 1])] * 2 * opts['state_size'] , 2)
 			c_t = tf.reduce_sum( tf.multiply(tiled_a_t, h_P) , 1) # [batch_size, 2 * state_size]
 
 			if t == 0:
-				AnsPtr_state = self.AnsPtr_cell.zero_state(self.options['batch_size'], dtype=tf.float32)
+				AnsPtr_state = self.AnsPtr_cell.zero_state(opts['batch_size'], dtype=tf.float32)
 				h_a, _ = self.AnsPtr_cell(c_t, (AnsPtr_state, r_Q) )
 				h_a = h_a[1]
 				print(h_a)
@@ -234,7 +251,7 @@ def build_model(self):
 		loss = loss_si + loss_ei
 		"""
 		
-		batch_idx = tf.reshape(tf.range(0, self.options['batch_size']), [-1,1])
+		batch_idx = tf.reshape(tf.range(0, opts['batch_size']), [-1,1])
 		answer_si_re = tf.reshape(answer_si_idx, [-1,1])
 		batch_idx_si = tf.concat([batch_idx, answer_si_re],1)
 		answer_ei_re = tf.reshape(answer_ei_idx, [-1,1])
@@ -245,26 +262,26 @@ def build_model(self):
 		
 		# Search
 		prob = []
-		search_range = self.options['p_length'] - self.options['span_length']
+		search_range = opts['p_length'] - opts['span_length']
 		for i in range(search_range):
-			for j in range(self.options['span_length']):
+			for j in range(opts['span_length']):
 				prob.append(tf.multiply(p1[:, i], p2[:, i+j]))
 		prob = tf.stack(prob, axis = 1)
 		argmax_idx = tf.argmax(prob, axis=1)
-		pred_si = argmax_idx / self.options['span_length']
-		pred_ei = pred_si + tf.cast(tf.mod(argmax_idx , self.options['span_length']), tf.float64)
+		pred_si = argmax_idx / opts['span_length']
+		pred_ei = pred_si + tf.cast(tf.mod(argmax_idx , opts['span_length']), tf.float64)
 		correct = tf.logical_and(tf.equal(tf.cast(pred_si, tf.int64), tf.cast(answer_si_idx, tf.int64)), 
 								 tf.equal(tf.cast(pred_ei, tf.int64), tf.cast(answer_ei_idx, tf.int64)))
 		accuracy = tf.reduce_mean(tf.cast(correct, tf.float32))
 
 		input_tensors = {
 			'p':paragraph,
 			'q':question,
-			'pc': paragraph_c, 
-			'qc': question_c,
 			'a_si':answer_si,
 			'a_ei':answer_ei,
 		}
+		if opts['char_emb']:
+			input_tensors.update({'pc': paragraph_c, 'qc': question_c})
 	
 		print('Model built')
 		for v in tf.global_variables():
diff --git a/preprocess.py b/preprocess.py
@@ -21,8 +21,10 @@ def __init__(self, data_type, opts):
 		self.opts = opts
 		data_path = os.path.join('Data', "data_{}.json".format(data_type))
 		shared_path = os.path.join('Data', "shared_{}.json".format(data_type))
+		idx_path = os.path.join('Data', "idx_table.json")
 		self.data = self.load_data(data_path)
 		self.shared = self.load_data(shared_path)
+		self.idx_table = self.load_data(idx_path)
 
 		# paragraph length filter: (train only)
 		if self.data_type == 'train':
@@ -71,7 +73,7 @@ def get_training_batch(self, batch_no):
 				except KeyError:
 					pass
 				for k, char in enumerate(p[j]):
-					paragraph_c[count][j][k] = self.shared['char2idx'][char]
+					paragraph_c[count][j][k] = self.idx_table['char2idx'][char]
 			
 			for j in range(len(q)):
 				if j >= opts['q_length']:
@@ -81,7 +83,7 @@ def get_training_batch(self, batch_no):
 				except KeyError:
 					pass
 				for k, char in enumerate(q[j]):
-					question_c[count][j][k] = self.shared['char2idx'][char]
+					question_c[count][j][k] = self.idx_table['char2idx'][char]
 			
 			si, ei = sample['answer'][0][0], sample['answer'][0][-1]
 			answer_si[count][si] = 1.0
@@ -132,7 +134,7 @@ def get_testing_batch(self, batch_no):
 					#print('{} not in GloVe'.format(p[j]))
 					pass
 				for k, char in enumerate(p[j]):
-					paragraph_c[count][j][k] = self.shared['char2idx'][char]
+					paragraph_c[count][j][k] = self.idx_table['char2idx'][char]
 			
 			for j in range(len(q)):
 				if j >= opts['q_length']:
@@ -143,7 +145,7 @@ def get_testing_batch(self, batch_no):
 					pass
 					#print('{} not in GloVe'.format(triplet['question'][j].lower()))
 				for k, char in enumerate(q[j]):
-					question_c[count][j][k] = self.shared['char2idx'][char]
+					question_c[count][j][k] = self.idx_table['char2idx'][char]
 			
 			answer_si[count] = [ans[0]  for ans in sample['answer']]
 			answer_ei[count] = [ans[-1] for ans in sample['answer']]
@@ -303,16 +305,22 @@ def generate_seq(data_type):
 			  'paragraphs_original_sent': articles_original_sent,
 			  'glove100': w2v_100,
 			  'glove300': w2v_300,
-			  'char2idx': char2idx,
-			  'idx2char': idx2char,
 			  }
 	print('Saving...')
 	with open(os.path.join('Data','data_'+data_type+".json"), 'w') as f:
 		json.dump(data, f)
 	with open(os.path.join('Data','shared_'+data_type+".json"), 'w') as f:
 		json.dump(shared, f)
 
-	print('SQuAD preprossing finished!')
+	if data_type == 'train':
+		char2idx, idx2char = get_char_vocab(word_counter)
+		idx_table = {'char2idx': char2idx,
+					 'idx2char': idx2char,
+					 }
+		with open(os.path.join('Data','idx_table.json'), 'w') as f:
+			json.dump(idx_table, f)
+
+	print('SQuAD '+data_type+' preprossing finished!')
 
 def read_data(data_type, opts):
 	return DataProcessor(data_type, opts)
diff --git a/rnet.py b/rnet.py
@@ -52,14 +52,19 @@ def run():
 		EM = 0.0
 		while batch_no < num_batches:
 			tensor_dict, idxs = dp.get_training_batch(rl[batch_no])
-			_, loss_value, accuracy, predictions_si, predictions_ei = sess.run([train_op, loss, acc, pred_si, pred_ei], feed_dict={
+			feed_dict = {
 				input_tensors['p']:tensor_dict['paragraph'],
 				input_tensors['q']:tensor_dict['question'],
-				input_tensors['pc']:tensor_dict['paragraph_c'],
-				input_tensors['qc']:tensor_dict['question_c'],
 				input_tensors['a_si']:tensor_dict['answer_si'],
 				input_tensors['a_ei']:tensor_dict['answer_ei'],
-			})
+			}
+			if modOpts['char_emb']:
+				feed_dict.update({
+						input_tensors['pc']:tensor_dict['paragraph_c'],
+						input_tensors['qc']:tensor_dict['question_c'],
+					})
+			_, loss_value, accuracy, predictions_si, predictions_ei = sess.run(
+					[train_op, loss, acc, pred_si, pred_ei], feed_dict=feed_dict)
 			batch_no += 1
 			LOSS += loss_value
 			EM += accuracy