4 years ago · 710220adbe
--- a/sqlnet/model/modules/aggregator_predict.py
+++ b/sqlnet/model/modules/aggregator_predict.py
@@ -4,7 +4,7 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from net_utils import run_lstm, col_name_encode
			
 
				+from sqlnet.model.modules.net_utils import run_lstm, col_name_encode
			
 
				 
			
 
				 
			
 
				 
			
@@ -13,17 +13,13 @@ class AggPredictor(nn.Module):
 
				         super(AggPredictor, self).__init__()
			
 
				         self.use_ca = use_ca
			
 
				 
			
 
				-        self.agg_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.agg_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         if use_ca:
			
 
				-            print "Using column attention on aggregator predicting"
			
 
				-            self.agg_col_name_enc = nn.LSTM(input_size=N_word,
			
 
				-                    hidden_size=N_h/2, num_layers=N_depth,
			
 
				-                    batch_first=True, dropout=0.3, bidirectional=True)
			
 
				+            print ("Using column attention on aggregator predicting")
			
 
				+            self.agg_col_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				             self.agg_att = nn.Linear(N_h, N_h)
			
 
				         else:
			
 
				-            print "Not using column attention on aggregator predicting"
			
 
				+            print ("Not using column attention on aggregator predicting")
			
 
				             self.agg_att = nn.Linear(N_h, 1)
			
 
				         self.agg_out = nn.Sequential(nn.Linear(N_h, N_h), nn.Tanh(), nn.Linear(N_h, 6))
			
 
				         self.softmax = nn.Softmax(dim=-1)
			
--- a/sqlnet/model/modules/select_number.py
+++ b/sqlnet/model/modules/select_number.py
@@ -4,7 +4,8 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from net_utils import run_lstm, col_name_encode
			
 
				+
			
 
				+from sqlnet.model.modules.net_utils import run_lstm, col_name_encode
			
 
				 
			
 
				 class SelNumPredictor(nn.Module):
			
 
				     def __init__(self, N_word, N_h, N_depth, use_ca):
			
@@ -12,20 +13,18 @@ class SelNumPredictor(nn.Module):
 
				         self.N_h = N_h
			
 
				         self.use_ca = use_ca
			
 
				 
			
 
				-        self.sel_num_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                                    num_layers=N_depth, batch_first=True,
			
 
				-                                    dropout=0.3, bidirectional=True)
			
 
				+        self.sel_num_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				+
			
 
				         self.sel_num_att = nn.Linear(N_h, 1)
			
 
				         self.sel_num_col_att = nn.Linear(N_h, 1)
			
 
				-        self.sel_num_out = nn.Sequential(nn.Linear(N_h, N_h),
			
 
				-                                         nn.Tanh(), nn.Linear(N_h,4))
			
 
				+        self.sel_num_out = nn.Sequential(nn.Linear(N_h, N_h), nn.Tanh(), nn.Linear(N_h,4))
			
 
				         self.softmax = nn.Softmax(dim=-1)
			
 
				         self.sel_num_col2hid1 = nn.Linear(N_h, 2 * N_h)
			
 
				         self.sel_num_col2hid2 = nn.Linear(N_h, 2 * N_h)
			
 
				 
			
 
				 
			
 
				         if self.use_ca:
			
 
				-            print "Using column attention on select number predicting"
			
 
				+            print ("Using column attention on select number predicting")
			
 
				 
			
 
				     def forward(self, x_emb_var, x_len, col_inp_var, col_name_len, col_len, col_num):
			
 
				         B = len(x_len)
			
@@ -42,11 +41,10 @@ class SelNumPredictor(nn.Module):
 
				                 num_col_att_val[idx, num:] = -1000000
			
 
				         num_col_att = self.softmax(num_col_att_val)
			
 
				         K_num_col = (e_num_col * num_col_att.unsqueeze(2)).sum(1)
			
 
				-        sel_num_h1 = self.sel_num_col2hid1(K_num_col).view(B, 4, self.N_h/2).transpose(0,1).contiguous()
			
 
				-        sel_num_h2 = self.sel_num_col2hid2(K_num_col).view(B, 4, self.N_h/2).transpose(0,1).contiguous()
			
 
				+        sel_num_h1 = self.sel_num_col2hid1(K_num_col).view((B, 4, self.N_h//2)).transpose(0,1).contiguous()
			
 
				+        sel_num_h2 = self.sel_num_col2hid2(K_num_col).view((B, 4, self.N_h//2)).transpose(0,1).contiguous()
			
 
				 
			
 
				-        h_num_enc, _ = run_lstm(self.sel_num_lstm, x_emb_var, x_len,
			
 
				-                                hidden=(sel_num_h1, sel_num_h2))
			
 
				+        h_num_enc, _ = run_lstm(self.sel_num_lstm, x_emb_var, x_len,hidden=(sel_num_h1, sel_num_h2))
			
 
				 
			
 
				         num_att_val = self.sel_num_att(h_num_enc).squeeze()
			
 
				         for idx, num in enumerate(x_len):
			
@@ -54,8 +52,7 @@ class SelNumPredictor(nn.Module):
 
				                 num_att_val[idx, num:] = -1000000
			
 
				         num_att = self.softmax(num_att_val)
			
 
				 
			
 
				-        K_sel_num = (h_num_enc * num_att.unsqueeze(2).expand_as(
			
 
				-            h_num_enc)).sum(1)
			
 
				+        K_sel_num = (h_num_enc * num_att.unsqueeze(2).expand_as(h_num_enc)).sum(1)
			
 
				         sel_num_score = self.sel_num_out(K_sel_num)
			
 
				         return sel_num_score
			
 
				 
			
--- a/sqlnet/model/modules/selection_predict.py
+++ b/sqlnet/model/modules/selection_predict.py
@@ -4,25 +4,21 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from net_utils import run_lstm, col_name_encode
			
 
				+from sqlnet.model.modules.net_utils import run_lstm, col_name_encode
			
 
				 
			
 
				 class SelPredictor(nn.Module):
			
 
				     def __init__(self, N_word, N_h, N_depth, max_tok_num, use_ca):
			
 
				         super(SelPredictor, self).__init__()
			
 
				         self.use_ca = use_ca
			
 
				         self.max_tok_num = max_tok_num
			
 
				-        self.sel_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.sel_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         if use_ca:
			
 
				-            print "Using column attention on selection predicting"
			
 
				+            print ("Using column attention on selection predicting")
			
 
				             self.sel_att = nn.Linear(N_h, N_h)
			
 
				         else:
			
 
				-            print "Not using column attention on selection predicting"
			
 
				+            print ("Not using column attention on selection predicting")
			
 
				             self.sel_att = nn.Linear(N_h, 1)
			
 
				-        self.sel_col_name_enc = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.sel_col_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.sel_out_K = nn.Linear(N_h, N_h)
			
 
				         self.sel_out_col = nn.Linear(N_h, N_h)
			
 
				         self.sel_out = nn.Sequential(nn.Tanh(), nn.Linear(N_h, 1))
			
--- a/sqlnet/model/modules/sqlnet_condition_predict.py
+++ b/sqlnet/model/modules/sqlnet_condition_predict.py
@@ -4,7 +4,7 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from net_utils import run_lstm, col_name_encode
			
 
				+from sqlnet.model.modules.net_utils import run_lstm, col_name_encode
			
 
				 
			
 
				 class SQLNetCondPredictor(nn.Module):
			
 
				     def __init__(self, N_word, N_h, N_depth, max_col_num, max_tok_num, use_ca, gpu):
			
@@ -15,59 +15,41 @@ class SQLNetCondPredictor(nn.Module):
 
				         self.gpu = gpu
			
 
				         self.use_ca = use_ca
			
 
				 
			
 
				-        self.cond_num_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_num_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.cond_num_att = nn.Linear(N_h, 1)
			
 
				         self.cond_num_out = nn.Sequential(nn.Linear(N_h, N_h),
			
 
				                 nn.Tanh(), nn.Linear(N_h, 5))
			
 
				-        self.cond_num_name_enc = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_num_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.cond_num_col_att = nn.Linear(N_h, 1)
			
 
				         self.cond_num_col2hid1 = nn.Linear(N_h, 2*N_h)
			
 
				         self.cond_num_col2hid2 = nn.Linear(N_h, 2*N_h)
			
 
				 
			
 
				-        self.cond_col_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_col_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         if use_ca:
			
 
				-            print "Using column attention on where predicting"
			
 
				+            print ("Using column attention on where predicting")
			
 
				             self.cond_col_att = nn.Linear(N_h, N_h)
			
 
				         else:
			
 
				-            print "Not using column attention on where predicting"
			
 
				+            print ("Not using column attention on where predicting")
			
 
				             self.cond_col_att = nn.Linear(N_h, 1)
			
 
				-        self.cond_col_name_enc = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_col_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.cond_col_out_K = nn.Linear(N_h, N_h)
			
 
				         self.cond_col_out_col = nn.Linear(N_h, N_h)
			
 
				         self.cond_col_out = nn.Sequential(nn.ReLU(), nn.Linear(N_h, 1))
			
 
				 
			
 
				-        self.cond_op_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_op_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         if use_ca:
			
 
				             self.cond_op_att = nn.Linear(N_h, N_h)
			
 
				         else:
			
 
				             self.cond_op_att = nn.Linear(N_h, 1)
			
 
				         self.cond_op_out_K = nn.Linear(N_h, N_h)
			
 
				-        self.cond_op_name_enc = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_op_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.cond_op_out_col = nn.Linear(N_h, N_h)
			
 
				         self.cond_op_out = nn.Sequential(nn.Linear(N_h, N_h), nn.Tanh(),
			
 
				                 nn.Linear(N_h, 4))
			
 
				 
			
 
				-        self.cond_str_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				-        self.cond_str_decoder = nn.LSTM(input_size=self.max_tok_num,
			
 
				-                hidden_size=N_h, num_layers=N_depth,
			
 
				-                batch_first=True, dropout=0.3)
			
 
				-        self.cond_str_name_enc = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                num_layers=N_depth, batch_first=True,
			
 
				-                dropout=0.3, bidirectional=True)
			
 
				+        self.cond_str_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				+        self.cond_str_decoder = nn.LSTM(input_size=self.max_tok_num, hidden_size=N_h, num_layers=N_depth, batch_first=True, dropout=0.3)
			
 
				+        self.cond_str_name_enc = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.cond_str_out_g = nn.Linear(N_h, N_h)
			
 
				         self.cond_str_out_h = nn.Linear(N_h, N_h)
			
 
				         self.cond_str_out_col = nn.Linear(N_h, N_h)
			
@@ -78,7 +60,7 @@ class SQLNetCondPredictor(nn.Module):
 
				 
			
 
				     def gen_gt_batch(self, split_tok_seq):
			
 
				         B = len(split_tok_seq)
			
 
				-        max_len = max([max([len(tok) for tok in tok_seq]+[0]) for 
			
 
				+        max_len = max([max([len(tok) for tok in tok_seq]+[0]) for
			
 
				             tok_seq in split_tok_seq]) - 1 # The max seq len in the batch.
			
 
				         if max_len < 1:
			
 
				             max_len = 1
			
@@ -121,10 +103,8 @@ class SQLNetCondPredictor(nn.Module):
 
				                 num_col_att_val[idx, num:] = -100
			
 
				         num_col_att = self.softmax(num_col_att_val)
			
 
				         K_num_col = (e_num_col * num_col_att.unsqueeze(2)).sum(1)
			
 
				-        cond_num_h1 = self.cond_num_col2hid1(K_num_col).view(
			
 
				-                B, 4, self.N_h/2).transpose(0, 1).contiguous()
			
 
				-        cond_num_h2 = self.cond_num_col2hid2(K_num_col).view(
			
 
				-                B, 4, self.N_h/2).transpose(0, 1).contiguous()
			
 
				+        cond_num_h1 = self.cond_num_col2hid1(K_num_col).view(B, 4, self.N_h//2).transpose(0, 1).contiguous()
			
 
				+        cond_num_h2 = self.cond_num_col2hid2(K_num_col).view(B, 4, self.N_h//2).transpose(0, 1).contiguous()
			
 
				 
			
 
				         h_num_enc, _ = run_lstm(self.cond_num_lstm, x_emb_var, x_len,
			
 
				                 hidden=(cond_num_h1, cond_num_h2))
			
@@ -185,7 +165,7 @@ class SQLNetCondPredictor(nn.Module):
 
				         h_op_enc, _ = run_lstm(self.cond_op_lstm, x_emb_var, x_len)
			
 
				         col_emb = []
			
 
				         for b in range(B):
			
 
				-            cur_col_emb = torch.stack([e_cond_col[b, x] 
			
 
				+            cur_col_emb = torch.stack([e_cond_col[b, x]
			
 
				                 for x in chosen_col_gt[b]] + [e_cond_col[b, 0]] *
			
 
				                 (4 - len(chosen_col_gt[b])))  # Pad the columns to maximum (4)
			
 
				             col_emb.append(cur_col_emb)
			
--- a/sqlnet/model/modules/where_relation.py
+++ b/sqlnet/model/modules/where_relation.py
@@ -4,7 +4,7 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from net_utils import run_lstm, col_name_encode
			
 
				+from sqlnet.model.modules.net_utils import run_lstm, col_name_encode
			
 
				 
			
 
				 class WhereRelationPredictor(nn.Module):
			
 
				     def __init__(self, N_word, N_h, N_depth, use_ca):
			
@@ -12,9 +12,7 @@ class WhereRelationPredictor(nn.Module):
 
				         self.N_h = N_h
			
 
				         self.use_ca = use_ca
			
 
				 
			
 
				-        self.where_rela_lstm = nn.LSTM(input_size=N_word, hidden_size=N_h/2,
			
 
				-                                    num_layers=N_depth, batch_first=True,
			
 
				-                                    dropout=0.3, bidirectional=True)
			
 
				+        self.where_rela_lstm = nn.LSTM(input_size=N_word, hidden_size=int(N_h/2), num_layers=N_depth, batch_first=True, dropout=0.3, bidirectional=True)
			
 
				         self.where_rela_att = nn.Linear(N_h, 1)
			
 
				         self.where_rela_col_att = nn.Linear(N_h, 1)
			
 
				         self.where_rela_out = nn.Sequential(nn.Linear(N_h, N_h), nn.Tanh(), nn.Linear(N_h,3))
			
@@ -23,7 +21,7 @@ class WhereRelationPredictor(nn.Module):
 
				         self.col2hid2 = nn.Linear(N_h, 2 * N_h)
			
 
				 
			
 
				         if self.use_ca:
			
 
				-            print "Using column attention on where relation predicting"
			
 
				+            print ("Using column attention on where relation predicting")
			
 
				 
			
 
				     def forward(self, x_emb_var, x_len, col_inp_var, col_name_len, col_len, col_num):
			
 
				         B = len(x_len)
			
@@ -40,8 +38,8 @@ class WhereRelationPredictor(nn.Module):
 
				                 col_att_val[idx, num:] = -1000000
			
 
				         num_col_att = self.softmax(col_att_val)
			
 
				         K_num_col = (e_num_col * num_col_att.unsqueeze(2)).sum(1)
			
 
				-        h1 = self.col2hid1(K_num_col).view(B, 4, self.N_h/2).transpose(0,1).contiguous()
			
 
				-        h2 = self.col2hid2(K_num_col).view(B, 4, self.N_h/2).transpose(0,1).contiguous()
			
 
				+        h1 = self.col2hid1(K_num_col).view(B, 4, self.N_h//2).transpose(0,1).contiguous()
			
 
				+        h2 = self.col2hid2(K_num_col).view(B, 4, self.N_h//2).transpose(0,1).contiguous()
			
 
				 
			
 
				         h_enc, _ = run_lstm(self.where_rela_lstm, x_emb_var, x_len, hidden=(h1, h2))
			
 
				 
			
--- a/sqlnet/model/modules/word_embedding.py
+++ b/sqlnet/model/modules/word_embedding.py
@@ -15,15 +15,14 @@ class WordEmbedding(nn.Module):
 
				         self.SQL_TOK = SQL_TOK
			
 
				 
			
 
				         if trainable:
			
 
				-            print "Using trainable embedding"
			
 
				+            print ("Using trainable embedding")
			
 
				             self.w2i, word_emb_val = word_emb
			
 
				             self.embedding = nn.Embedding(len(self.w2i), N_word)
			
 
				             self.embedding.weight = nn.Parameter(
			
 
				                     torch.from_numpy(word_emb_val.astype(np.float32)))
			
 
				         else:
			
 
				             self.word_emb = word_emb
			
 
				-            print "Using fixed embedding"
			
 
				-
			
 
				+            print ("Using fixed embedding")
			
 
				 
			
 
				     def gen_x_batch(self, q, col):
			
 
				         B = len(q)
			
@@ -31,24 +30,17 @@ class WordEmbedding(nn.Module):
 
				         val_len = np.zeros(B, dtype=np.int64)
			
 
				         for i, (one_q, one_col) in enumerate(zip(q, col)):
			
 
				             if self.trainable:
			
 
				-                q_val = map(lambda x:self.w2i.get(x, 0), one_q)
			
 
				-            else:
			
 
				-                q_val = map(lambda x:self.word_emb.get(x, np.zeros(self.N_word, dtype=np.float32)), one_q)
			
 
				-            if self.our_model:
			
 
				-                if self.trainable:
			
 
				-                    val_embs.append([1] + q_val + [2])  #<BEG> and <END>
			
 
				-                else:
			
 
				-                    val_embs.append([np.zeros(self.N_word, dtype=np.float32)] + q_val + [np.zeros(self.N_word, dtype=np.float32)])  #<BEG> and <END>
			
 
				-                val_len[i] = 1 + len(q_val) + 1
			
 
				+                q_val = [self.w2i.get(x,0) for x in one_q]
			
 
				+                val_embs.append([1] + q_val + [2])  #<BEG> and <END>
			
 
				             else:
			
 
				-                one_col_all = [x for toks in one_col for x in toks+[',']]
			
 
				-                if self.trainable:
			
 
				-                    col_val = map(lambda x:self.w2i.get(x, 0), one_col_all)
			
 
				-                    val_embs.append( [0 for _ in self.SQL_TOK] + col_val + [0] + q_val+ [0])
			
 
				-                else:
			
 
				-                    col_val = map(lambda x:self.word_emb.get(x, np.zeros(self.N_word, dtype=np.float32)), one_col_all)
			
 
				-                    val_embs.append( [np.zeros(self.N_word, dtype=np.float32) for _ in self.SQL_TOK] + col_val + [np.zeros(self.N_word, dtype=np.float32)] + q_val+ [np.zeros(self.N_word, dtype=np.float32)])
			
 
				-                val_len[i] = len(self.SQL_TOK) + len(col_val) + 1 + len(q_val) + 1
			
 
				+                # print (i)
			
 
				+                # print ([x.encode('utf-8') for x in one_q])
			
 
				+                q_val = [self.word_emb.get(x, np.zeros(self.N_word, dtype=np.float32)) for x in one_q]
			
 
				+                # print (q_val)
			
 
				+                # print ("#"*60)
			
 
				+                val_embs.append([np.zeros(self.N_word, dtype=np.float32)] + q_val + [np.zeros(self.N_word, dtype=np.float32)])  #<BEG> and <END>
			
 
				+            # exit(0)
			
 
				+            val_len[i] = len(q_val) + 2
			
 
				         max_len = max(val_len)
			
 
				 
			
 
				         if self.trainable:
			
@@ -93,8 +85,7 @@ class WordEmbedding(nn.Module):
 
				             if self.trainable:
			
 
				                 val = [self.w2i.get(x, 0) for x in one_str]
			
 
				             else:
			
 
				-                val = [self.word_emb.get(x, np.zeros(
			
 
				-                    self.N_word, dtype=np.float32)) for x in one_str]
			
 
				+                val = [self.word_emb.get(x, np.zeros(self.N_word, dtype=np.float32)) for x in one_str]
			
 
				             val_embs.append(val)
			
 
				             val_len[i] = len(val)
			
 
				         max_len = max(val_len)
			
--- a/sqlnet/model/sqlnet.py
+++ b/sqlnet/model/sqlnet.py
@@ -3,12 +3,12 @@ import torch.nn as nn
 
				 import torch.nn.functional as F
			
 
				 from torch.autograd import Variable
			
 
				 import numpy as np
			
 
				-from modules.word_embedding import WordEmbedding
			
 
				-from modules.aggregator_predict import AggPredictor
			
 
				-from modules.selection_predict import SelPredictor
			
 
				-from modules.sqlnet_condition_predict import SQLNetCondPredictor
			
 
				-from modules.select_number import SelNumPredictor
			
 
				-from modules.where_relation import WhereRelationPredictor
			
 
				+from sqlnet.model.modules.word_embedding import WordEmbedding
			
 
				+from sqlnet.model.modules.aggregator_predict import AggPredictor
			
 
				+from sqlnet.model.modules.selection_predict import SelPredictor
			
 
				+from sqlnet.model.modules.sqlnet_condition_predict import SQLNetCondPredictor
			
 
				+from sqlnet.model.modules.select_number import SelNumPredictor
			
 
				+from sqlnet.model.modules.where_relation import WhereRelationPredictor
			
 
				 
			
 
				 
			
 
				 class SQLNet(nn.Module):
			
@@ -140,7 +140,8 @@ class SQLNet(nn.Module):
 
				         loss = 0
			
 
				 
			
 
				         # Evaluate select number
			
 
				-        sel_num_truth = map(lambda x:x[0], truth_num)
			
 
				+        # sel_num_truth = map(lambda x:x[0], truth_num)
			
 
				+        sel_num_truth = [x[0] for x in truth_num]
			
 
				         sel_num_truth = torch.from_numpy(np.array(sel_num_truth))
			
 
				         if self.gpu:
			
 
				             sel_num_truth = Variable(sel_num_truth.cuda())
			
@@ -173,20 +174,21 @@ class SQLNet(nn.Module):
 
				                 sel_agg_truth_var = Variable(data.cuda())
			
 
				             else:
			
 
				                 sel_agg_truth_var = Variable(data)
			
 
				-            sel_agg_pred = agg_score[b, :len(truth_num[b][1])]
			
 
				-            loss += (self.CE(sel_agg_pred, sel_agg_truth_var)) / len(truth_num)
			
 
				+        sel_agg_pred = agg_score[b, :len(truth_num[b][1])]
			
 
				+        loss += (self.CE(sel_agg_pred, sel_agg_truth_var)) / len(truth_num)
			
 
				 
			
 
				         cond_num_score, cond_col_score, cond_op_score, cond_str_score = cond_score
			
 
				 
			
 
				         # Evaluate the number of conditions
			
 
				-        cond_num_truth = map(lambda x:x[3], truth_num)
			
 
				+        # cond_num_truth = map(lambda x:x[3], truth_num)
			
 
				+        cond_num_truth = [x[3] for x in truth_num]
			
 
				         data = torch.from_numpy(np.array(cond_num_truth))
			
 
				         if self.gpu:
			
 
				             try:
			
 
				                 cond_num_truth_var = Variable(data.cuda())
			
 
				             except:
			
 
				-                print "cond_num_truth_var error"
			
 
				-                print data
			
 
				+                print ("cond_num_truth_var error")
			
 
				+                print (data)
			
 
				                 exit(0)
			
 
				         else:
			
 
				             cond_num_truth_var = Variable(data)
			
@@ -224,8 +226,8 @@ class SQLNet(nn.Module):
 
				             try:
			
 
				                 loss += (self.CE(cond_op_pred, cond_op_truth_var) / len(truth_num))
			
 
				             except:
			
 
				-                print cond_op_pred
			
 
				-                print cond_op_truth_var
			
 
				+                print (cond_op_pred)
			
 
				+                print (cond_op_truth_var)
			
 
				                 exit(0)
			
 
				 
			
 
				         #Evaluate the strings of conditions
			
@@ -245,14 +247,15 @@ class SQLNet(nn.Module):
 
				                         / (len(gt_where) * len(gt_where[b])))
			
 
				 
			
 
				         # Evaluate condition relationship, and / or
			
 
				-        where_rela_truth = map(lambda x:x[6], truth_num)
			
 
				+        # where_rela_truth = map(lambda x:x[6], truth_num)
			
 
				+        where_rela_truth = [x[6] for x in truth_num]
			
 
				         data = torch.from_numpy(np.array(where_rela_truth))
			
 
				         if self.gpu:
			
 
				             try:
			
 
				                 where_rela_truth = Variable(data.cuda())
			
 
				             except:
			
 
				-                print "where_rela_truth error"
			
 
				-                print data
			
 
				+                print ("where_rela_truth error")
			
 
				+                print (data)
			
 
				                 exit(0)
			
 
				         else:
			
 
				             where_rela_truth = Variable(data)
			
--- a/sqlnet/utils.py
+++ b/sqlnet/utils.py
@@ -1,5 +1,5 @@
 
				 import json
			
 
				-from lib.dbengine import DBEngine
			
 
				+from sqlnet.lib.dbengine import DBEngine
			
 
				 import numpy as np
			
 
				 from tqdm import tqdm
			
 
				 
			
@@ -12,20 +12,20 @@ def load_data(sql_paths, table_paths, use_small=False):
 
				     table_data = {}
			
 
				 
			
 
				     for SQL_PATH in sql_paths:
			
 
				-        with open(SQL_PATH) as inf:
			
 
				+        with open(SQL_PATH, encoding='utf-8') as inf:
			
 
				             for idx, line in enumerate(inf):
			
 
				                 sql = json.loads(line.strip())
			
 
				                 if use_small and idx >= 1000:
			
 
				                     break
			
 
				                 sql_data.append(sql)
			
 
				-        print "Loaded %d data from %s" % (len(sql_data), SQL_PATH)
			
 
				+        print ("Loaded %d data from %s" % (len(sql_data), SQL_PATH))
			
 
				 
			
 
				     for TABLE_PATH in table_paths:
			
 
				-        with open(TABLE_PATH) as inf:
			
 
				+        with open(TABLE_PATH, encoding='utf-8') as inf:
			
 
				             for line in inf:
			
 
				                 tab = json.loads(line.strip())
			
 
				                 table_data[tab[u'id']] = tab
			
 
				-        print "Loaded %d data from %s" % (len(table_data), TABLE_PATH)
			
 
				+        print ("Loaded %d data from %s" % (len(table_data), TABLE_PATH))
			
 
				 
			
 
				     ret_sql_data = []
			
 
				     for sql in sql_data:
			
@@ -35,7 +35,7 @@ def load_data(sql_paths, table_paths, use_small=False):
 
				     return ret_sql_data, table_data
			
 
				 
			
 
				 def load_dataset(toy=False, use_small=False, mode='train'):
			
 
				-    print "Loading dataset"
			
 
				+    print ("Loading dataset")
			
 
				     dev_sql, dev_table = load_data('data/val/val.json', 'data/val/val.tables.json', use_small=use_small)
			
 
				     dev_db = 'data/val/val.db'
			
 
				     if mode == 'train':
			
@@ -107,6 +107,7 @@ def to_batch_query(sql_data, idxes, st, ed):
 
				 def epoch_train(model, optimizer, batch_size, sql_data, table_data):
			
 
				     model.train()
			
 
				     perm=np.random.permutation(len(sql_data))
			
 
				+    perm = list(range(len(sql_data)))
			
 
				     cum_loss = 0.0
			
 
				     for st in tqdm(range(len(sql_data)//batch_size+1)):
			
 
				         ed = (st+1)*batch_size if (st+1)*batch_size < len(perm) else len(perm)
			
@@ -173,7 +174,7 @@ def epoch_acc(model, batch_size, sql_data, table_data, db_path):
 
				             one_err, tot_err = model.check_acc(raw_data, pred_queries, query_gt)
			
 
				         except:
			
 
				             badcase += 1
			
 
				-            print 'badcase', badcase
			
 
				+            print ('badcase', badcase)
			
 
				             continue
			
 
				         one_acc_num += (ed-st-one_err)
			
 
				         tot_acc_num += (ed-st-tot_err)
			
@@ -191,10 +192,14 @@ def epoch_acc(model, batch_size, sql_data, table_data, db_path):
 
				 
			
 
				 def load_word_emb(file_name):
			
 
				     print ('Loading word embedding from %s'%file_name)
			
 
				-    ret = {}
			
 
				-    with open(file_name) as inf:
			
 
				-        for idx, line in enumerate(inf):
			
 
				-            info = line.strip().split(' ')
			
 
				-            if info[0].lower() not in ret:
			
 
				-                ret[info[0].decode('utf-8')] = np.array(map(lambda x:float(x), info[1:]))
			
 
				+    f = open(file_name)
			
 
				+    ret = json.load(f)
			
 
				+    f.close()
			
 
				+    # ret = {}
			
 
				+    # with open(file_name, encoding='latin') as inf:
			
 
				+    #     ret = json.load(inf)
			
 
				+    #     for idx, line in enumerate(inf):
			
 
				+    #         info = line.strip().split(' ')
			
 
				+    #         if info[0].lower() not in ret:
			
 
				+    #             ret[info[0]] = np.array([float(x) for x in info[1:]])
			
 
				     return ret