bigfreecoder
diff --git a/‎.gitignore
Lines changed: 1 addition & 1 deletion b/‎.gitignore
Lines changed: 1 addition & 1 deletion
diff --git a/‎__pycache__/models.cpython-36.pyc
287 Bytes b/‎__pycache__/models.cpython-36.pyc
287 Bytes
diff --git a/‎models.py
Lines changed: 19 additions & 11 deletions b/‎models.py
Lines changed: 19 additions & 11 deletions
diff --git a/‎run.py
Lines changed: 5 additions & 1 deletion b/‎run.py
Lines changed: 5 additions & 1 deletion
diff --git a/‎run_test_ConvMF.sh renamed to ‎run_ConvMF.sh
Lines changed: 4 additions & 2 deletions b/‎run_test_ConvMF.sh renamed to ‎run_ConvMF.sh
Lines changed: 4 additions & 2 deletions
diff --git a/‎run_test_preprocess.sh renamed to ‎run_preprocess.sh
Lines changed: 3 additions & 3 deletions b/‎run_test_preprocess.sh renamed to ‎run_preprocess.sh
Lines changed: 3 additions & 3 deletions
diff --git a/‎text_analysis/__pycache__/models.cpython-36.pyc
-4.02 KB b/‎text_analysis/__pycache__/models.cpython-36.pyc
-4.02 KB
diff --git a/‎text_analysis/cnn_model.py
Lines changed: 17 additions & 42 deletions b/‎text_analysis/cnn_model.py
Lines changed: 17 additions & 42 deletions
diff --git a/‎text_analysis/models.py
Lines changed: 0 additions & 144 deletions b/‎text_analysis/models.py
Lines changed: 0 additions & 144 deletions
diff --git a/‎text_analysis/models.pyc
-5.1 KB b/‎text_analysis/models.pyc
-5.1 KB
@@ -1,6 +1,6 @@
 *.pyc
 data/
+.data/
 .idea/
 result/
-venv/
 .ipynb_checkpoints/
@@ -16,11 +16,13 @@
 2、batch
 3、give_item_weight到底是做什么用的
 4、模型中seed的用法
+5、一些参数的设置
+6、添加cuda参数来控制是否使用GPU
 '''
 
 
 def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
-           R, CNN_X, vocab_size, init_W=None, give_item_weight=True,
+           R, CNN_X, vocab_size, if_cuda, init_W=None, give_item_weight=True,
            max_iter=50, lambda_u=1, lambda_v=100, dimension=50,
            dropout_rate=0.2, emb_dim=200, max_len=300, num_kernel_per_ws=100):
     # explicit setting
@@ -40,7 +42,6 @@ def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
     Test_R = test_user[1]
     Valid_R = valid_user[1]
 
-    # 这一部分到底是做什么用的
     if give_item_weight is True:
         item_weight = np.array([math.sqrt(len(i))
                                 for i in Train_R_J], dtype=float)
@@ -49,15 +50,18 @@ def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
         item_weight = np.ones(num_item, dtype=float)
 
     pre_val_eval = 1e10
+    best_tr_eval, best_val_eval, best_te_eval = 1e10, 1e10, 1e10
 
     # dimension: 用户和物品的隐特征维数
     # emb_dim: 词向量的维数
+    # if_cuda: 是否用GPU训练CNN
     cnn_module = CNN(dimension, vocab_size, dropout_rate,
-                     emb_dim, max_len, num_kernel_per_ws, init_W)
+                     emb_dim, max_len, num_kernel_per_ws, if_cuda, init_W)
 
-    # return the output of CNN
+    # 返回CNN的output
     # size of V is (num_item, dimension)
-    cnn_module = cnn_module.cuda()
+    if if_cuda:
+        cnn_module = cnn_module.cuda()
     theta = cnn_module.get_projection_layer(CNN_X)
     U = np.random.uniform(size=(num_user, dimension))
     V = theta
@@ -104,7 +108,6 @@ def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
             sub_loss[j] = sub_loss[j] - 0.5 * np.dot(V[j].dot(tmp_A), V[j])
 
         loss = loss + np.sum(sub_loss)
-        seed = np.random.randint(100000)
 
         # 用V训练CNN模型，更新V
         cnn_module.train(CNN_X, V)
@@ -126,9 +129,10 @@ def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
         # 计算Loss下降率
         converge = abs((loss - PREV_LOSS) / PREV_LOSS)
 
-        # 存储模型参数
+        # 存储效果最好的模型参数
         if val_eval < pre_val_eval:
-            # cnn_module.save_model(res_dir + '/CNN_weights.hdf5')
+            torch.save(cnn_module, res_dir+'CNN_model.pt')
+            best_tr_eval, best_val_eval, best_te_eval = tr_eval, val_eval, te_eval
             np.savetxt(res_dir + '/U.dat', U)
             np.savetxt(res_dir + '/V.dat', V)
             np.savetxt(res_dir + '/theta.dat', theta)
@@ -137,13 +141,17 @@ def ConvMF(res_dir, train_user, train_item, valid_user, test_user,
 
         pre_val_eval = val_eval
 
-        print("Elpased: %.4fs Converge: %.6f Tr: %.5f Val: %.5f Te: %.5f" % (
-             elapsed, converge, tr_eval, val_eval, te_eval))
-        f1.write("Elpased: %.4fs Converge: %.6f Tr: %.5f Val: %.5f Te: %.5f\n" % (
+        print("Elpased: %.4fs Converge: %.6f Train: %.5f Valid: %.5f Test: %.5f" % (
+            elapsed, converge, tr_eval, val_eval, te_eval))
+        f1.write("Elpased: %.4fs Converge: %.6f Train: %.5f Valid: %.5f Test: %.5f\n" % (
             elapsed, converge, tr_eval, val_eval, te_eval))
 
         # 超过五次则退出迭代训练
         if count == endure_count:
+            print("\n\nBest Model: Train: %.5f Valid: %.5f Test: %.5f" % (
+                best_tr_eval, best_val_eval, best_te_eval))
+            f1.write("\n\nBest Model: Train: %.5f Valid: %.5f Test: %.5f\n" % (
+                best_tr_eval, best_val_eval, best_te_eval))
             break
 
         PREV_LOSS = loss
 
@@ -35,6 +35,8 @@
 parser.add_argument("-a", "--aux_path", type=str, help="Path to R, D_all sets")
 
 # Option for running ConvMF
+parser.add_argument("-cu", "--if_cuda", type=bool,
+                    help="if use GPU to train in pytorch", default=False)
 parser.add_argument("-o", "--res_dir", type=str,
                     help="Path to ConvMF's result")
 parser.add_argument("-e", "--emb_dim", type=int,
@@ -110,6 +112,7 @@
     print("\t aux path - %s" % aux_path)
     print("\t data path - %s" % data_path)
     print("\t result path - %s" % res_dir)
+    print("\t if cuda - %s" % args.if_cuda)
     print("\t pretrained w2v data path - %s" % pretrain_w2v)
     print("\t dimension: %d\n\t lambda_u: %.4f\n\t lambda_v: %.4f\n\t max_iter: %d\n\t num_kernel_per_ws: %d" %
           (dimension, lambda_u, lambda_v, max_iter, num_kernel_per_ws))
@@ -147,4 +150,5 @@
     ConvMF(max_iter=max_iter, res_dir=res_dir,
            lambda_u=lambda_u, lambda_v=lambda_v, dimension=dimension, vocab_size=vocab_size, init_W=init_W,
            give_item_weight=give_item_weight, CNN_X=input_array, emb_dim=emb_dim, num_kernel_per_ws=num_kernel_per_ws,
-           train_user=train_user, train_item=train_item, valid_user=valid_user, test_user=test_user, R=R)
+           train_user=train_user, train_item=train_item, valid_user=valid_user, test_user=test_user, R=R,
+           if_cuda=args.if_cuda)
@@ -1,11 +1,13 @@
 #!/usr/bin/env bash
 python ./run.py \
+-cu True \
 -d ./data/preprocessed/ml-1m/0.2/ \
 -a ./data/preprocessed/ml-1m/ \
 -o ./result/ml-1m/1_100_200 \
 -e 50 \
--u 10 \
--v 100 \
+-u 100 \
+-v 10 \
+-w 100 \
 -g True
 
 
 
@@ -1,8 +1,8 @@
 #!/usr/bin/env bash
 python ./run.py \
--d ./data/preprocessed/ml-1m/0.2/ \
--a ./data/preprocessed/ml-1m/ \
 -c True \
 -r ./data/movielens/ml-1m_ratings.dat \
 -i ./data/movielens/ml_plot.dat \
--m 1
+-m 1 \
+-d ./data/preprocessed/ml-1m/0.2/ \
+-a ./data/preprocessed/ml-1m/ 
@@ -1,6 +1,6 @@
 # coding:utf-8
 
-# Pytorch
+# 导入Pytorch相关模块
 import torch
 import torch.nn as nn
 import torch.nn.functional as F
@@ -14,13 +14,14 @@ class CNN(nn.Module):
     # More than this epoch cause easily over-fitting on our data sets
     nb_epoch = 5
 
-    def __init__(self, output_dimesion, vocab_size, dropout_rate, emb_dim, max_len, n_filters, init_W=None):
+    def __init__(self, output_dimesion, vocab_size, dropout_rate, emb_dim, max_len, n_filters, if_cuda, init_W=None):
         # n_filter为卷积核个数
         super(CNN, self).__init__()
 
         self.max_len = max_len
         self.emb_dim = emb_dim
-        vanila_dimension = 200  # 倒数第二层的节点数
+        self.if_cuda = if_cuda
+        vanila_dimension = 2*n_filters  # 倒数第二层的节点数
         projection_dimension = output_dimesion  # 输出层的节点数
         self.qual_conv_set = {}
 
@@ -49,13 +50,10 @@ def __init__(self, output_dimesion, vocab_size, dropout_rate, emb_dim, max_len,
         )
 
         '''Dropout Layer'''
-        # layer = Dense(vanila_dimension, activation='tanh')(flatten_layer)
-        # layer = Dropout(dropout_rate)(layer)
-        self.layer = nn.Linear(300, vanila_dimension)
+        self.layer = nn.Linear(n_filters*3, vanila_dimension)
         self.dropout = nn.Dropout(dropout_rate)
 
         '''Projection Layer & Output Layer'''
-        # output_layer = Dense(projection_dimension, activation='tanh')(layer)
         self.output_layer = nn.Linear(vanila_dimension, projection_dimension)
 
     def forward(self, inputs):
@@ -82,19 +80,23 @@ def train(self, X_train, V):
         optimizer = torch.optim.Adam(self.parameters(), lr=0.001)
 
         for epoch in range(1, self.nb_epoch + 1):
-
-            print('<---epoch' + str(epoch))
             n_batch = len(X_train) // self.batch_size
 
             # 这里会漏掉一些训练集，先这样写
-            for i in range(n_batch):
+            for i in range(n_batch+1):
                 begin_idx, end_idx = i * self.batch_size, (i + 1) * self.batch_size
-                feature = X_train[begin_idx:end_idx][...]
-                target = V[begin_idx:end_idx][...]
+
+                if i<n_batch:
+                    feature = X_train[begin_idx:end_idx][...]
+                    target = V[begin_idx:end_idx][...]
+                else:
+                    feature = X_train[begin_idx:][...]
+                    target = V[begin_idx:][...]
 
                 feature = Variable(torch.from_numpy(feature.astype('int64')).long())
                 target = Variable(torch.from_numpy(target))
-                feature, target = feature.cuda(), target.cuda()
+                if self.if_cuda:
+                    feature, target = feature.cuda(), target.cuda()
 
                 optimizer.zero_grad()
                 logit = self(feature)
@@ -105,34 +107,7 @@ def train(self, X_train, V):
 
     def get_projection_layer(self, X_train):
         inputs = Variable(torch.from_numpy(X_train.astype('int64')).long())
-        inputs = inputs.cuda()
+        if self.if_cuda:
+            inputs = inputs.cuda()
         outputs = self(inputs)
         return outputs.cpu().data.numpy()
-
-
-    # 获取CNN模型的输出
-
-    # def train(self, X_train, V, item_weight, seed):
-    #     # X_train is CNN_X
-    #     X_train = sequence.pad_sequences(X_train, maxlen=self.max_len)
-    #     np.random.seed(seed)
-    #     X_train = np.random.permutation(X_train)
-    #     np.random.seed(seed)
-    #     V = np.random.permutation(V)ojecti
-    #     np.random.seed(seed)
-    #     item_weight = np.random.permutation(item_weight)
-    #
-    #     print("Train...CNN module")
-    #     history = self.model.fit(X_train, V, verbose=0, batch_size=self.batch_size,
-    #                              epochs=self.nb_epoch, sample_weight=item_weight)
-    #
-    #     # cnn_loss_his = history.history['loss']
-    #     # cmp_cnn_loss = sorted(cnn_loss_his)[::-1]
-    #     # if cnn_loss_his != cmp_cnn_loss:
-    #     #     self.nb_epoch = 1
-    #     return history
-    #
-    # def get_projection_layer(self, X_train):
-    #     X_train = sequence.pad_sequences(X_train, maxlen=self.max_len)
-    #     Y = self.model.predict(X_train, batch_size=len(X_train))
-    #     return Y
-Original file line number
+Diff line change
@@ @@ -1,6 +1,6 @@ @@
 *.pyc
 data/
 +.data/
 .idea/
 result/
 -venv/
 .ipynb_checkpoints/