ffs97
diff --git a/‎code/graph.py
+38-40 b/‎code/graph.py
+38-40
diff --git a/‎code/includes/config.py
+6-5 b/‎code/includes/config.py
+6-5
@@ -136,17 +136,11 @@ def init_nodes(self):
             config.decay_rate,
             staircase=True
         )
-        if config.optimizer == "adamax":
-            print "\nUsing AdaMax Optimizer with lr: %f, decay_steps: %d, decay_rate: %f\n" \
-                % (config.learning_rate, config.decay_steps, config.decay_rate)
 
-            self.optimizer = tf.keras.optimizers.Adamax(learning_rate)
+        print "\nUsing Adam Optimizer with lr: %f, decay_steps: %d, decay_rate: %f\n" \
+            % (config.learning_rate, config.decay_steps, config.decay_rate)
 
-        else:
-            print "\nUsing Adam Optimizer with lr: %f, decay_steps: %d, decay_rate: %f\n" \
-                % (config.learning_rate, config.decay_steps, config.decay_rate)
-
-            self.optimizer = tf.train.AdamOptimizer(learning_rate)
+        self.optimizer = tf.train.AdamOptimizer(learning_rate)
 
         gradients = self.optimizer.compute_gradients(self.loss)
         clipped_gradients = [
@@ -183,40 +177,44 @@ def predict(self, sess, dataset, msg):
         answers = []
         ground_answers = []
 
-        with tqdm(dataset, desc=msg) as pbar:
-            for batch in pbar:
-                questions_padded, questions_length = pad_sequences(
-                    batch[:, 0], config.max_question_length
-                )
-                contexts_padded, contexts_length = pad_sequences(
-                    batch[:, 1], config.max_context_length
-                )
+        if msg != None:
+            pbar = tqdm(dataset, desc=msg)
+        else:
+            pbar = dataset
 
-                labels = np.zeros(
-                    (len(batch), config.n_clusters), dtype=np.float32
-                )
-                if config.clustering:
-                    for j, el in enumerate(batch):
-                        labels[j, el[3]] = 1
-                else:
-                    labels[:, 0] = 1
+        for batch in pbar:
+            questions_padded, questions_length = pad_sequences(
+                batch[:, 0], config.max_question_length
+            )
+            contexts_padded, contexts_length = pad_sequences(
+                batch[:, 1], config.max_context_length
+            )
 
-                predictions = sess.run(
-                    self.predictions,
-                    feed_dict={
-                        self.questions_ids: questions_padded,
-                        self.questions_length: questions_length,
-                        self.questions_mask: masks(questions_length, config.max_question_length),
-                        self.contexts_ids: contexts_padded,
-                        self.contexts_length: contexts_length,
-                        self.contexts_mask: masks(contexts_length, config.max_context_length),
-                        self.labels: labels,
-                        self.dropout: 1.0
-                    }
-                )
+            labels = np.zeros(
+                (len(batch), config.n_clusters), dtype=np.float32
+            )
+            if config.clustering:
+                for j, el in enumerate(batch):
+                    labels[j, el[3]] = 1
+            else:
+                labels[:, 0] = 1
+
+            predictions = sess.run(
+                self.predictions,
+                feed_dict={
+                    self.questions_ids: questions_padded,
+                    self.questions_length: questions_length,
+                    self.questions_mask: masks(questions_length, config.max_question_length),
+                    self.contexts_ids: contexts_padded,
+                    self.contexts_length: contexts_length,
+                    self.contexts_mask: masks(contexts_length, config.max_context_length),
+                    self.labels: labels,
+                    self.dropout: 1.0
+                }
+            )
 
-                answers += get_answers(predictions[0], predictions[1])
-                ground_answers += [np.array(el[2]) for el in batch]
+            answers += get_answers(predictions[0], predictions[1])
+            ground_answers += [np.array(el[2]) for el in batch]
 
         return np.array(answers, dtype=np.float32), np.array(ground_answers, dtype=np.float32)
 
 
@@ -30,13 +30,15 @@
 
 clustering = True
 
+model_name = "k-match-lstm"
+
 data_dir = "data/squad/"
-train_dir = "model/k-match-lstm.clustered.weighted"
+train_dir = "model/" + model_name + "/"
 
 if not os.path.exists(train_dir):
     os.makedirs(train_dir)
 
-plots_dir = "data/plots/"
+plots_dir = "data/plots." + model_name + "/"
 
 if not os.path.exists(plots_dir):
     os.makedirs(plots_dir)
@@ -48,17 +50,16 @@
 embed_path = data_dir + "/glove.npz"
 
 dropout_keep_prob = 0.9
-# regularization_constant = 0.001
 
 train_embeddings = False
 
-optimizer = "adamax"
+optimizer = "adam"
 
 learning_rate = 0.002
 decay_steps = 1000
 decay_rate = 0.92
 
-max_gradient = 10.0
+max_gradient = 5.0
 
 load_model = True