Added a verbosity flag, --verbose, which allows for printing of

variables and such.
2018-05-10 10:39:22 +02:00 · 2018-05-10 10:39:22 +02:00 · 9cfdd7e2b2
commit 9cfdd7e2b2
parent 6429e0732c
2 changed files with 25 additions and 9 deletions
--- a/main.py
+++ b/main.py
@ -38,6 +38,8 @@ parser.add_argument('--board-rep', action='store', dest='board_rep',
                    help='name of board representation to use as input to neural network')
 parser.add_argument('--use-baseline', action='store_true',
                    help='use the baseline model, note, has size 28')
+parser.add_argument('--verbose', action='store_true',
+                    help='If set, a lot of stuff will be printed')

 args = parser.parse_args()

@ -61,7 +63,9 @@ config = {
    'board_representation': args.board_rep,
    'force_creation': args.force_creation,
    'use_baseline': args.use_baseline,
-    'global_step': 0
+    'global_step': 0,
+    'verbose': args.verbose
+
 }

 # Create models folder
--- a/network.py
+++ b/network.py
@ -98,10 +98,20 @@ class Network:



+    def print_variables(self):
+        variables = self.model.variables
+
+        for k in variables:
+            print(k)
+
    def eval_state(self, state):
        return self.model(state.reshape(1,-1))

    def save_model(self, episode_count):
+        """
+        :param episode_count:
+        :return:
+        """
        tfe.Saver(self.model.variables).save(os.path.join(self.checkpoint_path, 'model.ckpt'))
        #self.saver.save(sess, os.path.join(self.checkpoint_path, 'model.ckpt'), global_step=global_step)
        with open(os.path.join(self.checkpoint_path, "episodes_trained"), 'w+') as f:
@ -113,6 +123,8 @@ class Network:
            print("[NETWK] ({name}) Saving global step to:".format(name=self.name),
                  os.path.join(self.checkpoint_path, 'model.ckpt'))
            f.write(str(self.global_step) + "\n")
+        if self.config['verbose']:
+            self.print_variables()


    def calc_vals(self, states):
@ -150,6 +162,8 @@ class Network:
                with open(global_step_path, 'r') as f:
                    self.config['global_step'] = int(f.read())

+            if self.config['verbose']:
+                self.print_variables()



@ -489,19 +503,13 @@ class Network:
                     in self.config['eval_methods'] ]
        return outcomes

+
    def train_model(self, episodes=1000, save_step_size=100, trained_eps=0):
        with tf.Session() as sess:
            difference_in_vals = 0

            self.restore_model()

-            #variables_names = [v.name for v in tf.trainable_variables()]
-            #values = sess.run(variables_names)
-            #for k, v in zip(variables_names, values):
-            #    print("Variable: ", k)
-            #    print("Shape: ", v.shape)
-            #    print(v)
-
            start_time = time.time()

            def print_time_estimate(eps_completed):
@ -537,9 +545,13 @@ class Network:

                    difference_in_vals += abs((cur_board_value - self.eval_state(self.board_trans_func(prev_board, player))))

+                    if self.config['verbose']:
+                        print("Difference in values:", difference_in_vals)
+                        print("Current board value :", cur_board_value)
+                        print("Current board is    :\n",cur_board)
+

                    # adjust weights
-                    #print(cur_board)
                    if Board.outcome(cur_board) is None:
                        self.do_backprop(self.board_trans_func(prev_board, player), cur_board_value)
                        player *= -1