backgammon/main.py

import argparse
import sys
import os
import time

# Define helper functions
def log_train_outcome(outcome, trained_eps = 0):
    format_vars = { 'trained_eps': trained_eps,
                    'count': len(train_outcome),
                    'sum': sum(train_outcome),
                    'mean': sum(train_outcome) / len(train_outcome),
                    'time': int(time.time())
    }
    with open(os.path.join(config['model_path'], 'logs', "train.log"), 'a+') as f:
        f.write("{time};{trained_eps};{count};{sum};{mean}".format(**format_vars) + "\n")
    

def log_eval_outcomes(outcomes, trained_eps = 0):
    for outcome in outcomes:
        scores = outcome[1]
        format_vars = { 'trained_eps': trained_eps,
                        'method': outcome[0],
                        'count': len(scores),
                        'sum': sum(scores),
                        'mean': sum(scores) / len(scores),
                        'time': int(time.time())
        }
        with open(os.path.join(config['model_path'], 'logs', "eval.log"), 'a+') as f:
            f.write("{time};{method};{trained_eps};{count};{sum};{mean}".format(**format_vars) + "\n")

            
# Parse command line arguments
parser = argparse.ArgumentParser(description="Backgammon games")
parser.add_argument('--episodes', action='store', dest='episode_count',
                    type=int, default=1000,
                    help='number of episodes to train')
parser.add_argument('--model-path', action='store', dest='model_path',
                    default='./model',
                    help='path to Tensorflow model')
parser.add_argument('--eval-methods', action='store',
                    default=['random'], nargs='*',
                    help='specifies evaluation methods')
parser.add_argument('--eval', action='store_true',
                    help='whether to evaluate the neural network with a random choice bot')
parser.add_argument('--train', action='store_true',
                    help='whether to train the neural network')
parser.add_argument('--eval-after-train', action='store_true', dest='eval_after_train',
                    help='whether to evaluate after each training session')
parser.add_argument('--play', action='store_true',
                    help='whether to play with the neural network')
parser.add_argument('--start-episode', action='store', dest='start_episode',
                    type=int, default=0,
                    help='episode count to start at; purely for display purposes')

args = parser.parse_args()

config = {
    'model_path': args.model_path,
    'episode_count': args.episode_count,
    'eval_methods': args.eval_methods,
    'train': args.train,
    'play': args.play,
    'eval': args.eval,
    'eval_after_train': args.eval_after_train,
    'start_episode': args.start_episode
}

# Make sure directories exist
model_path = os.path.join(config['model_path'])
log_path   = os.path.join(model_path, 'logs')
if not os.path.isdir(model_path):
    os.mkdir(model_path)
if not os.path.isdir(log_path):
    os.mkdir(log_path)
    

# Set up game
import game
g = game.Game(config = config)
g.set_up_bots()


# Set up variables
episode_count = config['episode_count']


# Do actions specified by command-line
if args.train:
    eps = config['start_episode']
    while True:
        train_outcome = g.train_model(episodes = episode_count, trained_eps = eps)
        eps += episode_count
        log_train_outcome(train_outcome, trained_eps = eps)
        if config['eval_after_train']:
            eval_outcomes = g.eval(trained_eps = eps)
            log_eval_outcomes(eval_outcomes, trained_eps = eps)
elif args.eval:
    eps = config['start_episode']
    outcomes = g.eval()
    log_eval_outcomes(outcomes, trained_eps = eps)
#elif args.play:
#    g.play(episodes = episode_count)
woooow 2018-03-08 15:27:16 +00:00			`import argparse`
plot-plot 2018-03-08 16:13:25 +00:00			`import sys`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`import os`
train and eval now outputs proper number of training episodes to log 2018-03-09 20:05:38 +00:00			`import time`
woooow 2018-03-08 15:27:16 +00:00
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`# Define helper functions`
			`def log_train_outcome(outcome, trained_eps = 0):`
train and eval now outputs proper number of training episodes to log 2018-03-09 20:05:38 +00:00			`format_vars = { 'trained_eps': trained_eps,`
woooow 2018-03-08 15:27:16 +00:00			`'count': len(train_outcome),`
			`'sum': sum(train_outcome),`
train and eval now outputs proper number of training episodes to log 2018-03-09 20:05:38 +00:00			`'mean': sum(train_outcome) / len(train_outcome),`
			`'time': int(time.time())`
			`}`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`with open(os.path.join(config['model_path'], 'logs', "train.log"), 'a+') as f:`
			`f.write("{time};{trained_eps};{count};{sum};{mean}".format(**format_vars) + "\n")`

woooow 2018-03-08 15:27:16 +00:00
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`def log_eval_outcomes(outcomes, trained_eps = 0):`
small fixes 2018-03-08 16:51:32 +00:00			`for outcome in outcomes:`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`scores = outcome[1]`
			`format_vars = { 'trained_eps': trained_eps,`
			`'method': outcome[0],`
			`'count': len(scores),`
			`'sum': sum(scores),`
			`'mean': sum(scores) / len(scores),`
			`'time': int(time.time())`
			`}`
			`with open(os.path.join(config['model_path'], 'logs', "eval.log"), 'a+') as f:`
			`f.write("{time};{method};{trained_eps};{count};{sum};{mean}".format(**format_vars) + "\n")`
woooow 2018-03-08 15:27:16 +00:00
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00
			`# Parse command line arguments`
woooow 2018-03-08 15:27:16 +00:00			`parser = argparse.ArgumentParser(description="Backgammon games")`
			`parser.add_argument('--episodes', action='store', dest='episode_count',`
			`type=int, default=1000,`
			`help='number of episodes to train')`
			`parser.add_argument('--model-path', action='store', dest='model_path',`
			`default='./model',`
			`help='path to Tensorflow model')`
			`parser.add_argument('--eval-methods', action='store',`
			`default=['random'], nargs='*',`
			`help='specifies evaluation methods')`
			`parser.add_argument('--eval', action='store_true',`
			`help='whether to evaluate the neural network with a random choice bot')`
			`parser.add_argument('--train', action='store_true',`
			`help='whether to train the neural network')`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`parser.add_argument('--eval-after-train', action='store_true', dest='eval_after_train',`
			`help='whether to evaluate after each training session')`
woooow 2018-03-08 15:27:16 +00:00			`parser.add_argument('--play', action='store_true',`
			`help='whether to play with the neural network')`
save and restore number of trained episodes 2018-03-09 23:22:20 +00:00			`parser.add_argument('--start-episode', action='store', dest='start_episode',`
			`type=int, default=0,`
			`help='episode count to start at; purely for display purposes')`
woooow 2018-03-08 15:27:16 +00:00
			`args = parser.parse_args()`

			`config = {`
			`'model_path': args.model_path,`
			`'episode_count': args.episode_count,`
			`'eval_methods': args.eval_methods,`
			`'train': args.train,`
			`'play': args.play,`
save and restore number of trained episodes 2018-03-09 23:22:20 +00:00			`'eval': args.eval,`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`'eval_after_train': args.eval_after_train,`
save and restore number of trained episodes 2018-03-09 23:22:20 +00:00			`'start_episode': args.start_episode`
woooow 2018-03-08 15:27:16 +00:00			`}`

training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`# Make sure directories exist`
			`model_path = os.path.join(config['model_path'])`
			`log_path = os.path.join(model_path, 'logs')`
			`if not os.path.isdir(model_path):`
			`os.mkdir(model_path)`
			`if not os.path.isdir(log_path):`
			`os.mkdir(log_path)`

woooow 2018-03-08 15:27:16 +00:00
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`# Set up game`
woooow 2018-03-08 15:27:16 +00:00			`import game`
			`g = game.Game(config = config)`
			`g.set_up_bots()`


training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`# Set up variables`
			`episode_count = config['episode_count']`


			`# Do actions specified by command-line`
woooow 2018-03-08 15:27:16 +00:00			`if args.train:`
save and restore number of trained episodes 2018-03-09 23:22:20 +00:00			`eps = config['start_episode']`
woooow 2018-03-08 15:27:16 +00:00			`while True:`
train and eval now outputs proper number of training episodes to log 2018-03-09 20:05:38 +00:00			`train_outcome = g.train_model(episodes = episode_count, trained_eps = eps)`
woooow 2018-03-08 15:27:16 +00:00			`eps += episode_count`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`log_train_outcome(train_outcome, trained_eps = eps)`
			`if config['eval_after_train']:`
train and eval now outputs proper number of training episodes to log 2018-03-09 20:05:38 +00:00			`eval_outcomes = g.eval(trained_eps = eps)`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`log_eval_outcomes(eval_outcomes, trained_eps = eps)`
woooow 2018-03-08 15:27:16 +00:00			`elif args.eval:`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`eps = config['start_episode']`
woooow 2018-03-08 15:27:16 +00:00			`outcomes = g.eval()`
training and evaluation stats are now logged by default to model/logs/ 2018-03-09 23:39:55 +00:00			`log_eval_outcomes(outcomes, trained_eps = eps)`
woooow 2018-03-08 15:27:16 +00:00			`#elif args.play:`
			`# g.play(episodes = episode_count)`