EPSILON = 0.005 ALPHA = 0.2 GAMMA = 0.8 AMOUNT_RUNS = 5000 AMOUNT_TRIES = 5 REWARD_ON_WIN = 400 REWARD_ON_HALF = 50 REWARD_ON_LOSE = -250 plot_result = True show_game = False show_trained = False