MLE-Pacman/main.py

31 lines
679 B
Python

#! TMP
import os
os.environ['MPLBACKEND'] = 'Agg'
from GenTunic.gen_tuning import gen_tuning_main
from ReinforcmentLearning.learning import multipleTries, oneTry
from ReinforcmentLearning.util import calc_time_reward
EPSILON = 0.01
# EPSILON = 0.005
ALPHA = 0.2
GAMMA = 0.8
AMOUNT_RUNS = 5000
AMOUNT_TRIES = 5
REWARD_ON_WIN = 400
REWARD_ON_LOSE = -250
plot_result = False
show_game = False
# oneTry(EPSILON, ALPHA, GAMMA, AMOUNT_RUNS, REWARD_ON_WIN, REWARD_ON_LOSE, plot_result, show_game)
#multipleTries(EPSILON, ALPHA, GAMMA,AMOUNT_TRIES, AMOUNT_RUNS, REWARD_ON_WIN, REWARD_ON_LOSE)
gen_tuning_main(AMOUNT_TRIES, AMOUNT_RUNS, REWARD_ON_WIN, REWARD_ON_LOSE, EPSILON)