from util import epsilon_greedy, get_start_state AMOUNT_RUNS = 10 EPSILON = 0.1 """ state: (x_distance_to_ghost, y_distance_to_ghost, next_cookie_Direction) action: Direction q_value: (state, action) """ q_values = {} # Amount of single runs for x in range(AMOUNT_RUNS): state = get_start_state() # Single run, until win or death while(True): action = epsilon_greedy(q_values, state, EPSILON)