diff --git a/agents/reinforcement_learning.c b/agents/reinforcement_learning.c index 5466519..ce009a1 100644 --- a/agents/reinforcement_learning.c +++ b/agents/reinforcement_learning.c @@ -96,7 +96,8 @@ int get_action_exploit(char *table, rl_agent_t *agent) int play_rl(char *table, rl_agent_t *agent) { int move = get_action_exploit(table, agent); - table[move] = agent->player; + if (move != -1) + table[move] = agent->player; return move; } diff --git a/elo.c b/elo.c index f4110e1..a28406d 100644 --- a/elo.c +++ b/elo.c @@ -63,7 +63,8 @@ static int play_game(int player1, int player2) else move = play_rl(table, &agent); - table[move] = player == player1 ? 'X' : 'O'; + if (move != -1) + table[move] = player == player1 ? 'X' : 'O'; player ^= player1 ^ player2; }