Q-learning-in-C/q-learning.h

short float_argmax(float* arr, short length);
short bot_choose_action(float* table, short* board, int state);
short opponent_random_action(float* table, short* board, int state);
void init_table(float* table);
float get_estimate_reward(float* table, short* board, int state);
void run(float* table, short* board, bool train, int times, bool plot);