Q-learning-in-C/q-learning.h

6 lines
347 B
C

short float_argmax(float *arr, short length);
short bot_choose_action(float *table, short *board, int state);
short opponent_random_action(float *table, short *board, int state);
void init_table(float *table);
float get_estimate_reward(float *table, short *board, int state);
void run(float *table, short *board, bool train, int times, bool plot);