14 lines
300 B
C
14 lines
300 B
C
#define BOT_SYMBOL 1
|
|
#define OPPONENT_SYMBOL 2
|
|
|
|
#define EPSILON 0.9 // Epsilon-greedy
|
|
#define LR 0.1 // learning rate
|
|
#define LAMBDA 0.9 // discount factor
|
|
|
|
#define STATE_NUM 19683
|
|
#define ACTION_NUM 9
|
|
#define EPISODE_NUM 100000
|
|
#define FIRST true
|
|
|
|
#define ROW_NUM 6
|
|
#define COL_NUM 7 |