-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconstants.py
More file actions
56 lines (55 loc) · 2.79 KB
/
constants.py
File metadata and controls
56 lines (55 loc) · 2.79 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
CONSTANTS = {
'NUM_ENVS' : 4,
'NUM_SKILLS' : 22,
'STATE_SIZE' : 22,
'ACTION_SIZE' : 43,
"TARGET_P_KNOW" : 0.8,
'NUM_OBS' : 'all',
'VILLAGE' : '130',
'STUDENT_ID' : 'new_student',
'STUDENT_MODEL_NAME' : 'hotDINA_skill',
'AREA_ROTATION' : 'L-N-L-S',
'START_POS' : '0,0',
'ALGO' : 'DQN',
'AVG_OVER_RUNS' : 500,
'AGENT_TYPE' : None,
'AREA_ROTATION_CONSTRAINT' : True,
'TRANSITION_CONSTRAINT' : True,
"FC1_DIMS" : 1024,
"FC2_DIMS" : 2048,
'FC3_DIMS' : 1024,
'NUM_TESTS' : 10,
'GAE_LAMBDA' : 0.95,
'GAMMA' : 0.99,
'GAE_LAMBDA' : 0.95,
'PPO_EPSILON' : 0.2,
"CRITIC_DISCOUNT" : 0.5,
"ENTROPY_BETA" : 0.001,
"RUN_NUM" : 0,
'PRINT_STUDENT_PARAMS' : True,
'CLEAR_LOGS' : True,
'EPSILON' : 0.95, # explore-exploit coefficient for DQN
'LOAD' : False,
'RUN' : 0,
'DETERMINISTIC' : False,
'ANTI_RL' : False,
# Current RoboTutor Thresholds
'LOW_PERFORMANCE_THRESHOLD' : 0.5,
'MID_PERFORMANCE_THRESHOLD' : 0.83,
'HIGH_PERFORMANCE_THRESHOLD' : 0.9,
'LOW_LENIENT_PERFORMANCE_THRESHOLD' : 0.4,
'MID_LENIENT_PERFORMANCE_THRESHOLD' : 0.55,
'HIGH_LENIENT_PERFORMANCE_THRESHOLD': 0.7,
'LEARNING_RATE' : 7e-4,
'DQ_LEARNING_RATE' : 1e-4,
'AC_LEARNING_RATE' : 5e-4,
'NUM_EPISODES' : 1750, # For dqn and actor_critic
"MAX_TIMESTEPS" : 200,
'BATCH_SIZE' : 64,
'PPO_EPOCHS' : 10,
'TEST_EPOCHS' : 5,
'PPO_STEPS' : 64, # Must be a multiple of MINI_BATCH_SIZE
"MINI_BATCH_SIZE" : 32,
'NEW_STUDENT_PARAMS' : '5A27001753'
}
# village 130: ['5A27001753', '5A27001932', '5A28002555', '5A29000477', '6105000515', '6112001212', '6115000404', '6116002085', 'new_student']