Upload policy_config.py with huggingface_hub
Browse files- policy_config.py +4 -3
policy_config.py
CHANGED
@@ -11,10 +11,10 @@ exp_config = {
|
|
11 |
'cfg_type': 'BaseEnvManagerDict'
|
12 |
},
|
13 |
'stop_value': 240,
|
|
|
14 |
'env_id': 'LunarLanderContinuous-v2',
|
15 |
'collector_env_num': 4,
|
16 |
'evaluator_env_num': 8,
|
17 |
-
'n_evaluator_episode': 8,
|
18 |
'act_scale': True
|
19 |
},
|
20 |
'policy': {
|
@@ -67,9 +67,10 @@ exp_config = {
|
|
67 |
'render_freq': -1,
|
68 |
'mode': 'train_iter'
|
69 |
},
|
|
|
70 |
'cfg_type': 'InteractionSerialEvaluatorDict',
|
71 |
-
'
|
72 |
-
'
|
73 |
}
|
74 |
},
|
75 |
'other': {
|
|
|
11 |
'cfg_type': 'BaseEnvManagerDict'
|
12 |
},
|
13 |
'stop_value': 240,
|
14 |
+
'n_evaluator_episode': 8,
|
15 |
'env_id': 'LunarLanderContinuous-v2',
|
16 |
'collector_env_num': 4,
|
17 |
'evaluator_env_num': 8,
|
|
|
18 |
'act_scale': True
|
19 |
},
|
20 |
'policy': {
|
|
|
67 |
'render_freq': -1,
|
68 |
'mode': 'train_iter'
|
69 |
},
|
70 |
+
'figure_path': None,
|
71 |
'cfg_type': 'InteractionSerialEvaluatorDict',
|
72 |
+
'stop_value': 240,
|
73 |
+
'n_episode': 8
|
74 |
}
|
75 |
},
|
76 |
'other': {
|