aarongrainer commited on
Commit
7bf81c1
1 Parent(s): 710bc7d

Initial commit

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
- value: 2.00 +/- 0.00
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -72,7 +72,7 @@ OrderedDict([('batch_size', 32),
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
- ('n_timesteps', 100000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
 
16
  type: BreakoutNoFrameskip-v4
17
  metrics:
18
  - type: mean_reward
19
+ value: 110.70 +/- 67.19
20
  name: mean_reward
21
  verified: false
22
  ---
 
72
  ('gradient_steps', 1),
73
  ('learning_rate', 0.0001),
74
  ('learning_starts', 100000),
75
+ ('n_timesteps', 1000000.0),
76
  ('optimize_memory_usage', False),
77
  ('policy', 'CnnPolicy'),
78
  ('target_update_interval', 1000),
args.yml CHANGED
@@ -54,7 +54,7 @@
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
- - 17702433
58
  - - storage
59
  - null
60
  - - study_name
 
54
  - - save_replay_buffer
55
  - false
56
  - - seed
57
+ - 2684586546
58
  - - storage
59
  - null
60
  - - study_name
config.yml CHANGED
@@ -18,7 +18,7 @@
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
- - 100000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
 
18
  - - learning_starts
19
  - 100000
20
  - - n_timesteps
21
+ - 1000000.0
22
  - - optimize_memory_usage
23
  - false
24
  - - policy
dqn-BreakoutNoFrameskip-v4.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a44048879dd24833bf206e18eeb1af9167e2746470c040e93782f327e4e5cf7
3
- size 13706816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13a4f1cf7859facf7c2ede5b306de317d1206a2634d425cc871bee45b19b7379
3
+ size 27203748
dqn-BreakoutNoFrameskip-v4/data CHANGED
The diff for this file is too large to render. See raw diff
 
dqn-BreakoutNoFrameskip-v4/policy.optimizer.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3fc84919e676e2bdcaa04814c7dfa2b7625d8d53a818418c6db25771364db93
3
- size 1120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b261e00a4a8d4a55e0e18103c8a192f8e08559e9f41cb88248b8fefad4cb8632
3
+ size 13498044
dqn-BreakoutNoFrameskip-v4/policy.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82f6d1110ed4e24eeeb04e16f36ea61db415c64a0235c359525a7d7d4dce5592
3
  size 13497178
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c720de912a19a70dcef1598c672c785e1efa4a10b99b1429fd6d3fbdc99dd3e2
3
  size 13497178
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dd1f72ac713964fdd75c7b097fe8e5be066dd20a65dbfa925d4036fa4cc1121
3
- size 55866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4481187ab9168cf2a89acab711c9b5c6fda5f351176cf1b7a4e23f7d689b134
3
+ size 73210
results.json CHANGED
@@ -1 +1 @@
1
- {"mean_reward": 2.0, "std_reward": 0.0, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-07T04:24:00.513106"}
 
1
+ {"mean_reward": 110.7, "std_reward": 67.18638254884691, "is_deterministic": false, "n_eval_episodes": 10, "eval_datetime": "2024-01-07T05:52:18.496806"}
train_eval_metrics.zip CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8630cff8ef80708566a655b651eb9bfefdf52b45971e678b7c8d23d5fafc052
3
- size 13154
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ec6c59330cb6b711e7dc7d9dfc1b94728c22d2ed695d9e7d010cd05586cc504
3
+ size 46904