tweak epsilon, lr
Browse files- q-learning.pkl +2 -2
- replay.mp4 +2 -2
- results.json +1 -1
q-learning.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ab81d101ceb6dbe3b391f1ba0a72fbe604c5f192192b601f987e9dd89b83363
|
3 |
+
size 24591
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad491fb74154a91ec663b210ace8d1a58b855066eec0f35df120ae0e4ecdbc9d
|
3 |
+
size 110581
|
results.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-05-22T09:
|
|
|
1 |
+
{"env_id": "Taxi-v3", "mean_reward": 7.56, "n_eval_episodes": 100, "eval_datetime": "2022-05-22T09:19:22.584046"}
|