sdpkjc commited on
Commit
82dcb58
Β·
1 Parent(s): 899ebe5

pushing model

Browse files
.gitattributes CHANGED
@@ -37,3 +37,6 @@ videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval/rl-video-e
37
  videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
38
  videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
39
  replay.mp4 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
37
  videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
38
  videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
39
  replay.mp4 filter=lfs diff=lfs merge=lfs -text
40
+ videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval/rl-video-episode-0.mp4 filter=lfs diff=lfs merge=lfs -text
41
+ videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval/rl-video-episode-1.mp4 filter=lfs diff=lfs merge=lfs -text
42
+ videos/HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval/rl-video-episode-8.mp4 filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -16,7 +16,7 @@ model-index:
16
  type: HalfCheetah-v2
17
  metrics:
18
  - type: mean_reward
19
- value: 8342.83 +/- 244.76
20
  name: mean_reward
21
  verified: false
22
  ---
@@ -46,7 +46,7 @@ curl -OL https://huggingface.co/cleanrl/HalfCheetah-v2-ddpg_continuous_action_ja
46
  curl -OL https://huggingface.co/cleanrl/HalfCheetah-v2-ddpg_continuous_action_jax-seed1/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/cleanrl/HalfCheetah-v2-ddpg_continuous_action_jax-seed1/raw/main/poetry.lock
48
  poetry install --all-extras
49
- python ddpg_continuous_action_jax.py --track --capture-video --save-model --hf-entity cleanrl --upload-mode --env-id HalfCheetah-v2 --seed 1
50
  ```
51
 
52
  # Hyperparameters
 
16
  type: HalfCheetah-v2
17
  metrics:
18
  - type: mean_reward
19
+ value: 10083.75 +/- 205.96
20
  name: mean_reward
21
  verified: false
22
  ---
 
46
  curl -OL https://huggingface.co/cleanrl/HalfCheetah-v2-ddpg_continuous_action_jax-seed1/raw/main/pyproject.toml
47
  curl -OL https://huggingface.co/cleanrl/HalfCheetah-v2-ddpg_continuous_action_jax-seed1/raw/main/poetry.lock
48
  poetry install --all-extras
49
+ python ddpg_continuous_action_jax.py --track --capture-video --save-model --hf-entity cleanrl --upload-mode --env-id HalfCheetah-v2
50
  ```
51
 
52
  # Hyperparameters
ddpg_continuous_action_jax.cleanrl_model CHANGED
Binary files a/ddpg_continuous_action_jax.cleanrl_model and b/ddpg_continuous_action_jax.cleanrl_model differ
 
events.out.tfevents.1688050742.3090-172.1323964.0 β†’ events.out.tfevents.1688131132.3090-172.1375710.0 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:179074f19d98c7e1a00475b179492d75439f798e9c9f63d2ee4b62f8b6be55ba
3
  size 2260134
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb68444ec727fbc36dfa5a8731989d09d4823abe0549c8420d6ac93846b860c0
3
  size 2260134
pyproject.toml CHANGED
@@ -105,9 +105,4 @@ qdagger_dqn_atari_impalacnn = [
105
  qdagger_dqn_atari_jax_impalacnn = [
106
  "ale-py", "AutoROM", "opencv-python", # atari
107
  "jax", "jaxlib", "flax", # jax
108
- ]
109
-
110
- [[tool.poetry.source]]
111
- name = "tsinghua"
112
- url = "https://pypi.tuna.tsinghua.edu.cn/simple"
113
- default = true
 
105
  qdagger_dqn_atari_jax_impalacnn = [
106
  "ale-py", "AutoROM", "opencv-python", # atari
107
  "jax", "jaxlib", "flax", # jax
108
+ ]
 
 
 
 
 
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba88e953fcb7bb22bbc2b9169117d43e990f23f8da1b0576d2ce3f7f0330185e
3
- size 1315247
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18de031e41a6d2e3e6001718b48e618ff2ecf6d8aed6c31a1674242ccf781639
3
+ size 1376105
videos/{HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval β†’ HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval}/rl-video-episode-0.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ba8762e75acd1e202b038f341e9f8896c57d90383e4c96d62f70db06eac2d52
3
- size 1377406
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b80b13117ad53c2443373326a5d2d2c6032ffc0a57142d9bff1b6639726825b4
3
+ size 1376629
videos/{HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval β†’ HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval}/rl-video-episode-1.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a45a425289b8f647ab157de95d613bb4cce8c435ce5ea612f3bd4536ca92cda
3
- size 1343876
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:545b2fc1ba7da357d4ed37fe7a80b012817829fb4d57cb71ffe22aa6a0543fb4
3
+ size 1362075
videos/{HalfCheetah-v2__ddpg_continuous_action_jax__1__1688050725-eval β†’ HalfCheetah-v2__ddpg_continuous_action_jax__1__1688131116-eval}/rl-video-episode-8.mp4 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba88e953fcb7bb22bbc2b9169117d43e990f23f8da1b0576d2ce3f7f0330185e
3
- size 1315247
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18de031e41a6d2e3e6001718b48e618ff2ecf6d8aed6c31a1674242ccf781639
3
+ size 1376105