hishamcse commited on
Commit
9222647
·
verified ·
1 Parent(s): 70583fb

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +32 -16
config.json CHANGED
@@ -4,7 +4,7 @@
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
  "train_dir": "/kaggle/working/train_dir",
7
- "restart_behavior": "resume",
8
  "device": "gpu",
9
  "seed": null,
10
  "num_policies": 1,
@@ -15,9 +15,9 @@
15
  "worker_num_splits": 2,
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
- "num_workers": 8,
19
- "num_envs_per_worker": 4,
20
- "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
@@ -42,7 +42,7 @@
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
- "max_grad_norm": 4.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
@@ -50,7 +50,7 @@
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
52
  "normalize_input_keys": null,
53
- "decorrelate_experience_max_seconds": 0,
54
  "decorrelate_envs_on_one_worker": true,
55
  "actor_worker_gpus": [],
56
  "set_workers_cpu_affinity": true,
@@ -61,10 +61,10 @@
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
- "heartbeat_interval": 20,
65
- "heartbeat_reporting_interval": 600,
66
- "train_for_env_steps": 10000000,
67
- "train_for_seconds": 10000000000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
70
  "load_checkpoint_kind": "latest",
@@ -83,10 +83,10 @@
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
- "rnn_type": "gru",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
- "nonlinearity": "elu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
@@ -128,12 +128,28 @@
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=10000000",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
- "num_workers": 8,
135
- "num_envs_per_worker": 4,
136
- "train_for_env_steps": 10000000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
137
  },
138
  "git_hash": "unknown",
139
  "git_repo_name": "not a git repository",
 
4
  "env": "doom_health_gathering_supreme",
5
  "experiment": "default_experiment",
6
  "train_dir": "/kaggle/working/train_dir",
7
+ "restart_behavior": "restart",
8
  "device": "gpu",
9
  "seed": null,
10
  "num_policies": 1,
 
15
  "worker_num_splits": 2,
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
+ "num_workers": 20,
19
+ "num_envs_per_worker": 12,
20
+ "batch_size": 2048,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
23
  "rollout": 32,
 
42
  "adam_eps": 1e-06,
43
  "adam_beta1": 0.9,
44
  "adam_beta2": 0.999,
45
+ "max_grad_norm": 0.0,
46
  "learning_rate": 0.0001,
47
  "lr_schedule": "constant",
48
  "lr_schedule_kl_threshold": 0.008,
 
50
  "obs_scale": 255.0,
51
  "normalize_input": true,
52
  "normalize_input_keys": null,
53
+ "decorrelate_experience_max_seconds": 1,
54
  "decorrelate_envs_on_one_worker": true,
55
  "actor_worker_gpus": [],
56
  "set_workers_cpu_affinity": true,
 
61
  "flush_summaries_interval": 30,
62
  "stats_avg": 100,
63
  "summaries_use_frameskip": true,
64
+ "heartbeat_interval": 10,
65
+ "heartbeat_reporting_interval": 300,
66
+ "train_for_env_steps": 1000000000,
67
+ "train_for_seconds": 360000,
68
  "save_every_sec": 120,
69
  "keep_checkpoints": 2,
70
  "load_checkpoint_kind": "latest",
 
83
  ],
84
  "use_rnn": true,
85
  "rnn_size": 512,
86
+ "rnn_type": "lstm",
87
  "rnn_num_layers": 1,
88
  "decoder_mlp_layers": [],
89
+ "nonlinearity": "relu",
90
  "policy_initialization": "orthogonal",
91
  "policy_init_gain": 1.0,
92
  "actor_critic_share_weights": true,
 
128
  "wide_aspect_ratio": false,
129
  "eval_env_frameskip": 1,
130
  "fps": 35,
131
+ "command_line": "--env=doom_health_gathering_supreme --restart_behavior=restart --num_workers=20 --num_envs_per_worker=12 --batch_size=2048 --recurrence=32 --exploration_loss_coeff=0.001 --exploration_loss=symmetric_kl --ppo_clip_value=0.2 --max_grad_norm=0.0 --obs_scale=255.0 --decorrelate_experience_max_seconds=1 --heartbeat_interval=10 --heartbeat_reporting_interval=300 --train_for_env_steps=1000000000 --train_for_seconds=360000 --benchmark=false --use_rnn=true --rnn_type=lstm --nonlinearity=relu",
132
  "cli_args": {
133
  "env": "doom_health_gathering_supreme",
134
+ "restart_behavior": "restart",
135
+ "num_workers": 20,
136
+ "num_envs_per_worker": 12,
137
+ "batch_size": 2048,
138
+ "recurrence": 32,
139
+ "exploration_loss_coeff": 0.001,
140
+ "exploration_loss": "symmetric_kl",
141
+ "ppo_clip_value": 0.2,
142
+ "max_grad_norm": 0.0,
143
+ "obs_scale": 255.0,
144
+ "decorrelate_experience_max_seconds": 1,
145
+ "heartbeat_interval": 10,
146
+ "heartbeat_reporting_interval": 300,
147
+ "train_for_env_steps": 1000000000,
148
+ "train_for_seconds": 360000,
149
+ "benchmark": false,
150
+ "use_rnn": true,
151
+ "rnn_type": "lstm",
152
+ "nonlinearity": "relu"
153
  },
154
  "git_hash": "unknown",
155
  "git_repo_name": "not a git repository",