jaymanvirk commited on
Commit
5f86876
1 Parent(s): 444e5c9

Upload folder using huggingface_hub

Browse files
.summary/0/events.out.tfevents.1715928454.f186c3f8af36 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b703eebcfbe830ecbbc87c2b6342e1b51cd12991a83a0c0eb90fc97ede7891f9
3
+ size 439460
README.md CHANGED
@@ -15,7 +15,7 @@ model-index:
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
- value: 8.36 +/- 4.79
19
  name: mean_reward
20
  verified: false
21
  ---
 
15
  type: doom_health_gathering_supreme
16
  metrics:
17
  - type: mean_reward
18
+ value: 9.46 +/- 5.33
19
  name: mean_reward
20
  verified: false
21
  ---
checkpoint_p0/best_000000727_2977792_reward_22.923.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edb709545039827fac47c97b0e58f7096f5d310bfe3f1856f3b6c7f4c215589d
3
+ size 34929051
checkpoint_p0/checkpoint_000000934_3825664.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a08a1930c15f41cf3d62ee404714b54d1845d0a261573ac48d837ec71341264
3
+ size 34929477
checkpoint_p0/checkpoint_000000978_4005888.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab8d153277fc0035347bc05b18fa6f49391f445404ed649821d601f9bf260a51
3
  size 34929477
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fc3c91f45dddb59a50df15bcdedf79b96730793505c3ea1539061166caac640
3
  size 34929477
config.json CHANGED
@@ -6,7 +6,7 @@
6
  "train_dir": "/kaggle/working/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
- "seed": null,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
@@ -16,7 +16,7 @@
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
- "num_envs_per_worker": 4,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
@@ -30,7 +30,7 @@
30
  "normalize_returns": true,
31
  "exploration_loss_coeff": 0.001,
32
  "value_loss_coeff": 0.5,
33
- "kl_loss_coeff": 0.0,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
  "ppo_clip_ratio": 0.1,
@@ -130,11 +130,13 @@
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
- "command_line": "--env=doom_health_gathering_supreme --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=4000000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
 
136
  "num_workers": 8,
137
- "num_envs_per_worker": 4,
 
138
  "train_for_env_steps": 4000000
139
  },
140
  "git_hash": "unknown",
 
6
  "train_dir": "/kaggle/working/train_dir",
7
  "restart_behavior": "resume",
8
  "device": "gpu",
9
+ "seed": 0,
10
  "num_policies": 1,
11
  "async_rl": true,
12
  "serial_mode": false,
 
16
  "policy_workers_per_policy": 1,
17
  "max_policy_lag": 1000,
18
  "num_workers": 8,
19
+ "num_envs_per_worker": 8,
20
  "batch_size": 1024,
21
  "num_batches_per_epoch": 1,
22
  "num_epochs": 1,
 
30
  "normalize_returns": true,
31
  "exploration_loss_coeff": 0.001,
32
  "value_loss_coeff": 0.5,
33
+ "kl_loss_coeff": 0.3,
34
  "exploration_loss": "symmetric_kl",
35
  "gae_lambda": 0.95,
36
  "ppo_clip_ratio": 0.1,
 
130
  "wide_aspect_ratio": false,
131
  "eval_env_frameskip": 1,
132
  "fps": 35,
133
+ "command_line": "--env=doom_health_gathering_supreme --seed=0 --kl_loss_coeff=0.3 --num_workers=8 --num_envs_per_worker=8 --train_for_env_steps=4000000",
134
  "cli_args": {
135
  "env": "doom_health_gathering_supreme",
136
+ "seed": 0,
137
  "num_workers": 8,
138
+ "num_envs_per_worker": 8,
139
+ "kl_loss_coeff": 0.3,
140
  "train_for_env_steps": 4000000
141
  },
142
  "git_hash": "unknown",
replay.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aefb90d9d9fc0a9d21e8d66140b485b21cd5696a30c9d972a2b2c01f8c381788
3
- size 16378745
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5a3b35f488a265d644abd68809e7dce7747cf58e06d9b565a3b67aeb10a55c6
3
+ size 18095784
sf_log.txt CHANGED
The diff for this file is too large to render. See raw diff