Kevin King
commited on
Upload folder using huggingface_hub
Browse files- README.md +1 -1
- replay.mp4 +2 -2
- sf_log.txt +107 -0
README.md
CHANGED
@@ -15,7 +15,7 @@ model-index:
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
-
value:
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
|
|
15 |
type: doom_health_gathering_supreme
|
16 |
metrics:
|
17 |
- type: mean_reward
|
18 |
+
value: 6.43 +/- 1.43
|
19 |
name: mean_reward
|
20 |
verified: false
|
21 |
---
|
replay.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c2846299f6fafb81feed852f02a6a4c6c95525c15ccf9bdb42848a1dce510f9
|
3 |
+
size 11960428
|
sf_log.txt
CHANGED
@@ -1121,3 +1121,110 @@ main_loop: 1150.4710
|
|
1121 |
[2024-07-24 19:33:15,594][02885] Avg episode rewards: #0: 22.838, true rewards: #0: 9.938
|
1122 |
[2024-07-24 19:33:15,596][02885] Avg episode reward: 22.838, avg true_objective: 9.938
|
1123 |
[2024-07-24 19:34:17,803][02885] Replay video saved to /content/train_dir/default_experiment/replay.mp4!
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1121 |
[2024-07-24 19:33:15,594][02885] Avg episode rewards: #0: 22.838, true rewards: #0: 9.938
|
1122 |
[2024-07-24 19:33:15,596][02885] Avg episode reward: 22.838, avg true_objective: 9.938
|
1123 |
[2024-07-24 19:34:17,803][02885] Replay video saved to /content/train_dir/default_experiment/replay.mp4!
|
1124 |
+
[2024-07-24 19:34:23,227][02885] The model has been pushed to https://huggingface.co/dergky1/rl_course_vizdoom_health_gathering_supreme
|
1125 |
+
[2024-07-24 19:42:02,699][02885] Loading existing experiment configuration from /content/train_dir/default_experiment/config.json
|
1126 |
+
[2024-07-24 19:42:02,704][02885] Overriding arg 'num_workers' with value 1 passed from command line
|
1127 |
+
[2024-07-24 19:42:02,706][02885] Adding new argument 'no_render'=True that is not in the saved config file!
|
1128 |
+
[2024-07-24 19:42:02,707][02885] Adding new argument 'save_video'=True that is not in the saved config file!
|
1129 |
+
[2024-07-24 19:42:02,709][02885] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!
|
1130 |
+
[2024-07-24 19:42:02,714][02885] Adding new argument 'video_name'=None that is not in the saved config file!
|
1131 |
+
[2024-07-24 19:42:02,715][02885] Adding new argument 'max_num_frames'=100000 that is not in the saved config file!
|
1132 |
+
[2024-07-24 19:42:02,717][02885] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!
|
1133 |
+
[2024-07-24 19:42:02,718][02885] Adding new argument 'push_to_hub'=True that is not in the saved config file!
|
1134 |
+
[2024-07-24 19:42:02,720][02885] Adding new argument 'hf_repository'='dergky1/rl_course_vizdoom_health_gathering_supreme' that is not in the saved config file!
|
1135 |
+
[2024-07-24 19:42:02,724][02885] Adding new argument 'policy_index'=0 that is not in the saved config file!
|
1136 |
+
[2024-07-24 19:42:02,725][02885] Adding new argument 'eval_deterministic'=False that is not in the saved config file!
|
1137 |
+
[2024-07-24 19:42:02,730][02885] Adding new argument 'train_script'=None that is not in the saved config file!
|
1138 |
+
[2024-07-24 19:42:02,734][02885] Adding new argument 'enjoy_script'=None that is not in the saved config file!
|
1139 |
+
[2024-07-24 19:42:02,736][02885] Using frameskip 1 and render_action_repeat=4 for evaluation
|
1140 |
+
[2024-07-24 19:42:02,779][02885] RunningMeanStd input shape: (3, 72, 128)
|
1141 |
+
[2024-07-24 19:42:02,782][02885] RunningMeanStd input shape: (1,)
|
1142 |
+
[2024-07-24 19:42:02,801][02885] ConvEncoder: input_channels=3
|
1143 |
+
[2024-07-24 19:42:02,865][02885] Conv encoder output size: 512
|
1144 |
+
[2024-07-24 19:42:02,868][02885] Policy head output size: 512
|
1145 |
+
[2024-07-24 19:42:02,903][02885] Loading state from checkpoint /content/train_dir/default_experiment/checkpoint_p0/checkpoint_000000978_4005888.pth...
|
1146 |
+
[2024-07-24 19:42:03,570][02885] Num frames 100...
|
1147 |
+
[2024-07-24 19:42:03,752][02885] Num frames 200...
|
1148 |
+
[2024-07-24 19:42:03,929][02885] Num frames 300...
|
1149 |
+
[2024-07-24 19:42:04,126][02885] Num frames 400...
|
1150 |
+
[2024-07-24 19:42:04,273][02885] Avg episode rewards: #0: 5.480, true rewards: #0: 4.480
|
1151 |
+
[2024-07-24 19:42:04,275][02885] Avg episode reward: 5.480, avg true_objective: 4.480
|
1152 |
+
[2024-07-24 19:42:04,372][02885] Num frames 500...
|
1153 |
+
[2024-07-24 19:42:04,563][02885] Num frames 600...
|
1154 |
+
[2024-07-24 19:42:04,751][02885] Num frames 700...
|
1155 |
+
[2024-07-24 19:42:04,957][02885] Num frames 800...
|
1156 |
+
[2024-07-24 19:42:05,188][02885] Num frames 900...
|
1157 |
+
[2024-07-24 19:42:05,343][02885] Num frames 1000...
|
1158 |
+
[2024-07-24 19:42:05,469][02885] Num frames 1100...
|
1159 |
+
[2024-07-24 19:42:05,593][02885] Num frames 1200...
|
1160 |
+
[2024-07-24 19:42:05,767][02885] Avg episode rewards: #0: 10.950, true rewards: #0: 6.450
|
1161 |
+
[2024-07-24 19:42:05,769][02885] Avg episode reward: 10.950, avg true_objective: 6.450
|
1162 |
+
[2024-07-24 19:42:05,785][02885] Num frames 1300...
|
1163 |
+
[2024-07-24 19:42:05,922][02885] Num frames 1400...
|
1164 |
+
[2024-07-24 19:42:06,060][02885] Num frames 1500...
|
1165 |
+
[2024-07-24 19:42:06,187][02885] Num frames 1600...
|
1166 |
+
[2024-07-24 19:42:06,315][02885] Num frames 1700...
|
1167 |
+
[2024-07-24 19:42:06,440][02885] Num frames 1800...
|
1168 |
+
[2024-07-24 19:42:06,578][02885] Avg episode rewards: #0: 10.553, true rewards: #0: 6.220
|
1169 |
+
[2024-07-24 19:42:06,580][02885] Avg episode reward: 10.553, avg true_objective: 6.220
|
1170 |
+
[2024-07-24 19:42:06,628][02885] Num frames 1900...
|
1171 |
+
[2024-07-24 19:42:06,757][02885] Num frames 2000...
|
1172 |
+
[2024-07-24 19:42:06,883][02885] Num frames 2100...
|
1173 |
+
[2024-07-24 19:42:07,024][02885] Num frames 2200...
|
1174 |
+
[2024-07-24 19:42:07,165][02885] Num frames 2300...
|
1175 |
+
[2024-07-24 19:42:07,240][02885] Avg episode rewards: #0: 9.285, true rewards: #0: 5.785
|
1176 |
+
[2024-07-24 19:42:07,242][02885] Avg episode reward: 9.285, avg true_objective: 5.785
|
1177 |
+
[2024-07-24 19:42:07,353][02885] Num frames 2400...
|
1178 |
+
[2024-07-24 19:42:07,483][02885] Num frames 2500...
|
1179 |
+
[2024-07-24 19:42:07,606][02885] Num frames 2600...
|
1180 |
+
[2024-07-24 19:42:07,736][02885] Num frames 2700...
|
1181 |
+
[2024-07-24 19:42:07,863][02885] Num frames 2800...
|
1182 |
+
[2024-07-24 19:42:08,001][02885] Num frames 2900...
|
1183 |
+
[2024-07-24 19:42:08,140][02885] Num frames 3000...
|
1184 |
+
[2024-07-24 19:42:08,261][02885] Avg episode rewards: #0: 9.900, true rewards: #0: 6.100
|
1185 |
+
[2024-07-24 19:42:08,264][02885] Avg episode reward: 9.900, avg true_objective: 6.100
|
1186 |
+
[2024-07-24 19:42:08,331][02885] Num frames 3100...
|
1187 |
+
[2024-07-24 19:42:08,460][02885] Num frames 3200...
|
1188 |
+
[2024-07-24 19:42:08,585][02885] Num frames 3300...
|
1189 |
+
[2024-07-24 19:42:08,716][02885] Num frames 3400...
|
1190 |
+
[2024-07-24 19:42:08,844][02885] Num frames 3500...
|
1191 |
+
[2024-07-24 19:42:09,015][02885] Avg episode rewards: #0: 9.805, true rewards: #0: 5.972
|
1192 |
+
[2024-07-24 19:42:09,017][02885] Avg episode reward: 9.805, avg true_objective: 5.972
|
1193 |
+
[2024-07-24 19:42:09,042][02885] Num frames 3600...
|
1194 |
+
[2024-07-24 19:42:09,178][02885] Num frames 3700...
|
1195 |
+
[2024-07-24 19:42:09,304][02885] Num frames 3800...
|
1196 |
+
[2024-07-24 19:42:09,429][02885] Num frames 3900...
|
1197 |
+
[2024-07-24 19:42:09,557][02885] Num frames 4000...
|
1198 |
+
[2024-07-24 19:42:09,683][02885] Num frames 4100...
|
1199 |
+
[2024-07-24 19:42:09,808][02885] Num frames 4200...
|
1200 |
+
[2024-07-24 19:42:09,892][02885] Avg episode rewards: #0: 9.889, true rewards: #0: 6.031
|
1201 |
+
[2024-07-24 19:42:09,898][02885] Avg episode reward: 9.889, avg true_objective: 6.031
|
1202 |
+
[2024-07-24 19:42:10,010][02885] Num frames 4300...
|
1203 |
+
[2024-07-24 19:42:10,151][02885] Num frames 4400...
|
1204 |
+
[2024-07-24 19:42:10,281][02885] Num frames 4500...
|
1205 |
+
[2024-07-24 19:42:10,407][02885] Num frames 4600...
|
1206 |
+
[2024-07-24 19:42:10,532][02885] Num frames 4700...
|
1207 |
+
[2024-07-24 19:42:10,664][02885] Num frames 4800...
|
1208 |
+
[2024-07-24 19:42:10,796][02885] Avg episode rewards: #0: 9.828, true rewards: #0: 6.077
|
1209 |
+
[2024-07-24 19:42:10,798][02885] Avg episode reward: 9.828, avg true_objective: 6.077
|
1210 |
+
[2024-07-24 19:42:10,849][02885] Num frames 4900...
|
1211 |
+
[2024-07-24 19:42:10,982][02885] Num frames 5000...
|
1212 |
+
[2024-07-24 19:42:11,111][02885] Num frames 5100...
|
1213 |
+
[2024-07-24 19:42:11,246][02885] Num frames 5200...
|
1214 |
+
[2024-07-24 19:42:11,371][02885] Num frames 5300...
|
1215 |
+
[2024-07-24 19:42:11,500][02885] Num frames 5400...
|
1216 |
+
[2024-07-24 19:42:11,626][02885] Num frames 5500...
|
1217 |
+
[2024-07-24 19:42:11,754][02885] Num frames 5600...
|
1218 |
+
[2024-07-24 19:42:11,883][02885] Num frames 5700...
|
1219 |
+
[2024-07-24 19:42:12,023][02885] Avg episode rewards: #0: 10.953, true rewards: #0: 6.398
|
1220 |
+
[2024-07-24 19:42:12,025][02885] Avg episode reward: 10.953, avg true_objective: 6.398
|
1221 |
+
[2024-07-24 19:42:12,082][02885] Num frames 5800...
|
1222 |
+
[2024-07-24 19:42:12,220][02885] Num frames 5900...
|
1223 |
+
[2024-07-24 19:42:12,345][02885] Num frames 6000...
|
1224 |
+
[2024-07-24 19:42:12,471][02885] Num frames 6100...
|
1225 |
+
[2024-07-24 19:42:12,601][02885] Num frames 6200...
|
1226 |
+
[2024-07-24 19:42:12,729][02885] Num frames 6300...
|
1227 |
+
[2024-07-24 19:42:12,868][02885] Num frames 6400...
|
1228 |
+
[2024-07-24 19:42:12,973][02885] Avg episode rewards: #0: 10.930, true rewards: #0: 6.430
|
1229 |
+
[2024-07-24 19:42:12,976][02885] Avg episode reward: 10.930, avg true_objective: 6.430
|
1230 |
+
[2024-07-24 19:42:51,453][02885] Replay video saved to /content/train_dir/default_experiment/replay.mp4!
|