Efferbach commited on
Commit
8de13bf
1 Parent(s): 7656836

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 25.97,
3
+ "eval_accuracy_background": NaN,
4
+ "eval_accuracy_left": 0.0,
5
+ "eval_accuracy_right": 0.0,
6
+ "eval_iou_background": 0.0,
7
+ "eval_iou_left": 0.0,
8
+ "eval_iou_right": 0.0,
9
+ "eval_loss": 0.08214545249938965,
10
+ "eval_mean_accuracy": 0.0,
11
+ "eval_mean_iou": 0.0,
12
+ "eval_overall_accuracy": 0.0,
13
+ "eval_runtime": 145.4719,
14
+ "eval_samples_per_second": 0.887,
15
+ "eval_steps_per_second": 0.117,
16
+ "train_loss": 0.10369874272346497,
17
+ "train_runtime": 11613.3095,
18
+ "train_samples_per_second": 6.889,
19
+ "train_steps_per_second": 0.861
20
+ }
eval_results.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 25.97,
3
+ "eval_accuracy_background": NaN,
4
+ "eval_accuracy_left": 0.0,
5
+ "eval_accuracy_right": 0.0,
6
+ "eval_iou_background": 0.0,
7
+ "eval_iou_left": 0.0,
8
+ "eval_iou_right": 0.0,
9
+ "eval_loss": 0.08214545249938965,
10
+ "eval_mean_accuracy": 0.0,
11
+ "eval_mean_iou": 0.0,
12
+ "eval_overall_accuracy": 0.0,
13
+ "eval_runtime": 145.4719,
14
+ "eval_samples_per_second": 0.887,
15
+ "eval_steps_per_second": 0.117
16
+ }
runs/Apr08_12-03-00_0ab892ee8a37/events.out.tfevents.1680967161.0ab892ee8a37.47320.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52538990dab7ad84623fda3160d24659ff02802c2d349d17172094bab7d9f3ce
3
+ size 869
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 25.97,
3
+ "train_loss": 0.10369874272346497,
4
+ "train_runtime": 11613.3095,
5
+ "train_samples_per_second": 6.889,
6
+ "train_steps_per_second": 0.861
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,1067 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 25.974025974025974,
5
+ "global_step": 10000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "learning_rate": 5.9401e-05,
13
+ "loss": 0.9514,
14
+ "step": 100
15
+ },
16
+ {
17
+ "epoch": 0.52,
18
+ "learning_rate": 5.8802000000000004e-05,
19
+ "loss": 0.7058,
20
+ "step": 200
21
+ },
22
+ {
23
+ "epoch": 0.78,
24
+ "learning_rate": 5.8203e-05,
25
+ "loss": 0.5041,
26
+ "step": 300
27
+ },
28
+ {
29
+ "epoch": 1.0,
30
+ "eval_accuracy_background": NaN,
31
+ "eval_accuracy_left": 0.0,
32
+ "eval_accuracy_right": 0.0,
33
+ "eval_iou_background": 0.0,
34
+ "eval_iou_left": 0.0,
35
+ "eval_iou_right": 0.0,
36
+ "eval_loss": 0.33822229504585266,
37
+ "eval_mean_accuracy": 0.0,
38
+ "eval_mean_iou": 0.0,
39
+ "eval_overall_accuracy": 0.0,
40
+ "eval_runtime": 142.7389,
41
+ "eval_samples_per_second": 0.904,
42
+ "eval_steps_per_second": 0.119,
43
+ "step": 385
44
+ },
45
+ {
46
+ "epoch": 1.04,
47
+ "learning_rate": 5.7604e-05,
48
+ "loss": 0.3458,
49
+ "step": 400
50
+ },
51
+ {
52
+ "epoch": 1.3,
53
+ "learning_rate": 5.7005e-05,
54
+ "loss": 0.2466,
55
+ "step": 500
56
+ },
57
+ {
58
+ "epoch": 1.56,
59
+ "learning_rate": 5.6406e-05,
60
+ "loss": 0.19,
61
+ "step": 600
62
+ },
63
+ {
64
+ "epoch": 1.82,
65
+ "learning_rate": 5.5806999999999996e-05,
66
+ "loss": 0.1553,
67
+ "step": 700
68
+ },
69
+ {
70
+ "epoch": 2.0,
71
+ "eval_accuracy_background": NaN,
72
+ "eval_accuracy_left": 0.0,
73
+ "eval_accuracy_right": 0.0,
74
+ "eval_iou_background": 0.0,
75
+ "eval_iou_left": 0.0,
76
+ "eval_iou_right": 0.0,
77
+ "eval_loss": 0.13873086869716644,
78
+ "eval_mean_accuracy": 0.0,
79
+ "eval_mean_iou": 0.0,
80
+ "eval_overall_accuracy": 0.0,
81
+ "eval_runtime": 145.3756,
82
+ "eval_samples_per_second": 0.887,
83
+ "eval_steps_per_second": 0.117,
84
+ "step": 770
85
+ },
86
+ {
87
+ "epoch": 2.08,
88
+ "learning_rate": 5.5208000000000004e-05,
89
+ "loss": 0.1338,
90
+ "step": 800
91
+ },
92
+ {
93
+ "epoch": 2.34,
94
+ "learning_rate": 5.4609000000000005e-05,
95
+ "loss": 0.1184,
96
+ "step": 900
97
+ },
98
+ {
99
+ "epoch": 2.6,
100
+ "learning_rate": 5.401e-05,
101
+ "loss": 0.1087,
102
+ "step": 1000
103
+ },
104
+ {
105
+ "epoch": 2.86,
106
+ "learning_rate": 5.3411e-05,
107
+ "loss": 0.1019,
108
+ "step": 1100
109
+ },
110
+ {
111
+ "epoch": 3.0,
112
+ "eval_accuracy_background": NaN,
113
+ "eval_accuracy_left": 0.0,
114
+ "eval_accuracy_right": 0.0,
115
+ "eval_iou_background": 0.0,
116
+ "eval_iou_left": 0.0,
117
+ "eval_iou_right": 0.0,
118
+ "eval_loss": 0.1036786362528801,
119
+ "eval_mean_accuracy": 0.0,
120
+ "eval_mean_iou": 0.0,
121
+ "eval_overall_accuracy": 0.0,
122
+ "eval_runtime": 143.5246,
123
+ "eval_samples_per_second": 0.899,
124
+ "eval_steps_per_second": 0.118,
125
+ "step": 1155
126
+ },
127
+ {
128
+ "epoch": 3.12,
129
+ "learning_rate": 5.2812e-05,
130
+ "loss": 0.097,
131
+ "step": 1200
132
+ },
133
+ {
134
+ "epoch": 3.38,
135
+ "learning_rate": 5.2213e-05,
136
+ "loss": 0.093,
137
+ "step": 1300
138
+ },
139
+ {
140
+ "epoch": 3.64,
141
+ "learning_rate": 5.1614000000000004e-05,
142
+ "loss": 0.0906,
143
+ "step": 1400
144
+ },
145
+ {
146
+ "epoch": 3.9,
147
+ "learning_rate": 5.1015e-05,
148
+ "loss": 0.0882,
149
+ "step": 1500
150
+ },
151
+ {
152
+ "epoch": 4.0,
153
+ "eval_accuracy_background": NaN,
154
+ "eval_accuracy_left": 0.0,
155
+ "eval_accuracy_right": 0.0,
156
+ "eval_iou_background": 0.0,
157
+ "eval_iou_left": 0.0,
158
+ "eval_iou_right": 0.0,
159
+ "eval_loss": 0.08832325041294098,
160
+ "eval_mean_accuracy": 0.0,
161
+ "eval_mean_iou": 0.0,
162
+ "eval_overall_accuracy": 0.0,
163
+ "eval_runtime": 143.2361,
164
+ "eval_samples_per_second": 0.901,
165
+ "eval_steps_per_second": 0.119,
166
+ "step": 1540
167
+ },
168
+ {
169
+ "epoch": 4.16,
170
+ "learning_rate": 5.0416e-05,
171
+ "loss": 0.0867,
172
+ "step": 1600
173
+ },
174
+ {
175
+ "epoch": 4.42,
176
+ "learning_rate": 4.9817e-05,
177
+ "loss": 0.0854,
178
+ "step": 1700
179
+ },
180
+ {
181
+ "epoch": 4.68,
182
+ "learning_rate": 4.9218e-05,
183
+ "loss": 0.084,
184
+ "step": 1800
185
+ },
186
+ {
187
+ "epoch": 4.94,
188
+ "learning_rate": 4.8619e-05,
189
+ "loss": 0.0828,
190
+ "step": 1900
191
+ },
192
+ {
193
+ "epoch": 5.0,
194
+ "eval_accuracy_background": NaN,
195
+ "eval_accuracy_left": 0.0,
196
+ "eval_accuracy_right": 0.0,
197
+ "eval_iou_background": 0.0,
198
+ "eval_iou_left": 0.0,
199
+ "eval_iou_right": 0.0,
200
+ "eval_loss": 0.08227328956127167,
201
+ "eval_mean_accuracy": 0.0,
202
+ "eval_mean_iou": 0.0,
203
+ "eval_overall_accuracy": 0.0,
204
+ "eval_runtime": 142.7729,
205
+ "eval_samples_per_second": 0.904,
206
+ "eval_steps_per_second": 0.119,
207
+ "step": 1925
208
+ },
209
+ {
210
+ "epoch": 5.19,
211
+ "learning_rate": 4.8020000000000004e-05,
212
+ "loss": 0.0826,
213
+ "step": 2000
214
+ },
215
+ {
216
+ "epoch": 5.45,
217
+ "learning_rate": 4.7421000000000006e-05,
218
+ "loss": 0.0817,
219
+ "step": 2100
220
+ },
221
+ {
222
+ "epoch": 5.71,
223
+ "learning_rate": 4.6822e-05,
224
+ "loss": 0.081,
225
+ "step": 2200
226
+ },
227
+ {
228
+ "epoch": 5.97,
229
+ "learning_rate": 4.6223e-05,
230
+ "loss": 0.0807,
231
+ "step": 2300
232
+ },
233
+ {
234
+ "epoch": 6.0,
235
+ "eval_accuracy_background": NaN,
236
+ "eval_accuracy_left": 0.0,
237
+ "eval_accuracy_right": 0.0,
238
+ "eval_iou_background": 0.0,
239
+ "eval_iou_left": 0.0,
240
+ "eval_iou_right": 0.0,
241
+ "eval_loss": 0.08197005838155746,
242
+ "eval_mean_accuracy": 0.0,
243
+ "eval_mean_iou": 0.0,
244
+ "eval_overall_accuracy": 0.0,
245
+ "eval_runtime": 144.6634,
246
+ "eval_samples_per_second": 0.892,
247
+ "eval_steps_per_second": 0.118,
248
+ "step": 2310
249
+ },
250
+ {
251
+ "epoch": 6.23,
252
+ "learning_rate": 4.5624e-05,
253
+ "loss": 0.0803,
254
+ "step": 2400
255
+ },
256
+ {
257
+ "epoch": 6.49,
258
+ "learning_rate": 4.5025000000000003e-05,
259
+ "loss": 0.0798,
260
+ "step": 2500
261
+ },
262
+ {
263
+ "epoch": 6.75,
264
+ "learning_rate": 4.4426000000000005e-05,
265
+ "loss": 0.0795,
266
+ "step": 2600
267
+ },
268
+ {
269
+ "epoch": 7.0,
270
+ "eval_accuracy_background": NaN,
271
+ "eval_accuracy_left": 0.0,
272
+ "eval_accuracy_right": 0.0,
273
+ "eval_iou_background": 0.0,
274
+ "eval_iou_left": 0.0,
275
+ "eval_iou_right": 0.0,
276
+ "eval_loss": 0.08042579144239426,
277
+ "eval_mean_accuracy": 0.0,
278
+ "eval_mean_iou": 0.0,
279
+ "eval_overall_accuracy": 0.0,
280
+ "eval_runtime": 143.7993,
281
+ "eval_samples_per_second": 0.897,
282
+ "eval_steps_per_second": 0.118,
283
+ "step": 2695
284
+ },
285
+ {
286
+ "epoch": 7.01,
287
+ "learning_rate": 4.3827e-05,
288
+ "loss": 0.0792,
289
+ "step": 2700
290
+ },
291
+ {
292
+ "epoch": 7.27,
293
+ "learning_rate": 4.3228e-05,
294
+ "loss": 0.0789,
295
+ "step": 2800
296
+ },
297
+ {
298
+ "epoch": 7.53,
299
+ "learning_rate": 4.2629e-05,
300
+ "loss": 0.0788,
301
+ "step": 2900
302
+ },
303
+ {
304
+ "epoch": 7.79,
305
+ "learning_rate": 4.203e-05,
306
+ "loss": 0.0786,
307
+ "step": 3000
308
+ },
309
+ {
310
+ "epoch": 8.0,
311
+ "eval_accuracy_background": NaN,
312
+ "eval_accuracy_left": 0.0,
313
+ "eval_accuracy_right": 0.0,
314
+ "eval_iou_background": 0.0,
315
+ "eval_iou_left": 0.0,
316
+ "eval_iou_right": 0.0,
317
+ "eval_loss": 0.078447625041008,
318
+ "eval_mean_accuracy": 0.0,
319
+ "eval_mean_iou": 0.0,
320
+ "eval_overall_accuracy": 0.0,
321
+ "eval_runtime": 143.2832,
322
+ "eval_samples_per_second": 0.9,
323
+ "eval_steps_per_second": 0.119,
324
+ "step": 3080
325
+ },
326
+ {
327
+ "epoch": 8.05,
328
+ "learning_rate": 4.1431e-05,
329
+ "loss": 0.0783,
330
+ "step": 3100
331
+ },
332
+ {
333
+ "epoch": 8.31,
334
+ "learning_rate": 4.0832e-05,
335
+ "loss": 0.0783,
336
+ "step": 3200
337
+ },
338
+ {
339
+ "epoch": 8.57,
340
+ "learning_rate": 4.0233e-05,
341
+ "loss": 0.0778,
342
+ "step": 3300
343
+ },
344
+ {
345
+ "epoch": 8.83,
346
+ "learning_rate": 3.9634e-05,
347
+ "loss": 0.0777,
348
+ "step": 3400
349
+ },
350
+ {
351
+ "epoch": 9.0,
352
+ "eval_accuracy_background": NaN,
353
+ "eval_accuracy_left": 0.0,
354
+ "eval_accuracy_right": 0.0,
355
+ "eval_iou_background": 0.0,
356
+ "eval_iou_left": 0.0,
357
+ "eval_iou_right": 0.0,
358
+ "eval_loss": 0.0785832330584526,
359
+ "eval_mean_accuracy": 0.0,
360
+ "eval_mean_iou": 0.0,
361
+ "eval_overall_accuracy": 0.0,
362
+ "eval_runtime": 143.0294,
363
+ "eval_samples_per_second": 0.902,
364
+ "eval_steps_per_second": 0.119,
365
+ "step": 3465
366
+ },
367
+ {
368
+ "epoch": 9.09,
369
+ "learning_rate": 3.9035e-05,
370
+ "loss": 0.0779,
371
+ "step": 3500
372
+ },
373
+ {
374
+ "epoch": 9.35,
375
+ "learning_rate": 3.8436e-05,
376
+ "loss": 0.0774,
377
+ "step": 3600
378
+ },
379
+ {
380
+ "epoch": 9.61,
381
+ "learning_rate": 3.7837000000000004e-05,
382
+ "loss": 0.0778,
383
+ "step": 3700
384
+ },
385
+ {
386
+ "epoch": 9.87,
387
+ "learning_rate": 3.7238000000000005e-05,
388
+ "loss": 0.0771,
389
+ "step": 3800
390
+ },
391
+ {
392
+ "epoch": 10.0,
393
+ "eval_accuracy_background": NaN,
394
+ "eval_accuracy_left": 0.0,
395
+ "eval_accuracy_right": 0.0,
396
+ "eval_iou_background": 0.0,
397
+ "eval_iou_left": 0.0,
398
+ "eval_iou_right": 0.0,
399
+ "eval_loss": 0.07735682278871536,
400
+ "eval_mean_accuracy": 0.0,
401
+ "eval_mean_iou": 0.0,
402
+ "eval_overall_accuracy": 0.0,
403
+ "eval_runtime": 143.7403,
404
+ "eval_samples_per_second": 0.897,
405
+ "eval_steps_per_second": 0.118,
406
+ "step": 3850
407
+ },
408
+ {
409
+ "epoch": 10.13,
410
+ "learning_rate": 3.6639e-05,
411
+ "loss": 0.0772,
412
+ "step": 3900
413
+ },
414
+ {
415
+ "epoch": 10.39,
416
+ "learning_rate": 3.604e-05,
417
+ "loss": 0.0767,
418
+ "step": 4000
419
+ },
420
+ {
421
+ "epoch": 10.65,
422
+ "learning_rate": 3.544100000000001e-05,
423
+ "loss": 0.077,
424
+ "step": 4100
425
+ },
426
+ {
427
+ "epoch": 10.91,
428
+ "learning_rate": 3.4842e-05,
429
+ "loss": 0.0773,
430
+ "step": 4200
431
+ },
432
+ {
433
+ "epoch": 11.0,
434
+ "eval_accuracy_background": NaN,
435
+ "eval_accuracy_left": 0.0,
436
+ "eval_accuracy_right": 0.0,
437
+ "eval_iou_background": 0.0,
438
+ "eval_iou_left": 0.0,
439
+ "eval_iou_right": 0.0,
440
+ "eval_loss": 0.07747040688991547,
441
+ "eval_mean_accuracy": 0.0,
442
+ "eval_mean_iou": 0.0,
443
+ "eval_overall_accuracy": 0.0,
444
+ "eval_runtime": 143.2937,
445
+ "eval_samples_per_second": 0.9,
446
+ "eval_steps_per_second": 0.119,
447
+ "step": 4235
448
+ },
449
+ {
450
+ "epoch": 11.17,
451
+ "learning_rate": 3.4243000000000004e-05,
452
+ "loss": 0.0767,
453
+ "step": 4300
454
+ },
455
+ {
456
+ "epoch": 11.43,
457
+ "learning_rate": 3.3644000000000005e-05,
458
+ "loss": 0.0768,
459
+ "step": 4400
460
+ },
461
+ {
462
+ "epoch": 11.69,
463
+ "learning_rate": 3.3045000000000006e-05,
464
+ "loss": 0.0765,
465
+ "step": 4500
466
+ },
467
+ {
468
+ "epoch": 11.95,
469
+ "learning_rate": 3.2446e-05,
470
+ "loss": 0.0765,
471
+ "step": 4600
472
+ },
473
+ {
474
+ "epoch": 12.0,
475
+ "eval_accuracy_background": NaN,
476
+ "eval_accuracy_left": 0.0,
477
+ "eval_accuracy_right": 0.0,
478
+ "eval_iou_background": 0.0,
479
+ "eval_iou_left": 0.0,
480
+ "eval_iou_right": 0.0,
481
+ "eval_loss": 0.07821880280971527,
482
+ "eval_mean_accuracy": 0.0,
483
+ "eval_mean_iou": 0.0,
484
+ "eval_overall_accuracy": 0.0,
485
+ "eval_runtime": 143.0726,
486
+ "eval_samples_per_second": 0.902,
487
+ "eval_steps_per_second": 0.119,
488
+ "step": 4620
489
+ },
490
+ {
491
+ "epoch": 12.21,
492
+ "learning_rate": 3.1847e-05,
493
+ "loss": 0.0762,
494
+ "step": 4700
495
+ },
496
+ {
497
+ "epoch": 12.47,
498
+ "learning_rate": 3.1248e-05,
499
+ "loss": 0.0759,
500
+ "step": 4800
501
+ },
502
+ {
503
+ "epoch": 12.73,
504
+ "learning_rate": 3.0649000000000004e-05,
505
+ "loss": 0.0763,
506
+ "step": 4900
507
+ },
508
+ {
509
+ "epoch": 12.99,
510
+ "learning_rate": 3.0050000000000002e-05,
511
+ "loss": 0.0757,
512
+ "step": 5000
513
+ },
514
+ {
515
+ "epoch": 13.0,
516
+ "eval_accuracy_background": NaN,
517
+ "eval_accuracy_left": 0.0,
518
+ "eval_accuracy_right": 0.0,
519
+ "eval_iou_background": 0.0,
520
+ "eval_iou_left": 0.0,
521
+ "eval_iou_right": 0.0,
522
+ "eval_loss": 0.07746042311191559,
523
+ "eval_mean_accuracy": 0.0,
524
+ "eval_mean_iou": 0.0,
525
+ "eval_overall_accuracy": 0.0,
526
+ "eval_runtime": 142.871,
527
+ "eval_samples_per_second": 0.903,
528
+ "eval_steps_per_second": 0.119,
529
+ "step": 5005
530
+ },
531
+ {
532
+ "epoch": 13.25,
533
+ "learning_rate": 2.9451e-05,
534
+ "loss": 0.0758,
535
+ "step": 5100
536
+ },
537
+ {
538
+ "epoch": 13.51,
539
+ "learning_rate": 2.8851999999999998e-05,
540
+ "loss": 0.0756,
541
+ "step": 5200
542
+ },
543
+ {
544
+ "epoch": 13.77,
545
+ "learning_rate": 2.8253e-05,
546
+ "loss": 0.0756,
547
+ "step": 5300
548
+ },
549
+ {
550
+ "epoch": 14.0,
551
+ "eval_accuracy_background": NaN,
552
+ "eval_accuracy_left": 0.0,
553
+ "eval_accuracy_right": 0.0,
554
+ "eval_iou_background": 0.0,
555
+ "eval_iou_left": 0.0,
556
+ "eval_iou_right": 0.0,
557
+ "eval_loss": 0.07735219597816467,
558
+ "eval_mean_accuracy": 0.0,
559
+ "eval_mean_iou": 0.0,
560
+ "eval_overall_accuracy": 0.0,
561
+ "eval_runtime": 147.4271,
562
+ "eval_samples_per_second": 0.875,
563
+ "eval_steps_per_second": 0.115,
564
+ "step": 5390
565
+ },
566
+ {
567
+ "epoch": 14.03,
568
+ "learning_rate": 2.7653999999999996e-05,
569
+ "loss": 0.0756,
570
+ "step": 5400
571
+ },
572
+ {
573
+ "epoch": 14.29,
574
+ "learning_rate": 2.7054999999999998e-05,
575
+ "loss": 0.0758,
576
+ "step": 5500
577
+ },
578
+ {
579
+ "epoch": 14.55,
580
+ "learning_rate": 2.6455999999999995e-05,
581
+ "loss": 0.075,
582
+ "step": 5600
583
+ },
584
+ {
585
+ "epoch": 14.81,
586
+ "learning_rate": 2.5857e-05,
587
+ "loss": 0.0754,
588
+ "step": 5700
589
+ },
590
+ {
591
+ "epoch": 15.0,
592
+ "eval_accuracy_background": NaN,
593
+ "eval_accuracy_left": 0.0,
594
+ "eval_accuracy_right": 0.0,
595
+ "eval_iou_background": 0.0,
596
+ "eval_iou_left": 0.0,
597
+ "eval_iou_right": 0.0,
598
+ "eval_loss": 0.07753156125545502,
599
+ "eval_mean_accuracy": 0.0,
600
+ "eval_mean_iou": 0.0,
601
+ "eval_overall_accuracy": 0.0,
602
+ "eval_runtime": 147.8722,
603
+ "eval_samples_per_second": 0.872,
604
+ "eval_steps_per_second": 0.115,
605
+ "step": 5775
606
+ },
607
+ {
608
+ "epoch": 15.06,
609
+ "learning_rate": 2.5258e-05,
610
+ "loss": 0.075,
611
+ "step": 5800
612
+ },
613
+ {
614
+ "epoch": 15.32,
615
+ "learning_rate": 2.4659e-05,
616
+ "loss": 0.0749,
617
+ "step": 5900
618
+ },
619
+ {
620
+ "epoch": 15.58,
621
+ "learning_rate": 2.406e-05,
622
+ "loss": 0.0745,
623
+ "step": 6000
624
+ },
625
+ {
626
+ "epoch": 15.84,
627
+ "learning_rate": 2.3460999999999998e-05,
628
+ "loss": 0.0746,
629
+ "step": 6100
630
+ },
631
+ {
632
+ "epoch": 16.0,
633
+ "eval_accuracy_background": NaN,
634
+ "eval_accuracy_left": 0.0,
635
+ "eval_accuracy_right": 0.0,
636
+ "eval_iou_background": 0.0,
637
+ "eval_iou_left": 0.0,
638
+ "eval_iou_right": 0.0,
639
+ "eval_loss": 0.0775093138217926,
640
+ "eval_mean_accuracy": 0.0,
641
+ "eval_mean_iou": 0.0,
642
+ "eval_overall_accuracy": 0.0,
643
+ "eval_runtime": 147.9462,
644
+ "eval_samples_per_second": 0.872,
645
+ "eval_steps_per_second": 0.115,
646
+ "step": 6160
647
+ },
648
+ {
649
+ "epoch": 16.1,
650
+ "learning_rate": 2.2862e-05,
651
+ "loss": 0.0751,
652
+ "step": 6200
653
+ },
654
+ {
655
+ "epoch": 16.36,
656
+ "learning_rate": 2.2263e-05,
657
+ "loss": 0.0743,
658
+ "step": 6300
659
+ },
660
+ {
661
+ "epoch": 16.62,
662
+ "learning_rate": 2.1663999999999998e-05,
663
+ "loss": 0.0746,
664
+ "step": 6400
665
+ },
666
+ {
667
+ "epoch": 16.88,
668
+ "learning_rate": 2.1065e-05,
669
+ "loss": 0.074,
670
+ "step": 6500
671
+ },
672
+ {
673
+ "epoch": 17.0,
674
+ "eval_accuracy_background": NaN,
675
+ "eval_accuracy_left": 0.0,
676
+ "eval_accuracy_right": 0.0,
677
+ "eval_iou_background": 0.0,
678
+ "eval_iou_left": 0.0,
679
+ "eval_iou_right": 0.0,
680
+ "eval_loss": 0.0779297724366188,
681
+ "eval_mean_accuracy": 0.0,
682
+ "eval_mean_iou": 0.0,
683
+ "eval_overall_accuracy": 0.0,
684
+ "eval_runtime": 147.7299,
685
+ "eval_samples_per_second": 0.873,
686
+ "eval_steps_per_second": 0.115,
687
+ "step": 6545
688
+ },
689
+ {
690
+ "epoch": 17.14,
691
+ "learning_rate": 2.0465999999999997e-05,
692
+ "loss": 0.0736,
693
+ "step": 6600
694
+ },
695
+ {
696
+ "epoch": 17.4,
697
+ "learning_rate": 1.9866999999999998e-05,
698
+ "loss": 0.0741,
699
+ "step": 6700
700
+ },
701
+ {
702
+ "epoch": 17.66,
703
+ "learning_rate": 1.9267999999999996e-05,
704
+ "loss": 0.0737,
705
+ "step": 6800
706
+ },
707
+ {
708
+ "epoch": 17.92,
709
+ "learning_rate": 1.8669e-05,
710
+ "loss": 0.0736,
711
+ "step": 6900
712
+ },
713
+ {
714
+ "epoch": 18.0,
715
+ "eval_accuracy_background": NaN,
716
+ "eval_accuracy_left": 0.0,
717
+ "eval_accuracy_right": 0.0,
718
+ "eval_iou_background": 0.0,
719
+ "eval_iou_left": 0.0,
720
+ "eval_iou_right": 0.0,
721
+ "eval_loss": 0.07919886708259583,
722
+ "eval_mean_accuracy": 0.0,
723
+ "eval_mean_iou": 0.0,
724
+ "eval_overall_accuracy": 0.0,
725
+ "eval_runtime": 144.6419,
726
+ "eval_samples_per_second": 0.892,
727
+ "eval_steps_per_second": 0.118,
728
+ "step": 6930
729
+ },
730
+ {
731
+ "epoch": 18.18,
732
+ "learning_rate": 1.807e-05,
733
+ "loss": 0.0739,
734
+ "step": 7000
735
+ },
736
+ {
737
+ "epoch": 18.44,
738
+ "learning_rate": 1.7471e-05,
739
+ "loss": 0.0737,
740
+ "step": 7100
741
+ },
742
+ {
743
+ "epoch": 18.7,
744
+ "learning_rate": 1.6872e-05,
745
+ "loss": 0.0743,
746
+ "step": 7200
747
+ },
748
+ {
749
+ "epoch": 18.96,
750
+ "learning_rate": 1.6272999999999998e-05,
751
+ "loss": 0.0737,
752
+ "step": 7300
753
+ },
754
+ {
755
+ "epoch": 19.0,
756
+ "eval_accuracy_background": NaN,
757
+ "eval_accuracy_left": 0.0,
758
+ "eval_accuracy_right": 0.0,
759
+ "eval_iou_background": 0.0,
760
+ "eval_iou_left": 0.0,
761
+ "eval_iou_right": 0.0,
762
+ "eval_loss": 0.08009234070777893,
763
+ "eval_mean_accuracy": 0.0,
764
+ "eval_mean_iou": 0.0,
765
+ "eval_overall_accuracy": 0.0,
766
+ "eval_runtime": 144.5325,
767
+ "eval_samples_per_second": 0.893,
768
+ "eval_steps_per_second": 0.118,
769
+ "step": 7315
770
+ },
771
+ {
772
+ "epoch": 19.22,
773
+ "learning_rate": 1.5674e-05,
774
+ "loss": 0.0731,
775
+ "step": 7400
776
+ },
777
+ {
778
+ "epoch": 19.48,
779
+ "learning_rate": 1.5075000000000002e-05,
780
+ "loss": 0.0731,
781
+ "step": 7500
782
+ },
783
+ {
784
+ "epoch": 19.74,
785
+ "learning_rate": 1.4476e-05,
786
+ "loss": 0.0736,
787
+ "step": 7600
788
+ },
789
+ {
790
+ "epoch": 20.0,
791
+ "learning_rate": 1.3877e-05,
792
+ "loss": 0.073,
793
+ "step": 7700
794
+ },
795
+ {
796
+ "epoch": 20.0,
797
+ "eval_accuracy_background": NaN,
798
+ "eval_accuracy_left": 0.0,
799
+ "eval_accuracy_right": 0.0,
800
+ "eval_iou_background": 0.0,
801
+ "eval_iou_left": 0.0,
802
+ "eval_iou_right": 0.0,
803
+ "eval_loss": 0.08035800606012344,
804
+ "eval_mean_accuracy": 0.0,
805
+ "eval_mean_iou": 0.0,
806
+ "eval_overall_accuracy": 0.0,
807
+ "eval_runtime": 144.0433,
808
+ "eval_samples_per_second": 0.896,
809
+ "eval_steps_per_second": 0.118,
810
+ "step": 7700
811
+ },
812
+ {
813
+ "epoch": 20.26,
814
+ "learning_rate": 1.3277999999999999e-05,
815
+ "loss": 0.0731,
816
+ "step": 7800
817
+ },
818
+ {
819
+ "epoch": 20.52,
820
+ "learning_rate": 1.2678999999999998e-05,
821
+ "loss": 0.0729,
822
+ "step": 7900
823
+ },
824
+ {
825
+ "epoch": 20.78,
826
+ "learning_rate": 1.2079999999999998e-05,
827
+ "loss": 0.0729,
828
+ "step": 8000
829
+ },
830
+ {
831
+ "epoch": 21.0,
832
+ "eval_accuracy_background": NaN,
833
+ "eval_accuracy_left": 0.0,
834
+ "eval_accuracy_right": 0.0,
835
+ "eval_iou_background": 0.0,
836
+ "eval_iou_left": 0.0,
837
+ "eval_iou_right": 0.0,
838
+ "eval_loss": 0.08050834387540817,
839
+ "eval_mean_accuracy": 0.0,
840
+ "eval_mean_iou": 0.0,
841
+ "eval_overall_accuracy": 0.0,
842
+ "eval_runtime": 147.0065,
843
+ "eval_samples_per_second": 0.878,
844
+ "eval_steps_per_second": 0.116,
845
+ "step": 8085
846
+ },
847
+ {
848
+ "epoch": 21.04,
849
+ "learning_rate": 1.1480999999999997e-05,
850
+ "loss": 0.0724,
851
+ "step": 8100
852
+ },
853
+ {
854
+ "epoch": 21.3,
855
+ "learning_rate": 1.0882000000000004e-05,
856
+ "loss": 0.0727,
857
+ "step": 8200
858
+ },
859
+ {
860
+ "epoch": 21.56,
861
+ "learning_rate": 1.0283000000000003e-05,
862
+ "loss": 0.0731,
863
+ "step": 8300
864
+ },
865
+ {
866
+ "epoch": 21.82,
867
+ "learning_rate": 9.684000000000002e-06,
868
+ "loss": 0.0734,
869
+ "step": 8400
870
+ },
871
+ {
872
+ "epoch": 22.0,
873
+ "eval_accuracy_background": NaN,
874
+ "eval_accuracy_left": 0.0,
875
+ "eval_accuracy_right": 0.0,
876
+ "eval_iou_background": 0.0,
877
+ "eval_iou_left": 0.0,
878
+ "eval_iou_right": 0.0,
879
+ "eval_loss": 0.08037494868040085,
880
+ "eval_mean_accuracy": 0.0,
881
+ "eval_mean_iou": 0.0,
882
+ "eval_overall_accuracy": 0.0,
883
+ "eval_runtime": 144.7441,
884
+ "eval_samples_per_second": 0.891,
885
+ "eval_steps_per_second": 0.117,
886
+ "step": 8470
887
+ },
888
+ {
889
+ "epoch": 22.08,
890
+ "learning_rate": 9.085000000000002e-06,
891
+ "loss": 0.0722,
892
+ "step": 8500
893
+ },
894
+ {
895
+ "epoch": 22.34,
896
+ "learning_rate": 8.486000000000001e-06,
897
+ "loss": 0.0727,
898
+ "step": 8600
899
+ },
900
+ {
901
+ "epoch": 22.6,
902
+ "learning_rate": 7.887000000000001e-06,
903
+ "loss": 0.0729,
904
+ "step": 8700
905
+ },
906
+ {
907
+ "epoch": 22.86,
908
+ "learning_rate": 7.2879999999999995e-06,
909
+ "loss": 0.0726,
910
+ "step": 8800
911
+ },
912
+ {
913
+ "epoch": 23.0,
914
+ "eval_accuracy_background": NaN,
915
+ "eval_accuracy_left": 0.0,
916
+ "eval_accuracy_right": 0.0,
917
+ "eval_iou_background": 0.0,
918
+ "eval_iou_left": 0.0,
919
+ "eval_iou_right": 0.0,
920
+ "eval_loss": 0.08105623722076416,
921
+ "eval_mean_accuracy": 0.0,
922
+ "eval_mean_iou": 0.0,
923
+ "eval_overall_accuracy": 0.0,
924
+ "eval_runtime": 143.4472,
925
+ "eval_samples_per_second": 0.899,
926
+ "eval_steps_per_second": 0.119,
927
+ "step": 8855
928
+ },
929
+ {
930
+ "epoch": 23.12,
931
+ "learning_rate": 6.688999999999999e-06,
932
+ "loss": 0.0724,
933
+ "step": 8900
934
+ },
935
+ {
936
+ "epoch": 23.38,
937
+ "learning_rate": 6.0899999999999984e-06,
938
+ "loss": 0.0725,
939
+ "step": 9000
940
+ },
941
+ {
942
+ "epoch": 23.64,
943
+ "learning_rate": 5.490999999999998e-06,
944
+ "loss": 0.0723,
945
+ "step": 9100
946
+ },
947
+ {
948
+ "epoch": 23.9,
949
+ "learning_rate": 4.891999999999997e-06,
950
+ "loss": 0.0726,
951
+ "step": 9200
952
+ },
953
+ {
954
+ "epoch": 24.0,
955
+ "eval_accuracy_background": NaN,
956
+ "eval_accuracy_left": 0.0,
957
+ "eval_accuracy_right": 0.0,
958
+ "eval_iou_background": 0.0,
959
+ "eval_iou_left": 0.0,
960
+ "eval_iou_right": 0.0,
961
+ "eval_loss": 0.08159284293651581,
962
+ "eval_mean_accuracy": 0.0,
963
+ "eval_mean_iou": 0.0,
964
+ "eval_overall_accuracy": 0.0,
965
+ "eval_runtime": 145.0941,
966
+ "eval_samples_per_second": 0.889,
967
+ "eval_steps_per_second": 0.117,
968
+ "step": 9240
969
+ },
970
+ {
971
+ "epoch": 24.16,
972
+ "learning_rate": 4.292999999999997e-06,
973
+ "loss": 0.0723,
974
+ "step": 9300
975
+ },
976
+ {
977
+ "epoch": 24.42,
978
+ "learning_rate": 3.694000000000003e-06,
979
+ "loss": 0.0723,
980
+ "step": 9400
981
+ },
982
+ {
983
+ "epoch": 24.68,
984
+ "learning_rate": 3.0950000000000026e-06,
985
+ "loss": 0.0722,
986
+ "step": 9500
987
+ },
988
+ {
989
+ "epoch": 24.94,
990
+ "learning_rate": 2.496000000000002e-06,
991
+ "loss": 0.0721,
992
+ "step": 9600
993
+ },
994
+ {
995
+ "epoch": 25.0,
996
+ "eval_accuracy_background": NaN,
997
+ "eval_accuracy_left": 0.0,
998
+ "eval_accuracy_right": 0.0,
999
+ "eval_iou_background": 0.0,
1000
+ "eval_iou_left": 0.0,
1001
+ "eval_iou_right": 0.0,
1002
+ "eval_loss": 0.08221694082021713,
1003
+ "eval_mean_accuracy": 0.0,
1004
+ "eval_mean_iou": 0.0,
1005
+ "eval_overall_accuracy": 0.0,
1006
+ "eval_runtime": 144.3494,
1007
+ "eval_samples_per_second": 0.894,
1008
+ "eval_steps_per_second": 0.118,
1009
+ "step": 9625
1010
+ },
1011
+ {
1012
+ "epoch": 25.19,
1013
+ "learning_rate": 1.8970000000000013e-06,
1014
+ "loss": 0.072,
1015
+ "step": 9700
1016
+ },
1017
+ {
1018
+ "epoch": 25.45,
1019
+ "learning_rate": 1.298000000000001e-06,
1020
+ "loss": 0.0726,
1021
+ "step": 9800
1022
+ },
1023
+ {
1024
+ "epoch": 25.71,
1025
+ "learning_rate": 6.990000000000005e-07,
1026
+ "loss": 0.0722,
1027
+ "step": 9900
1028
+ },
1029
+ {
1030
+ "epoch": 25.97,
1031
+ "learning_rate": 1e-07,
1032
+ "loss": 0.0727,
1033
+ "step": 10000
1034
+ },
1035
+ {
1036
+ "epoch": 25.97,
1037
+ "eval_accuracy_background": NaN,
1038
+ "eval_accuracy_left": 0.0,
1039
+ "eval_accuracy_right": 0.0,
1040
+ "eval_iou_background": 0.0,
1041
+ "eval_iou_left": 0.0,
1042
+ "eval_iou_right": 0.0,
1043
+ "eval_loss": 0.08214545249938965,
1044
+ "eval_mean_accuracy": 0.0,
1045
+ "eval_mean_iou": 0.0,
1046
+ "eval_overall_accuracy": 0.0,
1047
+ "eval_runtime": 143.8508,
1048
+ "eval_samples_per_second": 0.897,
1049
+ "eval_steps_per_second": 0.118,
1050
+ "step": 10000
1051
+ },
1052
+ {
1053
+ "epoch": 25.97,
1054
+ "step": 10000,
1055
+ "total_flos": 2.70322107117696e+18,
1056
+ "train_loss": 0.10369874272346497,
1057
+ "train_runtime": 11613.3095,
1058
+ "train_samples_per_second": 6.889,
1059
+ "train_steps_per_second": 0.861
1060
+ }
1061
+ ],
1062
+ "max_steps": 10000,
1063
+ "num_train_epochs": 26,
1064
+ "total_flos": 2.70322107117696e+18,
1065
+ "trial_name": null,
1066
+ "trial_params": null
1067
+ }