Metal079 commited on
Commit
8a95184
1 Parent(s): 05a806e

New better model

Browse files
sonic/config.json CHANGED
@@ -20,7 +20,7 @@
20
  "id2label": {
21
  "0": "Tails the fox",
22
  "1": "Amy Rose",
23
- "10": "Shadow the hedgehog",
24
  "11": "Sally Acorn",
25
  "12": "Tangle the lemur",
26
  "13": "mobian",
@@ -30,7 +30,7 @@
30
  "17": "Tikal the echidna",
31
  "18": "Wave the swallow",
32
  "19": "Jet the hawk",
33
- "2": "Rogue the bat",
34
  "20": "Honey the cat",
35
  "21": "Surge the tenrec",
36
  "22": "Starline the platypus",
@@ -44,35 +44,35 @@
44
  "3": "Whisper the wolf",
45
  "30": "Storm the albatross",
46
  "31": "Maria Robotnik",
47
- "4": "Knuckles the echidna",
48
- "5": "Blaze the cat",
49
- "6": "Silver the hedgehog",
50
- "7": "Cream the rabbit",
51
- "8": "Vanilla the rabbit",
52
- "9": "Sonic the hedgehog"
53
  },
54
  "image_size": 384,
55
  "initializer_range": 0.02,
56
  "label2id": {
57
  "Amy Rose": "1",
58
  "Big the cat": "15",
59
- "Blaze the cat": "5",
60
  "Bunnie Rabbot": "28",
61
  "Charmy the bee": "25",
62
  "Cosmo the seedrian": "14",
63
- "Cream the rabbit": "7",
64
  "Espio the chameleon": "26",
65
  "Honey the cat": "20",
66
  "Jet the hawk": "19",
67
- "Knuckles the echidna": "4",
68
  "Maria Robotnik": "31",
69
  "Marine the Raccoon": "29",
70
  "Mighty the armadillo": "23",
71
- "Rogue the bat": "2",
72
  "Sally Acorn": "11",
73
- "Shadow the hedgehog": "10",
74
- "Silver the hedgehog": "6",
75
- "Sonic the hedgehog": "9",
76
  "Starline the platypus": "22",
77
  "Sticks the badger": "16",
78
  "Storm the albatross": "30",
@@ -80,7 +80,7 @@
80
  "Tails the fox": "0",
81
  "Tangle the lemur": "12",
82
  "Tikal the echidna": "17",
83
- "Vanilla the rabbit": "8",
84
  "Vector the crocodile": "24",
85
  "Wave the swallow": "18",
86
  "Whisper the wolf": "3",
 
20
  "id2label": {
21
  "0": "Tails the fox",
22
  "1": "Amy Rose",
23
+ "10": "Sonic the hedgehog",
24
  "11": "Sally Acorn",
25
  "12": "Tangle the lemur",
26
  "13": "mobian",
 
30
  "17": "Tikal the echidna",
31
  "18": "Wave the swallow",
32
  "19": "Jet the hawk",
33
+ "2": "Knuckles the echidna",
34
  "20": "Honey the cat",
35
  "21": "Surge the tenrec",
36
  "22": "Starline the platypus",
 
44
  "3": "Whisper the wolf",
45
  "30": "Storm the albatross",
46
  "31": "Maria Robotnik",
47
+ "4": "Rogue the bat",
48
+ "5": "Silver the hedgehog",
49
+ "6": "Blaze the cat",
50
+ "7": "Vanilla the rabbit",
51
+ "8": "Cream the rabbit",
52
+ "9": "Shadow the hedgehog"
53
  },
54
  "image_size": 384,
55
  "initializer_range": 0.02,
56
  "label2id": {
57
  "Amy Rose": "1",
58
  "Big the cat": "15",
59
+ "Blaze the cat": "6",
60
  "Bunnie Rabbot": "28",
61
  "Charmy the bee": "25",
62
  "Cosmo the seedrian": "14",
63
+ "Cream the rabbit": "8",
64
  "Espio the chameleon": "26",
65
  "Honey the cat": "20",
66
  "Jet the hawk": "19",
67
+ "Knuckles the echidna": "2",
68
  "Maria Robotnik": "31",
69
  "Marine the Raccoon": "29",
70
  "Mighty the armadillo": "23",
71
+ "Rogue the bat": "4",
72
  "Sally Acorn": "11",
73
+ "Shadow the hedgehog": "9",
74
+ "Silver the hedgehog": "5",
75
+ "Sonic the hedgehog": "10",
76
  "Starline the platypus": "22",
77
  "Sticks the badger": "16",
78
  "Storm the albatross": "30",
 
80
  "Tails the fox": "0",
81
  "Tangle the lemur": "12",
82
  "Tikal the echidna": "17",
83
+ "Vanilla the rabbit": "7",
84
  "Vector the crocodile": "24",
85
  "Wave the swallow": "18",
86
  "Whisper the wolf": "3",
sonic/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec5e3d6a60bdf3f519adb879379016d6bd97bb046a8f5a18afaac0cbae52c570
3
  size 350515757
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f52490f57b1e76d2aa86890ff44ec63cde9b7581f02c8fffac5292887bf7565
3
  size 350515757
sonic/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.08468733727931976,
3
- "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-1600",
4
- "epoch": 6.042296072507553,
5
- "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -10,177 +10,262 @@
10
  {
11
  "epoch": 0.6,
12
  "learning_rate": 4.6978851963746225e-05,
13
- "loss": 0.2038,
14
  "step": 200
15
  },
16
  {
17
  "epoch": 0.6,
18
- "eval_accuracy": 0.9509220795568983,
19
- "eval_loss": 0.1493668258190155,
20
- "eval_precision": 0.4276334957981484,
21
- "eval_recall": 0.34057603409646653,
22
- "eval_runtime": 245.2223,
23
- "eval_samples_per_second": 8.099,
24
- "eval_steps_per_second": 1.015,
25
  "step": 200
26
  },
27
  {
28
  "epoch": 1.21,
29
  "learning_rate": 4.395770392749245e-05,
30
- "loss": 0.1299,
31
  "step": 400
32
  },
33
  {
34
  "epoch": 1.21,
35
- "eval_accuracy": 0.9626132930513596,
36
- "eval_loss": 0.11390183866024017,
37
- "eval_precision": 0.6821628829936983,
38
- "eval_recall": 0.6035811496119172,
39
- "eval_runtime": 245.5675,
40
- "eval_samples_per_second": 8.087,
41
- "eval_steps_per_second": 1.014,
42
  "step": 400
43
  },
44
  {
45
  "epoch": 1.81,
46
  "learning_rate": 4.093655589123867e-05,
47
- "loss": 0.0952,
48
  "step": 600
49
  },
50
  {
51
  "epoch": 1.81,
52
- "eval_accuracy": 0.9677901560926485,
53
- "eval_loss": 0.10017536580562592,
54
- "eval_precision": 0.7746363586620384,
55
- "eval_recall": 0.71393109788423,
56
- "eval_runtime": 246.2016,
57
- "eval_samples_per_second": 8.067,
58
- "eval_steps_per_second": 1.011,
59
  "step": 600
60
  },
61
  {
62
  "epoch": 2.42,
63
  "learning_rate": 3.79154078549849e-05,
64
- "loss": 0.0681,
65
  "step": 800
66
  },
67
  {
68
  "epoch": 2.42,
69
- "eval_accuracy": 0.9708113041289023,
70
- "eval_loss": 0.09041494876146317,
71
- "eval_precision": 0.8065139068160218,
72
- "eval_recall": 0.7231326368063123,
73
- "eval_runtime": 245.4942,
74
- "eval_samples_per_second": 8.09,
75
- "eval_steps_per_second": 1.014,
76
  "step": 800
77
  },
78
  {
79
  "epoch": 3.02,
80
  "learning_rate": 3.489425981873112e-05,
81
- "loss": 0.0608,
82
  "step": 1000
83
  },
84
  {
85
  "epoch": 3.02,
86
- "eval_accuracy": 0.972904078549849,
87
- "eval_loss": 0.08679082244634628,
88
- "eval_precision": 0.8209949551458537,
89
- "eval_recall": 0.7289373926706963,
90
- "eval_runtime": 244.3239,
91
- "eval_samples_per_second": 8.129,
92
- "eval_steps_per_second": 1.019,
93
  "step": 1000
94
  },
95
  {
96
  "epoch": 3.63,
97
  "learning_rate": 3.187311178247734e-05,
98
- "loss": 0.0393,
99
  "step": 1200
100
  },
101
  {
102
  "epoch": 3.63,
103
- "eval_accuracy": 0.9730771651560927,
104
- "eval_loss": 0.08753738552331924,
105
- "eval_precision": 0.8360383490292852,
106
- "eval_recall": 0.7486598211097333,
107
- "eval_runtime": 248.2529,
108
- "eval_samples_per_second": 8.0,
109
- "eval_steps_per_second": 1.003,
110
  "step": 1200
111
  },
112
  {
113
  "epoch": 4.23,
114
  "learning_rate": 2.8851963746223565e-05,
115
- "loss": 0.0347,
116
  "step": 1400
117
  },
118
  {
119
  "epoch": 4.23,
120
- "eval_accuracy": 0.9733761329305136,
121
- "eval_loss": 0.08492986112833023,
122
- "eval_precision": 0.8388275873170129,
123
- "eval_recall": 0.7801557843198007,
124
- "eval_runtime": 248.4693,
125
- "eval_samples_per_second": 7.993,
126
- "eval_steps_per_second": 1.002,
127
  "step": 1400
128
  },
129
  {
130
  "epoch": 4.83,
131
  "learning_rate": 2.583081570996979e-05,
132
- "loss": 0.0256,
133
  "step": 1600
134
  },
135
  {
136
  "epoch": 4.83,
137
- "eval_accuracy": 0.9739583333333334,
138
- "eval_loss": 0.08468733727931976,
139
- "eval_precision": 0.8475558611132625,
140
- "eval_recall": 0.788949676665331,
141
- "eval_runtime": 248.7261,
142
- "eval_samples_per_second": 7.985,
143
- "eval_steps_per_second": 1.001,
144
  "step": 1600
145
  },
146
  {
147
  "epoch": 5.44,
148
  "learning_rate": 2.2809667673716012e-05,
149
- "loss": 0.0191,
150
  "step": 1800
151
  },
152
  {
153
  "epoch": 5.44,
154
- "eval_accuracy": 0.9742573011077543,
155
- "eval_loss": 0.0882001668214798,
156
- "eval_precision": 0.845859505500522,
157
- "eval_recall": 0.7649921950675245,
158
- "eval_runtime": 251.833,
159
- "eval_samples_per_second": 7.886,
160
- "eval_steps_per_second": 0.989,
161
  "step": 1800
162
  },
163
  {
164
  "epoch": 6.04,
165
  "learning_rate": 1.9788519637462235e-05,
166
- "loss": 0.0154,
167
  "step": 2000
168
  },
169
  {
170
  "epoch": 6.04,
171
- "eval_accuracy": 0.9743674471299094,
172
- "eval_loss": 0.08864131569862366,
173
- "eval_precision": 0.8535254440088273,
174
- "eval_recall": 0.7735381205368478,
175
- "eval_runtime": 245.1302,
176
- "eval_samples_per_second": 8.102,
177
- "eval_steps_per_second": 1.016,
178
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
179
  }
180
  ],
181
  "max_steps": 3310,
182
  "num_train_epochs": 10,
183
- "total_flos": 1.1154739870524506e+19,
184
  "trial_name": null,
185
  "trial_params": null
186
  }
 
1
  {
2
+ "best_metric": 0.0789622887969017,
3
+ "best_model_checkpoint": "./SonicCharacterClassifier\\checkpoint-1800",
4
+ "epoch": 9.06344410876133,
5
+ "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
10
  {
11
  "epoch": 0.6,
12
  "learning_rate": 4.6978851963746225e-05,
13
+ "loss": 0.2032,
14
  "step": 200
15
  },
16
  {
17
  "epoch": 0.6,
18
+ "eval_accuracy": 0.9495591939546599,
19
+ "eval_loss": 0.1497950255870819,
20
+ "eval_precision": 0.38202921623576536,
21
+ "eval_recall": 0.2866420054831203,
22
+ "eval_runtime": 264.6722,
23
+ "eval_samples_per_second": 7.5,
24
+ "eval_steps_per_second": 0.941,
25
  "step": 200
26
  },
27
  {
28
  "epoch": 1.21,
29
  "learning_rate": 4.395770392749245e-05,
30
+ "loss": 0.1244,
31
  "step": 400
32
  },
33
  {
34
  "epoch": 1.21,
35
+ "eval_accuracy": 0.9624212846347607,
36
+ "eval_loss": 0.1109040230512619,
37
+ "eval_precision": 0.6335885608933468,
38
+ "eval_recall": 0.5364579884489264,
39
+ "eval_runtime": 261.6322,
40
+ "eval_samples_per_second": 7.587,
41
+ "eval_steps_per_second": 0.952,
42
  "step": 400
43
  },
44
  {
45
  "epoch": 1.81,
46
  "learning_rate": 4.093655589123867e-05,
47
+ "loss": 0.0902,
48
  "step": 600
49
  },
50
  {
51
  "epoch": 1.81,
52
+ "eval_accuracy": 0.9697890428211587,
53
+ "eval_loss": 0.09568421542644501,
54
+ "eval_precision": 0.7973267857987819,
55
+ "eval_recall": 0.7373828567737021,
56
+ "eval_runtime": 263.8635,
57
+ "eval_samples_per_second": 7.523,
58
+ "eval_steps_per_second": 0.944,
59
  "step": 600
60
  },
61
  {
62
  "epoch": 2.42,
63
  "learning_rate": 3.79154078549849e-05,
64
+ "loss": 0.0692,
65
  "step": 800
66
  },
67
  {
68
  "epoch": 2.42,
69
+ "eval_accuracy": 0.9711901763224181,
70
+ "eval_loss": 0.08928817510604858,
71
+ "eval_precision": 0.8029630032715678,
72
+ "eval_recall": 0.7031733867707225,
73
+ "eval_runtime": 256.6147,
74
+ "eval_samples_per_second": 7.735,
75
+ "eval_steps_per_second": 0.97,
76
  "step": 800
77
  },
78
  {
79
  "epoch": 3.02,
80
  "learning_rate": 3.489425981873112e-05,
81
+ "loss": 0.0536,
82
  "step": 1000
83
  },
84
  {
85
  "epoch": 3.02,
86
+ "eval_accuracy": 0.9734571788413098,
87
+ "eval_loss": 0.08212397247552872,
88
+ "eval_precision": 0.8281340329136301,
89
+ "eval_recall": 0.7454393318947714,
90
+ "eval_runtime": 262.8056,
91
+ "eval_samples_per_second": 7.553,
92
+ "eval_steps_per_second": 0.947,
93
  "step": 1000
94
  },
95
  {
96
  "epoch": 3.63,
97
  "learning_rate": 3.187311178247734e-05,
98
+ "loss": 0.0383,
99
  "step": 1200
100
  },
101
  {
102
  "epoch": 3.63,
103
+ "eval_accuracy": 0.9749685138539043,
104
+ "eval_loss": 0.07910189032554626,
105
+ "eval_precision": 0.8499502404462407,
106
+ "eval_recall": 0.7928208095506756,
107
+ "eval_runtime": 269.2715,
108
+ "eval_samples_per_second": 7.372,
109
+ "eval_steps_per_second": 0.925,
110
  "step": 1200
111
  },
112
  {
113
  "epoch": 4.23,
114
  "learning_rate": 2.8851963746223565e-05,
115
+ "loss": 0.0335,
116
  "step": 1400
117
  },
118
  {
119
  "epoch": 4.23,
120
+ "eval_accuracy": 0.9746851385390428,
121
+ "eval_loss": 0.08017772436141968,
122
+ "eval_precision": 0.8415176727834163,
123
+ "eval_recall": 0.7714390648131707,
124
+ "eval_runtime": 262.8468,
125
+ "eval_samples_per_second": 7.552,
126
+ "eval_steps_per_second": 0.947,
127
  "step": 1400
128
  },
129
  {
130
  "epoch": 4.83,
131
  "learning_rate": 2.583081570996979e-05,
132
+ "loss": 0.0245,
133
  "step": 1600
134
  },
135
  {
136
  "epoch": 4.83,
137
+ "eval_accuracy": 0.9751259445843828,
138
+ "eval_loss": 0.08046023547649384,
139
+ "eval_precision": 0.8452890204657136,
140
+ "eval_recall": 0.7795725037362784,
141
+ "eval_runtime": 292.5617,
142
+ "eval_samples_per_second": 6.785,
143
+ "eval_steps_per_second": 0.851,
144
  "step": 1600
145
  },
146
  {
147
  "epoch": 5.44,
148
  "learning_rate": 2.2809667673716012e-05,
149
+ "loss": 0.0199,
150
  "step": 1800
151
  },
152
  {
153
  "epoch": 5.44,
154
+ "eval_accuracy": 0.975787153652393,
155
+ "eval_loss": 0.0789622887969017,
156
+ "eval_precision": 0.8522677350637055,
157
+ "eval_recall": 0.7916681676884358,
158
+ "eval_runtime": 269.8991,
159
+ "eval_samples_per_second": 7.355,
160
+ "eval_steps_per_second": 0.923,
161
  "step": 1800
162
  },
163
  {
164
  "epoch": 6.04,
165
  "learning_rate": 1.9788519637462235e-05,
166
+ "loss": 0.0169,
167
  "step": 2000
168
  },
169
  {
170
  "epoch": 6.04,
171
+ "eval_accuracy": 0.9749842569269521,
172
+ "eval_loss": 0.08285234868526459,
173
+ "eval_precision": 0.8439850500744712,
174
+ "eval_recall": 0.7729562503247884,
175
+ "eval_runtime": 265.7593,
176
+ "eval_samples_per_second": 7.469,
177
+ "eval_steps_per_second": 0.937,
178
  "step": 2000
179
+ },
180
+ {
181
+ "epoch": 6.65,
182
+ "learning_rate": 1.676737160120846e-05,
183
+ "loss": 0.0132,
184
+ "step": 2200
185
+ },
186
+ {
187
+ "epoch": 6.65,
188
+ "eval_accuracy": 0.9755982367758187,
189
+ "eval_loss": 0.08093218505382538,
190
+ "eval_precision": 0.8554658866593972,
191
+ "eval_recall": 0.7986969530652608,
192
+ "eval_runtime": 261.442,
193
+ "eval_samples_per_second": 7.593,
194
+ "eval_steps_per_second": 0.952,
195
+ "step": 2200
196
+ },
197
+ {
198
+ "epoch": 7.25,
199
+ "learning_rate": 1.3746223564954682e-05,
200
+ "loss": 0.0113,
201
+ "step": 2400
202
+ },
203
+ {
204
+ "epoch": 7.25,
205
+ "eval_accuracy": 0.9752676322418136,
206
+ "eval_loss": 0.08354648947715759,
207
+ "eval_precision": 0.8497939903151792,
208
+ "eval_recall": 0.7866075777488188,
209
+ "eval_runtime": 259.2176,
210
+ "eval_samples_per_second": 7.658,
211
+ "eval_steps_per_second": 0.961,
212
+ "step": 2400
213
+ },
214
+ {
215
+ "epoch": 7.85,
216
+ "learning_rate": 1.0725075528700906e-05,
217
+ "loss": 0.0102,
218
+ "step": 2600
219
+ },
220
+ {
221
+ "epoch": 7.85,
222
+ "eval_accuracy": 0.9757241813602016,
223
+ "eval_loss": 0.08276553452014923,
224
+ "eval_precision": 0.8552711059293521,
225
+ "eval_recall": 0.7972149485255522,
226
+ "eval_runtime": 259.024,
227
+ "eval_samples_per_second": 7.663,
228
+ "eval_steps_per_second": 0.961,
229
+ "step": 2600
230
+ },
231
+ {
232
+ "epoch": 8.46,
233
+ "learning_rate": 7.70392749244713e-06,
234
+ "loss": 0.0089,
235
+ "step": 2800
236
+ },
237
+ {
238
+ "epoch": 8.46,
239
+ "eval_accuracy": 0.976227959697733,
240
+ "eval_loss": 0.08310715854167938,
241
+ "eval_precision": 0.8535510581843376,
242
+ "eval_recall": 0.7942174286631556,
243
+ "eval_runtime": 266.8436,
244
+ "eval_samples_per_second": 7.439,
245
+ "eval_steps_per_second": 0.933,
246
+ "step": 2800
247
+ },
248
+ {
249
+ "epoch": 9.06,
250
+ "learning_rate": 4.682779456193353e-06,
251
+ "loss": 0.0077,
252
+ "step": 3000
253
+ },
254
+ {
255
+ "epoch": 9.06,
256
+ "eval_accuracy": 0.9758658690176323,
257
+ "eval_loss": 0.08518018573522568,
258
+ "eval_precision": 0.8593849643219924,
259
+ "eval_recall": 0.7900506494585933,
260
+ "eval_runtime": 260.5553,
261
+ "eval_samples_per_second": 7.618,
262
+ "eval_steps_per_second": 0.956,
263
+ "step": 3000
264
  }
265
  ],
266
  "max_steps": 3310,
267
  "num_train_epochs": 10,
268
+ "total_flos": 1.6730017245781033e+19,
269
  "trial_name": null,
270
  "trial_params": null
271
  }