xzuyn commited on
Commit
3ba332e
·
verified ·
1 Parent(s): 711e591

Upload Step 160/2504

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_state.json +81 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b81b091dab089fa2fe32b0bec2100bb9f9c60692c1095ab9780f0d2662d6b41
3
  size 1907432232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd6116f82d579a82e3164164a1945c1d5c028518d8c967b5f19b4c473791f0cd
3
  size 1907432232
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.059892194050708725,
6
  "eval_steps": 10,
7
- "global_step": 150,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1186,6 +1186,84 @@
1186
  "eval_samples_per_second": 0.876,
1187
  "eval_steps_per_second": 0.219,
1188
  "step": 150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1189
  }
1190
  ],
1191
  "logging_steps": 1,
@@ -1205,7 +1283,7 @@
1205
  "attributes": {}
1206
  }
1207
  },
1208
- "total_flos": 4.837675502665728e+17,
1209
  "train_batch_size": 4,
1210
  "trial_name": null,
1211
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.06388500698742264,
6
  "eval_steps": 10,
7
+ "global_step": 160,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1186
  "eval_samples_per_second": 0.876,
1187
  "eval_steps_per_second": 0.219,
1188
  "step": 150
1189
+ },
1190
+ {
1191
+ "epoch": 0.06029147534438012,
1192
+ "grad_norm": 0.463015079498291,
1193
+ "learning_rate": 2.4848560027025883e-07,
1194
+ "loss": 2.0948,
1195
+ "step": 151
1196
+ },
1197
+ {
1198
+ "epoch": 0.060690756638051506,
1199
+ "grad_norm": 0.4769456386566162,
1200
+ "learning_rate": 2.484749915511997e-07,
1201
+ "loss": 2.1417,
1202
+ "step": 152
1203
+ },
1204
+ {
1205
+ "epoch": 0.0610900379317229,
1206
+ "grad_norm": 0.4819183647632599,
1207
+ "learning_rate": 2.484643747622871e-07,
1208
+ "loss": 2.2244,
1209
+ "step": 153
1210
+ },
1211
+ {
1212
+ "epoch": 0.06148931922539429,
1213
+ "grad_norm": 0.4990222454071045,
1214
+ "learning_rate": 2.4845374989430964e-07,
1215
+ "loss": 2.3024,
1216
+ "step": 154
1217
+ },
1218
+ {
1219
+ "epoch": 0.06188860051906568,
1220
+ "grad_norm": 0.553051233291626,
1221
+ "learning_rate": 2.4844311693804187e-07,
1222
+ "loss": 2.1907,
1223
+ "step": 155
1224
+ },
1225
+ {
1226
+ "epoch": 0.062287881812737075,
1227
+ "grad_norm": 0.483012318611145,
1228
+ "learning_rate": 2.4843247588424436e-07,
1229
+ "loss": 2.2427,
1230
+ "step": 156
1231
+ },
1232
+ {
1233
+ "epoch": 0.06268716310640847,
1234
+ "grad_norm": 0.5101610422134399,
1235
+ "learning_rate": 2.4842182672366355e-07,
1236
+ "loss": 2.0001,
1237
+ "step": 157
1238
+ },
1239
+ {
1240
+ "epoch": 0.06308644440007985,
1241
+ "grad_norm": 0.47115758061408997,
1242
+ "learning_rate": 2.484111694470319e-07,
1243
+ "loss": 2.2248,
1244
+ "step": 158
1245
+ },
1246
+ {
1247
+ "epoch": 0.06348572569375124,
1248
+ "grad_norm": 0.46976238489151,
1249
+ "learning_rate": 2.4840050404506756e-07,
1250
+ "loss": 2.0394,
1251
+ "step": 159
1252
+ },
1253
+ {
1254
+ "epoch": 0.06388500698742264,
1255
+ "grad_norm": 0.4438592791557312,
1256
+ "learning_rate": 2.4838983050847455e-07,
1257
+ "loss": 2.0788,
1258
+ "step": 160
1259
+ },
1260
+ {
1261
+ "epoch": 0.06388500698742264,
1262
+ "eval_loss": 2.1408231258392334,
1263
+ "eval_runtime": 292.5781,
1264
+ "eval_samples_per_second": 0.875,
1265
+ "eval_steps_per_second": 0.219,
1266
+ "step": 160
1267
  }
1268
  ],
1269
  "logging_steps": 1,
 
1283
  "attributes": {}
1284
  }
1285
  },
1286
+ "total_flos": 5.160187202843443e+17,
1287
  "train_batch_size": 4,
1288
  "trial_name": null,
1289
  "trial_params": null