Training in progress, step 660, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +15 -7
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 50365768
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e07e035f586498dc8981df34e67630b046d3efe96532d54935045c70e2732a5c
|
3 |
size 50365768
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 25859412
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4391b36bfb3153386e6ba9b7fa9813c558d76ab5b72d79ffcddc8628bda27c5
|
3 |
size 25859412
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:769f27da95e3db89c4ac50ba3b676be7452e7102a0fceebe0dba03240f9a0912
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b5ebb4c43b35cc5c443696fa48cabff1cc53c72b887ea3e6159a2871f0a2068
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ab0379217213a80cc6c5b608182019ce004207aeec4e881e08eb21bd107b24
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86bbbbd5fa142eccd9cc0d90c2a1f214e26f81abc61d8b8108e38ba0231a465d
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9067d6a23df796f52db826028f8c78fda475923b094eba9dfa934d7463044e0
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "miner_id_24/checkpoint-
|
4 |
-
"epoch": 4.
|
5 |
"eval_steps": 20,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -313,6 +313,14 @@
|
|
313 |
"eval_samples_per_second": 312.336,
|
314 |
"eval_steps_per_second": 2.448,
|
315 |
"step": 640
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
316 |
}
|
317 |
],
|
318 |
"logging_steps": 100,
|
@@ -327,7 +335,7 @@
|
|
327 |
"early_stopping_threshold": 0.0
|
328 |
},
|
329 |
"attributes": {
|
330 |
-
"early_stopping_patience_counter":
|
331 |
}
|
332 |
},
|
333 |
"TrainerControl": {
|
@@ -336,12 +344,12 @@
|
|
336 |
"should_evaluate": false,
|
337 |
"should_log": false,
|
338 |
"should_save": true,
|
339 |
-
"should_training_stop":
|
340 |
},
|
341 |
"attributes": {}
|
342 |
}
|
343 |
},
|
344 |
-
"total_flos": 9.
|
345 |
"train_batch_size": 16,
|
346 |
"trial_name": null,
|
347 |
"trial_params": null
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.6788897514343262,
|
3 |
+
"best_model_checkpoint": "miner_id_24/checkpoint-660",
|
4 |
+
"epoch": 4.981132075471698,
|
5 |
"eval_steps": 20,
|
6 |
+
"global_step": 660,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
313 |
"eval_samples_per_second": 312.336,
|
314 |
"eval_steps_per_second": 2.448,
|
315 |
"step": 640
|
316 |
+
},
|
317 |
+
{
|
318 |
+
"epoch": 4.981132075471698,
|
319 |
+
"eval_loss": 0.6788897514343262,
|
320 |
+
"eval_runtime": 2.8412,
|
321 |
+
"eval_samples_per_second": 314.3,
|
322 |
+
"eval_steps_per_second": 2.464,
|
323 |
+
"step": 660
|
324 |
}
|
325 |
],
|
326 |
"logging_steps": 100,
|
|
|
335 |
"early_stopping_threshold": 0.0
|
336 |
},
|
337 |
"attributes": {
|
338 |
+
"early_stopping_patience_counter": 0
|
339 |
}
|
340 |
},
|
341 |
"TrainerControl": {
|
|
|
344 |
"should_evaluate": false,
|
345 |
"should_log": false,
|
346 |
"should_save": true,
|
347 |
+
"should_training_stop": true
|
348 |
},
|
349 |
"attributes": {}
|
350 |
}
|
351 |
},
|
352 |
+
"total_flos": 9.693587491667313e+17,
|
353 |
"train_batch_size": 16,
|
354 |
"trial_name": null,
|
355 |
"trial_params": null
|