End of training
Browse files
all_results.json
CHANGED
|
@@ -1,12 +1,12 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"eval_loss": 0.9921010732650757,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second": 9.
|
| 6 |
-
"eval_steps_per_second": 0.
|
| 7 |
"eval_wer": 34.21715788320368,
|
| 8 |
"train_loss": 0.02765977076081908,
|
| 9 |
-
"train_runtime":
|
| 10 |
-
"train_samples_per_second": 12.
|
| 11 |
"train_steps_per_second": 0.191
|
| 12 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"eval_loss": 0.9921010732650757,
|
| 4 |
+
"eval_runtime": 135.7332,
|
| 5 |
+
"eval_samples_per_second": 9.113,
|
| 6 |
+
"eval_steps_per_second": 0.287,
|
| 7 |
"eval_wer": 34.21715788320368,
|
| 8 |
"train_loss": 0.02765977076081908,
|
| 9 |
+
"train_runtime": 26145.1461,
|
| 10 |
+
"train_samples_per_second": 12.239,
|
| 11 |
"train_steps_per_second": 0.191
|
| 12 |
}
|
eval_results.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"eval_loss": 0.9921010732650757,
|
| 4 |
-
"eval_runtime":
|
| 5 |
-
"eval_samples_per_second": 9.
|
| 6 |
-
"eval_steps_per_second": 0.
|
| 7 |
"eval_wer": 34.21715788320368
|
| 8 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"eval_loss": 0.9921010732650757,
|
| 4 |
+
"eval_runtime": 135.7332,
|
| 5 |
+
"eval_samples_per_second": 9.113,
|
| 6 |
+
"eval_steps_per_second": 0.287,
|
| 7 |
"eval_wer": 34.21715788320368
|
| 8 |
}
|
runs/Dec05_00-34-16_spartan-gpgpu111.hpc.unimelb.edu.au/events.out.tfevents.1670187201.spartan-gpgpu111.hpc.unimelb.edu.au
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:433f5889c525703f31ef1069f851311928d9ad29a52f11d06b4d80a637ac2f58
|
| 3 |
+
size 40
|
train_results.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"train_loss": 0.02765977076081908,
|
| 4 |
-
"train_runtime":
|
| 5 |
-
"train_samples_per_second": 12.
|
| 6 |
"train_steps_per_second": 0.191
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"epoch": 624.0,
|
| 3 |
"train_loss": 0.02765977076081908,
|
| 4 |
+
"train_runtime": 26145.1461,
|
| 5 |
+
"train_samples_per_second": 12.239,
|
| 6 |
"train_steps_per_second": 0.191
|
| 7 |
}
|
trainer_state.json
CHANGED
|
@@ -250,9 +250,9 @@
|
|
| 250 |
{
|
| 251 |
"epoch": 124.0,
|
| 252 |
"eval_loss": 0.7998368740081787,
|
| 253 |
-
"eval_runtime":
|
| 254 |
-
"eval_samples_per_second": 9.
|
| 255 |
-
"eval_steps_per_second": 0.
|
| 256 |
"eval_wer": 21.770570833789854,
|
| 257 |
"step": 1000
|
| 258 |
},
|
|
@@ -499,8 +499,8 @@
|
|
| 499 |
{
|
| 500 |
"epoch": 249.0,
|
| 501 |
"eval_loss": 0.8832917213439941,
|
| 502 |
-
"eval_runtime": 131.
|
| 503 |
-
"eval_samples_per_second": 9.
|
| 504 |
"eval_steps_per_second": 0.296,
|
| 505 |
"eval_wer": 28.968993097403313,
|
| 506 |
"step": 2000
|
|
@@ -748,9 +748,9 @@
|
|
| 748 |
{
|
| 749 |
"epoch": 374.0,
|
| 750 |
"eval_loss": 0.9381842613220215,
|
| 751 |
-
"eval_runtime":
|
| 752 |
-
"eval_samples_per_second": 9.
|
| 753 |
-
"eval_steps_per_second": 0.
|
| 754 |
"eval_wer": 30.820642051057302,
|
| 755 |
"step": 3000
|
| 756 |
},
|
|
@@ -997,9 +997,9 @@
|
|
| 997 |
{
|
| 998 |
"epoch": 499.0,
|
| 999 |
"eval_loss": 0.9754325151443481,
|
| 1000 |
-
"eval_runtime": 133.
|
| 1001 |
-
"eval_samples_per_second": 9.
|
| 1002 |
-
"eval_steps_per_second": 0.
|
| 1003 |
"eval_wer": 34.436287936890544,
|
| 1004 |
"step": 4000
|
| 1005 |
},
|
|
@@ -1246,9 +1246,9 @@
|
|
| 1246 |
{
|
| 1247 |
"epoch": 624.0,
|
| 1248 |
"eval_loss": 0.9921010732650757,
|
| 1249 |
-
"eval_runtime":
|
| 1250 |
-
"eval_samples_per_second": 9.
|
| 1251 |
-
"eval_steps_per_second": 0.
|
| 1252 |
"eval_wer": 34.21715788320368,
|
| 1253 |
"step": 5000
|
| 1254 |
},
|
|
@@ -1257,8 +1257,8 @@
|
|
| 1257 |
"step": 5000,
|
| 1258 |
"total_flos": 8.94614740992e+19,
|
| 1259 |
"train_loss": 0.02765977076081908,
|
| 1260 |
-
"train_runtime":
|
| 1261 |
-
"train_samples_per_second": 12.
|
| 1262 |
"train_steps_per_second": 0.191
|
| 1263 |
}
|
| 1264 |
],
|
|
|
|
| 250 |
{
|
| 251 |
"epoch": 124.0,
|
| 252 |
"eval_loss": 0.7998368740081787,
|
| 253 |
+
"eval_runtime": 130.4981,
|
| 254 |
+
"eval_samples_per_second": 9.479,
|
| 255 |
+
"eval_steps_per_second": 0.299,
|
| 256 |
"eval_wer": 21.770570833789854,
|
| 257 |
"step": 1000
|
| 258 |
},
|
|
|
|
| 499 |
{
|
| 500 |
"epoch": 249.0,
|
| 501 |
"eval_loss": 0.8832917213439941,
|
| 502 |
+
"eval_runtime": 131.7792,
|
| 503 |
+
"eval_samples_per_second": 9.387,
|
| 504 |
"eval_steps_per_second": 0.296,
|
| 505 |
"eval_wer": 28.968993097403313,
|
| 506 |
"step": 2000
|
|
|
|
| 748 |
{
|
| 749 |
"epoch": 374.0,
|
| 750 |
"eval_loss": 0.9381842613220215,
|
| 751 |
+
"eval_runtime": 133.2813,
|
| 752 |
+
"eval_samples_per_second": 9.281,
|
| 753 |
+
"eval_steps_per_second": 0.293,
|
| 754 |
"eval_wer": 30.820642051057302,
|
| 755 |
"step": 3000
|
| 756 |
},
|
|
|
|
| 997 |
{
|
| 998 |
"epoch": 499.0,
|
| 999 |
"eval_loss": 0.9754325151443481,
|
| 1000 |
+
"eval_runtime": 133.3867,
|
| 1001 |
+
"eval_samples_per_second": 9.274,
|
| 1002 |
+
"eval_steps_per_second": 0.292,
|
| 1003 |
"eval_wer": 34.436287936890544,
|
| 1004 |
"step": 4000
|
| 1005 |
},
|
|
|
|
| 1246 |
{
|
| 1247 |
"epoch": 624.0,
|
| 1248 |
"eval_loss": 0.9921010732650757,
|
| 1249 |
+
"eval_runtime": 136.0036,
|
| 1250 |
+
"eval_samples_per_second": 9.095,
|
| 1251 |
+
"eval_steps_per_second": 0.287,
|
| 1252 |
"eval_wer": 34.21715788320368,
|
| 1253 |
"step": 5000
|
| 1254 |
},
|
|
|
|
| 1257 |
"step": 5000,
|
| 1258 |
"total_flos": 8.94614740992e+19,
|
| 1259 |
"train_loss": 0.02765977076081908,
|
| 1260 |
+
"train_runtime": 26145.1461,
|
| 1261 |
+
"train_samples_per_second": 12.239,
|
| 1262 |
"train_steps_per_second": 0.191
|
| 1263 |
}
|
| 1264 |
],
|