Anhltq
/

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-soft_scavenging_clam

Text Generation

Generated from Trainer

I am soft scavenging clam

text-generation-inference

Model card Files Files and versions

Anhltq commited on Apr 6

Commit

a5032b8

·

verified ·

1 Parent(s): faadbd7

End of training

Files changed (4) hide show

all_results.json +2 -2
model.safetensors +1 -1
train_results.json +2 -2
trainer_state.json +3 -3

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 0.0,
     "train_loss": -2.7790665626525877e-07,
-    "train_runtime": 3161.8325,
     "train_samples": 160,
-    "train_samples_per_second": 0.101,
     "train_steps_per_second": 0.006
 }

 {
     "total_flos": 0.0,
     "train_loss": -2.7790665626525877e-07,
+    "train_runtime": 3143.7741,
     "train_samples": 160,
+    "train_samples_per_second": 0.102,
     "train_steps_per_second": 0.006
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f56802790fcca3fcc69f9c09fbd2d62c07fab6a15110cc0d094adc7c40872245
 size 1976163472

 version https://git-lfs.github.com/spec/v1
+oid sha256:b114055c1a1b44b7027c19bc13db83e7d9e96f9ea30a41c21eded6b713c60d17
 size 1976163472

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 0.0,
     "train_loss": -2.7790665626525877e-07,
-    "train_runtime": 3161.8325,
     "train_samples": 160,
-    "train_samples_per_second": 0.101,
     "train_steps_per_second": 0.006
 }

 {
     "total_flos": 0.0,
     "train_loss": -2.7790665626525877e-07,
+    "train_runtime": 3143.7741,
     "train_samples": 160,
+    "train_samples_per_second": 0.102,
     "train_steps_per_second": 0.006
 }

trainer_state.json CHANGED Viewed

@@ -183,7 +183,7 @@
     {
       "completion_length": 89.625,
       "epoch": 1.0,
-      "grad_norm": 3.1471806494209886e-08,
       "kl": 0.0,
       "learning_rate": 0.0,
       "loss": -0.0,
@@ -204,8 +204,8 @@
       "step": 20,
       "total_flos": 0.0,
       "train_loss": -2.7790665626525877e-07,
-      "train_runtime": 3161.8325,
-      "train_samples_per_second": 0.101,
       "train_steps_per_second": 0.006
     }
   ],

     {
       "completion_length": 89.625,
       "epoch": 1.0,
+      "grad_norm": 3.0665063377455226e-08,
       "kl": 0.0,
       "learning_rate": 0.0,
       "loss": -0.0,
       "step": 20,
       "total_flos": 0.0,
       "train_loss": -2.7790665626525877e-07,
+      "train_runtime": 3143.7741,
+      "train_samples_per_second": 0.102,
       "train_steps_per_second": 0.006
     }
   ],