Training in progress, step 500, checkpoint

Files changed (6) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edfba44bd109d21a02049f79329b04cd8b750c97316da54ecf419cf7c57a316b
 size 3208536

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5acdfd33b50c6d9fdef5edadc974a380da21df1f9c8134b54111f089faa3053
 size 3208536

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bd8d04570d6fc1a61f55f224964c4eaff27bdd1e5914260d48c485c77bf70c11
 size 6477306

 version https://git-lfs.github.com/spec/v1
+oid sha256:daa0e9373454efdc4662cae9258f5af17a0a314bb53df3cd22153f2aa5f94dbd
 size 6477306

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:99b6bf2633576a5bcc6ae4d6496d485a98cae17c5f851c237cfbdbab048f4d2e
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:97a06efdf9c0a3412c2213f750b599184601a81c1b554150f5baece32506b39e
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40a47e8e0c728a6419cdac42f9eb7d9aab7d985a7569fc2a2246cdbf3299396f
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:8cc70b99f783009e9bc521a702be6ffc66450585d22580bd0270abac6affb5ea
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,26 +1,19 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.0,
   "eval_steps": 500,
-  "global_step": 1083,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 1.3850415512465375,
-      "grad_norm": 3.2763009071350098,
       "learning_rate": 2.6915974145891044e-05,
-      "loss": 0.7375,
       "step": 500
-    },
-    {
-      "epoch": 2.770083102493075,
-      "grad_norm": 25.30129051208496,
-      "learning_rate": 3.831948291782087e-06,
-      "loss": 0.5462,
-      "step": 1000
     }
   ],
   "logging_steps": 500,
@@ -35,12 +28,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": true
       },
       "attributes": {}
     }
   },
-  "total_flos": 1020832481829888.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.3850415512465375,
   "eval_steps": 500,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 1.3850415512465375,
+      "grad_norm": 2.723154067993164,
       "learning_rate": 2.6915974145891044e-05,
+      "loss": 0.7381,
       "step": 500
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": false
       },
       "attributes": {}
     }
   },
+  "total_flos": 475746871219200.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0cf827305e0121bde381d35bf22cc066c8e166490ad94bcfa0caaefd631a16bd
 size 5432

 version https://git-lfs.github.com/spec/v1
+oid sha256:137f34abacf3c97b6ea24393f8753eac25cc9695068d5a8f1e3ad9ea5584ea97
 size 5432