Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

checkpoint-3811/config.json +1 -1
checkpoint-3811/model.safetensors +1 -1
checkpoint-3811/optimizer.pt +1 -1
checkpoint-3811/rng_state.pth +1 -1
checkpoint-3811/trainer_state.json +20 -13
checkpoint-3811/training_args.bin +2 -2
config.json +1 -1
model.safetensors +1 -1
training_args.bin +2 -2

checkpoint-3811/config.json CHANGED Viewed

@@ -120,5 +120,5 @@
   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.37.2"
 }

   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.38.1"
 }

checkpoint-3811/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fbf5f6f1dfd2ccde0d7a7a24e1e6044f20ebc081c27c4474c0901aeeec0ac23f
 size 343365480

 version https://git-lfs.github.com/spec/v1
+oid sha256:9449fd2d1966756ea426a5eaed7016b0a2b06e90c9b93c5c152101c63e800467
 size 343365480

checkpoint-3811/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d362186704f9c56250778b57f1ea20edfb0596a177fadcd6898a087c34ec3d94
 size 686851461

 version https://git-lfs.github.com/spec/v1
+oid sha256:6722a5f10822f8dd81119396666550fca6614bebaaf4c062fafa0e1c32ff9786
 size 686851461

checkpoint-3811/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b668fdb5dc699008b82d229ecd74c73544a23840131a335df22bdecd69c9d0f8
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:47937116bc899ee0e8d20f420e26be61bf299bdf92003f1cac432d282b42481f
 size 14575

checkpoint-3811/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 2.5512685775756836,
   "best_model_checkpoint": "cat_breed_image_detection/checkpoint-3811",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,53 +10,60 @@
   "log_history": [
     {
       "epoch": 0.13,
       "learning_rate": 2.641052911459718e-07,
-      "loss": 2.5439,
       "step": 500
     },
     {
       "epoch": 0.26,
       "learning_rate": 2.2422228130816273e-07,
-      "loss": 2.5463,
       "step": 1000
     },
     {
       "epoch": 0.39,
       "learning_rate": 1.8433927147035363e-07,
-      "loss": 2.5467,
       "step": 1500
     },
     {
       "epoch": 0.52,
       "learning_rate": 1.444562616325445e-07,
-      "loss": 2.5433,
       "step": 2000
     },
     {
       "epoch": 0.66,
       "learning_rate": 1.0457325179473543e-07,
-      "loss": 2.5426,
       "step": 2500
     },
     {
       "epoch": 0.79,
       "learning_rate": 6.469024195692635e-08,
-      "loss": 2.5382,
       "step": 3000
     },
     {
       "epoch": 0.92,
       "learning_rate": 2.4807232119117254e-08,
-      "loss": 2.5352,
       "step": 3500
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.4089533510481252,
-      "eval_loss": 2.5512685775756836,
-      "eval_runtime": 320.305,
-      "eval_samples_per_second": 84.594,
-      "eval_steps_per_second": 2.644,
       "step": 3811
     }
   ],

 {
+  "best_metric": 2.530700206756592,
   "best_model_checkpoint": "cat_breed_image_detection/checkpoint-3811",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.13,
+      "grad_norm": 2.8601508140563965,
       "learning_rate": 2.641052911459718e-07,
+      "loss": 2.5249,
       "step": 500
     },
     {
       "epoch": 0.26,
+      "grad_norm": 2.4823763370513916,
       "learning_rate": 2.2422228130816273e-07,
+      "loss": 2.5332,
       "step": 1000
     },
     {
       "epoch": 0.39,
+      "grad_norm": 3.0686984062194824,
       "learning_rate": 1.8433927147035363e-07,
+      "loss": 2.5257,
       "step": 1500
     },
     {
       "epoch": 0.52,
+      "grad_norm": 2.4510738849639893,
       "learning_rate": 1.444562616325445e-07,
+      "loss": 2.5138,
       "step": 2000
     },
     {
       "epoch": 0.66,
+      "grad_norm": 2.1571173667907715,
       "learning_rate": 1.0457325179473543e-07,
+      "loss": 2.521,
       "step": 2500
     },
     {
       "epoch": 0.79,
+      "grad_norm": 2.9375104904174805,
       "learning_rate": 6.469024195692635e-08,
+      "loss": 2.5142,
       "step": 3000
     },
     {
       "epoch": 0.92,
+      "grad_norm": 3.093559503555298,
       "learning_rate": 2.4807232119117254e-08,
+      "loss": 2.5058,
       "step": 3500
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.41552258635961026,
+      "eval_loss": 2.530700206756592,
+      "eval_runtime": 299.6579,
+      "eval_samples_per_second": 90.423,
+      "eval_steps_per_second": 2.827,
       "step": 3811
     }
   ],

checkpoint-3811/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06011ad1af114029fbc190c3719d27b6d4c4854d6a202ffb9e678265e68cb0ee
-size 4219

 version https://git-lfs.github.com/spec/v1
+oid sha256:3778b54042e77bf37dd5c8d74f4432f27fcc27b31fdf7ef4e19085906e116ef3
+size 4411

config.json CHANGED Viewed

@@ -120,5 +120,5 @@
   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.37.2"
 }

   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.38.1"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fbf5f6f1dfd2ccde0d7a7a24e1e6044f20ebc081c27c4474c0901aeeec0ac23f
 size 343365480

 version https://git-lfs.github.com/spec/v1
+oid sha256:9449fd2d1966756ea426a5eaed7016b0a2b06e90c9b93c5c152101c63e800467
 size 343365480

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06011ad1af114029fbc190c3719d27b6d4c4854d6a202ffb9e678265e68cb0ee
-size 4219

 version https://git-lfs.github.com/spec/v1
+oid sha256:3778b54042e77bf37dd5c8d74f4432f27fcc27b31fdf7ef4e19085906e116ef3
+size 4411