thrunlab
/

t5-base_qnli_dense_epochs-1

Text Classification

Generated from Trainer

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

lukeleeai commited on Oct 27, 2023

Commit

2be678d

•

1 Parent(s): 0fc349c

End of training

Files changed (5) hide show

README.md +7 -4
config.json +1 -1
pytorch_model.bin +2 -2
tokenizer.json +1 -6
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -22,7 +22,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: 0.46153846153846156
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on the glue dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.8579
-- Accuracy: 0.4615
 ## Model description
@@ -55,7 +55,10 @@ The following hyperparameters were used during training:
 - learning_rate: 5e-05
 - train_batch_size: 32
 - eval_batch_size: 64
-- seed: 0
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 20

     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.3076923076923077
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on the glue dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.7773
+- Accuracy: 0.3077
 ## Model description
 - learning_rate: 5e-05
 - train_batch_size: 32
 - eval_batch_size: 64
+- seed: 1
+- distributed_type: multi-GPU
+- gradient_accumulation_steps: 2
+- total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 20

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
       "prefix": "translate English to Romanian: "
     }
   },
-  "torch_dtype": "float32",
   "transformers_version": "4.34.1",
   "use_cache": true,
   "vocab_size": 32128

       "prefix": "translate English to Romanian: "
     }
   },
+  "torch_dtype": "bfloat16",
   "transformers_version": "4.34.1",
   "use_cache": true,
   "vocab_size": 32128

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:710bf7ff2261326757656e1dcd2c867a5aa79e37703729e0a64e42264cfdb4e9
-size 894094241

 version https://git-lfs.github.com/spec/v1
+oid sha256:cdeb500ba7be5f70311bd2630980f095edeb31b24a7cb27f8c3e72ec55bfe7ac
+size 447089825

tokenizer.json CHANGED Viewed

@@ -1,11 +1,6 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 512,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4330e66b9a4f06ab478d5bf11a932f5efc11d5b4ad349a2ea0e4023ac73db390
-size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:dcab6ddc1b87a49965f15aeb6c4fcec9087a213cafb40893d389a8084b322844
+size 5819