End of training

Browse files

Files changed (9) hide show

README.md +33 -41
config.json +1 -1
model.safetensors +1 -1
runs/Apr06_16-27-51_df7953592bde/events.out.tfevents.1712420877.df7953592bde.34.0 +3 -0
runs/Apr06_16-28-56_df7953592bde/events.out.tfevents.1712420945.df7953592bde.34.1 +3 -0
runs/Apr06_16-41-52_df7953592bde/events.out.tfevents.1712421713.df7953592bde.168.0 +3 -0
special_tokens_map.json +3 -21
tokenizer_config.json +0 -7
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 license: apache-2.0
-base_model: SpamAcc/t5base-fine-tuned
 tags:
 - generated_from_trainer
 model-index:
@@ -13,9 +13,9 @@ should probably proofread and complete it, then remove this comment. -->
 # ingredient_prune
-This model is a fine-tuned version of [SpamAcc/t5base-fine-tuned](https://huggingface.co/SpamAcc/t5base-fine-tuned) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.0371
 ## Model description
@@ -35,53 +35,45 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 4
-- eval_batch_size: 4
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 10
 - mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 3.1159        | 0.29  | 10   | 0.9254          |
-| 1.8303        | 0.57  | 20   | 0.5377          |
-| 1.4456        | 0.86  | 30   | 0.4401          |
-| 1.067         | 1.14  | 40   | 0.3872          |
-| 0.9132        | 1.43  | 50   | 0.3461          |
-| 0.7107        | 1.71  | 60   | 0.3071          |
-| 0.6644        | 2.0   | 70   | 0.2702          |
-| 0.5167        | 2.29  | 80   | 0.2367          |
-| 0.4688        | 2.57  | 90   | 0.2058          |
-| 0.4094        | 2.86  | 100  | 0.1813          |
-| 0.411         | 3.14  | 110  | 0.1651          |
-| 0.359         | 3.43  | 120  | 0.1418          |
-| 0.3094        | 3.71  | 130  | 0.1290          |
-| 0.2469        | 4.0   | 140  | 0.1190          |
-| 0.2509        | 4.29  | 150  | 0.1108          |
-| 0.2023        | 4.57  | 160  | 0.1018          |
-| 0.2049        | 4.86  | 170  | 0.0947          |
-| 0.2236        | 5.14  | 180  | 0.0881          |
-| 0.1748        | 5.43  | 190  | 0.0810          |
-| 0.1428        | 5.71  | 200  | 0.0741          |
-| 0.1569        | 6.0   | 210  | 0.0679          |
-| 0.1297        | 6.29  | 220  | 0.0626          |
-| 0.1495        | 6.57  | 230  | 0.0578          |
-| 0.146         | 6.86  | 240  | 0.0544          |
-| 0.0996        | 7.14  | 250  | 0.0506          |
-| 0.1292        | 7.43  | 260  | 0.0472          |
-| 0.1003        | 7.71  | 270  | 0.0449          |
-| 0.1097        | 8.0   | 280  | 0.0433          |
-| 0.1347        | 8.29  | 290  | 0.0421          |
-| 0.0953        | 8.57  | 300  | 0.0406          |
-| 0.0967        | 8.86  | 310  | 0.0393          |
-| 0.0956        | 9.14  | 320  | 0.0383          |
-| 0.117         | 9.43  | 330  | 0.0376          |
-| 0.0974        | 9.71  | 340  | 0.0372          |
-| 0.1094        | 10.0  | 350  | 0.0371          |
 ### Framework versions

 ---
 license: apache-2.0
+base_model: t5-base
 tags:
 - generated_from_trainer
 model-index:
 # ingredient_prune
+This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2021
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 8
+- eval_batch_size: 8
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 5
 - mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 13.8901       | 0.18  | 10   | 13.5101         |
+| 11.2216       | 0.36  | 20   | 9.6935          |
+| 8.9001        | 0.55  | 30   | 6.9317          |
+| 6.9158        | 0.73  | 40   | 4.3383          |
+| 4.5333        | 0.91  | 50   | 2.5113          |
+| 3.3307        | 1.09  | 60   | 1.5023          |
+| 2.3644        | 1.27  | 70   | 1.1537          |
+| 1.8483        | 1.45  | 80   | 0.7876          |
+| 1.5672        | 1.64  | 90   | 0.6205          |
+| 1.1184        | 1.82  | 100  | 0.4843          |
+| 0.9273        | 2.0   | 110  | 0.4324          |
+| 0.7881        | 2.18  | 120  | 0.4005          |
+| 0.7159        | 2.36  | 130  | 0.3644          |
+| 0.6495        | 2.55  | 140  | 0.3373          |
+| 0.5903        | 2.73  | 150  | 0.3155          |
+| 0.5114        | 2.91  | 160  | 0.2980          |
+| 0.5107        | 3.09  | 170  | 0.2800          |
+| 0.4718        | 3.27  | 180  | 0.2669          |
+| 0.4285        | 3.45  | 190  | 0.2542          |
+| 0.429         | 3.64  | 200  | 0.2422          |
+| 0.4065        | 3.82  | 210  | 0.2320          |
+| 0.4087        | 4.0   | 220  | 0.2244          |
+| 0.3597        | 4.18  | 230  | 0.2166          |
+| 0.3515        | 4.36  | 240  | 0.2106          |
+| 0.3453        | 4.55  | 250  | 0.2065          |
+| 0.3563        | 4.73  | 260  | 0.2036          |
+| 0.3492        | 4.91  | 270  | 0.2021          |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "SpamAcc/t5base-fine-tuned",
   "architectures": [
     "T5ForConditionalGeneration"
   ],

 {
+  "_name_or_path": "t5-base",
   "architectures": [
     "T5ForConditionalGeneration"
   ],

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e2c1d0eca5a9fdd1a703b692941ae5e104219e2a5f1c49560aff935d6aeb6525
 size 891644712

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4d2d2b99f6ff36ae036cde9a73fcb1bcd4b107db55e86bc9fa2bb5d54c3dc3c
 size 891644712

runs/Apr06_16-27-51_df7953592bde/events.out.tfevents.1712420877.df7953592bde.34.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3b558f141f3fdc8942f2fd524936ae2821b0a88a7111529fee167fc7b405172
+size 5561

runs/Apr06_16-28-56_df7953592bde/events.out.tfevents.1712420945.df7953592bde.34.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:204e06b7c0d8a5e5bd7f96850787da731046964cc05f876e97bb618aeae05c5b
+size 11239

runs/Apr06_16-41-52_df7953592bde/events.out.tfevents.1712421713.df7953592bde.168.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ac52d3a63587e2a4d1af52dad8d5397f3729723bd1e6be09e56ad9ea74a07e1
+size 18820

special_tokens_map.json CHANGED Viewed

@@ -101,25 +101,7 @@
     "<extra_id_98>",
     "<extra_id_99>"
   ],
-  "eos_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "<pad>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
 }

     "<extra_id_98>",
     "<extra_id_99>"
   ],
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
 }

tokenizer_config.json CHANGED Viewed

@@ -930,15 +930,8 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
-  "max_length": 128,
   "model_max_length": 128,
-  "pad_to_multiple_of": null,
   "pad_token": "<pad>",
-  "pad_token_type_id": 0,
-  "padding_side": "right",
-  "stride": 0,
   "tokenizer_class": "T5Tokenizer",
-  "truncation_side": "right",
-  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 128,
   "pad_token": "<pad>",
   "tokenizer_class": "T5Tokenizer",
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed9821bbaf0be7045aef9332c29b7944cb91606f2687c5353c3530e75dd7d461
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:e24eb1200ae4c986e921750f7baeedb709068cf3e3fd0294ba5080450d869661
 size 5048