richardchiu commited on Mar 23

Commit

4141c3e

•

1 Parent(s): 71ef7a7

Training in progress, epoch 1

Browse files

Files changed (25) hide show

model.safetensors +1 -1
run-5/checkpoint-1340/config.json +25 -0
run-5/checkpoint-1340/model.safetensors +3 -0
run-5/checkpoint-1340/optimizer.pt +3 -0
run-5/checkpoint-1340/rng_state.pth +3 -0
run-5/checkpoint-1340/scheduler.pt +3 -0
run-5/checkpoint-1340/special_tokens_map.json +7 -0
run-5/checkpoint-1340/tokenizer.json +0 -0
run-5/checkpoint-1340/tokenizer_config.json +55 -0
run-5/checkpoint-1340/trainer_state.json +85 -0
run-5/checkpoint-1340/training_args.bin +3 -0
run-5/checkpoint-1340/vocab.txt +0 -0
run-6/checkpoint-134/config.json +25 -0
run-6/checkpoint-134/model.safetensors +3 -0
run-6/checkpoint-134/optimizer.pt +3 -0
run-6/checkpoint-134/rng_state.pth +3 -0
run-6/checkpoint-134/scheduler.pt +3 -0
run-6/checkpoint-134/special_tokens_map.json +7 -0
run-6/checkpoint-134/tokenizer.json +0 -0
run-6/checkpoint-134/tokenizer_config.json +55 -0
run-6/checkpoint-134/trainer_state.json +35 -0
run-6/checkpoint-134/training_args.bin +3 -0
run-6/checkpoint-134/vocab.txt +0 -0
runs/Mar23_02-14-11_d179836e26c8/events.out.tfevents.1711161215.d179836e26c8.903.10 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a0ec1375d7819609f06105f3870abc2a54172d9a7099016fc1da269afa7a977a
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:5dd71b8c0b74767d522e813d7e177828bb7110f60a2e3fcde82478f0ef95e3e7
 size 267832560

run-5/checkpoint-1340/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.39.1",
+  "vocab_size": 30522
+}

run-5/checkpoint-1340/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6924014bf59ea78b5fb2877725379b58387c390575cf05d8b2214c1e897a754
+size 267832560

run-5/checkpoint-1340/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc05456e26f1c50f13a49163aca978e2cf38efaf56e2405384b7983ecfd60962
+size 535727290

run-5/checkpoint-1340/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4588875a5fbed58e929a85f3d56b0d55e9bcd483ab055f6f849f6d129245a124
+size 14244

run-5/checkpoint-1340/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbadd4653547d16ad332105d7db088fc9b2f85e5e30b0e89a4123fc4c3f335e4
+size 1064

run-5/checkpoint-1340/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-1340/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-5/checkpoint-1340/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-5/checkpoint-1340/trainer_state.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "best_metric": 0.5115958993985192,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-5/checkpoint-1340",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 1340,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.46541309356689453,
+      "eval_matthews_correlation": 0.4611631351812362,
+      "eval_runtime": 0.7349,
+      "eval_samples_per_second": 1419.226,
+      "eval_steps_per_second": 89.807,
+      "step": 268
+    },
+    {
+      "epoch": 1.87,
+      "grad_norm": 5.322132587432861,
+      "learning_rate": 2.8926577590888014e-05,
+      "loss": 0.415,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5235322117805481,
+      "eval_matthews_correlation": 0.48584699342231225,
+      "eval_runtime": 0.8286,
+      "eval_samples_per_second": 1258.804,
+      "eval_steps_per_second": 79.656,
+      "step": 536
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6811769604682922,
+      "eval_matthews_correlation": 0.4886634303966225,
+      "eval_runtime": 1.1682,
+      "eval_samples_per_second": 892.827,
+      "eval_steps_per_second": 56.497,
+      "step": 804
+    },
+    {
+      "epoch": 3.73,
+      "grad_norm": 5.797658920288086,
+      "learning_rate": 1.1708376643930863e-05,
+      "loss": 0.1523,
+      "step": 1000
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.8018879294395447,
+      "eval_matthews_correlation": 0.5029119946692125,
+      "eval_runtime": 0.7895,
+      "eval_samples_per_second": 1321.02,
+      "eval_steps_per_second": 83.593,
+      "step": 1072
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.930472731590271,
+      "eval_matthews_correlation": 0.5115958993985192,
+      "eval_runtime": 1.1184,
+      "eval_samples_per_second": 932.607,
+      "eval_steps_per_second": 59.014,
+      "step": 1340
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1340,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 191380204405152.0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.6144778537845165e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 3
+  }
+}

run-5/checkpoint-1340/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb396c880ed21cbe5386566eb59cb1266f1baa96469ad33b08f5bdf8bfd36bd0
+size 5048

run-5/checkpoint-1340/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-134/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.39.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-134/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5dd71b8c0b74767d522e813d7e177828bb7110f60a2e3fcde82478f0ef95e3e7
+size 267832560

run-6/checkpoint-134/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:348bf351569cfd040213112990135d920b3099006c58db7e1ebe193809c3c266
+size 535727290

run-6/checkpoint-134/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:67de1495d89bad1bf433ea074faeed5cad69203839c69144ec9b9dd8e5891ce0
+size 14244

run-6/checkpoint-134/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c228f60e941e071784831a9788fb9a8d1c897654908ed7aa836107b8a9f698d6
+size 1064

run-6/checkpoint-134/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-134/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-134/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-134/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.4751366513569292,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-134",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 134,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.4657443165779114,
+      "eval_matthews_correlation": 0.4751366513569292,
+      "eval_runtime": 0.7348,
+      "eval_samples_per_second": 1419.5,
+      "eval_steps_per_second": 89.825,
+      "step": 134
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 268,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.3864170205221844e-05,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 64,
+    "seed": 16
+  }
+}

run-6/checkpoint-134/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb80389a7fc088e5844ba718e7e18b53f00364a3051c518916518ff469150fda
+size 5048

run-6/checkpoint-134/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Mar23_02-14-11_d179836e26c8/events.out.tfevents.1711161215.d179836e26c8.903.10 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41b906996a25d9d0d72a59bbe4c225d5224638780e7c13e7c1a50bcc07d050e5
+size 5631

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bb396c880ed21cbe5386566eb59cb1266f1baa96469ad33b08f5bdf8bfd36bd0
 size 5048

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb80389a7fc088e5844ba718e7e18b53f00364a3051c518916518ff469150fda
 size 5048