diogopaes10 commited on Jul 22, 2023

Commit

66fe6a4

•

1 Parent(s): 8eb03d2

End of training

Browse files

Files changed (26) hide show

checkpoint-3000/pytorch_model.bin +0 -3
checkpoint-3000/rng_state.pth +0 -3
checkpoint-3000/scheduler.pt +0 -3
checkpoint-3000/trainer_state.json +0 -412
checkpoint-3250/added_tokens.json +0 -3
checkpoint-3250/config.json +0 -59
checkpoint-3250/optimizer.pt +0 -3
checkpoint-3250/special_tokens_map.json +0 -9
checkpoint-3250/spm.model +0 -3
checkpoint-3250/tokenizer.json +0 -0
checkpoint-3250/tokenizer_config.json +0 -16
{checkpoint-3000 → checkpoint-3750}/added_tokens.json +0 -0
{checkpoint-3000 → checkpoint-3750}/config.json +0 -0
{checkpoint-3000 → checkpoint-3750}/optimizer.pt +1 -1
{checkpoint-3250 → checkpoint-3750}/pytorch_model.bin +1 -1
{checkpoint-3250 → checkpoint-3750}/rng_state.pth +1 -1
{checkpoint-3250 → checkpoint-3750}/scheduler.pt +1 -1
{checkpoint-3000 → checkpoint-3750}/special_tokens_map.json +0 -0
{checkpoint-3000 → checkpoint-3750}/spm.model +0 -0
{checkpoint-3000 → checkpoint-3750}/tokenizer.json +0 -0
{checkpoint-3000 → checkpoint-3750}/tokenizer_config.json +0 -0
{checkpoint-3250 → checkpoint-3750}/trainer_state.json +55 -3
{checkpoint-3000 → checkpoint-3750}/training_args.bin +0 -0
pytorch_model.bin +1 -1
runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690060770.ab4276e44fca.659.0 +2 -2
checkpoint-3250/training_args.bin → runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690061518.ab4276e44fca.659.1 +2 -2

checkpoint-3000/pytorch_model.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c95f2d92d432e839ff645f87515fc248494db36dac837cae703842d2cbf775e5
-size 737788917

checkpoint-3000/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:30675d1e37d339cae6e3dc477927b70e39062f0910613a7d90db6c1671bca5bc
-size 14575

checkpoint-3000/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:68cbe85bad4e57d93e8caf9830d7003e889867d2bc1bdf97b16703437df161a3
-size 627

checkpoint-3000/trainer_state.json DELETED Viewed

@@ -1,412 +0,0 @@
-{
-  "best_metric": null,
-  "best_model_checkpoint": null,
-  "epoch": 12.0,
-  "global_step": 3000,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 0.0,
-      "learning_rate": 1.999466666666667e-05,
-      "loss": 2.308,
-      "step": 1
-    },
-    {
-      "epoch": 0.75,
-      "learning_rate": 1.8997333333333335e-05,
-      "loss": 1.6916,
-      "step": 188
-    },
-    {
-      "epoch": 0.75,
-      "eval_accuracy": 0.6755,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 24.806385040283203,
-      "eval_f1": 0.6708054417489328,
-      "eval_gpu_ram_allocated": 2.089780330657959,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 50,
-      "eval_loss": 1.1062816381454468,
-      "eval_precision": 0.690043017889279,
-      "eval_recall": 0.6755,
-      "eval_runtime": 2.3912,
-      "eval_samples_per_second": 836.398,
-      "eval_steps_per_second": 26.347,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.019077301025391,
-      "step": 188
-    },
-    {
-      "epoch": 1.5,
-      "learning_rate": 1.8e-05,
-      "loss": 0.9694,
-      "step": 376
-    },
-    {
-      "epoch": 1.5,
-      "eval_accuracy": 0.7195,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 29.64177703857422,
-      "eval_f1": 0.7181081417115642,
-      "eval_gpu_ram_allocated": 2.0897774696350098,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 50,
-      "eval_loss": 0.9585903286933899,
-      "eval_precision": 0.719758443061289,
-      "eval_recall": 0.7195,
-      "eval_runtime": 2.3693,
-      "eval_samples_per_second": 844.141,
-      "eval_steps_per_second": 26.59,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.2536163330078125,
-      "step": 376
-    },
-    {
-      "epoch": 2.26,
-      "learning_rate": 1.6997333333333334e-05,
-      "loss": 0.8509,
-      "step": 564
-    },
-    {
-      "epoch": 2.26,
-      "eval_accuracy": 0.712,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 29.641841888427734,
-      "eval_f1": 0.7070168337920522,
-      "eval_gpu_ram_allocated": 2.089791774749756,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 46,
-      "eval_loss": 0.9747923016548157,
-      "eval_precision": 0.7160570316458433,
-      "eval_recall": 0.712,
-      "eval_runtime": 2.4432,
-      "eval_samples_per_second": 818.586,
-      "eval_steps_per_second": 25.785,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.160213470458984,
-      "step": 564
-    },
-    {
-      "epoch": 3.01,
-      "learning_rate": 1.5994666666666668e-05,
-      "loss": 0.7475,
-      "step": 752
-    },
-    {
-      "epoch": 3.01,
-      "eval_accuracy": 0.714,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 29.641963958740234,
-      "eval_f1": 0.7122032912823338,
-      "eval_gpu_ram_allocated": 2.089776039123535,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 50,
-      "eval_loss": 0.9446640014648438,
-      "eval_precision": 0.7148157467744413,
-      "eval_recall": 0.714,
-      "eval_runtime": 2.5063,
-      "eval_samples_per_second": 798.001,
-      "eval_steps_per_second": 25.137,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.160709381103516,
-      "step": 752
-    },
-    {
-      "epoch": 3.76,
-      "learning_rate": 1.4997333333333335e-05,
-      "loss": 0.5841,
-      "step": 940
-    },
-    {
-      "epoch": 3.76,
-      "eval_accuracy": 0.711,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 29.642024993896484,
-      "eval_f1": 0.7076606604060025,
-      "eval_gpu_ram_allocated": 2.089787483215332,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 47,
-      "eval_loss": 1.0064291954040527,
-      "eval_precision": 0.7225290812411572,
-      "eval_recall": 0.711,
-      "eval_runtime": 2.4755,
-      "eval_samples_per_second": 807.933,
-      "eval_steps_per_second": 25.45,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.188880920410156,
-      "step": 940
-    },
-    {
-      "epoch": 4.51,
-      "learning_rate": 1.3994666666666668e-05,
-      "loss": 0.4972,
-      "step": 1128
-    },
-    {
-      "epoch": 4.51,
-      "eval_accuracy": 0.714,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 29.642135620117188,
-      "eval_f1": 0.7109995031569997,
-      "eval_gpu_ram_allocated": 2.089801788330078,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 47,
-      "eval_loss": 1.0585097074508667,
-      "eval_precision": 0.7129473752365556,
-      "eval_recall": 0.714,
-      "eval_runtime": 2.3843,
-      "eval_samples_per_second": 838.824,
-      "eval_steps_per_second": 26.423,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.176631927490234,
-      "step": 1128
-    },
-    {
-      "epoch": 5.26,
-      "learning_rate": 1.2992e-05,
-      "loss": 0.4555,
-      "step": 1316
-    },
-    {
-      "epoch": 5.26,
-      "eval_accuracy": 0.7075,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 33.76519775390625,
-      "eval_f1": 0.7086283787248422,
-      "eval_gpu_ram_allocated": 2.089810371398926,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 46,
-      "eval_loss": 1.117536187171936,
-      "eval_precision": 0.71510102752271,
-      "eval_recall": 0.7075,
-      "eval_runtime": 2.5545,
-      "eval_samples_per_second": 782.936,
-      "eval_steps_per_second": 24.662,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.225734710693359,
-      "step": 1316
-    },
-    {
-      "epoch": 6.02,
-      "learning_rate": 1.1989333333333336e-05,
-      "loss": 0.3535,
-      "step": 1504
-    },
-    {
-      "epoch": 6.02,
-      "eval_accuracy": 0.708,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 33.76530456542969,
-      "eval_f1": 0.7032209621498534,
-      "eval_gpu_ram_allocated": 2.0898032188415527,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 50,
-      "eval_loss": 1.1748836040496826,
-      "eval_precision": 0.7076659711678004,
-      "eval_recall": 0.708,
-      "eval_runtime": 2.3932,
-      "eval_samples_per_second": 835.715,
-      "eval_steps_per_second": 26.325,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.23016357421875,
-      "step": 1504
-    },
-    {
-      "epoch": 6.77,
-      "learning_rate": 1.0986666666666668e-05,
-      "loss": 0.2614,
-      "step": 1692
-    },
-    {
-      "epoch": 6.77,
-      "eval_accuracy": 0.709,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 33.76542282104492,
-      "eval_f1": 0.7056311006074188,
-      "eval_gpu_ram_allocated": 2.089783191680908,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 49,
-      "eval_loss": 1.2027860879898071,
-      "eval_precision": 0.7079398723985221,
-      "eval_recall": 0.709,
-      "eval_runtime": 2.3888,
-      "eval_samples_per_second": 837.234,
-      "eval_steps_per_second": 26.373,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.237628936767578,
-      "step": 1692
-    },
-    {
-      "epoch": 7.52,
-      "learning_rate": 9.984e-06,
-      "loss": 0.2321,
-      "step": 1880
-    },
-    {
-      "epoch": 7.52,
-      "eval_accuracy": 0.698,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 33.7656135559082,
-      "eval_f1": 0.7018556265437493,
-      "eval_gpu_ram_allocated": 2.089846134185791,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 49,
-      "eval_loss": 1.2960551977157593,
-      "eval_precision": 0.708462957552084,
-      "eval_recall": 0.698,
-      "eval_runtime": 2.391,
-      "eval_samples_per_second": 836.478,
-      "eval_steps_per_second": 26.349,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.224781036376953,
-      "step": 1880
-    },
-    {
-      "epoch": 8.27,
-      "learning_rate": 8.981333333333333e-06,
-      "loss": 0.197,
-      "step": 2068
-    },
-    {
-      "epoch": 8.27,
-      "eval_accuracy": 0.712,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 33.7657470703125,
-      "eval_f1": 0.7097931257647566,
-      "eval_gpu_ram_allocated": 2.0897903442382812,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 45,
-      "eval_loss": 1.3960117101669312,
-      "eval_precision": 0.7137187449926237,
-      "eval_recall": 0.712,
-      "eval_runtime": 2.3878,
-      "eval_samples_per_second": 837.604,
-      "eval_steps_per_second": 26.385,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.219398498535156,
-      "step": 2068
-    },
-    {
-      "epoch": 9.02,
-      "learning_rate": 7.978666666666667e-06,
-      "loss": 0.1505,
-      "step": 2256
-    },
-    {
-      "epoch": 9.02,
-      "eval_accuracy": 0.7075,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 35.827659606933594,
-      "eval_f1": 0.709341703450241,
-      "eval_gpu_ram_allocated": 2.0897817611694336,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 48,
-      "eval_loss": 1.4310206174850464,
-      "eval_precision": 0.7133423622104005,
-      "eval_recall": 0.7075,
-      "eval_runtime": 2.4471,
-      "eval_samples_per_second": 817.29,
-      "eval_steps_per_second": 25.745,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.2417755126953125,
-      "step": 2256
-    },
-    {
-      "epoch": 9.78,
-      "learning_rate": 6.976000000000001e-06,
-      "loss": 0.1132,
-      "step": 2444
-    },
-    {
-      "epoch": 9.78,
-      "eval_accuracy": 0.7045,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 35.827754974365234,
-      "eval_f1": 0.705265213679387,
-      "eval_gpu_ram_allocated": 2.089801788330078,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 48,
-      "eval_loss": 1.5454399585723877,
-      "eval_precision": 0.7097494768850874,
-      "eval_recall": 0.7045,
-      "eval_runtime": 2.5035,
-      "eval_samples_per_second": 798.873,
-      "eval_steps_per_second": 25.165,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.293117523193359,
-      "step": 2444
-    },
-    {
-      "epoch": 10.53,
-      "learning_rate": 5.973333333333334e-06,
-      "loss": 0.0979,
-      "step": 2632
-    },
-    {
-      "epoch": 10.53,
-      "eval_accuracy": 0.708,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 35.82805252075195,
-      "eval_f1": 0.7090322597492875,
-      "eval_gpu_ram_allocated": 2.089801788330078,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 45,
-      "eval_loss": 1.64204740524292,
-      "eval_precision": 0.7171054872018443,
-      "eval_recall": 0.708,
-      "eval_runtime": 2.5339,
-      "eval_samples_per_second": 789.29,
-      "eval_steps_per_second": 24.863,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.279300689697266,
-      "step": 2632
-    },
-    {
-      "epoch": 11.28,
-      "learning_rate": 4.976e-06,
-      "loss": 0.0818,
-      "step": 2820
-    },
-    {
-      "epoch": 11.28,
-      "eval_accuracy": 0.7065,
-      "eval_disk_space_total": 78.1898422241211,
-      "eval_disk_space_used": 35.828128814697266,
-      "eval_f1": 0.706242034421972,
-      "eval_gpu_ram_allocated": 2.0898447036743164,
-      "eval_gpu_ram_cached": 25.85546875,
-      "eval_gpu_ram_total": 39.56402587890625,
-      "eval_gpu_utilization": 49,
-      "eval_loss": 1.686875820159912,
-      "eval_precision": 0.7102028476355108,
-      "eval_recall": 0.7065,
-      "eval_runtime": 2.4408,
-      "eval_samples_per_second": 819.396,
-      "eval_steps_per_second": 25.811,
-      "eval_system_ram_total": 83.48074722290039,
-      "eval_system_ram_used": 4.2822418212890625,
-      "step": 2820
-    }
-  ],
-  "max_steps": 3750,
-  "num_train_epochs": 15,
-  "total_flos": 5780526048262272.0,
-  "trial_name": null,
-  "trial_params": null
-}

checkpoint-3250/added_tokens.json DELETED Viewed

@@ -1,3 +0,0 @@
-{
-  "[MASK]": 128000
-}

checkpoint-3250/config.json DELETED Viewed

@@ -1,59 +0,0 @@
-{
-  "_name_or_path": "microsoft/deberta-v3-base",
-  "architectures": [
-    "DebertaV2ForSequenceClassification"
-  ],
-  "attention_probs_dropout_prob": 0.1,
-  "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
-  "id2label": {
-    "0": "Society & Culture",
-    "1": "Science & Mathematics",
-    "2": "Health",
-    "3": "Education & Reference",
-    "4": "Computers & Internet",
-    "5": "Sports",
-    "6": "Business & Finance",
-    "7": "Entertainment & Music",
-    "8": "Family & Relationships",
-    "9": "Politics & Government"
-  },
-  "initializer_range": 0.02,
-  "intermediate_size": 3072,
-  "label2id": {
-    "Business & Finance": 6,
-    "Computers & Internet": 4,
-    "Education & Reference": 3,
-    "Entertainment & Music": 7,
-    "Family & Relationships": 8,
-    "Health": 2,
-    "Politics & Government": 9,
-    "Science & Mathematics": 1,
-    "Society & Culture": 0,
-    "Sports": 5
-  },
-  "layer_norm_eps": 1e-07,
-  "max_position_embeddings": 512,
-  "max_relative_positions": -1,
-  "model_type": "deberta-v2",
-  "norm_rel_ebd": "layer_norm",
-  "num_attention_heads": 12,
-  "num_hidden_layers": 12,
-  "pad_token_id": 0,
-  "pooler_dropout": 0,
-  "pooler_hidden_act": "gelu",
-  "pooler_hidden_size": 768,
-  "pos_att_type": [
-    "p2c",
-    "c2p"
-  ],
-  "position_biased_input": false,
-  "position_buckets": 256,
-  "relative_attention": true,
-  "share_att_key": true,
-  "torch_dtype": "float32",
-  "transformers_version": "4.31.0",
-  "type_vocab_size": 0,
-  "vocab_size": 128100
-}

checkpoint-3250/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f17eacaf5376c0fabb8aeff03d05e59319e7a180e3c00d273c966e5a26d33f06
-size 1475557125

checkpoint-3250/special_tokens_map.json DELETED Viewed

@@ -1,9 +0,0 @@
-{
-  "bos_token": "[CLS]",
-  "cls_token": "[CLS]",
-  "eos_token": "[SEP]",
-  "mask_token": "[MASK]",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "unk_token": "[UNK]"
-}

checkpoint-3250/spm.model DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
-size 2464616

checkpoint-3250/tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-3250/tokenizer_config.json DELETED Viewed

@@ -1,16 +0,0 @@
-{
-  "bos_token": "[CLS]",
-  "clean_up_tokenization_spaces": true,
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
-  "eos_token": "[SEP]",
-  "mask_token": "[MASK]",
-  "model_max_length": 1000000000000000019884624838656,
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "sp_model_kwargs": {},
-  "split_by_punct": false,
-  "tokenizer_class": "DebertaV2Tokenizer",
-  "unk_token": "[UNK]",
-  "vocab_type": "spm"
-}

{checkpoint-3000 → checkpoint-3750}/added_tokens.json RENAMED Viewed

File without changes

{checkpoint-3000 → checkpoint-3750}/config.json RENAMED Viewed

File without changes

{checkpoint-3000 → checkpoint-3750}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a06836e74e2ee556f75e4f728cb07fd38bf7dca4688b3915aab2696b9adac99
 size 1475557125

 version https://git-lfs.github.com/spec/v1
+oid sha256:d156da8a469609a065c22691bca354b9e5e529ba5788e4c6a2fb2c05ca16bac3
 size 1475557125

{checkpoint-3250 → checkpoint-3750}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab87f1854f930634513326e51246eb456af5e9a20373ec512925553c65de13d4
 size 737788917

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb9e4b3254fdacaf6fa2e542ebcdfaf789e8bac3209c97fa9884b99c6abaf00f
 size 737788917

{checkpoint-3250 → checkpoint-3750}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e9318169f07f11cd9456a08a8554cc70b98429bd8764cb326d58f8d40bc05005
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:6586d391e812ac443d153fe39b51387d1776691cc74a4237b33c00b1c485b263
 size 14575

{checkpoint-3250 → checkpoint-3750}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6b6692caff16315b18091d72ba55872cc98f8a135dd4601d0a933fafdf6b6bcd
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7c58bc37a8c98d0bf14317ace8f986ecedea9d0665ee8450abd7629af8cb1e9
 size 627

{checkpoint-3000 → checkpoint-3750}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-3000 → checkpoint-3750}/spm.model RENAMED Viewed

File without changes

{checkpoint-3000 → checkpoint-3750}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-3000 → checkpoint-3750}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-3250 → checkpoint-3750}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 13.0,
-  "global_step": 3250,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -454,11 +454,63 @@
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 4.266563415527344,
       "step": 3196
     }
   ],
   "max_steps": 3750,
   "num_train_epochs": 15,
-  "total_flos": 6259743625357056.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 15.0,
+  "global_step": 3750,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 4.266563415527344,
       "step": 3196
+    },
+    {
+      "epoch": 13.54,
+      "learning_rate": 1.968e-06,
+      "loss": 0.0368,
+      "step": 3384
+    },
+    {
+      "epoch": 13.54,
+      "eval_accuracy": 0.7055,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 35.828514099121094,
+      "eval_f1": 0.7079190260942086,
+      "eval_gpu_ram_allocated": 2.0898475646972656,
+      "eval_gpu_ram_cached": 25.85546875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 47,
+      "eval_loss": 1.8403420448303223,
+      "eval_precision": 0.7131395828448935,
+      "eval_recall": 0.7055,
+      "eval_runtime": 2.4685,
+      "eval_samples_per_second": 810.214,
+      "eval_steps_per_second": 25.522,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.278324127197266,
+      "step": 3384
+    },
+    {
+      "epoch": 14.29,
+      "learning_rate": 9.653333333333333e-07,
+      "loss": 0.0379,
+      "step": 3572
+    },
+    {
+      "epoch": 14.29,
+      "eval_accuracy": 0.705,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 35.828582763671875,
+      "eval_f1": 0.7051869329304575,
+      "eval_gpu_ram_allocated": 2.089784622192383,
+      "eval_gpu_ram_cached": 25.85546875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 47,
+      "eval_loss": 1.8535802364349365,
+      "eval_precision": 0.7073671527926624,
+      "eval_recall": 0.705,
+      "eval_runtime": 2.4945,
+      "eval_samples_per_second": 801.76,
+      "eval_steps_per_second": 25.255,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.301258087158203,
+      "step": 3572
     }
   ],
   "max_steps": 3750,
   "num_train_epochs": 15,
+  "total_flos": 7220464762017408.0,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-3000 → checkpoint-3750}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab87f1854f930634513326e51246eb456af5e9a20373ec512925553c65de13d4
 size 737788917

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb9e4b3254fdacaf6fa2e542ebcdfaf789e8bac3209c97fa9884b99c6abaf00f
 size 737788917

runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690060770.ab4276e44fca.659.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a0676d7575783045c7b0b81b3dac8f9748e1362dd10f8ada9768f991e63e7691
-size 23854

 version https://git-lfs.github.com/spec/v1
+oid sha256:d7cc1c502b7afe0f436409a4e0fe91d0bca050eb10ee5cd85dbc61b0ffa714a0
+size 26412

checkpoint-3250/training_args.bin → runs/Jul22_21-19-20_ab4276e44fca/events.out.tfevents.1690061518.ab4276e44fca.659.1 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c483311c6e034a3b791b3aba6061603f3b239dec5f5cd88a867a5f6743909401
-size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:8f403714063524786ff7cc8bc9849d04c002300dca210402782a59c99edb0de9
+size 1033