Model save

Browse files

Files changed (9) hide show

README.md +69 -0
config.json +129 -0
model.safetensors +3 -0
runs/Aug06_13-28-33_10db6dd1f421/events.out.tfevents.1722950924.10db6dd1f421.959.0 +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +55 -0
training_args.bin +3 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,69 @@

+---
+license: mit
+base_model: google-bert/bert-base-german-cased
+tags:
+- generated_from_trainer
+metrics:
+- accuracy
+model-index:
+- name: BERT_Reciever_6
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# BERT_Reciever_6
+This model is a fine-tuned version of [google-bert/bert-base-german-cased](https://huggingface.co/google-bert/bert-base-german-cased) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.1356
+- Accuracy: 0.9561
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 160
+- eval_batch_size: 160
+- seed: 2805
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 10.0
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Accuracy |
+|:-------------:|:-----:|:----:|:---------------:|:--------:|
+| No log        | 1.0   | 31   | 0.3889          | 0.9196   |
+| No log        | 2.0   | 62   | 0.2137          | 0.9342   |
+| No log        | 3.0   | 93   | 0.1763          | 0.9433   |
+| No log        | 4.0   | 124  | 0.1660          | 0.9433   |
+| No log        | 5.0   | 155  | 0.1592          | 0.9415   |
+| No log        | 6.0   | 186  | 0.1522          | 0.9470   |
+| No log        | 7.0   | 217  | 0.1454          | 0.9525   |
+| No log        | 8.0   | 248  | 0.1448          | 0.9506   |
+| No log        | 9.0   | 279  | 0.1388          | 0.9525   |
+| No log        | 10.0  | 310  | 0.1356          | 0.9561   |
+### Framework versions
+- Transformers 4.44.0.dev0
+- Pytorch 2.3.1+cu121
+- Datasets 2.20.0
+- Tokenizers 0.19.1

config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "_name_or_path": "google-bert/bert-base-german-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "finetuning_task": "text-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "0",
+    "1": "1",
+    "2": "10",
+    "3": "11",
+    "4": "12",
+    "5": "13",
+    "6": "14",
+    "7": "15",
+    "8": "16",
+    "9": "17",
+    "10": "18",
+    "11": "19",
+    "12": "2",
+    "13": "20",
+    "14": "21",
+    "15": "22",
+    "16": "23",
+    "17": "24",
+    "18": "25",
+    "19": "26",
+    "20": "27",
+    "21": "28",
+    "22": "29",
+    "23": "3",
+    "24": "30",
+    "25": "31",
+    "26": "32",
+    "27": "33",
+    "28": "34",
+    "29": "35",
+    "30": "36",
+    "31": "37",
+    "32": "38",
+    "33": "39",
+    "34": "4",
+    "35": "40",
+    "36": "41",
+    "37": "42",
+    "38": "43",
+    "39": "44",
+    "40": "45",
+    "41": "46",
+    "42": "47",
+    "43": "48",
+    "44": "5",
+    "45": "6",
+    "46": "7",
+    "47": "8",
+    "48": "9"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "0": 0,
+    "1": 1,
+    "10": 2,
+    "11": 3,
+    "12": 4,
+    "13": 5,
+    "14": 6,
+    "15": 7,
+    "16": 8,
+    "17": 9,
+    "18": 10,
+    "19": 11,
+    "2": 12,
+    "20": 13,
+    "21": 14,
+    "22": 15,
+    "23": 16,
+    "24": 17,
+    "25": 18,
+    "26": 19,
+    "27": 20,
+    "28": 21,
+    "29": 22,
+    "3": 23,
+    "30": 24,
+    "31": 25,
+    "32": 26,
+    "33": 27,
+    "34": 28,
+    "35": 29,
+    "36": 30,
+    "37": 31,
+    "38": 32,
+    "39": 33,
+    "4": 34,
+    "40": 35,
+    "41": 36,
+    "42": 37,
+    "43": 38,
+    "44": 39,
+    "45": 40,
+    "46": 41,
+    "47": 42,
+    "48": 43,
+    "5": 44,
+    "6": 45,
+    "7": 46,
+    "8": 47,
+    "9": 48
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.0.dev0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30000
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76cbdbb60327ef2490b757bde465dd28d47a9d68fde85bf31f3a66d40b268588
+size 436499628

runs/Aug06_13-28-33_10db6dd1f421/events.out.tfevents.1722950924.10db6dd1f421.959.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0062d70a4b4a20e43ecea222269addaf68179eb95f560e811fce32778188b5fb
+size 10030

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e81911aff73cd24327c590422964b2e1d0f1fbc8b39abd845bbefdd204d7c63d
+size 5240

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff