HuggingAlex1247 commited on
Commit
37b249b
1 Parent(s): 6dc8ec0

Training in progress epoch 0

Browse files
README.md ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ tags:
4
+ - generated_from_keras_callback
5
+ model-index:
6
+ - name: HuggingAlex1247/distilbert-base-german-europeana-cased-germeval_14
7
+ results: []
8
+ ---
9
+
10
+ <!-- This model card has been generated automatically according to the information Keras had access to. You should
11
+ probably proofread and complete it, then remove this comment. -->
12
+
13
+ # HuggingAlex1247/distilbert-base-german-europeana-cased-germeval_14
14
+
15
+ This model is a fine-tuned version of [dbmdz/distilbert-base-german-europeana-cased](https://huggingface.co/dbmdz/distilbert-base-german-europeana-cased) on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - Train Loss: 0.3609
18
+ - Validation Loss: 0.2115
19
+ - Epoch: 0
20
+
21
+ ## Model description
22
+
23
+ More information needed
24
+
25
+ ## Intended uses & limitations
26
+
27
+ More information needed
28
+
29
+ ## Training and evaluation data
30
+
31
+ More information needed
32
+
33
+ ## Training procedure
34
+
35
+ ### Training hyperparameters
36
+
37
+ The following hyperparameters were used during training:
38
+ - optimizer: {'name': 'AdamWeightDecay', 'learning_rate': {'class_name': 'PolynomialDecay', 'config': {'initial_learning_rate': 1e-05, 'decay_steps': 25500, 'end_learning_rate': 0.0, 'power': 1.0, 'cycle': False, 'name': None}}, 'decay': 0.0, 'beta_1': 0.9, 'beta_2': 0.999, 'epsilon': 1e-08, 'amsgrad': False, 'weight_decay_rate': 0.01}
39
+ - training_precision: float32
40
+
41
+ ### Training results
42
+
43
+ | Train Loss | Validation Loss | Epoch |
44
+ |:----------:|:---------------:|:-----:|
45
+ | 0.3609 | 0.2115 | 0 |
46
+
47
+
48
+ ### Framework versions
49
+
50
+ - Transformers 4.17.0
51
+ - TensorFlow 2.6.2
52
+ - Datasets 1.18.0
53
+ - Tokenizers 0.11.6
config.json ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "dbmdz/distilbert-base-german-europeana-cased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForTokenClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "O",
13
+ "1": "B-LOC",
14
+ "10": "I-ORGderiv",
15
+ "11": "B-ORGpart",
16
+ "12": "I-ORGpart",
17
+ "13": "B-OTH",
18
+ "14": "I-OTH",
19
+ "15": "B-OTHderiv",
20
+ "16": "I-OTHderiv",
21
+ "17": "B-OTHpart",
22
+ "18": "I-OTHpart",
23
+ "19": "B-PER",
24
+ "2": "I-LOC",
25
+ "20": "I-PER",
26
+ "21": "B-PERderiv",
27
+ "22": "I-PERderiv",
28
+ "23": "B-PERpart",
29
+ "24": "I-PERpart",
30
+ "3": "B-LOCderiv",
31
+ "4": "I-LOCderiv",
32
+ "5": "B-LOCpart",
33
+ "6": "I-LOCpart",
34
+ "7": "B-ORG",
35
+ "8": "I-ORG",
36
+ "9": "B-ORGderiv"
37
+ },
38
+ "initializer_range": 0.02,
39
+ "label2id": {
40
+ "B-LOC": "1",
41
+ "B-LOCderiv": "3",
42
+ "B-LOCpart": "5",
43
+ "B-ORG": "7",
44
+ "B-ORGderiv": "9",
45
+ "B-ORGpart": "11",
46
+ "B-OTH": "13",
47
+ "B-OTHderiv": "15",
48
+ "B-OTHpart": "17",
49
+ "B-PER": "19",
50
+ "B-PERderiv": "21",
51
+ "B-PERpart": "23",
52
+ "I-LOC": "2",
53
+ "I-LOCderiv": "4",
54
+ "I-LOCpart": "6",
55
+ "I-ORG": "8",
56
+ "I-ORGderiv": "10",
57
+ "I-ORGpart": "12",
58
+ "I-OTH": "14",
59
+ "I-OTHderiv": "16",
60
+ "I-OTHpart": "18",
61
+ "I-PER": "20",
62
+ "I-PERderiv": "22",
63
+ "I-PERpart": "24",
64
+ "O": "0"
65
+ },
66
+ "max_position_embeddings": 512,
67
+ "model_type": "distilbert",
68
+ "n_heads": 12,
69
+ "n_layers": 6,
70
+ "pad_token_id": 0,
71
+ "qa_dropout": 0.1,
72
+ "seq_classif_dropout": 0.2,
73
+ "sinusoidal_pos_embds": true,
74
+ "tie_weights_": true,
75
+ "transformers_version": "4.17.0",
76
+ "vocab_size": 32000
77
+ }
logs/train/events.out.tfevents.1646753432.8e22313e678f.72.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97712164d2476a40fc8b5fa9e265d3a736cc9482d8fc9b23d7322eac53126fb7
3
+ size 1625167
logs/train/events.out.tfevents.1646753440.8e22313e678f.profile-empty ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6894201e96aa87d5e0a87cd1ba8d187c6d3f679e73f32c6e8f4e87d0627219b
3
+ size 40
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.input_pipeline.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b5924ddf019cb07b3ba36da97f1926cd679d05a8a77fe99289c204586d83c01
3
+ size 3053
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.kernel_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c18da93c72a0b20f88870ec77de96cc8c4770cbedba9bf2c711f6e558ff9396e
3
+ size 315610
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.memory_profile.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd71fffe4f3a877c9fd574eb626d13dab159ca31b150638b2775653926943678
3
+ size 34606
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.overview_page.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c020a1a9c10fb40e7ee7c8f43db12bc876dd73f320e8dec008fe55aaee2de4c4
3
+ size 5435
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.tensorflow_stats.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8891ccd68abc93b5ef96cb64acd197981b789824bf78e794f1c1a0e561f9bdb4
3
+ size 188411
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.trace.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84dfcb862f25e4150ea098eb4a995192e974a7c117a5fa845b41cb4a7efbc412
3
+ size 159061
logs/train/plugins/profile/2022_03_08_15_30_40/8e22313e678f.xplane.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:758e3da1a753b8e5c7978006f294455e0811f0cd5aaff1d704ea290b22ca6d78
3
+ size 1258846
logs/validation/events.out.tfevents.1646753560.8e22313e678f.72.1.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85e2155c92c02e22ca374413f92d6cf36cf3e6cf90e8bd8461737f9042c07bfe
3
+ size 194
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
tf_model.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6082a62557711eea2d80322f781d23b7e852f023a12d0d63f744da07a613b3a7
3
+ size 270195104
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": false, "max_len": 512, "special_tokens_map_file": null, "name_or_path": "dbmdz/distilbert-base-german-europeana-cased", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "DistilBertTokenizer"}
vocab.txt ADDED
The diff for this file is too large to render. See raw diff