aleksejalex commited on
Commit
964839a
1 Parent(s): 9d49a19

End of training

Browse files
README.md CHANGED
@@ -1,13 +1,11 @@
1
  ---
2
- license: cc
3
  base_model: gpt2
4
  tags:
5
  - generated_from_trainer
6
  model-index:
7
  - name: ErbenGPT
8
  results: []
9
- language:
10
- - cs
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -40,7 +38,7 @@ The following hyperparameters were used during training:
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 28
44
 
45
  ### Training results
46
 
@@ -51,4 +49,4 @@ The following hyperparameters were used during training:
51
  - Transformers 4.35.2
52
  - Pytorch 2.1.0+cu118
53
  - Datasets 2.15.0
54
- - Tokenizers 0.15.0
 
1
  ---
2
+ license: mit
3
  base_model: gpt2
4
  tags:
5
  - generated_from_trainer
6
  model-index:
7
  - name: ErbenGPT
8
  results: []
 
 
9
  ---
10
 
11
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 48
42
 
43
  ### Training results
44
 
 
49
  - Transformers 4.35.2
50
  - Pytorch 2.1.0+cu118
51
  - Datasets 2.15.0
52
+ - Tokenizers 0.15.0
config.json CHANGED
@@ -29,7 +29,7 @@
29
  "task_specific_params": {
30
  "text-generation": {
31
  "do_sample": true,
32
- "max_length": 150
33
  }
34
  },
35
  "torch_dtype": "float32",
 
29
  "task_specific_params": {
30
  "text-generation": {
31
  "do_sample": true,
32
+ "max_length": 50
33
  }
34
  },
35
  "torch_dtype": "float32",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3c533070f65e93dc2095e710b298ff7d7a196958dfb833da1ae14459e4e87da
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dac9852bcd10728824d1c376b070ac218cde6ec27e45f99fddd237c35a0213a
3
  size 497774208
runs/Dec05_22-26-49_855f7098f0b7/events.out.tfevents.1701815218.855f7098f0b7.317.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b13282cfda25be30699123805c45b92b314698f468e8e9354cd5540ecb726b7d
3
+ size 4948
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45887cd1943422b8caee9434e042316be93128ff8c345d25502bab1592401ba1
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad2b823d6843f5d1c809eac45bc0cd60e829ca58ffb4718e0e9cf89be8448ac7
3
  size 4600