akahana commited on
Commit
62d84ca
1 Parent(s): f6d98fe

End of training

Browse files
README.md CHANGED
@@ -1,9 +1,24 @@
1
  ---
2
  tags:
3
  - generated_from_trainer
 
 
 
 
4
  model-index:
5
  - name: tinybert-javanese
6
- results: []
 
 
 
 
 
 
 
 
 
 
 
7
  ---
8
 
9
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -11,7 +26,10 @@ should probably proofread and complete it, then remove this comment. -->
11
 
12
  # tinybert-javanese
13
 
14
- This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 
 
 
15
 
16
  ## Model description
17
 
 
1
  ---
2
  tags:
3
  - generated_from_trainer
4
+ datasets:
5
+ - akahana/GlotCC-V1-jav-Latn-content-only
6
+ metrics:
7
+ - accuracy
8
  model-index:
9
  - name: tinybert-javanese
10
+ results:
11
+ - task:
12
+ name: Masked Language Modeling
13
+ type: fill-mask
14
+ dataset:
15
+ name: akahana/GlotCC-V1-jav-Latn-content-only default
16
+ type: akahana/GlotCC-V1-jav-Latn-content-only
17
+ args: default
18
+ metrics:
19
+ - name: Accuracy
20
+ type: accuracy
21
+ value: 0.1400072934534502
22
  ---
23
 
24
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
26
 
27
  # tinybert-javanese
28
 
29
+ This model is a fine-tuned version of [](https://huggingface.co/) on the akahana/GlotCC-V1-jav-Latn-content-only default dataset.
30
+ It achieves the following results on the evaluation set:
31
+ - Loss: 6.2427
32
+ - Accuracy: 0.1400
33
 
34
  ## Model description
35
 
all_results.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
- "epoch": 50.0,
3
- "eval_accuracy": 0.1519208618470086,
4
- "eval_loss": 5.8251872062683105,
5
- "eval_runtime": 11.1208,
6
  "eval_samples": 3852,
7
- "eval_samples_per_second": 346.376,
8
- "eval_steps_per_second": 86.594,
9
- "perplexity": 338.7245384996336,
10
- "total_flos": 5161725447936000.0,
11
- "train_loss": 6.140905278960581,
12
- "train_runtime": 7883.0646,
13
  "train_samples": 76378,
14
- "train_samples_per_second": 484.444,
15
- "train_steps_per_second": 30.28
16
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.1400072934534502,
4
+ "eval_loss": 6.242714881896973,
5
+ "eval_runtime": 11.5498,
6
  "eval_samples": 3852,
7
+ "eval_samples_per_second": 333.512,
8
+ "eval_steps_per_second": 83.378,
9
+ "perplexity": 514.2527529747575,
10
+ "total_flos": 781486986700800.0,
11
+ "train_loss": 6.528281962779993,
12
+ "train_runtime": 3948.1737,
13
  "train_samples": 76378,
14
+ "train_samples_per_second": 580.354,
15
+ "train_steps_per_second": 18.137
16
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 50.0,
3
- "eval_accuracy": 0.1519208618470086,
4
- "eval_loss": 5.8251872062683105,
5
- "eval_runtime": 11.1208,
6
  "eval_samples": 3852,
7
- "eval_samples_per_second": 346.376,
8
- "eval_steps_per_second": 86.594,
9
- "perplexity": 338.7245384996336
10
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.1400072934534502,
4
+ "eval_loss": 6.242714881896973,
5
+ "eval_runtime": 11.5498,
6
  "eval_samples": 3852,
7
+ "eval_samples_per_second": 333.512,
8
+ "eval_steps_per_second": 83.378,
9
+ "perplexity": 514.2527529747575
10
  }
runs/Aug03_01-12-12_9eaebf5603b2/events.out.tfevents.1722651590.9eaebf5603b2.1249.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16b7c7d6c246c448a7a4bf8225ad4de66e7796d2e7beeb7940a0279e142deb5d
3
+ size 417
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 50.0,
3
- "total_flos": 5161725447936000.0,
4
- "train_loss": 6.140905278960581,
5
- "train_runtime": 7883.0646,
6
  "train_samples": 76378,
7
- "train_samples_per_second": 484.444,
8
- "train_steps_per_second": 30.28
9
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "total_flos": 781486986700800.0,
4
+ "train_loss": 6.528281962779993,
5
+ "train_runtime": 3948.1737,
6
  "train_samples": 76378,
7
+ "train_samples_per_second": 580.354,
8
+ "train_steps_per_second": 18.137
9
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff