learn3r commited on
Commit
e58e5db
1 Parent(s): 5aa0561

End of training

Browse files
Files changed (5) hide show
  1. README.md +20 -8
  2. all_results.json +13 -13
  3. eval_results.json +9 -9
  4. train_results.json +4 -4
  5. trainer_state.json +0 -0
README.md CHANGED
@@ -3,11 +3,23 @@ license: apache-2.0
3
  base_model: facebook/bart-large
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - rouge
8
  model-index:
9
  - name: bart_large_gov
10
- results: []
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,14 +27,14 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # bart_large_gov
17
 
18
- This model is a fine-tuned version of [facebook/bart-large](https://huggingface.co/facebook/bart-large) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 1.4351
21
- - Rouge1: 72.0397
22
- - Rouge2: 40.9431
23
- - Rougel: 38.4161
24
- - Rougelsum: 69.5028
25
- - Gen Len: 744.4588
26
 
27
  ## Model description
28
 
 
3
  base_model: facebook/bart-large
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - learn3r/gov_report_memsum_oracle
8
  metrics:
9
  - rouge
10
  model-index:
11
  - name: bart_large_gov
12
+ results:
13
+ - task:
14
+ name: Summarization
15
+ type: summarization
16
+ dataset:
17
+ name: learn3r/gov_report_memsum_oracle
18
+ type: learn3r/gov_report_memsum_oracle
19
+ metrics:
20
+ - name: Rouge1
21
+ type: rouge
22
+ value: 71.9948
23
  ---
24
 
25
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
27
 
28
  # bart_large_gov
29
 
30
+ This model is a fine-tuned version of [facebook/bart-large](https://huggingface.co/facebook/bart-large) on the learn3r/gov_report_memsum_oracle dataset.
31
  It achieves the following results on the evaluation set:
32
+ - Loss: 1.4266
33
+ - Rouge1: 71.9948
34
+ - Rouge2: 41.0084
35
+ - Rougel: 38.0938
36
+ - Rougelsum: 69.4488
37
+ - Gen Len: 751.0288
38
 
39
  ## Model description
40
 
all_results.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "epoch": 19.94,
3
- "eval_gen_len": 128.50617283950618,
4
- "eval_loss": 1.445023536682129,
5
- "eval_rouge1": 56.2783,
6
- "eval_rouge2": 31.1387,
7
- "eval_rougeL": 39.2121,
8
- "eval_rougeLsum": 51.8068,
9
- "eval_runtime": 214.343,
10
  "eval_samples": 972,
11
- "eval_samples_per_second": 4.535,
12
- "eval_steps_per_second": 0.569,
13
- "train_loss": 1.0796797680504182,
14
- "train_runtime": 51892.12,
15
  "train_samples": 17457,
16
- "train_samples_per_second": 6.728,
17
- "train_steps_per_second": 0.052
18
  }
 
1
  {
2
  "epoch": 19.94,
3
+ "eval_gen_len": 751.0288065843621,
4
+ "eval_loss": 1.4266291856765747,
5
+ "eval_rouge1": 71.9948,
6
+ "eval_rouge2": 41.0084,
7
+ "eval_rougeL": 38.0938,
8
+ "eval_rougeLsum": 69.4488,
9
+ "eval_runtime": 1649.8925,
10
  "eval_samples": 972,
11
+ "eval_samples_per_second": 0.589,
12
+ "eval_steps_per_second": 0.074,
13
+ "train_loss": 1.4114765528370352,
14
+ "train_runtime": 122523.8715,
15
  "train_samples": 17457,
16
+ "train_samples_per_second": 2.85,
17
+ "train_steps_per_second": 0.022
18
  }
eval_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 19.94,
3
- "eval_gen_len": 128.50617283950618,
4
- "eval_loss": 1.445023536682129,
5
- "eval_rouge1": 56.2783,
6
- "eval_rouge2": 31.1387,
7
- "eval_rougeL": 39.2121,
8
- "eval_rougeLsum": 51.8068,
9
- "eval_runtime": 214.343,
10
  "eval_samples": 972,
11
- "eval_samples_per_second": 4.535,
12
- "eval_steps_per_second": 0.569
13
  }
 
1
  {
2
  "epoch": 19.94,
3
+ "eval_gen_len": 751.0288065843621,
4
+ "eval_loss": 1.4266291856765747,
5
+ "eval_rouge1": 71.9948,
6
+ "eval_rouge2": 41.0084,
7
+ "eval_rougeL": 38.0938,
8
+ "eval_rougeLsum": 69.4488,
9
+ "eval_runtime": 1649.8925,
10
  "eval_samples": 972,
11
+ "eval_samples_per_second": 0.589,
12
+ "eval_steps_per_second": 0.074
13
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 19.94,
3
- "train_loss": 1.0796797680504182,
4
- "train_runtime": 51892.12,
5
  "train_samples": 17457,
6
- "train_samples_per_second": 6.728,
7
- "train_steps_per_second": 0.052
8
  }
 
1
  {
2
  "epoch": 19.94,
3
+ "train_loss": 1.4114765528370352,
4
+ "train_runtime": 122523.8715,
5
  "train_samples": 17457,
6
+ "train_samples_per_second": 2.85,
7
+ "train_steps_per_second": 0.022
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff