Ramendra commited on
Commit
d1ca1af
1 Parent(s): 7163f80

End of training

Browse files
README.md CHANGED
@@ -1,9 +1,9 @@
1
  ---
2
- base_model: Ramendra/dialogue_Summary
 
3
  tags:
4
  - generated_from_trainer
5
- datasets:
6
- - samsum
7
  model-index:
8
  - name: dialogue_Summary_peft
9
  results: []
@@ -14,9 +14,9 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # dialogue_Summary_peft
16
 
17
- This model is a fine-tuned version of [Ramendra/dialogue_Summary](https://huggingface.co/Ramendra/dialogue_Summary) on the samsum dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.1359
20
 
21
  ## Model description
22
 
@@ -47,16 +47,17 @@ The following hyperparameters were used during training:
47
 
48
  | Training Loss | Epoch | Step | Validation Loss |
49
  |:-------------:|:-----:|:----:|:---------------:|
50
- | 0.0704 | 1.0 | 74 | 0.1357 |
51
- | 0.0861 | 2.0 | 148 | 0.1358 |
52
- | 0.0637 | 3.0 | 222 | 0.1358 |
53
- | 0.0757 | 4.0 | 296 | 0.1358 |
54
- | 0.0793 | 5.0 | 370 | 0.1359 |
55
 
56
 
57
  ### Framework versions
58
 
59
- - Transformers 4.34.0
60
- - Pytorch 2.0.1+cu118
61
- - Datasets 2.14.5
62
- - Tokenizers 0.14.1
 
 
1
  ---
2
+ license: mit
3
+ library_name: peft
4
  tags:
5
  - generated_from_trainer
6
+ base_model: Ramendra/dialogue_Summary
 
7
  model-index:
8
  - name: dialogue_Summary_peft
9
  results: []
 
14
 
15
  # dialogue_Summary_peft
16
 
17
+ This model is a fine-tuned version of [Ramendra/dialogue_Summary](https://huggingface.co/Ramendra/dialogue_Summary) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.1336
20
 
21
  ## Model description
22
 
 
47
 
48
  | Training Loss | Epoch | Step | Validation Loss |
49
  |:-------------:|:-----:|:----:|:---------------:|
50
+ | 0.1076 | 1.0 | 74 | 0.1337 |
51
+ | 0.0898 | 2.0 | 148 | 0.1336 |
52
+ | 0.0923 | 3.0 | 222 | 0.1336 |
53
+ | 0.0965 | 4.0 | 296 | 0.1335 |
54
+ | 0.1012 | 5.0 | 370 | 0.1336 |
55
 
56
 
57
  ### Framework versions
58
 
59
+ - PEFT 0.9.0
60
+ - Transformers 4.38.1
61
+ - Pytorch 2.1.0+cu121
62
+ - Datasets 2.18.0
63
+ - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "auto_mapping": null,
3
  "base_model_name_or_path": "Ramendra/dialogue_Summary",
4
  "bias": "none",
@@ -7,15 +8,21 @@
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
 
10
  "lora_alpha": 32,
11
  "lora_dropout": 0.05,
 
 
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
  "r": 32,
 
15
  "revision": null,
16
  "target_modules": [
17
- "q_proj",
18
- "v_proj"
19
  ],
20
- "task_type": "SEQ_2_SEQ_LM"
 
 
21
  }
 
1
  {
2
+ "alpha_pattern": {},
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Ramendra/dialogue_Summary",
5
  "bias": "none",
 
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
+ "loftq_config": {},
12
  "lora_alpha": 32,
13
  "lora_dropout": 0.05,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
  "r": 32,
19
+ "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "v_proj",
23
+ "q_proj"
24
  ],
25
+ "task_type": "SEQ_2_SEQ_LM",
26
+ "use_dora": false,
27
+ "use_rslora": false
28
  }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4b3f5f856345572f664b986c8ce8b7036f02a33ae3c0e1b5a3522e005fc62c
3
+ size 18894856
runs/Mar02_01-34-15_ddf363e378bf/events.out.tfevents.1709343266.ddf363e378bf.701.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6763687313bfc94243e58f0150e6953646c5f18df69ca1db8bb983541b6da168
3
+ size 26099
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8f5b6edc6777a2a5f5db441dfbb98e0071aab6522108e674dd659f3c844493d
3
- size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4ce98a4ab0615e8d538e73e16ca1e72f2e4e4508eb4812c33ca0c9b648282dd
3
+ size 4920