Update README.md
Browse files
README.md
CHANGED
@@ -51,7 +51,7 @@ For the MNTP Adapter, please refer to [this link](https://huggingface.co/uzabase
|
|
51 |
|
52 |
# Training Details
|
53 |
|
54 |
-
|
55 |
|
56 |
- Make Corpus from SimCSE from [Wikipedia](https://huggingface.co/datasets/wikimedia/wikipedia)
|
57 |
- Script for making SimCSE Corpus
|
@@ -94,7 +94,7 @@ if __name__ == "__main__":
|
|
94 |
|
95 |
|
96 |
|
97 |
-
|
98 |
- simcse_dropout: 0.3
|
99 |
- bidirectional: true
|
100 |
- pooling_mode: "mean"
|
@@ -112,7 +112,7 @@ if __name__ == "__main__":
|
|
112 |
- gradient_checkpointing: true
|
113 |
|
114 |
|
115 |
-
|
116 |
- deepspeed_config:
|
117 |
- gradient_accumulation_steps: 1
|
118 |
- gradient_clipping: 1.0
|
@@ -138,7 +138,7 @@ if __name__ == "__main__":
|
|
138 |
- quse_cpu: false
|
139 |
|
140 |
|
141 |
-
|
142 |
|
143 |
- Python: 3.12.3
|
144 |
- PEFT 0.11.1
|
|
|
51 |
|
52 |
# Training Details
|
53 |
|
54 |
+
## Training Data
|
55 |
|
56 |
- Make Corpus from SimCSE from [Wikipedia](https://huggingface.co/datasets/wikimedia/wikipedia)
|
57 |
- Script for making SimCSE Corpus
|
|
|
94 |
|
95 |
|
96 |
|
97 |
+
## Training Hyperparameter
|
98 |
- simcse_dropout: 0.3
|
99 |
- bidirectional: true
|
100 |
- pooling_mode: "mean"
|
|
|
112 |
- gradient_checkpointing: true
|
113 |
|
114 |
|
115 |
+
## Accelerator Settings
|
116 |
- deepspeed_config:
|
117 |
- gradient_accumulation_steps: 1
|
118 |
- gradient_clipping: 1.0
|
|
|
138 |
- quse_cpu: false
|
139 |
|
140 |
|
141 |
+
## Framework versions
|
142 |
|
143 |
- Python: 3.12.3
|
144 |
- PEFT 0.11.1
|