Add dataset_info
Browse files
README.md
CHANGED
@@ -25,7 +25,7 @@ set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage sft --do_train True
|
|
25 |
|
26 |
Stage B: Continued, `orpo`
|
27 |
```
|
28 |
-
set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True --model_name_or_path meta-llama/Meta-Llama-3.1-8B-Instruct --preprocessing_num_workers 1 --finetuning_type lora --template alpaca --rope_scaling linear --flash_attn fa2 --dataset_dir data --dataset
|
29 |
```
|
30 |
|
31 |
|
@@ -34,7 +34,86 @@ set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True
|
|
34 |
|
35 |
`dataset_info.json`:
|
36 |
```json
|
37 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
38 |
```
|
39 |
</details>
|
40 |
|
|
|
25 |
|
26 |
Stage B: Continued, `orpo`
|
27 |
```
|
28 |
+
set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True --model_name_or_path meta-llama/Meta-Llama-3.1-8B-Instruct --preprocessing_num_workers 1 --finetuning_type lora --template alpaca --rope_scaling linear --flash_attn fa2 --dataset_dir data --dataset fix_orca_dpo_de --cutoff_len 4000 --learning_rate 5e-05 --num_train_epochs 1.0 --max_samples 100000 --per_device_train_batch_size 1 --gradient_accumulation_steps 1 --lr_scheduler_type cosine --max_grad_norm 1.0 --logging_steps 10 --save_steps 1000 --warmup_steps 0 --neftune_noise_alpha 5 --optim adamw_8bit --packing True --report_to none --output_dir saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German-ORPO --bf16 True --plot_loss True --ddp_timeout 180000000 --include_num_input_tokens_seen True --quantization_bit 4 --quantization_method bitsandbytes --lora_rank 32 --lora_alpha 64 --lora_dropout 0.35 --lora_target all --pref_beta 0.1 --pref_ftx 0 --pref_loss orpo --adapter_name_or_path saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German
|
29 |
```
|
30 |
|
31 |
|
|
|
34 |
|
35 |
`dataset_info.json`:
|
36 |
```json
|
37 |
+
"oasst_de": {
|
38 |
+
"hf_hub_url": "mayflowergmbh/oasst_de"
|
39 |
+
},
|
40 |
+
"dolly_15k_de": {
|
41 |
+
"hf_hub_url": "mayflowergmbh/dolly-15k_de"
|
42 |
+
},
|
43 |
+
"alpaca-gpt4_de": {
|
44 |
+
"hf_hub_url": "mayflowergmbh/alpaca-gpt4_de"
|
45 |
+
},
|
46 |
+
"openschnabeltier_de": {
|
47 |
+
"hf_hub_url": "mayflowergmbh/openschnabeltier_de"
|
48 |
+
},
|
49 |
+
"evol_instruct_de": {
|
50 |
+
"hf_hub_url": "mayflowergmbh/evol-instruct_de"
|
51 |
+
},
|
52 |
+
"dolphin_de": {
|
53 |
+
"hf_hub_url": "mayflowergmbh/dolphin_de"
|
54 |
+
},
|
55 |
+
"booksum_de": {
|
56 |
+
"hf_hub_url": "mayflowergmbh/booksum_de"
|
57 |
+
},
|
58 |
+
"airoboros_de": {
|
59 |
+
"hf_hub_url": "mayflowergmbh/airoboros-3.0_de"
|
60 |
+
},
|
61 |
+
"ultrachat_de": {
|
62 |
+
"hf_hub_url": "mayflowergmbh/ultra-chat_de"
|
63 |
+
},
|
64 |
+
"German_Songs": {
|
65 |
+
"file_name": "German_Songs.json",
|
66 |
+
"file_sha1": "3ec36066a19debd1b138020b293e05f21264c352",
|
67 |
+
"columns": {
|
68 |
+
"prompt": "prompt",
|
69 |
+
"query": "analysis_prompt",
|
70 |
+
"response": "song",
|
71 |
+
"history": "analysis",
|
72 |
+
"system": "topic"
|
73 |
+
}
|
74 |
+
},
|
75 |
+
"German_Poems": {
|
76 |
+
"file_name": "German_Poems.json",
|
77 |
+
"file_sha1": "f0f4bbea3b8cbc378afb640f4ff4dcd11132263c",
|
78 |
+
"columns": {
|
79 |
+
"prompt": "prompt",
|
80 |
+
"query": "topic",
|
81 |
+
"response": "poem"
|
82 |
+
}
|
83 |
+
},
|
84 |
+
"bjoernp_ultrachat_de": {
|
85 |
+
"file_name": "ultrachat_de.json",
|
86 |
+
"file_sha1": "4e2b6dba1c387b3fa439c33ab35281403c39e973",
|
87 |
+
"formatting": "sharegpt",
|
88 |
+
"columns": {
|
89 |
+
"messages": "conversations"
|
90 |
+
},
|
91 |
+
"tags": {
|
92 |
+
"role_tag": "from",
|
93 |
+
"content_tag": "value",
|
94 |
+
"user_tag": "human",
|
95 |
+
"assistant_tag": "gpt",
|
96 |
+
"system_tag": "system"
|
97 |
+
}
|
98 |
+
},
|
99 |
+
"OpenSchnabeltier": {
|
100 |
+
"file_name": "OpenSchnabeltier.json",
|
101 |
+
"columns": {
|
102 |
+
"prompt": "instruction_de",
|
103 |
+
"response": "output_de"
|
104 |
+
}
|
105 |
+
},
|
106 |
+
"fix_orca_dpo_de": {
|
107 |
+
"file_name": "fix_intel_orca_dpo_pairs_de.json",
|
108 |
+
"ranking": true,
|
109 |
+
"columns": {
|
110 |
+
"prompt": "instruction",
|
111 |
+
"query": "input",
|
112 |
+
"chosen": "chosen",
|
113 |
+
"rejected": "rejected"
|
114 |
+
}
|
115 |
+
}
|
116 |
+
}
|
117 |
```
|
118 |
</details>
|
119 |
|