Nekochu commited on
Commit
c3b326b
1 Parent(s): eedce5b

Add dataset_info

Browse files
Files changed (1) hide show
  1. README.md +81 -2
README.md CHANGED
@@ -25,7 +25,7 @@ set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage sft --do_train True
25
 
26
  Stage B: Continued, `orpo`
27
  ```
28
- set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True --model_name_or_path meta-llama/Meta-Llama-3.1-8B-Instruct --preprocessing_num_workers 1 --finetuning_type lora --template alpaca --rope_scaling linear --flash_attn fa2 --dataset_dir data --dataset orca_dpo_de --cutoff_len 4000 --learning_rate 5e-05 --num_train_epochs 1.0 --max_samples 100000 --per_device_train_batch_size 1 --gradient_accumulation_steps 1 --lr_scheduler_type cosine --max_grad_norm 1.0 --logging_steps 10 --save_steps 1000 --warmup_steps 0 --neftune_noise_alpha 5 --optim adamw_8bit --packing True --report_to none --output_dir saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German-ORPO --bf16 True --plot_loss True --ddp_timeout 180000000 --include_num_input_tokens_seen True --quantization_bit 4 --quantization_method bitsandbytes --lora_rank 32 --lora_alpha 64 --lora_dropout 0.35 --lora_target all --pref_beta 0.1 --pref_ftx 0 --pref_loss orpo --adapter_name_or_path saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German
29
  ```
30
 
31
 
@@ -34,7 +34,86 @@ set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True
34
 
35
  `dataset_info.json`:
36
  ```json
37
- ...
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  ```
39
  </details>
40
 
 
25
 
26
  Stage B: Continued, `orpo`
27
  ```
28
+ set CUDA_VISIBLE_DEVICES=0 && llamafactory-cli train --stage dpo --do_train True --model_name_or_path meta-llama/Meta-Llama-3.1-8B-Instruct --preprocessing_num_workers 1 --finetuning_type lora --template alpaca --rope_scaling linear --flash_attn fa2 --dataset_dir data --dataset fix_orca_dpo_de --cutoff_len 4000 --learning_rate 5e-05 --num_train_epochs 1.0 --max_samples 100000 --per_device_train_batch_size 1 --gradient_accumulation_steps 1 --lr_scheduler_type cosine --max_grad_norm 1.0 --logging_steps 10 --save_steps 1000 --warmup_steps 0 --neftune_noise_alpha 5 --optim adamw_8bit --packing True --report_to none --output_dir saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German-ORPO --bf16 True --plot_loss True --ddp_timeout 180000000 --include_num_input_tokens_seen True --quantization_bit 4 --quantization_method bitsandbytes --lora_rank 32 --lora_alpha 64 --lora_dropout 0.35 --lora_target all --pref_beta 0.1 --pref_ftx 0 --pref_loss orpo --adapter_name_or_path saves\LLaMA3.1-8B-Chat\lora\Llama-3.1-8B-German
29
  ```
30
 
31
 
 
34
 
35
  `dataset_info.json`:
36
  ```json
37
+ "oasst_de": {
38
+ "hf_hub_url": "mayflowergmbh/oasst_de"
39
+ },
40
+ "dolly_15k_de": {
41
+ "hf_hub_url": "mayflowergmbh/dolly-15k_de"
42
+ },
43
+ "alpaca-gpt4_de": {
44
+ "hf_hub_url": "mayflowergmbh/alpaca-gpt4_de"
45
+ },
46
+ "openschnabeltier_de": {
47
+ "hf_hub_url": "mayflowergmbh/openschnabeltier_de"
48
+ },
49
+ "evol_instruct_de": {
50
+ "hf_hub_url": "mayflowergmbh/evol-instruct_de"
51
+ },
52
+ "dolphin_de": {
53
+ "hf_hub_url": "mayflowergmbh/dolphin_de"
54
+ },
55
+ "booksum_de": {
56
+ "hf_hub_url": "mayflowergmbh/booksum_de"
57
+ },
58
+ "airoboros_de": {
59
+ "hf_hub_url": "mayflowergmbh/airoboros-3.0_de"
60
+ },
61
+ "ultrachat_de": {
62
+ "hf_hub_url": "mayflowergmbh/ultra-chat_de"
63
+ },
64
+ "German_Songs": {
65
+ "file_name": "German_Songs.json",
66
+ "file_sha1": "3ec36066a19debd1b138020b293e05f21264c352",
67
+ "columns": {
68
+ "prompt": "prompt",
69
+ "query": "analysis_prompt",
70
+ "response": "song",
71
+ "history": "analysis",
72
+ "system": "topic"
73
+ }
74
+ },
75
+ "German_Poems": {
76
+ "file_name": "German_Poems.json",
77
+ "file_sha1": "f0f4bbea3b8cbc378afb640f4ff4dcd11132263c",
78
+ "columns": {
79
+ "prompt": "prompt",
80
+ "query": "topic",
81
+ "response": "poem"
82
+ }
83
+ },
84
+ "bjoernp_ultrachat_de": {
85
+ "file_name": "ultrachat_de.json",
86
+ "file_sha1": "4e2b6dba1c387b3fa439c33ab35281403c39e973",
87
+ "formatting": "sharegpt",
88
+ "columns": {
89
+ "messages": "conversations"
90
+ },
91
+ "tags": {
92
+ "role_tag": "from",
93
+ "content_tag": "value",
94
+ "user_tag": "human",
95
+ "assistant_tag": "gpt",
96
+ "system_tag": "system"
97
+ }
98
+ },
99
+ "OpenSchnabeltier": {
100
+ "file_name": "OpenSchnabeltier.json",
101
+ "columns": {
102
+ "prompt": "instruction_de",
103
+ "response": "output_de"
104
+ }
105
+ },
106
+ "fix_orca_dpo_de": {
107
+ "file_name": "fix_intel_orca_dpo_pairs_de.json",
108
+ "ranking": true,
109
+ "columns": {
110
+ "prompt": "instruction",
111
+ "query": "input",
112
+ "chosen": "chosen",
113
+ "rejected": "rejected"
114
+ }
115
+ }
116
+ }
117
  ```
118
  </details>
119