dsmueller commited on
Commit
694a287
1 Parent(s): 5d09bfd

Update project parameters in train_llm.py

Browse files
Files changed (1) hide show
  1. train_llm.py +10 -3
train_llm.py CHANGED
@@ -31,7 +31,7 @@ dataset['validation'].to_pandas().to_csv(validation_filename, columns=['text'],
31
  # Define project parameters
32
  username='ai-aerospace'
33
  project_name='./llms/'+'ams_data_train-100_'+str(uuid4())
34
- repo_name='ams_data_train-100_'+str(uuid4())
35
 
36
  # model_name='TinyLlama/TinyLlama-1.1B-Chat-v0.1'
37
  model_name='mistralai/Mistral-7B-v0.1'
@@ -42,16 +42,23 @@ os.environ["model_name"] = model_name
42
  os.environ["repo_id"] = username+'/'+repo_name
43
  os.environ["train_data"] = train_data
44
  os.environ["validation_data"] = validation_data
 
 
 
 
 
 
 
 
45
 
46
  # Set .venv and execute the autotrain script
47
  # To see all parameters: autotrain llm --help
48
  # !autotrain llm --train --project_name my-llm --model TinyLlama/TinyLlama-1.1B-Chat-v0.1 --data_path . --use-peft --use_int4 --learning_rate 2e-4 --train_batch_size 6 --num_train_epochs 3 --trainer sft
49
- # The training dataset to be used must be called training.csv and be located in the data_path folder.
50
  command="""
51
  autotrain llm --train \
52
  --project_name ${project_name} \
53
  --model ${model_name} \
54
- --data_path ../fine_tune_data \
55
  --train_split ${train_data} \
56
  --valid_split ${validation_data} \
57
  --use-peft \
 
31
  # Define project parameters
32
  username='ai-aerospace'
33
  project_name='./llms/'+'ams_data_train-100_'+str(uuid4())
34
+ repo_name='ams-data-train-100-'+str(uuid4())
35
 
36
  # model_name='TinyLlama/TinyLlama-1.1B-Chat-v0.1'
37
  model_name='mistralai/Mistral-7B-v0.1'
 
42
  os.environ["repo_id"] = username+'/'+repo_name
43
  os.environ["train_data"] = train_data
44
  os.environ["validation_data"] = validation_data
45
+ os.environ["data_directory"] = data_directory
46
+
47
+ print("project_name:", project_name)
48
+ print("model_name:", model_name)
49
+ print("repo_id:", username+'/'+repo_name)
50
+ print("train_data:", train_data)
51
+ print("validation_data:", validation_data)
52
+ print("data_directory:", data_directory)
53
 
54
  # Set .venv and execute the autotrain script
55
  # To see all parameters: autotrain llm --help
56
  # !autotrain llm --train --project_name my-llm --model TinyLlama/TinyLlama-1.1B-Chat-v0.1 --data_path . --use-peft --use_int4 --learning_rate 2e-4 --train_batch_size 6 --num_train_epochs 3 --trainer sft
 
57
  command="""
58
  autotrain llm --train \
59
  --project_name ${project_name} \
60
  --model ${model_name} \
61
+ --data_path ${data_directory} \
62
  --train_split ${train_data} \
63
  --valid_split ${validation_data} \
64
  --use-peft \