Spaces:
Runtime error
Runtime error
Update project parameters in train_llm.py
Browse files- train_llm.py +10 -3
train_llm.py
CHANGED
@@ -31,7 +31,7 @@ dataset['validation'].to_pandas().to_csv(validation_filename, columns=['text'],
|
|
31 |
# Define project parameters
|
32 |
username='ai-aerospace'
|
33 |
project_name='./llms/'+'ams_data_train-100_'+str(uuid4())
|
34 |
-
repo_name='
|
35 |
|
36 |
# model_name='TinyLlama/TinyLlama-1.1B-Chat-v0.1'
|
37 |
model_name='mistralai/Mistral-7B-v0.1'
|
@@ -42,16 +42,23 @@ os.environ["model_name"] = model_name
|
|
42 |
os.environ["repo_id"] = username+'/'+repo_name
|
43 |
os.environ["train_data"] = train_data
|
44 |
os.environ["validation_data"] = validation_data
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
45 |
|
46 |
# Set .venv and execute the autotrain script
|
47 |
# To see all parameters: autotrain llm --help
|
48 |
# !autotrain llm --train --project_name my-llm --model TinyLlama/TinyLlama-1.1B-Chat-v0.1 --data_path . --use-peft --use_int4 --learning_rate 2e-4 --train_batch_size 6 --num_train_epochs 3 --trainer sft
|
49 |
-
# The training dataset to be used must be called training.csv and be located in the data_path folder.
|
50 |
command="""
|
51 |
autotrain llm --train \
|
52 |
--project_name ${project_name} \
|
53 |
--model ${model_name} \
|
54 |
-
--data_path
|
55 |
--train_split ${train_data} \
|
56 |
--valid_split ${validation_data} \
|
57 |
--use-peft \
|
|
|
31 |
# Define project parameters
|
32 |
username='ai-aerospace'
|
33 |
project_name='./llms/'+'ams_data_train-100_'+str(uuid4())
|
34 |
+
repo_name='ams-data-train-100-'+str(uuid4())
|
35 |
|
36 |
# model_name='TinyLlama/TinyLlama-1.1B-Chat-v0.1'
|
37 |
model_name='mistralai/Mistral-7B-v0.1'
|
|
|
42 |
os.environ["repo_id"] = username+'/'+repo_name
|
43 |
os.environ["train_data"] = train_data
|
44 |
os.environ["validation_data"] = validation_data
|
45 |
+
os.environ["data_directory"] = data_directory
|
46 |
+
|
47 |
+
print("project_name:", project_name)
|
48 |
+
print("model_name:", model_name)
|
49 |
+
print("repo_id:", username+'/'+repo_name)
|
50 |
+
print("train_data:", train_data)
|
51 |
+
print("validation_data:", validation_data)
|
52 |
+
print("data_directory:", data_directory)
|
53 |
|
54 |
# Set .venv and execute the autotrain script
|
55 |
# To see all parameters: autotrain llm --help
|
56 |
# !autotrain llm --train --project_name my-llm --model TinyLlama/TinyLlama-1.1B-Chat-v0.1 --data_path . --use-peft --use_int4 --learning_rate 2e-4 --train_batch_size 6 --num_train_epochs 3 --trainer sft
|
|
|
57 |
command="""
|
58 |
autotrain llm --train \
|
59 |
--project_name ${project_name} \
|
60 |
--model ${model_name} \
|
61 |
+
--data_path ${data_directory} \
|
62 |
--train_split ${train_data} \
|
63 |
--valid_split ${validation_data} \
|
64 |
--use-peft \
|