ryefoxlime commited on
Commit
e0e167f
1 Parent(s): 3301578

Model Finetune Params and dependencies

Browse files
Files changed (3) hide show
  1. Gemma2_2B/hyperparams.yaml +4 -4
  2. pyproject.toml +3 -1
  3. uv.lock +0 -0
Gemma2_2B/hyperparams.yaml CHANGED
@@ -1,7 +1,7 @@
1
  model_name: "google/gemma-2-2b-it"
2
  new_model_name: "gemma-2-2b-ft"
3
 
4
- lora_r: 4
5
  lora_alpha: 16
6
  lora_dropout: 0.1
7
 
@@ -11,7 +11,7 @@ bnb_4bit_quant_type: "nf4"
11
  use_nested_quant: False
12
 
13
  output_dir: "./results"
14
- num_train_epochs: 1
15
  fp16: False
16
  bf16: False
17
  per_device_train_batch_size: 2
@@ -19,7 +19,7 @@ per_device_eval_batch_size: 2
19
  gradient_accumulation_steps: 1
20
  gradient_checkpointing: True
21
  max_grad_norm: 0.3
22
- learning_rate: 2e-4
23
  weight_decay: 0.001
24
  optimizer: "paged_adamw_32bit"
25
  lr_scheduler_type: "constant"
@@ -29,6 +29,6 @@ group_by_length: True
29
  save_steps: 25
30
  logging_steps: 25
31
 
32
- max_seq_length: 40
33
  packing: True
34
  device_map: "auto"
 
1
  model_name: "google/gemma-2-2b-it"
2
  new_model_name: "gemma-2-2b-ft"
3
 
4
+ lora_r: 64
5
  lora_alpha: 16
6
  lora_dropout: 0.1
7
 
 
11
  use_nested_quant: False
12
 
13
  output_dir: "./results"
14
+ num_train_epochs: 2
15
  fp16: False
16
  bf16: False
17
  per_device_train_batch_size: 2
 
19
  gradient_accumulation_steps: 1
20
  gradient_checkpointing: True
21
  max_grad_norm: 0.3
22
+ learning_rate: 2e-3
23
  weight_decay: 0.001
24
  optimizer: "paged_adamw_32bit"
25
  lr_scheduler_type: "constant"
 
29
  save_steps: 25
30
  logging_steps: 25
31
 
32
+ max_seq_length: 128
33
  packing: True
34
  device_map: "auto"
pyproject.toml CHANGED
@@ -1,5 +1,5 @@
1
  [project]
2
- name = "learninguv"
3
  version = "0.1.0"
4
  description = "Add your description here"
5
  readme = "README.md"
@@ -26,6 +26,8 @@ dependencies = [
26
  "ipykernel>=6.29.5",
27
  "ipywidgets>=8.1.5",
28
  "pyyaml>=6.0.2",
 
 
29
  ]
30
 
31
  [tool.uv.sources]
 
1
  [project]
2
+ name = "TADBot"
3
  version = "0.1.0"
4
  description = "Add your description here"
5
  readme = "README.md"
 
26
  "ipykernel>=6.29.5",
27
  "ipywidgets>=8.1.5",
28
  "pyyaml>=6.0.2",
29
+ "torch-tb-profiler>=0.4.3",
30
+ "tensorflow>=2.18.0",
31
  ]
32
 
33
  [tool.uv.sources]
uv.lock CHANGED
The diff for this file is too large to render. See raw diff