PEFT
code
terryyz commited on
Commit
c2de9d7
1 Parent(s): 5ccc10f

Upload 3 files

Browse files
Files changed (3) hide show
  1. README.md +31 -0
  2. adapter_config.json +17 -0
  3. adapter_model.bin +3 -0
README.md ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ## Training procedure
2
+
3
+
4
+ The following `bitsandbytes` quantization config was used during training:
5
+ - quant_method: bitsandbytes
6
+ - load_in_8bit: True
7
+ - load_in_4bit: False
8
+ - llm_int8_threshold: 6.0
9
+ - llm_int8_skip_modules: None
10
+ - llm_int8_enable_fp32_cpu_offload: False
11
+ - llm_int8_has_fp16_weight: False
12
+ - bnb_4bit_quant_type: fp4
13
+ - bnb_4bit_use_double_quant: False
14
+ - bnb_4bit_compute_dtype: float32
15
+
16
+ The following `bitsandbytes` quantization config was used during training:
17
+ - quant_method: bitsandbytes
18
+ - load_in_8bit: True
19
+ - load_in_4bit: False
20
+ - llm_int8_threshold: 6.0
21
+ - llm_int8_skip_modules: None
22
+ - llm_int8_enable_fp32_cpu_offload: False
23
+ - llm_int8_has_fp16_weight: False
24
+ - bnb_4bit_quant_type: fp4
25
+ - bnb_4bit_use_double_quant: False
26
+ - bnb_4bit_compute_dtype: float32
27
+ ### Framework versions
28
+
29
+ - PEFT 0.6.0.dev0
30
+
31
+ - PEFT 0.6.0.dev0
adapter_config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": null,
3
+ "base_model_name_or_path": "bigcode/starcoderbase-1b",
4
+ "encoder_dropout": 0.0,
5
+ "encoder_hidden_size": 2048,
6
+ "encoder_num_layers": 2,
7
+ "encoder_reparameterization_type": "MLP",
8
+ "inference_mode": true,
9
+ "num_attention_heads": 16,
10
+ "num_layers": 24,
11
+ "num_transformer_submodules": 1,
12
+ "num_virtual_tokens": 30,
13
+ "peft_type": "P_TUNING",
14
+ "revision": null,
15
+ "task_type": "CAUSAL_LM",
16
+ "token_dim": 2048
17
+ }
adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7db865b3446e70099b37e0afdf8f4adbf6494d0beb8a8345d27592a3de505531
3
+ size 246525