mjcarleb commited on
Commit
aee9715
1 Parent(s): 9bd2aca

Upload model

Browse files
Files changed (3) hide show
  1. README.md +36 -0
  2. adapter_config.json +2 -2
  3. adapter_model.bin +1 -1
README.md CHANGED
@@ -234,4 +234,40 @@ The following `bitsandbytes` quantization config was used during training:
234
  ### Framework versions
235
 
236
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
237
  - PEFT 0.6.2
 
234
  ### Framework versions
235
 
236
 
237
+ - PEFT 0.6.2
238
+ ## Training procedure
239
+
240
+
241
+ The following `bitsandbytes` quantization config was used during training:
242
+ - load_in_8bit: False
243
+ - load_in_4bit: True
244
+ - llm_int8_threshold: 6.0
245
+ - llm_int8_skip_modules: None
246
+ - llm_int8_enable_fp32_cpu_offload: False
247
+ - llm_int8_has_fp16_weight: False
248
+ - bnb_4bit_quant_type: nf4
249
+ - bnb_4bit_use_double_quant: True
250
+ - bnb_4bit_compute_dtype: bfloat16
251
+
252
+ ### Framework versions
253
+
254
+
255
+ - PEFT 0.6.2
256
+ ## Training procedure
257
+
258
+
259
+ The following `bitsandbytes` quantization config was used during training:
260
+ - load_in_8bit: False
261
+ - load_in_4bit: True
262
+ - llm_int8_threshold: 6.0
263
+ - llm_int8_skip_modules: None
264
+ - llm_int8_enable_fp32_cpu_offload: False
265
+ - llm_int8_has_fp16_weight: False
266
+ - bnb_4bit_quant_type: nf4
267
+ - bnb_4bit_use_double_quant: True
268
+ - bnb_4bit_compute_dtype: bfloat16
269
+
270
+ ### Framework versions
271
+
272
+
273
  - PEFT 0.6.2
adapter_config.json CHANGED
@@ -16,10 +16,10 @@
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
 
19
  "self_attn.o_proj",
20
  "self_attn.q_proj",
21
- "self_attn.v_proj",
22
- "self_attn.k_proj"
23
  ],
24
  "task_type": "CAUSAL_LM"
25
  }
 
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
+ "self_attn.k_proj",
20
  "self_attn.o_proj",
21
  "self_attn.q_proj",
22
+ "self_attn.v_proj"
 
23
  ],
24
  "task_type": "CAUSAL_LM"
25
  }
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c81f64c60c4ffdac7a697b7c2d915ad44fc6f85a5cc1e903612d6bbf2e1b4e0
3
  size 33646413
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4f9a4514856826da46a478f21b28aa81f6cdbd61bcc40feb92ef76f8db06230
3
  size 33646413