Training in progress, step 10
Browse files- 24_10_23_config_test_5.csv +1 -1
- 24_10_23_results_real.csv +2 -1
- README.md +13 -0
- adapter_model.bin +1 -1
- adapter_model.safetensors +1 -1
- training_args.bin +1 -1
24_10_23_config_test_5.csv
CHANGED
@@ -5,7 +5,7 @@ run_number,comment,peformed_already,num_train_epochs,max_tokens,temperature,stop
|
|
5 |
4,temperature set 0.1,True,2,100,0.1,False
|
6 |
5,temperature set 0.5,True,2,100,0.5,False
|
7 |
6,temperature set 0.95,True,2,100,0.95,False
|
8 |
-
7,max_tokens set 10,
|
9 |
8,max_tokens set 30,False,2,30,0.8,False
|
10 |
9,max_tokens set 300,False,2,300,0.8,False
|
11 |
10,max_tokens set 500,False,2,500,0.8,False
|
|
|
5 |
4,temperature set 0.1,True,2,100,0.1,False
|
6 |
5,temperature set 0.5,True,2,100,0.5,False
|
7 |
6,temperature set 0.95,True,2,100,0.95,False
|
8 |
+
7,max_tokens set 10,True,2,10,0.8,False
|
9 |
8,max_tokens set 30,False,2,30,0.8,False
|
10 |
9,max_tokens set 300,False,2,300,0.8,False
|
11 |
10,max_tokens set 500,False,2,500,0.8,False
|
24_10_23_results_real.csv
CHANGED
@@ -7,4 +7,5 @@ run_number,items_per_minute,changed_settings,total_time_taken,rouge_scores_unnes
|
|
7 |
6,1527.832714984196,temperature set 0.1,17.279378652572632,0,0.1976528832961626,0.2467135274850016,0.2058575375878128,0.2409779467117316,0.2882065660284059,0.2442224680649742,0.2898388010112335,0.3293633439583997,0.286402550490794,0.0718838497030716,0.0803139894900771,0.0722726446083685,0.0995882205581848,0.1065136908080851,0.0965880380354894,0.1279108884546315,0.136023948720788,0.1229532335611118
|
8 |
7,1520.1783121784651,temperature set 0.5,17.36638379096985,0,0.2171684144819638,0.2796526632931748,0.229555721072754,0.2657758702124259,0.325561701915657,0.2741816672483476,0.3124402945667981,0.3742653583799557,0.3180416119348384,0.084309129128651,0.0950885066931036,0.0841922348430965,0.1097482578115943,0.1216660656915193,0.1094137741028614,0.1394859462287843,0.1521687324132882,0.1369193067464648
|
9 |
8,1522.6253025648766,temperature set 0.95,17.33847451210022,0,0.1358318375162381,0.2367233918316699,0.1608590624915817,0.1684281758375314,0.2753995807236896,0.1957692397202891,0.2017753107078927,0.3158922152664998,0.231842660328347,0.0348253941650094,0.053243827263793,0.0397742520737331,0.0504060301453853,0.0741161939034151,0.0569579405303325,0.0665651758039863,0.0972012308295898,0.0754698873782298
|
10 |
-
9,
|
|
|
|
7 |
6,1527.832714984196,temperature set 0.1,17.279378652572632,0,0.1976528832961626,0.2467135274850016,0.2058575375878128,0.2409779467117316,0.2882065660284059,0.2442224680649742,0.2898388010112335,0.3293633439583997,0.286402550490794,0.0718838497030716,0.0803139894900771,0.0722726446083685,0.0995882205581848,0.1065136908080851,0.0965880380354894,0.1279108884546315,0.136023948720788,0.1229532335611118
|
8 |
7,1520.1783121784651,temperature set 0.5,17.36638379096985,0,0.2171684144819638,0.2796526632931748,0.229555721072754,0.2657758702124259,0.325561701915657,0.2741816672483476,0.3124402945667981,0.3742653583799557,0.3180416119348384,0.084309129128651,0.0950885066931036,0.0841922348430965,0.1097482578115943,0.1216660656915193,0.1094137741028614,0.1394859462287843,0.1521687324132882,0.1369193067464648
|
9 |
8,1522.6253025648766,temperature set 0.95,17.33847451210022,0,0.1358318375162381,0.2367233918316699,0.1608590624915817,0.1684281758375314,0.2753995807236896,0.1957692397202891,0.2017753107078927,0.3158922152664998,0.231842660328347,0.0348253941650094,0.053243827263793,0.0397742520737331,0.0504060301453853,0.0741161939034151,0.0569579405303325,0.0665651758039863,0.0972012308295898,0.0754698873782298
|
10 |
+
9,8137.253778897434,max_tokens set 10,3.244337797164917,0,0.1297367298173749,0.0248065965409596,0.0394931695780917,0.1776028332479944,0.0319881335779764,0.0503325526395891,0.2305753968253968,0.0398045284176508,0.0623919220801066,0.021505376344086,0.0012679576629888,0.0022182435535744,0.0615292712066905,0.003434056688616,0.0059725196216856,0.1129256272401433,0.0066200549176752,0.0109573554493896
|
11 |
+
10,0.0,0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
|
README.md
CHANGED
@@ -520,6 +520,18 @@ The following `bitsandbytes` quantization config was used during training:
|
|
520 |
- bnb_4bit_use_double_quant: True
|
521 |
- bnb_4bit_compute_dtype: bfloat16
|
522 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
523 |
The following `bitsandbytes` quantization config was used during training:
|
524 |
- quant_method: bitsandbytes
|
525 |
- load_in_8bit: False
|
@@ -576,5 +588,6 @@ The following `bitsandbytes` quantization config was used during training:
|
|
576 |
- PEFT 0.5.0
|
577 |
- PEFT 0.5.0
|
578 |
- PEFT 0.5.0
|
|
|
579 |
|
580 |
- PEFT 0.5.0
|
|
|
520 |
- bnb_4bit_use_double_quant: True
|
521 |
- bnb_4bit_compute_dtype: bfloat16
|
522 |
|
523 |
+
The following `bitsandbytes` quantization config was used during training:
|
524 |
+
- quant_method: bitsandbytes
|
525 |
+
- load_in_8bit: False
|
526 |
+
- load_in_4bit: True
|
527 |
+
- llm_int8_threshold: 6.0
|
528 |
+
- llm_int8_skip_modules: None
|
529 |
+
- llm_int8_enable_fp32_cpu_offload: False
|
530 |
+
- llm_int8_has_fp16_weight: False
|
531 |
+
- bnb_4bit_quant_type: nf4
|
532 |
+
- bnb_4bit_use_double_quant: True
|
533 |
+
- bnb_4bit_compute_dtype: bfloat16
|
534 |
+
|
535 |
The following `bitsandbytes` quantization config was used during training:
|
536 |
- quant_method: bitsandbytes
|
537 |
- load_in_8bit: False
|
|
|
588 |
- PEFT 0.5.0
|
589 |
- PEFT 0.5.0
|
590 |
- PEFT 0.5.0
|
591 |
+
- PEFT 0.5.0
|
592 |
|
593 |
- PEFT 0.5.0
|
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100733709
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c44debca9618a139fcec0e472329d7f2c0db2cc0811545c51152b147b6804d3b
|
3 |
size 100733709
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100690288
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc124817399e701f648910c5eca91fccdc40719c08befb3a5359627e5ef35ffc
|
3 |
size 100690288
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4283
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf83eeceb5ce1c413aa4e6fb54e48dd54db58e34101ffdcb4940d2f2fc81b67
|
3 |
size 4283
|