Anthonyg5005
commited on
Commit
•
91acde3
1
Parent(s):
a623791
update README.md
Browse files- README.md +3 -2
- misc/Cat 8B Gen Settings.json +0 -81
- misc/Cat 8b Context.json +0 -12
- misc/Cat 8b Instruct.json +0 -24
README.md
CHANGED
@@ -24,7 +24,7 @@ Feel free to send in PRs or use this code however you'd like. External downloade
|
|
24 |
|
25 |
- [EXL2 Single Quant V3](https://colab.research.google.com/drive/1Vc7d6JU3Z35OVHmtuMuhT830THJnzNfS?usp=sharing) **(COLAB)**
|
26 |
|
27 |
-
## work in progress/not tested
|
28 |
|
29 |
- Seems I've got nothing to work on right now
|
30 |
|
@@ -32,8 +32,9 @@ Feel free to send in PRs or use this code however you'd like. External downloade
|
|
32 |
|
33 |
- [Exllama Discord server](https://discord.gg/NSFwVuCjRq) Free Exl2 quantizing bot sponsored by The Bloke and Lambda Labs, managed by Kaltcit.
|
34 |
- existing quants under the HF account [@blockblockblock](https://huggingface.co/blockblockblock)
|
|
|
35 |
|
36 |
-
- [Download models
|
37 |
|
38 |
## usage
|
39 |
|
|
|
24 |
|
25 |
- [EXL2 Single Quant V3](https://colab.research.google.com/drive/1Vc7d6JU3Z35OVHmtuMuhT830THJnzNfS?usp=sharing) **(COLAB)**
|
26 |
|
27 |
+
## work in progress/not tested
|
28 |
|
29 |
- Seems I've got nothing to work on right now
|
30 |
|
|
|
32 |
|
33 |
- [Exllama Discord server](https://discord.gg/NSFwVuCjRq) Free Exl2 quantizing bot sponsored by The Bloke and Lambda Labs, managed by Kaltcit.
|
34 |
- existing quants under the HF account [@blockblockblock](https://huggingface.co/blockblockblock)
|
35 |
+
- quant website soon
|
36 |
|
37 |
+
- [Download models](https://github.com/oobabooga/text-generation-webui/blob/main/download-model.py) (download HF Hub models) [Oobabooga]
|
38 |
|
39 |
## usage
|
40 |
|
misc/Cat 8B Gen Settings.json
DELETED
@@ -1,81 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"temp": 0.6,
|
3 |
-
"temperature_last": true,
|
4 |
-
"top_p": 0.95,
|
5 |
-
"top_k": 0,
|
6 |
-
"top_a": 0,
|
7 |
-
"tfs": 1,
|
8 |
-
"epsilon_cutoff": 0,
|
9 |
-
"eta_cutoff": 0,
|
10 |
-
"typical_p": 1,
|
11 |
-
"min_p": 0.1,
|
12 |
-
"rep_pen": 1.1,
|
13 |
-
"rep_pen_range": 512,
|
14 |
-
"no_repeat_ngram_size": 0,
|
15 |
-
"penalty_alpha": 0,
|
16 |
-
"num_beams": 1,
|
17 |
-
"length_penalty": 1,
|
18 |
-
"min_length": 0,
|
19 |
-
"encoder_rep_pen": 1,
|
20 |
-
"freq_pen": 0,
|
21 |
-
"presence_pen": 0,
|
22 |
-
"do_sample": true,
|
23 |
-
"early_stopping": false,
|
24 |
-
"dynatemp": true,
|
25 |
-
"min_temp": 0.6,
|
26 |
-
"max_temp": 0.9,
|
27 |
-
"dynatemp_exponent": 1,
|
28 |
-
"smoothing_factor": 0,
|
29 |
-
"smoothing_curve": 1,
|
30 |
-
"add_bos_token": true,
|
31 |
-
"truncation_length": 2048,
|
32 |
-
"ban_eos_token": false,
|
33 |
-
"skip_special_tokens": false,
|
34 |
-
"streaming": true,
|
35 |
-
"mirostat_mode": 0,
|
36 |
-
"mirostat_tau": 5,
|
37 |
-
"mirostat_eta": 0.1,
|
38 |
-
"guidance_scale": 1,
|
39 |
-
"negative_prompt": "",
|
40 |
-
"grammar_string": "",
|
41 |
-
"json_schema": {},
|
42 |
-
"banned_tokens": "",
|
43 |
-
"sampler_priority": [
|
44 |
-
"temperature",
|
45 |
-
"dynamic_temperature",
|
46 |
-
"quadratic_sampling",
|
47 |
-
"top_k",
|
48 |
-
"top_p",
|
49 |
-
"typical_p",
|
50 |
-
"epsilon_cutoff",
|
51 |
-
"eta_cutoff",
|
52 |
-
"tfs",
|
53 |
-
"top_a",
|
54 |
-
"min_p",
|
55 |
-
"mirostat"
|
56 |
-
],
|
57 |
-
"samplers": [
|
58 |
-
"top_k",
|
59 |
-
"tfs_z",
|
60 |
-
"typical_p",
|
61 |
-
"top_p",
|
62 |
-
"min_p",
|
63 |
-
"temperature"
|
64 |
-
],
|
65 |
-
"ignore_eos_token_aphrodite": false,
|
66 |
-
"spaces_between_special_tokens_aphrodite": true,
|
67 |
-
"sampler_order": [
|
68 |
-
6,
|
69 |
-
0,
|
70 |
-
1,
|
71 |
-
2,
|
72 |
-
3,
|
73 |
-
4,
|
74 |
-
5
|
75 |
-
],
|
76 |
-
"logit_bias": [],
|
77 |
-
"n": 1,
|
78 |
-
"rep_pen_size": 0,
|
79 |
-
"genamt": 256,
|
80 |
-
"max_length": 8192
|
81 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
misc/Cat 8b Context.json
DELETED
@@ -1,12 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"story_string": "<|start_header_id|>system<|end_header_id|>\n\n{{#if system}}{{system}}\n{{/if}}{{#if wiBefore}}{{wiBefore}}\n{{/if}}{{#if description}}{{description}}\n{{/if}}{{#if personality}}{{char}}'s personality: {{personality}}\n{{/if}}{{#if scenario}}Scenario: {{scenario}}\n{{/if}}{{#if wiAfter}}{{wiAfter}}\n{{/if}}{{#if persona}}{{persona}}\n{{/if}}{{trim}}<|eot_id|>",
|
3 |
-
"example_separator": "",
|
4 |
-
"chat_start": "",
|
5 |
-
"use_stop_strings": false,
|
6 |
-
"allow_jailbreak": false,
|
7 |
-
"always_force_name2": true,
|
8 |
-
"trim_sentences": false,
|
9 |
-
"include_newline": false,
|
10 |
-
"single_line": false,
|
11 |
-
"name": "Cat 8b"
|
12 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
misc/Cat 8b Instruct.json
DELETED
@@ -1,24 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"system_prompt": "This is a fictional roleplay chat between {{user}} and {{char}}. The characters keep their response concise.",
|
3 |
-
"input_sequence": "<|start_header_id|>user<|end_header_id|>\n\n",
|
4 |
-
"output_sequence": "<|start_header_id|>assistant<|end_header_id|>\n\n",
|
5 |
-
"first_output_sequence": "",
|
6 |
-
"last_output_sequence": "",
|
7 |
-
"system_sequence_prefix": "",
|
8 |
-
"system_sequence_suffix": "",
|
9 |
-
"stop_sequence": "</s>",
|
10 |
-
"wrap": false,
|
11 |
-
"macro": true,
|
12 |
-
"names": true,
|
13 |
-
"names_force_groups": true,
|
14 |
-
"activation_regex": "",
|
15 |
-
"skip_examples": false,
|
16 |
-
"output_suffix": "<|eot_id|>",
|
17 |
-
"input_suffix": "<|eot_id|>",
|
18 |
-
"system_sequence": "<|start_header_id|>system<|end_header_id|>\n\n",
|
19 |
-
"system_suffix": "<|eot_id|>",
|
20 |
-
"user_alignment_message": "",
|
21 |
-
"last_system_sequence": "",
|
22 |
-
"system_same_as_user": true,
|
23 |
-
"name": "Cat 8b"
|
24 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|