TeeZee commited on
Commit
735bdaa
1 Parent(s): ec95227

Upload merge-config.yml

Browse files
Files changed (1) hide show
  1. merge-config.yml +142 -0
merge-config.yml ADDED
@@ -0,0 +1,142 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ # Either "cpu" or "cuda"
3
+ # NOTE: Cuda requires enough VRAM to load 3 FP16 models (~45 GB for Mistral)
4
+ # NOTE 2: The (much slower) CPU mode still requires Cuda capability, but only enough VRAM to load a model once. (~15 GB for Mistral)
5
+ device: "cpu"
6
+ random_seed: 42 # Random seed to use
7
+
8
+ directories:
9
+ model_path1: "../jondurbin_bagel-dpo-34b-v0.2" # Path to the base model. Must be a local copy.
10
+ # model_directory: "../2xNous-Capybara-34B/" # Directory of models to scan, IGNORED if models_to_merge has entries in it
11
+ output_directory: "./mm-output" # Output directory of the merged model
12
+
13
+ # A list of models to use as merge candidates - HF syntax, so can be either local directories or repos.
14
+ # Overrides model_directory if used
15
+ models_to_merge: ["../NousResearch_Nous-Capybara-34B", "../NousResearch_Nous-Hermes-2-Yi-34B", "../SUSTech_SUS-Chat-34B"]
16
+
17
+ # Merge ratios used for testing each layer's potential for improvement - Huge impact on total running time
18
+ merge_ratios: [0.2, 0.4, 0.6, 0.8]
19
+
20
+ # Choose from the following methods. Defaults to "lerp".
21
+ # "lerp" - Linear interpolation
22
+ # "slerp" - Spherical linear interpolation
23
+ # "slice" - Highly experimental. The tensor weights shifts from one model to another. [Model 1 > 10% blend > Model 2]
24
+ # "cyclic" - Highly experimental. Ignores merge ratios as these are predefined. [Model 1 > 10% blend > 10% Model 2 > 10% blend > Model 1]
25
+ merge_method: "slerp"
26
+
27
+ # If set to true, the lm_head and embed_token tensors (located outside the layers) will also be optimized
28
+ # Models that have a different vocab size from model1 will skip this phase automatically as it tends to cause model stability issues
29
+ merge_headers: true
30
+
31
+ # Strategies:
32
+ # "cumulative" - Default strategy. If there's a chance of reducing the combined probability, accept the merge.
33
+ # "all_phrases" - Only accept the merge if all phrases show an improvement. (Warning: This rarely happens)
34
+ # "quantitive" - Ignores probabilities completely. Only looks at how many phrases show an improvement, as defined by the threshold below.
35
+ strategy: "cumulative"
36
+ # Threshold is currently only used by the "quantitive" strategy. If 0.6, at least 60% of the number of phrases must show am improvement.
37
+ strategy_threshold: 0.6
38
+
39
+ # Whether or not to automatically balance the weights so all phrases are of equal importance to the "cumulative" strategy.
40
+ # The weight value of phrases is ignored if set to true.
41
+ auto_weights: false
42
+
43
+ # Phrase = What to measure, weight = multiplication factor, contexts = proceeding contexts
44
+ bad_phrases:
45
+ - phrase: "anticipation"
46
+ weight: 12
47
+ contexts: ["Her body quivers with ", "The atmosphere is thick with "]
48
+ - phrase: "unwavering"
49
+ weight: 12
50
+ contexts: ["Filled with an "]
51
+ - phrase: "determination"
52
+ weight: 12
53
+ contexts: ["Her eyes were filled with ", "Her stubbornness only fuels my "]
54
+ - phrase: "whisper"
55
+ weight: 12
56
+ contexts: ["Her voice barely above a "]
57
+ - phrase: "spine"
58
+ weight: 12
59
+ contexts: ["shivers down her "]
60
+ - phrase: "sends shivers"
61
+ weight: 12
62
+ contexts: ["The thrill of the act "]
63
+ - phrase: "ministrations"
64
+ weight: 12
65
+ contexts: ["She moans and twitches at your "]
66
+ - phrase: "legs"
67
+ weight: 12
68
+ contexts: ["wraps her "]
69
+ - phrase: "imposing figure"
70
+ weight: 12
71
+ contexts: ["He had an "]
72
+ - phrase: "shared challenges"
73
+ weight: 12
74
+ contexts: ["Their bond strengthened through "]
75
+ - phrase: "bond"
76
+ weight: 12
77
+ contexts: ["forged a ", "an unspoken "]
78
+ - phrase: "enhance our experience"
79
+ weight: 12
80
+ contexts: ["I'm excited to see how "]
81
+ - phrase: "sense of vulnerability"
82
+ weight: 12
83
+ contexts: ["create a "]
84
+ - phrase: "dimensions of intimacy"
85
+ weight: 12
86
+ contexts: ["explore new "]
87
+ - phrase: "deepening our connection"
88
+ weight: 12
89
+ contexts: ["while "]
90
+ - phrase: "shared experiences"
91
+ weight: 12
92
+ contexts: ["through "]
93
+ - phrase: "societal expectations"
94
+ weight: 12
95
+ contexts: ["that transcend "]
96
+ - phrase: "conventional boundaries"
97
+ weight: 12
98
+ contexts: ["that defy ", "and defy "]
99
+ - phrase: "open communication"
100
+ weight: 12
101
+ contexts: ["an environment "]
102
+ - phrase: "emotional vulnerability"
103
+ weight: 12
104
+ contexts: ["an environment "]
105
+ - phrase: "heightens our connection"
106
+ weight: 12
107
+ contexts: ["touch and the anticipation "]
108
+ - phrase: "sensations you're creating"
109
+ weight: 12
110
+ contexts: ["I'm enjoying "]
111
+ - phrase: "is truly arousing"
112
+ weight: 12
113
+ contexts: ["attention to detail ", "way you explore my body "]
114
+ - phrase: "challenge presented"
115
+ weight: 12
116
+ contexts: ["my resolve unwavering despite "]
117
+ - phrase: "humble vessel"
118
+ weight: 12
119
+ contexts: ["surrendering to the exquisite torment "]
120
+ - phrase: "bond"
121
+ weight: 12
122
+ contexts: ["cherishing the unique ", "special "]
123
+ - phrase: "grows stronger with each passing day"
124
+ weight: 12
125
+ contexts: ["bond "]
126
+ - phrase: "that cannot be broken by time or circumstance"
127
+ weight: 12
128
+ contexts: ["bond "]
129
+ - phrase: "becomes unbreakable, eternal"
130
+ weight: 12
131
+ contexts: ["bond "]
132
+ - phrase: "grew stronger with each passing"
133
+ weight: 12
134
+ contexts: ["bond "]
135
+
136
+
137
+ # Note - Example of a complex phrase
138
+ good_phrases:
139
+ - phrase: "The apple is in the bedroom"
140
+ weight: 1
141
+ contexts: ["Question: If I'm in the living room and pick up the apple, go to the bedroom and drop the apple, then walk to the kitchen, where is the apple? Explain your reasoning. Answer: "]
142
+