File size: 986 Bytes
c30b454
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41

models:
  - model: deepseek-ai/deepseek-math-7b-rl
    # No parameters necessary for base model
  - model: deepseek-ai/deepseek-math-7b-instruct
    parameters:
      density: 0.66
      weight: 0.2
  - model: deepseek-ai/deepseek-math-7b-base
    parameters:
      density: 0.57
      weight: 0.2
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.54
      weight: 0.1
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.61
      weight: 0.1
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.65
      weight: 0.1
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.55
      weight: 0.1
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.55
      weight: 0.1
  - model: deepseek-ai/deepseek-math-7b-rl
    parameters:
      density: 0.55
      weight: 0.1
merge_method: dare_ties
base_model: deepseek-ai/deepseek-math-7b-rl
dtype: bfloat16
experts_per_token: 3