HF-rwkv-3B-48-2048-ctx16384 / model.safetensors.index.json
something-else's picture
Upload Rwkv5ForCausalLM
2bf1417 verified
raw
history blame
84.7 kB
{
"metadata": {
"total_size": 11548262400
},
"weight_map": {
"head.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.0.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.pre_ln.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.0.pre_ln.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.1.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.10.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.10.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.11.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.12.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.13.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.14.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.15.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.15.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.16.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.16.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.17.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.18.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.19.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.2.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.2.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.20.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.20.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.21.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.22.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.feed_forward.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.23.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.gate.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.ln_x.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.ln_x.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.output.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_decay": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_faaaa": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_mix_gate": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.time_mix_value": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.attention.value.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.feed_forward.key.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.feed_forward.receptance.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.feed_forward.time_mix_key": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.feed_forward.time_mix_receptance": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.24.ln1.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.ln1.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.ln2.bias": "model-00003-of-00006.safetensors",
"rwkv.blocks.24.ln2.weight": "model-00003-of-00006.safetensors",
"rwkv.blocks.25.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.25.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.26.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.27.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.28.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.29.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.3.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.3.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.30.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.30.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.31.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.feed_forward.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.32.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.gate.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.ln_x.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.ln_x.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.output.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_decay": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_faaaa": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_mix_gate": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.time_mix_value": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.attention.value.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.feed_forward.key.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.feed_forward.receptance.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.feed_forward.time_mix_key": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.feed_forward.time_mix_receptance": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.33.ln1.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.ln1.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.ln2.bias": "model-00004-of-00006.safetensors",
"rwkv.blocks.33.ln2.weight": "model-00004-of-00006.safetensors",
"rwkv.blocks.34.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.34.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.35.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.36.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.37.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.38.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.39.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.4.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.4.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.40.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.40.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.feed_forward.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.41.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.gate.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.ln_x.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.ln_x.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.output.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_decay": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_faaaa": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_mix_gate": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.time_mix_value": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.attention.value.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.feed_forward.key.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.feed_forward.receptance.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.feed_forward.time_mix_key": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.feed_forward.time_mix_receptance": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.42.ln1.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.ln1.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.ln2.bias": "model-00005-of-00006.safetensors",
"rwkv.blocks.42.ln2.weight": "model-00005-of-00006.safetensors",
"rwkv.blocks.43.attention.gate.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.ln_x.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.ln_x.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.output.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_decay": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_faaaa": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_mix_gate": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.time_mix_value": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.attention.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.feed_forward.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.feed_forward.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.feed_forward.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.feed_forward.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.ln1.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.ln1.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.ln2.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.43.ln2.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.gate.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.ln_x.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.ln_x.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.output.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_decay": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_faaaa": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_mix_gate": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.time_mix_value": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.attention.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.feed_forward.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.feed_forward.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.feed_forward.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.feed_forward.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.ln1.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.ln1.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.ln2.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.44.ln2.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.gate.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.ln_x.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.ln_x.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.output.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_decay": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_faaaa": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_mix_gate": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.time_mix_value": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.attention.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.feed_forward.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.feed_forward.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.feed_forward.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.feed_forward.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.ln1.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.ln1.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.ln2.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.45.ln2.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.gate.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.ln_x.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.ln_x.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.output.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_decay": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_faaaa": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_mix_gate": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.time_mix_value": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.attention.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.feed_forward.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.feed_forward.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.feed_forward.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.feed_forward.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.ln1.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.ln1.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.ln2.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.46.ln2.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.gate.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.ln_x.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.ln_x.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.output.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_decay": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_faaaa": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_mix_gate": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.time_mix_value": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.attention.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.feed_forward.key.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.feed_forward.receptance.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.feed_forward.time_mix_key": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.feed_forward.time_mix_receptance": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.feed_forward.value.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.ln1.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.ln1.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.ln2.bias": "model-00006-of-00006.safetensors",
"rwkv.blocks.47.ln2.weight": "model-00006-of-00006.safetensors",
"rwkv.blocks.5.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.feed_forward.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.feed_forward.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.5.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.gate.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.ln_x.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.ln_x.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.output.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.receptance.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_decay": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_faaaa": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_mix_gate": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.time_mix_value": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.attention.value.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.feed_forward.key.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.6.feed_forward.time_mix_key": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.feed_forward.time_mix_receptance": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.6.ln1.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.ln1.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.ln2.bias": "model-00001-of-00006.safetensors",
"rwkv.blocks.6.ln2.weight": "model-00001-of-00006.safetensors",
"rwkv.blocks.7.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.7.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.8.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.gate.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.ln_x.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.ln_x.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.output.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_decay": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_faaaa": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_mix_gate": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.time_mix_value": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.attention.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.feed_forward.key.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.feed_forward.receptance.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.feed_forward.time_mix_key": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.feed_forward.time_mix_receptance": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.feed_forward.value.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.ln1.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.ln1.weight": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.ln2.bias": "model-00002-of-00006.safetensors",
"rwkv.blocks.9.ln2.weight": "model-00002-of-00006.safetensors",
"rwkv.embeddings.weight": "model-00001-of-00006.safetensors",
"rwkv.ln_out.bias": "model-00006-of-00006.safetensors",
"rwkv.ln_out.weight": "model-00006-of-00006.safetensors"
}
}