130M_Seshu / model.safetensors.index.json
yashwardhan20417's picture
Upload MambaForCausalLM
899c998 verified
{
"metadata": {
"total_size": 10763315200
},
"weight_map": {
"model.embedding.weight": "model-00001-of-00003.safetensors",
"model.layers.0.A_log": "model-00001-of-00003.safetensors",
"model.layers.0.D": "model-00001-of-00003.safetensors",
"model.layers.0.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.0.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.0.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.0.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.0.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.0.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.0.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.0.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.1.A_log": "model-00001-of-00003.safetensors",
"model.layers.1.D": "model-00001-of-00003.safetensors",
"model.layers.1.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.1.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.1.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.1.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.1.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.1.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.1.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.1.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.10.A_log": "model-00001-of-00003.safetensors",
"model.layers.10.D": "model-00001-of-00003.safetensors",
"model.layers.10.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.10.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.10.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.10.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.10.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.10.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.10.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.10.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.11.A_log": "model-00001-of-00003.safetensors",
"model.layers.11.D": "model-00001-of-00003.safetensors",
"model.layers.11.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.11.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.11.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.11.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.11.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.11.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.11.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.11.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.12.A_log": "model-00001-of-00003.safetensors",
"model.layers.12.D": "model-00001-of-00003.safetensors",
"model.layers.12.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.12.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.12.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.12.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.12.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.12.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.12.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.12.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.13.A_log": "model-00001-of-00003.safetensors",
"model.layers.13.D": "model-00001-of-00003.safetensors",
"model.layers.13.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.13.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.13.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.13.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.13.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.13.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.13.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.13.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.14.A_log": "model-00001-of-00003.safetensors",
"model.layers.14.D": "model-00001-of-00003.safetensors",
"model.layers.14.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.14.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.14.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.14.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.14.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.14.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.14.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.14.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.15.A_log": "model-00001-of-00003.safetensors",
"model.layers.15.D": "model-00001-of-00003.safetensors",
"model.layers.15.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.15.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.15.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.15.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.15.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.15.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.15.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.15.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.16.A_log": "model-00001-of-00003.safetensors",
"model.layers.16.D": "model-00001-of-00003.safetensors",
"model.layers.16.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.16.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.16.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.16.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.16.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.16.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.16.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.16.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.17.A_log": "model-00001-of-00003.safetensors",
"model.layers.17.D": "model-00001-of-00003.safetensors",
"model.layers.17.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.17.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.17.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.17.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.17.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.17.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.17.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.17.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.18.A_log": "model-00001-of-00003.safetensors",
"model.layers.18.D": "model-00001-of-00003.safetensors",
"model.layers.18.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.18.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.18.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.18.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.18.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.18.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.18.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.18.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.19.A_log": "model-00001-of-00003.safetensors",
"model.layers.19.D": "model-00001-of-00003.safetensors",
"model.layers.19.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.19.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.19.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.19.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.19.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.19.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.19.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.19.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.2.A_log": "model-00001-of-00003.safetensors",
"model.layers.2.D": "model-00001-of-00003.safetensors",
"model.layers.2.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.2.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.2.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.2.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.2.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.2.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.2.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.2.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.20.A_log": "model-00001-of-00003.safetensors",
"model.layers.20.D": "model-00001-of-00003.safetensors",
"model.layers.20.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.20.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.20.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.20.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.20.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.20.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.20.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.20.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.21.A_log": "model-00001-of-00003.safetensors",
"model.layers.21.D": "model-00001-of-00003.safetensors",
"model.layers.21.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.21.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.21.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.21.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.21.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.21.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.21.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.21.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.22.A_log": "model-00001-of-00003.safetensors",
"model.layers.22.D": "model-00001-of-00003.safetensors",
"model.layers.22.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.22.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.22.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.22.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.22.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.22.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.22.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.22.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.23.A_log": "model-00001-of-00003.safetensors",
"model.layers.23.D": "model-00001-of-00003.safetensors",
"model.layers.23.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.23.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.23.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.23.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.23.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.23.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.23.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.23.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.24.A_log": "model-00001-of-00003.safetensors",
"model.layers.24.D": "model-00001-of-00003.safetensors",
"model.layers.24.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.24.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.24.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.24.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.24.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.24.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.24.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.24.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.25.A_log": "model-00001-of-00003.safetensors",
"model.layers.25.D": "model-00001-of-00003.safetensors",
"model.layers.25.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.25.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.25.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.25.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.25.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.25.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.25.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.25.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.26.A_log": "model-00001-of-00003.safetensors",
"model.layers.26.D": "model-00001-of-00003.safetensors",
"model.layers.26.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.26.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.26.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.26.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.26.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.26.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.26.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.26.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.27.A_log": "model-00001-of-00003.safetensors",
"model.layers.27.D": "model-00001-of-00003.safetensors",
"model.layers.27.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.27.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.27.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.27.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.27.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.27.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.27.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.27.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.28.A_log": "model-00001-of-00003.safetensors",
"model.layers.28.D": "model-00001-of-00003.safetensors",
"model.layers.28.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.28.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.28.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.28.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.28.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.28.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.28.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.28.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.29.A_log": "model-00001-of-00003.safetensors",
"model.layers.29.D": "model-00001-of-00003.safetensors",
"model.layers.29.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.29.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.29.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.29.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.29.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.29.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.29.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.29.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.3.A_log": "model-00001-of-00003.safetensors",
"model.layers.3.D": "model-00001-of-00003.safetensors",
"model.layers.3.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.3.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.3.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.3.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.3.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.3.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.3.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.3.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.30.A_log": "model-00002-of-00003.safetensors",
"model.layers.30.D": "model-00002-of-00003.safetensors",
"model.layers.30.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.30.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.30.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.30.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.30.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.30.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.30.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.30.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.31.A_log": "model-00002-of-00003.safetensors",
"model.layers.31.D": "model-00002-of-00003.safetensors",
"model.layers.31.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.31.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.31.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.31.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.31.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.31.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.31.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.31.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.32.A_log": "model-00002-of-00003.safetensors",
"model.layers.32.D": "model-00002-of-00003.safetensors",
"model.layers.32.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.32.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.32.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.32.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.32.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.32.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.32.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.32.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.33.A_log": "model-00002-of-00003.safetensors",
"model.layers.33.D": "model-00002-of-00003.safetensors",
"model.layers.33.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.33.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.33.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.33.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.33.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.33.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.33.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.33.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.34.A_log": "model-00002-of-00003.safetensors",
"model.layers.34.D": "model-00002-of-00003.safetensors",
"model.layers.34.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.34.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.34.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.34.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.34.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.34.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.34.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.34.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.35.A_log": "model-00002-of-00003.safetensors",
"model.layers.35.D": "model-00002-of-00003.safetensors",
"model.layers.35.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.35.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.35.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.35.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.35.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.35.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.35.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.35.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.36.A_log": "model-00002-of-00003.safetensors",
"model.layers.36.D": "model-00002-of-00003.safetensors",
"model.layers.36.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.36.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.36.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.36.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.36.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.36.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.36.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.36.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.37.A_log": "model-00002-of-00003.safetensors",
"model.layers.37.D": "model-00002-of-00003.safetensors",
"model.layers.37.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.37.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.37.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.37.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.37.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.37.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.37.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.37.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.38.A_log": "model-00002-of-00003.safetensors",
"model.layers.38.D": "model-00002-of-00003.safetensors",
"model.layers.38.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.38.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.38.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.38.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.38.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.38.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.38.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.38.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.39.A_log": "model-00002-of-00003.safetensors",
"model.layers.39.D": "model-00002-of-00003.safetensors",
"model.layers.39.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.39.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.39.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.39.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.39.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.39.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.39.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.39.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.4.A_log": "model-00001-of-00003.safetensors",
"model.layers.4.D": "model-00001-of-00003.safetensors",
"model.layers.4.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.4.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.4.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.4.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.4.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.4.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.4.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.4.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.40.A_log": "model-00002-of-00003.safetensors",
"model.layers.40.D": "model-00002-of-00003.safetensors",
"model.layers.40.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.40.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.40.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.40.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.40.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.40.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.40.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.40.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.41.A_log": "model-00002-of-00003.safetensors",
"model.layers.41.D": "model-00002-of-00003.safetensors",
"model.layers.41.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.41.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.41.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.41.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.41.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.41.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.41.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.41.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.42.A_log": "model-00002-of-00003.safetensors",
"model.layers.42.D": "model-00002-of-00003.safetensors",
"model.layers.42.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.42.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.42.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.42.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.42.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.42.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.42.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.42.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.43.A_log": "model-00002-of-00003.safetensors",
"model.layers.43.D": "model-00002-of-00003.safetensors",
"model.layers.43.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.43.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.43.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.43.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.43.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.43.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.43.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.43.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.44.A_log": "model-00002-of-00003.safetensors",
"model.layers.44.D": "model-00002-of-00003.safetensors",
"model.layers.44.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.44.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.44.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.44.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.44.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.44.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.44.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.44.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.45.A_log": "model-00002-of-00003.safetensors",
"model.layers.45.D": "model-00002-of-00003.safetensors",
"model.layers.45.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.45.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.45.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.45.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.45.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.45.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.45.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.45.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.46.A_log": "model-00002-of-00003.safetensors",
"model.layers.46.D": "model-00002-of-00003.safetensors",
"model.layers.46.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.46.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.46.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.46.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.46.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.46.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.46.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.46.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.47.A_log": "model-00002-of-00003.safetensors",
"model.layers.47.D": "model-00002-of-00003.safetensors",
"model.layers.47.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.47.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.47.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.47.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.47.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.47.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.47.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.47.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.48.A_log": "model-00002-of-00003.safetensors",
"model.layers.48.D": "model-00002-of-00003.safetensors",
"model.layers.48.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.48.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.48.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.48.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.48.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.48.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.48.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.48.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.49.A_log": "model-00002-of-00003.safetensors",
"model.layers.49.D": "model-00002-of-00003.safetensors",
"model.layers.49.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.49.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.49.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.49.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.49.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.49.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.49.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.49.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.5.A_log": "model-00001-of-00003.safetensors",
"model.layers.5.D": "model-00001-of-00003.safetensors",
"model.layers.5.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.5.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.5.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.5.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.5.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.5.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.5.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.5.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.50.A_log": "model-00002-of-00003.safetensors",
"model.layers.50.D": "model-00002-of-00003.safetensors",
"model.layers.50.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.50.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.50.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.50.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.50.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.50.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.50.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.50.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.51.A_log": "model-00002-of-00003.safetensors",
"model.layers.51.D": "model-00002-of-00003.safetensors",
"model.layers.51.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.51.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.51.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.51.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.51.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.51.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.51.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.51.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.52.A_log": "model-00002-of-00003.safetensors",
"model.layers.52.D": "model-00002-of-00003.safetensors",
"model.layers.52.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.52.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.52.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.52.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.52.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.52.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.52.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.52.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.53.A_log": "model-00002-of-00003.safetensors",
"model.layers.53.D": "model-00002-of-00003.safetensors",
"model.layers.53.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.53.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.53.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.53.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.53.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.53.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.53.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.53.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.54.A_log": "model-00002-of-00003.safetensors",
"model.layers.54.D": "model-00002-of-00003.safetensors",
"model.layers.54.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.54.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.54.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.54.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.54.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.54.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.54.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.54.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.55.A_log": "model-00002-of-00003.safetensors",
"model.layers.55.D": "model-00002-of-00003.safetensors",
"model.layers.55.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.55.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.55.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.55.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.55.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.55.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.55.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.55.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.56.A_log": "model-00002-of-00003.safetensors",
"model.layers.56.D": "model-00002-of-00003.safetensors",
"model.layers.56.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.56.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.56.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.56.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.56.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.56.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.56.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.56.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.57.A_log": "model-00002-of-00003.safetensors",
"model.layers.57.D": "model-00002-of-00003.safetensors",
"model.layers.57.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.57.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.57.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.57.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.57.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.57.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.57.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.57.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.58.A_log": "model-00002-of-00003.safetensors",
"model.layers.58.D": "model-00002-of-00003.safetensors",
"model.layers.58.conv1d.bias": "model-00002-of-00003.safetensors",
"model.layers.58.conv1d.weight": "model-00002-of-00003.safetensors",
"model.layers.58.dt_proj.bias": "model-00002-of-00003.safetensors",
"model.layers.58.dt_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.58.in_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.58.norm.weight": "model-00002-of-00003.safetensors",
"model.layers.58.out_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.58.x_proj.weight": "model-00002-of-00003.safetensors",
"model.layers.59.A_log": "model-00002-of-00003.safetensors",
"model.layers.59.D": "model-00002-of-00003.safetensors",
"model.layers.59.conv1d.bias": "model-00003-of-00003.safetensors",
"model.layers.59.conv1d.weight": "model-00003-of-00003.safetensors",
"model.layers.59.dt_proj.bias": "model-00003-of-00003.safetensors",
"model.layers.59.dt_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.59.in_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.59.norm.weight": "model-00003-of-00003.safetensors",
"model.layers.59.out_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.59.x_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.6.A_log": "model-00001-of-00003.safetensors",
"model.layers.6.D": "model-00001-of-00003.safetensors",
"model.layers.6.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.6.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.6.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.6.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.6.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.6.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.6.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.6.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.60.A_log": "model-00003-of-00003.safetensors",
"model.layers.60.D": "model-00003-of-00003.safetensors",
"model.layers.60.conv1d.bias": "model-00003-of-00003.safetensors",
"model.layers.60.conv1d.weight": "model-00003-of-00003.safetensors",
"model.layers.60.dt_proj.bias": "model-00003-of-00003.safetensors",
"model.layers.60.dt_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.60.in_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.60.norm.weight": "model-00003-of-00003.safetensors",
"model.layers.60.out_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.60.x_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.61.A_log": "model-00003-of-00003.safetensors",
"model.layers.61.D": "model-00003-of-00003.safetensors",
"model.layers.61.conv1d.bias": "model-00003-of-00003.safetensors",
"model.layers.61.conv1d.weight": "model-00003-of-00003.safetensors",
"model.layers.61.dt_proj.bias": "model-00003-of-00003.safetensors",
"model.layers.61.dt_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.61.in_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.61.norm.weight": "model-00003-of-00003.safetensors",
"model.layers.61.out_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.61.x_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.62.A_log": "model-00003-of-00003.safetensors",
"model.layers.62.D": "model-00003-of-00003.safetensors",
"model.layers.62.conv1d.bias": "model-00003-of-00003.safetensors",
"model.layers.62.conv1d.weight": "model-00003-of-00003.safetensors",
"model.layers.62.dt_proj.bias": "model-00003-of-00003.safetensors",
"model.layers.62.dt_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.62.in_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.62.norm.weight": "model-00003-of-00003.safetensors",
"model.layers.62.out_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.62.x_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.63.A_log": "model-00003-of-00003.safetensors",
"model.layers.63.D": "model-00003-of-00003.safetensors",
"model.layers.63.conv1d.bias": "model-00003-of-00003.safetensors",
"model.layers.63.conv1d.weight": "model-00003-of-00003.safetensors",
"model.layers.63.dt_proj.bias": "model-00003-of-00003.safetensors",
"model.layers.63.dt_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.63.in_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.63.norm.weight": "model-00003-of-00003.safetensors",
"model.layers.63.out_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.63.x_proj.weight": "model-00003-of-00003.safetensors",
"model.layers.7.A_log": "model-00001-of-00003.safetensors",
"model.layers.7.D": "model-00001-of-00003.safetensors",
"model.layers.7.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.7.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.7.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.7.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.7.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.7.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.7.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.7.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.8.A_log": "model-00001-of-00003.safetensors",
"model.layers.8.D": "model-00001-of-00003.safetensors",
"model.layers.8.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.8.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.8.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.8.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.8.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.8.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.8.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.8.x_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.9.A_log": "model-00001-of-00003.safetensors",
"model.layers.9.D": "model-00001-of-00003.safetensors",
"model.layers.9.conv1d.bias": "model-00001-of-00003.safetensors",
"model.layers.9.conv1d.weight": "model-00001-of-00003.safetensors",
"model.layers.9.dt_proj.bias": "model-00001-of-00003.safetensors",
"model.layers.9.dt_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.9.in_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.9.norm.weight": "model-00001-of-00003.safetensors",
"model.layers.9.out_proj.weight": "model-00001-of-00003.safetensors",
"model.layers.9.x_proj.weight": "model-00001-of-00003.safetensors",
"model.norm_f.weight": "model-00003-of-00003.safetensors"
}
}