{ "metadata": { "total_size": 13393466368 }, "weight_map": { "embedding.weight": "model-00001-of-00003.safetensors", "lm_head.bias": "model-00003-of-00003.safetensors", "lm_head.weight": "model-00003-of-00003.safetensors", "mamba.layers.0.0.A": "model-00001-of-00003.safetensors", "mamba.layers.0.0.D": "model-00001-of-00003.safetensors", "mamba.layers.0.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.0.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.0.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.A": "model-00001-of-00003.safetensors", "mamba.layers.1.0.D": "model-00001-of-00003.safetensors", "mamba.layers.1.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.1.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.1.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.A": "model-00001-of-00003.safetensors", "mamba.layers.10.0.D": "model-00001-of-00003.safetensors", "mamba.layers.10.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.10.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.10.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.A": "model-00001-of-00003.safetensors", "mamba.layers.11.0.D": "model-00001-of-00003.safetensors", "mamba.layers.11.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.11.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.11.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.A": "model-00001-of-00003.safetensors", "mamba.layers.12.0.D": "model-00001-of-00003.safetensors", "mamba.layers.12.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.12.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.12.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.A": "model-00001-of-00003.safetensors", "mamba.layers.13.0.D": "model-00001-of-00003.safetensors", "mamba.layers.13.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.13.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.13.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.A": "model-00001-of-00003.safetensors", "mamba.layers.14.0.D": "model-00001-of-00003.safetensors", "mamba.layers.14.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.14.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.14.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.A": "model-00001-of-00003.safetensors", "mamba.layers.15.0.D": "model-00001-of-00003.safetensors", "mamba.layers.15.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.15.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.15.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.A": "model-00001-of-00003.safetensors", "mamba.layers.16.0.D": "model-00001-of-00003.safetensors", "mamba.layers.16.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.16.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.16.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.A": "model-00001-of-00003.safetensors", "mamba.layers.17.0.D": "model-00001-of-00003.safetensors", "mamba.layers.17.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.17.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.17.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.A": "model-00001-of-00003.safetensors", "mamba.layers.18.0.D": "model-00001-of-00003.safetensors", "mamba.layers.18.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.18.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.18.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.A": "model-00001-of-00003.safetensors", "mamba.layers.19.0.D": "model-00001-of-00003.safetensors", "mamba.layers.19.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.19.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.19.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.A": "model-00001-of-00003.safetensors", "mamba.layers.2.0.D": "model-00001-of-00003.safetensors", "mamba.layers.2.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.2.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.2.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.A": "model-00001-of-00003.safetensors", "mamba.layers.20.0.D": "model-00001-of-00003.safetensors", "mamba.layers.20.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.20.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.20.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.A": "model-00001-of-00003.safetensors", "mamba.layers.21.0.D": "model-00001-of-00003.safetensors", "mamba.layers.21.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.21.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.21.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.A": "model-00001-of-00003.safetensors", "mamba.layers.22.0.D": "model-00001-of-00003.safetensors", "mamba.layers.22.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.22.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.22.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.A": "model-00001-of-00003.safetensors", "mamba.layers.23.0.D": "model-00001-of-00003.safetensors", "mamba.layers.23.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.23.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.23.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.24.0.A": "model-00001-of-00003.safetensors", "mamba.layers.24.0.D": "model-00001-of-00003.safetensors", "mamba.layers.24.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.24.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.24.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.24.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.24.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.24.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.24.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.24.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.24.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.A": "model-00002-of-00003.safetensors", "mamba.layers.25.0.D": "model-00002-of-00003.safetensors", "mamba.layers.25.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.25.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.25.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.A": "model-00002-of-00003.safetensors", "mamba.layers.26.0.D": "model-00002-of-00003.safetensors", "mamba.layers.26.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.26.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.26.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.A": "model-00002-of-00003.safetensors", "mamba.layers.27.0.D": "model-00002-of-00003.safetensors", "mamba.layers.27.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.27.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.27.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.A": "model-00002-of-00003.safetensors", "mamba.layers.28.0.D": "model-00002-of-00003.safetensors", "mamba.layers.28.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.28.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.28.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.A": "model-00002-of-00003.safetensors", "mamba.layers.29.0.D": "model-00002-of-00003.safetensors", "mamba.layers.29.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.29.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.29.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.3.0.A": "model-00001-of-00003.safetensors", "mamba.layers.3.0.D": "model-00001-of-00003.safetensors", "mamba.layers.3.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.3.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.3.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.30.0.A": "model-00002-of-00003.safetensors", "mamba.layers.30.0.D": "model-00002-of-00003.safetensors", "mamba.layers.30.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.30.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.30.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.A": "model-00002-of-00003.safetensors", "mamba.layers.31.0.D": "model-00002-of-00003.safetensors", "mamba.layers.31.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.31.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.31.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.A": "model-00002-of-00003.safetensors", "mamba.layers.32.0.D": "model-00002-of-00003.safetensors", "mamba.layers.32.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.32.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.32.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.A": "model-00002-of-00003.safetensors", "mamba.layers.33.0.D": "model-00002-of-00003.safetensors", "mamba.layers.33.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.33.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.33.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.A": "model-00002-of-00003.safetensors", "mamba.layers.34.0.D": "model-00002-of-00003.safetensors", "mamba.layers.34.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.34.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.34.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.A": "model-00002-of-00003.safetensors", "mamba.layers.35.0.D": "model-00002-of-00003.safetensors", "mamba.layers.35.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.35.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.35.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.A": "model-00002-of-00003.safetensors", "mamba.layers.36.0.D": "model-00002-of-00003.safetensors", "mamba.layers.36.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.36.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.36.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.A": "model-00002-of-00003.safetensors", "mamba.layers.37.0.D": "model-00002-of-00003.safetensors", "mamba.layers.37.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.37.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.37.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.A": "model-00002-of-00003.safetensors", "mamba.layers.38.0.D": "model-00002-of-00003.safetensors", "mamba.layers.38.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.38.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.38.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.A": "model-00002-of-00003.safetensors", "mamba.layers.39.0.D": "model-00002-of-00003.safetensors", "mamba.layers.39.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.39.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.39.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.4.0.A": "model-00001-of-00003.safetensors", "mamba.layers.4.0.D": "model-00001-of-00003.safetensors", "mamba.layers.4.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.4.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.4.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.40.0.A": "model-00002-of-00003.safetensors", "mamba.layers.40.0.D": "model-00002-of-00003.safetensors", "mamba.layers.40.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.40.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.40.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.A": "model-00002-of-00003.safetensors", "mamba.layers.41.0.D": "model-00002-of-00003.safetensors", "mamba.layers.41.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.41.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.41.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.A": "model-00002-of-00003.safetensors", "mamba.layers.42.0.D": "model-00002-of-00003.safetensors", "mamba.layers.42.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.42.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.42.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.A": "model-00002-of-00003.safetensors", "mamba.layers.43.0.D": "model-00002-of-00003.safetensors", "mamba.layers.43.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.43.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.43.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.A": "model-00002-of-00003.safetensors", "mamba.layers.44.0.D": "model-00002-of-00003.safetensors", "mamba.layers.44.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.44.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.44.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.A": "model-00002-of-00003.safetensors", "mamba.layers.45.0.D": "model-00002-of-00003.safetensors", "mamba.layers.45.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.45.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.45.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.A": "model-00002-of-00003.safetensors", "mamba.layers.46.0.D": "model-00002-of-00003.safetensors", "mamba.layers.46.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.46.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.46.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.A": "model-00002-of-00003.safetensors", "mamba.layers.47.0.D": "model-00002-of-00003.safetensors", "mamba.layers.47.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.47.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.47.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.A": "model-00002-of-00003.safetensors", "mamba.layers.48.0.D": "model-00002-of-00003.safetensors", "mamba.layers.48.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.48.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.48.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.A": "model-00002-of-00003.safetensors", "mamba.layers.49.0.D": "model-00002-of-00003.safetensors", "mamba.layers.49.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.49.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.49.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.5.0.A": "model-00001-of-00003.safetensors", "mamba.layers.5.0.D": "model-00001-of-00003.safetensors", "mamba.layers.5.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.5.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.5.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.50.0.A": "model-00002-of-00003.safetensors", "mamba.layers.50.0.D": "model-00002-of-00003.safetensors", "mamba.layers.50.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.50.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.50.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.A": "model-00002-of-00003.safetensors", "mamba.layers.51.0.D": "model-00002-of-00003.safetensors", "mamba.layers.51.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.51.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.51.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.A": "model-00002-of-00003.safetensors", "mamba.layers.52.0.D": "model-00002-of-00003.safetensors", "mamba.layers.52.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.52.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.52.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.A": "model-00002-of-00003.safetensors", "mamba.layers.53.0.D": "model-00002-of-00003.safetensors", "mamba.layers.53.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.53.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.53.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.A": "model-00002-of-00003.safetensors", "mamba.layers.54.0.D": "model-00002-of-00003.safetensors", "mamba.layers.54.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.54.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.54.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.A": "model-00002-of-00003.safetensors", "mamba.layers.55.0.D": "model-00002-of-00003.safetensors", "mamba.layers.55.0.conv.bias": "model-00002-of-00003.safetensors", "mamba.layers.55.0.conv.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.in_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.out_proj.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.s_B.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.s_C.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.s_D.0.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.0.s_D.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.55.1.weight": "model-00002-of-00003.safetensors", "mamba.layers.56.0.A": "model-00003-of-00003.safetensors", "mamba.layers.56.0.D": "model-00003-of-00003.safetensors", "mamba.layers.56.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.56.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.56.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.A": "model-00003-of-00003.safetensors", "mamba.layers.57.0.D": "model-00003-of-00003.safetensors", "mamba.layers.57.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.57.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.57.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.A": "model-00003-of-00003.safetensors", "mamba.layers.58.0.D": "model-00003-of-00003.safetensors", "mamba.layers.58.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.58.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.58.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.A": "model-00003-of-00003.safetensors", "mamba.layers.59.0.D": "model-00003-of-00003.safetensors", "mamba.layers.59.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.59.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.59.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.6.0.A": "model-00001-of-00003.safetensors", "mamba.layers.6.0.D": "model-00001-of-00003.safetensors", "mamba.layers.6.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.6.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.6.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.60.0.A": "model-00003-of-00003.safetensors", "mamba.layers.60.0.D": "model-00003-of-00003.safetensors", "mamba.layers.60.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.60.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.60.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.A": "model-00003-of-00003.safetensors", "mamba.layers.61.0.D": "model-00003-of-00003.safetensors", "mamba.layers.61.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.61.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.61.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.A": "model-00003-of-00003.safetensors", "mamba.layers.62.0.D": "model-00003-of-00003.safetensors", "mamba.layers.62.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.62.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.62.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.A": "model-00003-of-00003.safetensors", "mamba.layers.63.0.D": "model-00003-of-00003.safetensors", "mamba.layers.63.0.conv.bias": "model-00003-of-00003.safetensors", "mamba.layers.63.0.conv.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.in_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.out_proj.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.s_B.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.s_C.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.s_D.0.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.0.s_D.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.63.1.weight": "model-00003-of-00003.safetensors", "mamba.layers.7.0.A": "model-00001-of-00003.safetensors", "mamba.layers.7.0.D": "model-00001-of-00003.safetensors", "mamba.layers.7.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.7.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.7.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.A": "model-00001-of-00003.safetensors", "mamba.layers.8.0.D": "model-00001-of-00003.safetensors", "mamba.layers.8.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.8.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.8.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.A": "model-00001-of-00003.safetensors", "mamba.layers.9.0.D": "model-00001-of-00003.safetensors", "mamba.layers.9.0.conv.bias": "model-00001-of-00003.safetensors", "mamba.layers.9.0.conv.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.in_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.out_proj.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.s_B.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.s_C.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.s_D.0.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.0.s_D.1.weight": "model-00001-of-00003.safetensors", "mamba.layers.9.1.weight": "model-00001-of-00003.safetensors", "proj.bias": "model-00003-of-00003.safetensors", "proj.weight": "model-00003-of-00003.safetensors" } }