WizardMath-7B-V1.1-q4f16_1-MLC / ndarray-cache.json
CharlieFRuan's picture
Initial commit
7af377a
raw
history blame contribute delete
No virus
146 kB
{
"metadata": {
"ParamSize": 325,
"ParamBytes": 4073857024.0,
"BitsPerParam": 4.50042279387851
},
"records": [
{
"dataPath": "params_shard_0.bin",
"format": "raw-shard",
"nbytes": 65536000,
"records": [
{
"name": "lm_head.q_weight",
"shape": [
32000,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 65536000,
"byteOffset": 0
}
],
"md5sum": "ace7eb94df55d610d5eeef237303115a"
},
{
"dataPath": "params_shard_1.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.22.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "0bb2e7e43b2fcfb95ac13026d50fa329"
},
{
"dataPath": "params_shard_2.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.22.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "6415c76f6b49e7ae20bf0145b4b0a7d0"
},
{
"dataPath": "params_shard_3.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.23.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "8db8bce75cc9fc39276b4c64b6919341"
},
{
"dataPath": "params_shard_4.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.23.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "a0a39e3d000ea1ff6de6ddf67c9cf8ec"
},
{
"dataPath": "params_shard_5.bin",
"format": "raw-shard",
"nbytes": 30244864,
"records": [
{
"name": "lm_head.q_scale",
"shape": [
32000,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192000,
"byteOffset": 0
},
{
"name": "model.layers.22.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 8192000
},
{
"name": "model.layers.22.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 8200192
},
{
"name": "model.layers.22.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 11870208
},
{
"name": "model.layers.22.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 19210240
},
{
"name": "model.layers.23.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 19218432
},
{
"name": "model.layers.23.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 19226624
},
{
"name": "model.layers.23.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 22896640
},
{
"name": "model.layers.23.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30236672
}
],
"md5sum": "6d318e1a0773fa9a388b45f7224b47e3"
},
{
"dataPath": "params_shard_6.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.24.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "06d388fab3f753bacc831083fe51c50d"
},
{
"dataPath": "params_shard_7.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.24.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "0206d6098244154ecd0b9a5b4d302c51"
},
{
"dataPath": "params_shard_8.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.23.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.23.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.23.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.23.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.24.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.24.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "09fa45f6a4d81b1131046a4d36738177"
},
{
"dataPath": "params_shard_9.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.25.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "f3834f2af378857b169e78cee45a4ead"
},
{
"dataPath": "params_shard_10.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.24.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.24.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.24.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.24.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.24.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.24.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.25.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "37e4349ddbea383c04498a9a0b8c6e41"
},
{
"dataPath": "params_shard_11.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.25.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "451fec3d24a7e7feea5623ae7c6c336f"
},
{
"dataPath": "params_shard_12.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.25.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.25.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.25.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.25.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.25.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "903395edbf9f287c2046017f2fe1b3b2"
},
{
"dataPath": "params_shard_13.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.26.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "c3996d9e250c6c2092c845be082a288f"
},
{
"dataPath": "params_shard_14.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.26.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "4fc716d73db81f587b2615262e14a6ba"
},
{
"dataPath": "params_shard_15.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.25.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.25.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.26.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.26.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.26.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.26.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.26.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "7a927fc60034d08b298576bbc344523b"
},
{
"dataPath": "params_shard_16.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.27.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "ca43eb3a661bba620a0319130f52d14a"
},
{
"dataPath": "params_shard_17.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.27.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "7700c5d925154bdf3c43c5d9ed8c6ba4"
},
{
"dataPath": "params_shard_18.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.26.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.26.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.26.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.27.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.27.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.27.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.27.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "e92e497528c41ff16600319f8dbe275a"
},
{
"dataPath": "params_shard_19.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.28.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "00ce42fadb12ea1feb127e4a6bc74efb"
},
{
"dataPath": "params_shard_20.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.28.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "2378d20ee0b37fc9d7fce6a4c865b30b"
},
{
"dataPath": "params_shard_21.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.27.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.27.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.27.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.27.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.28.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.28.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "25592bf791dde896bc485158a6b394f4"
},
{
"dataPath": "params_shard_22.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.29.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "41d676d45493d878c17f2b8b49734cd1"
},
{
"dataPath": "params_shard_23.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.28.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.28.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.28.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.28.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.28.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.28.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.29.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "460b7d33e582462c02d5a940c9e6a74c"
},
{
"dataPath": "params_shard_24.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.29.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "9c558b961fcfef45eadb2101550725b2"
},
{
"dataPath": "params_shard_25.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.29.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.29.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.29.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.29.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.29.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "c37edf353eef4e73f29c01cb816b4656"
},
{
"dataPath": "params_shard_26.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.30.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "4c65f1edfc67b938a3e918d9a23100cd"
},
{
"dataPath": "params_shard_27.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.30.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "5683a94b049c30714893c2e6ec3cb06f"
},
{
"dataPath": "params_shard_28.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.29.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.29.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.30.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.30.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.30.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.30.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.30.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "22c2149f5102a9927b388654502c5978"
},
{
"dataPath": "params_shard_29.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.31.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "ccce7d99674d64efa59a1b2e2a7efc3c"
},
{
"dataPath": "params_shard_30.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.31.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "a00dc9891bacb214ac708cba32887363"
},
{
"dataPath": "params_shard_31.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.30.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.30.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.30.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.31.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.31.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.31.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.31.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "6f418c569389305d68e7536fc875cacb"
},
{
"dataPath": "params_shard_32.bin",
"format": "raw-shard",
"nbytes": 65536000,
"records": [
{
"name": "model.embed_tokens.q_weight",
"shape": [
32000,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 65536000,
"byteOffset": 0
}
],
"md5sum": "969ae7ded2094e6a5a41c1707085f5b5"
},
{
"dataPath": "params_shard_33.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.0.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "056efa21bc1c48d0bd9bce3c598fb93f"
},
{
"dataPath": "params_shard_34.bin",
"format": "raw-shard",
"nbytes": 31801344,
"records": [
{
"name": "model.layers.31.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.31.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.31.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.31.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.norm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.embed_tokens.q_scale",
"shape": [
32000,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192000,
"byteOffset": 23601152
},
{
"name": "model.layers.0.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 31793152
}
],
"md5sum": "7d068c4a3114f58217434da65d0f1ca7"
},
{
"dataPath": "params_shard_35.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.0.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "9c3c2abbe090da38e040aad13cb9e468"
},
{
"dataPath": "params_shard_36.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.0.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.0.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.0.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.0.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.0.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "6f156809a0828bb2f74e7fed1d0ceed5"
},
{
"dataPath": "params_shard_37.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.1.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "27ad122e3a4a167205e6409f6923c2bf"
},
{
"dataPath": "params_shard_38.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.1.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "d1aa72ca765b05e356be967eb55da5b2"
},
{
"dataPath": "params_shard_39.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.0.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.0.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.1.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.1.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.1.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.1.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.1.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "cb62e4b23ab736f889f243e26fc43f97"
},
{
"dataPath": "params_shard_40.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.10.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "f609f54e01cc072a5862a6ed78ceaf27"
},
{
"dataPath": "params_shard_41.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.10.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "40bb367132b9c9ef2d74a951ff89a30d"
},
{
"dataPath": "params_shard_42.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.1.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.1.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.1.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.10.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.10.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.10.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.10.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "9942c01314cde45577415df5745a368d"
},
{
"dataPath": "params_shard_43.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.11.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "e693bb0769fe1b3533b8db781be16b5d"
},
{
"dataPath": "params_shard_44.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.11.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "260c9c2fc293e3eedbff2bd181a9df89"
},
{
"dataPath": "params_shard_45.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.10.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.10.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.10.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.10.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.11.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.11.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "23c8c598a862152573aabc7e005f243d"
},
{
"dataPath": "params_shard_46.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.12.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "89407d45a332deed6dd19cbe0e5a1d2a"
},
{
"dataPath": "params_shard_47.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.11.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.11.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.11.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.11.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.11.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.11.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.12.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "a7316951de7f780d9b1775c5e70ea072"
},
{
"dataPath": "params_shard_48.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.12.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "4427080eaf9643b685a3b19b0e37498b"
},
{
"dataPath": "params_shard_49.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.12.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.12.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.12.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.12.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.12.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "27ba72e3db245abeef0c5b4137b3e6c6"
},
{
"dataPath": "params_shard_50.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.13.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "ed03b3545dceb7ad00a9f02d7c309171"
},
{
"dataPath": "params_shard_51.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.13.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "d2ca46460aac82842091e590f792b55e"
},
{
"dataPath": "params_shard_52.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.12.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.12.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.13.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.13.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.13.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.13.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.13.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "80d24d34a5ba89ef986d961d55393a71"
},
{
"dataPath": "params_shard_53.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.14.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "869b1de05b330ec4322c921a321a1146"
},
{
"dataPath": "params_shard_54.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.14.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "586be56b53483778bb27e9df8c7cf0e7"
},
{
"dataPath": "params_shard_55.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.13.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.13.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.13.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.14.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.14.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.14.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.14.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "a36f2d501aa67d5046111d41f3c4b78e"
},
{
"dataPath": "params_shard_56.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.15.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "1e8103031daf94c11666d092e7aa2a4a"
},
{
"dataPath": "params_shard_57.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.15.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "57dea35b819ddd507b792c9e940fa8b9"
},
{
"dataPath": "params_shard_58.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.14.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.14.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.14.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.14.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.15.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.15.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "1b9b02b031402af5c09db16cc762e190"
},
{
"dataPath": "params_shard_59.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.16.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "e8b1d6b16d31e524781fbe595a9e3689"
},
{
"dataPath": "params_shard_60.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.15.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.15.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.15.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.15.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.15.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.15.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.16.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "63ae96d6331a33db476e8c87eea2d289"
},
{
"dataPath": "params_shard_61.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.16.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "b23e49a578f8bcf3f178c755d14cee61"
},
{
"dataPath": "params_shard_62.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.16.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.16.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.16.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.16.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.16.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "79bef92f4688d86e53154072c3056bbf"
},
{
"dataPath": "params_shard_63.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.17.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "12475d183dae409a480f6c29015e8a88"
},
{
"dataPath": "params_shard_64.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.17.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "98176052672ad4d3a27a26621dd23222"
},
{
"dataPath": "params_shard_65.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.16.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.16.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.17.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.17.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.17.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.17.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.17.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "0c8d32771a94131dd499d5e4472613b9"
},
{
"dataPath": "params_shard_66.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.18.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "df9e6d812cfe930f294375db6f63b5d0"
},
{
"dataPath": "params_shard_67.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.18.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "e7781265c1e475fc8fcdfceffc2148d2"
},
{
"dataPath": "params_shard_68.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.17.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.17.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.17.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.18.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.18.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.18.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.18.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "b50b7e10cb3fb60429ce8b21282f0bc7"
},
{
"dataPath": "params_shard_69.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.19.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "cabf37daa7505182eedd36c4377980c3"
},
{
"dataPath": "params_shard_70.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.19.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "8256baaab092d1ecda43d30a0a35e66f"
},
{
"dataPath": "params_shard_71.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.18.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.18.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.18.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.18.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.19.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.19.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "f89d6a3c40fc57471ae7b0617c54b7df"
},
{
"dataPath": "params_shard_72.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.2.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "5f9cd36aa91338caf602ca6a89602eb0"
},
{
"dataPath": "params_shard_73.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.19.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.19.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.19.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.19.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.19.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.19.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.2.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "526454df422c4c142965c262fd1c596a"
},
{
"dataPath": "params_shard_74.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.2.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "97a73edde1ec4e6a31c786d6ae2e0fc3"
},
{
"dataPath": "params_shard_75.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.2.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.2.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.2.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.2.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.2.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "4328a16926ff2389086fece3daebbf15"
},
{
"dataPath": "params_shard_76.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.20.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "8b5027968fa9324a7789c83490527f1e"
},
{
"dataPath": "params_shard_77.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.20.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "029c00fe3c5082036b0ada4e3bddb7de"
},
{
"dataPath": "params_shard_78.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.2.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.2.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.20.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.20.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.20.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.20.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.20.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "9239fad122fdd50bbd508c2821b58332"
},
{
"dataPath": "params_shard_79.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.21.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "6cc39882ca9724c12522daf6ddc68c24"
},
{
"dataPath": "params_shard_80.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.21.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "1498a9bff0d2107d5fe7dc6705fc603d"
},
{
"dataPath": "params_shard_81.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.20.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.20.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.20.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.21.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.21.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.21.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.21.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "c7abda69e082db14bac06ffc3396e84a"
},
{
"dataPath": "params_shard_82.bin",
"format": "raw-shard",
"nbytes": 23592960,
"records": [
{
"name": "model.layers.21.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.21.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.21.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.21.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
}
],
"md5sum": "f0e27322bf508bc903276b5426ed8566"
},
{
"dataPath": "params_shard_83.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.3.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "4a62184b2a582ffe5550f93ef224ccf7"
},
{
"dataPath": "params_shard_84.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.3.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "72030d604350d66187afd0c78ceb0c66"
},
{
"dataPath": "params_shard_85.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.22.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.22.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.22.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.22.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.3.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.3.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "6919a3c3b0044d09a42d145f48048d00"
},
{
"dataPath": "params_shard_86.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.4.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "a6da7de15cce6bf116a0c020a8e34aee"
},
{
"dataPath": "params_shard_87.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.3.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.3.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.3.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.3.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.3.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.3.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.4.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "2b9541bbdcdd65783b47db17f41bc778"
},
{
"dataPath": "params_shard_88.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.4.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "92da920e2090dc542dd6a2174d249ad7"
},
{
"dataPath": "params_shard_89.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.4.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.4.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.4.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.4.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.4.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "c324013a37bc7f161ae10b1757bf1fc2"
},
{
"dataPath": "params_shard_90.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.5.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "b4066cf4673ec6511465ae6176973aac"
},
{
"dataPath": "params_shard_91.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.5.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "cc558b4e5b9795954cc900dbda5a358d"
},
{
"dataPath": "params_shard_92.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.4.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.4.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.5.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.5.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.5.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.5.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.5.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "bb2b703fb7ac16fb197dfb67c50e78b6"
},
{
"dataPath": "params_shard_93.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.6.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "280140ad523e015cb5fc35506073cf0b"
},
{
"dataPath": "params_shard_94.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.6.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "3bac232cd08b566134e1b4ab6fd70d67"
},
{
"dataPath": "params_shard_95.bin",
"format": "raw-shard",
"nbytes": 22036480,
"records": [
{
"name": "model.layers.5.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.5.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.5.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
},
{
"name": "model.layers.6.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.6.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 11018240
},
{
"name": "model.layers.6.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 14688256
},
{
"name": "model.layers.6.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 22028288
}
],
"md5sum": "e2e0db0d12573c4c3b863aada1b78e86"
},
{
"dataPath": "params_shard_96.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.7.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "48e42c122ebaf64491d4ac806007fe3a"
},
{
"dataPath": "params_shard_97.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.7.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "963d79b16e5c087b9ebed963ab80b76b"
},
{
"dataPath": "params_shard_98.bin",
"format": "raw-shard",
"nbytes": 27271168,
"records": [
{
"name": "model.layers.6.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 0
},
{
"name": "model.layers.6.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 12582912
},
{
"name": "model.layers.6.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 14155776
},
{
"name": "model.layers.6.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 22544384
},
{
"name": "model.layers.7.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 23592960
},
{
"name": "model.layers.7.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 23601152
}
],
"md5sum": "fc3004251cc2f1f52f94a8bd748a00ff"
},
{
"dataPath": "params_shard_99.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.8.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "6adb4794ac087dc040cd16aa6ba352ef"
},
{
"dataPath": "params_shard_100.bin",
"format": "raw-shard",
"nbytes": 30949376,
"records": [
{
"name": "model.layers.7.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 0
},
{
"name": "model.layers.7.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 7340032
},
{
"name": "model.layers.7.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 7348224
},
{
"name": "model.layers.7.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 19931136
},
{
"name": "model.layers.7.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 21504000
},
{
"name": "model.layers.7.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 29892608
},
{
"name": "model.layers.8.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 30941184
}
],
"md5sum": "4dbbf02a2c533967bc6b2e48a497807f"
},
{
"dataPath": "params_shard_101.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.8.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "458e7bf75184ed1fafa3650186f63243"
},
{
"dataPath": "params_shard_102.bin",
"format": "raw-shard",
"nbytes": 25174016,
"records": [
{
"name": "model.layers.8.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 0
},
{
"name": "model.layers.8.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 3670016
},
{
"name": "model.layers.8.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 11010048
},
{
"name": "model.layers.8.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 11018240
},
{
"name": "model.layers.8.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 23601152
}
],
"md5sum": "dfe9f25118e34b41873deeb53aec790a"
},
{
"dataPath": "params_shard_103.bin",
"format": "raw-shard",
"nbytes": 29360128,
"records": [
{
"name": "model.layers.9.mlp.down_proj.q_weight",
"shape": [
4096,
1792
],
"dtype": "uint32",
"format": "raw",
"nbytes": 29360128,
"byteOffset": 0
}
],
"md5sum": "4fc9eecf9cc1ca061ace45225d24d540"
},
{
"dataPath": "params_shard_104.bin",
"format": "raw-shard",
"nbytes": 58720256,
"records": [
{
"name": "model.layers.9.mlp.gate_up_proj.q_weight",
"shape": [
28672,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 58720256,
"byteOffset": 0
}
],
"md5sum": "eb4d88ddadf12ddd9edd6fcec65fd28d"
},
{
"dataPath": "params_shard_105.bin",
"format": "raw-shard",
"nbytes": 33046528,
"records": [
{
"name": "model.layers.8.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 0
},
{
"name": "model.layers.8.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 8388608
},
{
"name": "model.layers.9.input_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 9437184
},
{
"name": "model.layers.9.mlp.down_proj.q_scale",
"shape": [
4096,
448
],
"dtype": "float16",
"format": "raw",
"nbytes": 3670016,
"byteOffset": 9445376
},
{
"name": "model.layers.9.mlp.gate_up_proj.q_scale",
"shape": [
28672,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 7340032,
"byteOffset": 13115392
},
{
"name": "model.layers.9.post_attention_layernorm.weight",
"shape": [
4096
],
"dtype": "float16",
"format": "raw",
"nbytes": 8192,
"byteOffset": 20455424
},
{
"name": "model.layers.9.self_attn.qkv_proj.q_weight",
"shape": [
6144,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 12582912,
"byteOffset": 20463616
}
],
"md5sum": "fa119b02defa9ba64894df6418be175c"
},
{
"dataPath": "params_shard_106.bin",
"format": "raw-shard",
"nbytes": 11010048,
"records": [
{
"name": "model.layers.9.self_attn.qkv_proj.q_scale",
"shape": [
6144,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1572864,
"byteOffset": 0
},
{
"name": "model.layers.9.self_attn.o_proj.q_weight",
"shape": [
4096,
512
],
"dtype": "uint32",
"format": "raw",
"nbytes": 8388608,
"byteOffset": 1572864
},
{
"name": "model.layers.9.self_attn.o_proj.q_scale",
"shape": [
4096,
128
],
"dtype": "float16",
"format": "raw",
"nbytes": 1048576,
"byteOffset": 9961472
}
],
"md5sum": "9b3cd6b535aa1254db8cd7cb9caf4993"
}
]
}