Qwen3.6-27B-PrismaQuant-5.5bit-vllm / mixed_native_manifest.json
rdtand's picture
v5: max-not-sum sibling aggregation, kernel shape mask, joint input_global — validator: ppl=4.16, mean_NLL=1.43, MTP P0=89.5%
09de726 verified
{
"source_model": "/hfcache/hub/models--Qwen--Qwen3.6-27B/snapshots/5d316fa25c3a0b6251198e9e7a94e863a435536a",
"source_recipe": "/work/artifacts/layer_config.json",
"format_histogram": {
"head_passthrough/BF16": 3,
"linear/BF16": 118,
"linear/NVFP4": 354,
"layer_passthrough/BF16": 352,
"linear/MXFP8": 24,
"mtp_linear/NVFP4": 7,
"mtp_passthrough/BF16": 8
},
"n_assignment_entries": 614,
"ignore": [
"lm_head"
]
}