| { | |
| "quantization": { | |
| "method": "jang-importance", | |
| "profile": "JANG_3M", | |
| "target_bits": 3, | |
| "actual_bits": 3.09, | |
| "block_size": 128, | |
| "calibration_method": "activations", | |
| "quantization_method": "mse-all", | |
| "scoring_method": "awq+hessian", | |
| "bit_widths_used": [ | |
| 3, | |
| 8 | |
| ], | |
| "quantization_scheme": "asymmetric", | |
| "quantization_backend": "mx.quantize", | |
| "hadamard_rotation": false | |
| }, | |
| "source_model": { | |
| "name": "Qwen3.5-122B-A10B", | |
| "dtype": "bfloat16", | |
| "parameters": "2.6B" | |
| }, | |
| "architecture": { | |
| "type": "hybrid_moe_ssm", | |
| "attention": "gqa", | |
| "has_vision": true, | |
| "has_ssm": true, | |
| "has_moe": true | |
| }, | |
| "runtime": { | |
| "total_weight_bytes": 48127822848, | |
| "total_weight_gb": 44.82 | |
| }, | |
| "format": "jang", | |
| "format_version": "2.0" | |
| } | |