| { | |
| "quantization": { | |
| "method": "jang-importance", | |
| "profile": "JANG_3S", | |
| "target_bits": 3, | |
| "actual_bits": 3.83, | |
| "block_size": 64, | |
| "calibration_method": "activations", | |
| "quantization_method": "mse-all", | |
| "scoring_method": "awq+hessian", | |
| "bit_widths_used": [ | |
| 3, | |
| 6 | |
| ], | |
| "quantization_scheme": "asymmetric", | |
| "quantization_backend": "mx.quantize", | |
| "hadamard_rotation": false | |
| }, | |
| "source_model": { | |
| "name": "gemma-4-31B-it", | |
| "dtype": "bfloat16", | |
| "parameters": "29.2B" | |
| }, | |
| "architecture": { | |
| "type": "transformer", | |
| "attention": "gqa", | |
| "has_vision": true, | |
| "has_ssm": false, | |
| "has_moe": false | |
| }, | |
| "runtime": { | |
| "total_weight_bytes": 14690156544, | |
| "total_weight_gb": 13.68 | |
| }, | |
| "format": "jang", | |
| "format_version": "2.0" | |
| } | |