| { | |
| "timestamp": "2025-08-25T11:04:12.307382", | |
| "models": { | |
| "distilbert": { | |
| "model_name": "DistilBERT-base", | |
| "total_parameters": 66362880, | |
| "fp32_size_mb": 253.1896457672119, | |
| "int8_size_mb": 131.71621131896973, | |
| "compression_ratio": 1.9222360196352506, | |
| "quality_preserved_percent": 62.2927248998829, | |
| "fp32_inference_time": 0.4803179340015049, | |
| "int8_inference_time": 0.40977579800528474, | |
| "inference_speedup": 1.1721481267063762, | |
| "passed": false | |
| }, | |
| "bert_tiny": { | |
| "error": "Due to a serious vulnerability issue in `torch.load`, even with `weights_only=True`, we now require users to upgrade torch to at least v2.6 in order to use the function. This version restriction does not apply when loading files with safetensors.\nSee the vulnerability report here https://nvd.nist.gov/vuln/detail/CVE-2025-32434" | |
| }, | |
| "distilgpt2": { | |
| "model_name": "DistilGPT2", | |
| "total_parameters": 81912576, | |
| "fp32_size_mb": 312.4962635040283, | |
| "int8_size_mb": 312.4962635040283, | |
| "compression_ratio": 1.0, | |
| "quality_preserved_percent": 100.0, | |
| "fp32_inference_time": 0.48100979599985294, | |
| "int8_inference_time": 0.3830824960023165, | |
| "inference_speedup": 1.2556297951993722, | |
| "passed": false | |
| } | |
| } | |
| } |