File size: 526 Bytes
7320ff5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
{
  "timestamp_utc": "2026-02-09T20:38:09.856840+00:00",
  "source_model_dir": "artifacts/medasr-mlx-fp16",
  "output_model_dir": "artifacts/medasr-mlx-int8",
  "quantization": {
    "bits": 8,
    "group_size": 64,
    "mode": "affine",
    "target_modules": "mlx.nn.quantize default predicate (Linear/Embedding layers)"
  },
  "timing": {
    "quantization_time_s": 0.0034
  },
  "size_mb": {
    "source_weights": 200.9,
    "output_weights": 121.108,
    "compression_ratio_x": 1.659,
    "reduction_percent": 39.72
  }
}