Estimate model weight size in bytes.
(model: ModelInfo, variant: GGUFVariant | None)
| 66 | |
| 67 | |
| 68 | def estimate_weight_bytes(model: ModelInfo, variant: GGUFVariant | None) -> int: |
| 69 | """Estimate model weight size in bytes.""" |
| 70 | if variant: |
| 71 | return variant.file_size_bytes |
| 72 | quant_type = infer_non_gguf_quant_type(model.id) |
| 73 | bytes_per_weight = _NON_GGUF_BYTES_PER_WEIGHT.get(quant_type, 2.0) |
| 74 | return int(model.parameter_count * bytes_per_weight) |
| 75 | |
| 76 | |
| 77 | def quant_quality_penalty(model: ModelInfo, variant: GGUFVariant | None) -> float: |