Useful for running inference with quantized models by setting `device_map=get_peft_device_map()`
()
| 36 | |
| 37 | |
| 38 | def get_kbit_device_map() -> Dict[str, int] | None: |
| 39 | """Useful for running inference with quantized models by setting `device_map=get_peft_device_map()`""" |
| 40 | return {"": get_current_device()} if torch.cuda.is_available() else None |
| 41 | |
| 42 | |
| 43 | def get_quantization_config(model_args: ModelArguments) -> BitsAndBytesConfig | None: |
no test coverage detected