(model, backend)
| 272 | |
| 273 | |
| 274 | def get_max_cache_entry(model, backend): |
| 275 | if backend == 'pytorch': |
| 276 | return 0.8 |
| 277 | if 'Llama-2' in model: |
| 278 | return 0.95 |
| 279 | elif 'internlm2' in model: |
| 280 | return 0.9 |
| 281 | elif 'Qwen/Qwen3-235B-A22B' == model or 'internlm/Intern-S1' == model: |
| 282 | return 0.7 |
| 283 | else: |
| 284 | return None |
no outgoing calls
no test coverage detected