MCPcopy
hub / github.com/InternLM/lmdeploy / from_config

Method from_config

lmdeploy/pytorch/config.py:578–625  ·  view source on GitHub ↗
(
        cls,
        method: str,
        num_speculative_tokens: int,
        model: str,
        target_cache_cfg: CacheConfig,
        target_model: str = None,
        dtype: str = 'auto',
        trust_remote_code: bool = False,
        model_format: str = None,
        hf_overrides: dict[str, Any] = None,
        dist_config: DistConfig = None,
    )

Source from the content-addressed store, hash-verified

576
577 @classmethod
578 def from_config(
579 cls,
580 method: str,
581 num_speculative_tokens: int,
582 model: str,
583 target_cache_cfg: CacheConfig,
584 target_model: str = None,
585 dtype: str = 'auto',
586 trust_remote_code: bool = False,
587 model_format: str = None,
588 hf_overrides: dict[str, Any] = None,
589 dist_config: DistConfig = None,
590 ):
591 model = model or target_model
592 dist_config = dist_config or DistConfig()
593 model_config = ModelConfig.from_pretrained(model,
594 trust_remote_code=trust_remote_code,
595 dtype=dtype,
596 dist_config=dist_config,
597 is_draft_model=True,
598 spec_method=method,
599 block_size=target_cache_cfg.block_size,
600 model_format=model_format,
601 hf_overrides=hf_overrides,
602 )
603 cache_config = None
604 # include medusa
605 no_caches = ['medusa']
606 if method not in no_caches:
607 cache_config = CacheConfig(max_batches=target_cache_cfg.max_batches,
608 block_size=target_cache_cfg.block_size,
609 kernel_block_size=target_cache_cfg.kernel_block_size,
610 num_cpu_blocks=target_cache_cfg.num_cpu_blocks,
611 num_gpu_blocks=target_cache_cfg.num_gpu_blocks,
612 cache_max_entry_count=target_cache_cfg.cache_max_entry_count,
613 max_prefill_token_num=target_cache_cfg.max_prefill_token_num,
614 device_type=target_cache_cfg.device_type,
615 quant_policy=target_cache_cfg.quant_policy,
616 migration_backend=target_cache_cfg.migration_backend)
617 obj = cls(
618 model=model,
619 method=method,
620 cache_config=cache_config,
621 model_config=model_config,
622 dist_config=dist_config,
623 num_speculative_tokens=num_speculative_tokens,
624 )
625 return obj
626
627
628@dataclass

Callers 11

build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
build_modelMethod · 0.45
from_pretrainedMethod · 0.45

Calls 3

DistConfigClass · 0.85
CacheConfigClass · 0.85
from_pretrainedMethod · 0.45

Tested by

no test coverage detected