MCPcopy
hub / github.com/HIT-SCIR/ltp / load_dataset

Function load_dataset

python/core/ltp_core/datamodules/utils/datasets.py:6–38  ·  view source on GitHub ↗
(
    builder_cls: type,
    config_name: Optional[str] = None,
    data_dir: Optional[str] = None,
    data_files: Optional[
        Union[str, Sequence[str], Mapping[str, Union[str, Sequence[str]]]]
    ] = None,
    split: Optional[Union[str, Split]] = None,
    cache_dir: Optional[str] = None,
    features: Optional[Features] = None,
    save_infos: bool = False,
    **config_kwargs
)

Source from the content-addressed store, hash-verified

4
5
6def load_dataset(
7 builder_cls: type,
8 config_name: Optional[str] = None,
9 data_dir: Optional[str] = None,
10 data_files: Optional[
11 Union[str, Sequence[str], Mapping[str, Union[str, Sequence[str]]]]
12 ] = None,
13 split: Optional[Union[str, Split]] = None,
14 cache_dir: Optional[str] = None,
15 features: Optional[Features] = None,
16 save_infos: bool = False,
17 **config_kwargs
18) -> Union[DatasetDict, Dataset]:
19 # Instantiate the dataset builder
20 builder_instance: DatasetBuilder = builder_cls(
21 cache_dir=cache_dir,
22 config_name=config_name,
23 data_dir=data_dir,
24 data_files=data_files,
25 hash=hash,
26 features=features,
27 **config_kwargs,
28 )
29
30 # Download and prepare data
31 builder_instance.download_and_prepare()
32
33 # Build dataset for splits
34 ds = builder_instance.as_dataset(split=split)
35 if save_infos:
36 builder_instance._save_infos()
37
38 return ds

Callers 10

mainFunction · 0.90
mainFunction · 0.90
mainFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90
build_datasetFunction · 0.90

Calls

no outgoing calls

Tested by

no test coverage detected