(updates=None)
| 337 | |
| 338 | @staticmethod |
| 339 | def get_default_config(updates=None): |
| 340 | config = ConfigDict() |
| 341 | config.path = '' |
| 342 | config.seq_length = 1024 |
| 343 | config.batch_size = 8 |
| 344 | config.always_start_with_bos = False |
| 345 | config.start_seek_loc = 0 |
| 346 | config.example_index_at_start = 0 |
| 347 | config.tokens_count_at_start = 0 |
| 348 | config.tokenizer_processes = 1 |
| 349 | config.tokenizer_parallel_chunk_size = 32 |
| 350 | config.tokenizer_parallel_batch_size = 1024 |
| 351 | config.throughput_average_window_size = 200 |
| 352 | config.pad = False |
| 353 | config.use_data_sharded_loader = True |
| 354 | config.return_local_batch = False |
| 355 | |
| 356 | if updates is not None: |
| 357 | config.update(ConfigDict(updates).copy_and_resolve_references()) |
| 358 | return config |
| 359 | |
| 360 | def __init__(self, config, tokenizer, text_processor, node_info): |
| 361 | self.config = self.get_default_config(config) |
no outgoing calls
no test coverage detected