(self)
| 38 | self.assertEqual(len(datasets["test"]), 300) |
| 39 | |
| 40 | def test_loading_data_dict(self): |
| 41 | dataset_mixer = { |
| 42 | "HuggingFaceH4/testing_alpaca_small": 0.5, |
| 43 | "HuggingFaceH4/testing_self_instruct_small": 0.3, |
| 44 | "HuggingFaceH4/testing_codealpaca_small": 0.2, |
| 45 | } |
| 46 | datasets = get_datasets(dataset_mixer, columns_to_keep=["prompt", "completion"]) |
| 47 | self.assertEqual(len(datasets["train"]), 100) |
| 48 | self.assertEqual(len(datasets["test"]), 300) |
| 49 | |
| 50 | def test_loading_with_unit_fractions(self): |
| 51 | dataset_mixer = { |
nothing calls this directly
no test coverage detected