(model_name, models_dir)
| 112 | |
| 113 | |
| 114 | def get_encoder(model_name, models_dir): |
| 115 | with open(os.path.join(models_dir, model_name, "encoder.json"), "r") as f: |
| 116 | encoder = json.load(f) |
| 117 | with open(os.path.join(models_dir, model_name, "vocab.bpe"), "r", encoding="utf-8") as f: |
| 118 | bpe_data = f.read() |
| 119 | bpe_merges = [tuple(merge_str.split()) for merge_str in bpe_data.split("\n")[1:-1]] |
| 120 | return Encoder(encoder=encoder, bpe_merges=bpe_merges) |
no test coverage detected