(
self, filename="train.csv", text_col="text", label_col="label", size=-1
)
| 224 | self.labels = None |
| 225 | |
| 226 | def get_train_examples( |
| 227 | self, filename="train.csv", text_col="text", label_col="label", size=-1 |
| 228 | ): |
| 229 | |
| 230 | if size == -1: |
| 231 | data_df = pd.read_csv(os.path.join(self.data_dir, filename)) |
| 232 | |
| 233 | return self._create_examples( |
| 234 | data_df, "train", text_col=text_col, label_col=label_col |
| 235 | ) |
| 236 | else: |
| 237 | data_df = pd.read_csv(os.path.join(self.data_dir, filename)) |
| 238 | # data_df['comment_text'] = data_df['comment_text'].apply(cleanHtml) |
| 239 | return self._create_examples( |
| 240 | data_df.sample(size), "train", text_col=text_col, label_col=label_col |
| 241 | ) |
| 242 | |
| 243 | def get_dev_examples( |
| 244 | self, filename="val.csv", text_col="text", label_col="label", size=-1 |
no test coverage detected