| 88 | self.page_url = f"{self.root}/gallery/{self.gallery_id}/" |
| 89 | |
| 90 | def metadata(self, page): |
| 91 | extr = text.extract_from(page) |
| 92 | title = extr("<h1>", "<") |
| 93 | title_alt = extr('class="subtitle">', "<") |
| 94 | end = "</li>" if extr('<ul class="galleries_info', ">") else "</ul>" |
| 95 | |
| 96 | data = { |
| 97 | "gallery_id": text.parse_int(self.gallery_id), |
| 98 | "title" : text.unescape(title), |
| 99 | "title_alt" : text.unescape(title_alt), |
| 100 | "parody" : self._split(extr(">Parodies", end)), |
| 101 | "character" : self._split(extr(">Characters", end)), |
| 102 | "tags" : self._split(extr(">Tags", end)), |
| 103 | "artist" : self._split(extr(">Artists", end)), |
| 104 | "group" : self._split(extr(">Groups", end)), |
| 105 | "language" : self._split(extr(">Languages", end)), |
| 106 | "type" : extr("href='/category/", "/"), |
| 107 | } |
| 108 | |
| 109 | if data["language"]: |
| 110 | data["lang"] = util.language_to_code(data["language"][0]) |
| 111 | |
| 112 | return data |
| 113 | |
| 114 | def _split(self, html): |
| 115 | results = [] |