Append a character into ngram buffer.
(self, ch)
| 29 | self.capitalword = False |
| 30 | |
| 31 | def add_char(self, ch): |
| 32 | '''Append a character into ngram buffer.''' |
| 33 | ch = self.normalize(ch) |
| 34 | last_char = self.grams[-1] |
| 35 | if last_char == ' ': |
| 36 | self.grams = ' ' |
| 37 | self.capitalword = False |
| 38 | if ch == ' ': |
| 39 | return |
| 40 | elif len(self.grams) >= self.N_GRAM: |
| 41 | self.grams = self.grams[1:] |
| 42 | self.grams += ch |
| 43 | |
| 44 | if ch.isupper(): |
| 45 | if last_char.isupper(): |
| 46 | self.capitalword = True |
| 47 | else: |
| 48 | self.capitalword = False |
| 49 | |
| 50 | def get(self, n): |
| 51 | '''Get n-gram.''' |