Skip to content

Commit

Permalink
emojis
Browse files Browse the repository at this point in the history
  • Loading branch information
mgraffg committed Aug 24, 2024
1 parent 356f73b commit acaec43
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions dialectid/text_repr.py
Original file line number Diff line number Diff line change
Expand Up @@ -97,6 +97,7 @@ def bow(self):
self._bow = bow
return bow


class SeqTM(TextModel):
"""TextModel where the utterance is segmented in a sequence."""

Expand Down Expand Up @@ -151,6 +152,9 @@ def __vocabulary(self, counter):
for k, v in emojis.items():
self._map[k] = v
tokens[k] = v
for x in [f'~{k}~', f'~{k}', f'{k}~']:
self._map[x] = v
tokens[x] = v

@property
def language(self):
Expand Down

0 comments on commit acaec43

Please sign in to comment.