diff --git a/tests/test_tokenizers.py b/tests/test_tokenizers.py index 578bf86..6c993b3 100644 --- a/tests/test_tokenizers.py +++ b/tests/test_tokenizers.py @@ -13,6 +13,8 @@ def test_tokenize(self): for i, token in enumerate(tokens): self.assertEqual(token, expected[i]) + self.assertEqual(tokenizer.dropped, 6) + class TestCanonical(unittest.TestCase): def test_tokenize(self): tokenizer = tokenizers.Canonical(tokenizers.Kmer(k=6)) @@ -33,4 +35,7 @@ def test_tokenize(self): expected = ['CGGT', 'TCAG', 'TAAT'] for i, token in enumerate(tokens): - self.assertEqual(token, expected[i]) \ No newline at end of file + self.assertEqual(token, expected[i]) + + self.assertEqual(tokenizer.dropped, 1) + \ No newline at end of file