Update fix_single_quotes

This commit is contained in:
2021-08-28 20:48:00 -04:00
parent 60273fb6bd
commit 7e0ffafb8c
4 changed files with 14 additions and 2 deletions

View File

@@ -130,6 +130,17 @@ class TestText(TestCase):
expected = "hello world it's it's"
self.assertEqual(cleaned, expected)
def test_single_quote(self):
text = "it's it`s its"
cleaned = preprocess(
text,
lowercase=True,
fix_single_quotes=True
)
expected = "it's it's it's"
self.assertEqual(cleaned, expected)
def test_html_10(self):
text = "<div>\n Hello, \t\n<strong>world! it's it`s https://google.ca/test/abc.pdf </strong>\n\t</div>"