17 lines
389 B
Python

from unittest import TestCase
from parsing import TikaFileParser
import os
dir_name = os.path.dirname(os.path.abspath(__file__))
class DocxParserTest(TestCase):
def test_parse_content(self):
parser = TikaFileParser([], dir_name + "/test_files/", 1000)
info = parser.parse(dir_name + "/test_files/docx1.docx")
self.assertEqual(len(info["content"]), 1000)