Added pdf & epub parsing

This commit is contained in:
simon987
2018-04-16 19:42:40 -04:00
parent 6d3cceb1b1
commit 17c682a5ef
11 changed files with 264 additions and 57 deletions

13
spec/EbookParserTest.py Normal file
View File

@@ -0,0 +1,13 @@
from unittest import TestCase
from parsing import EbookParser
class EbookParserTest(TestCase):
def test_parse_content(self):
parser = EbookParser([], 1000)
info = parser.parse("test_files/epub1.epub")
self.assertEqual(len(info["content"]), 1000)