mirror of
https://github.com/simon987/libscan.git
synced 2025-04-05 12:23:00 +00:00
text tests
This commit is contained in:
parent
a0c9d21863
commit
f6cd9c42e3
@ -11,33 +11,63 @@ static scan_arc_ctx_t arc_list_ctx;
|
|||||||
static scan_text_ctx_t text_500_ctx;
|
static scan_text_ctx_t text_500_ctx;
|
||||||
|
|
||||||
|
|
||||||
TEST(TextTest, BookCsvContentLen) {
|
TEST(Text, BookCsvContentLen) {
|
||||||
const char *filepath = "libscan-test-files/test_files/text/books.csv";
|
|
||||||
|
|
||||||
vfile_t f;
|
vfile_t f;
|
||||||
document_t doc;
|
document_t doc;
|
||||||
doc.meta_head = nullptr;
|
load_doc_file("libscan-test-files/test_files/text/books.csv", &f, &doc);
|
||||||
doc.meta_tail = nullptr;
|
|
||||||
load_file(filepath, &f);
|
|
||||||
parse_text(&text_500_ctx, &f, &doc);
|
parse_text(&text_500_ctx, &f, &doc);
|
||||||
|
|
||||||
ASSERT_NEAR(strlen(get_meta(&doc, MetaContent)->str_val), 500, 1);
|
ASSERT_NEAR(strlen(get_meta(&doc, MetaContent)->str_val), 500, 1);
|
||||||
CLOSE_FILE(f)
|
cleanup(&doc, &f);
|
||||||
destroy_doc(&doc);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
TEST(TextTest, MemUtf8_1) {
|
TEST(Text, MemUtf8_1) {
|
||||||
const char *content = "a"; //todo
|
const char *content = "a";
|
||||||
|
|
||||||
vfile_t f;
|
vfile_t f;
|
||||||
document_t doc;
|
document_t doc;
|
||||||
doc.meta_head = nullptr;
|
load_doc_mem((void *) content, strlen(content), &f, &doc);
|
||||||
doc.meta_tail = nullptr;
|
|
||||||
load_mem((void *) content, strlen(content), &f);
|
|
||||||
parse_text(&text_500_ctx, &f, &doc);
|
parse_text(&text_500_ctx, &f, &doc);
|
||||||
|
|
||||||
ASSERT_EQ(strlen(get_meta(&doc, MetaContent)->str_val), 1);
|
ASSERT_EQ(strlen(get_meta(&doc, MetaContent)->str_val), 1);
|
||||||
destroy_doc(&doc);
|
cleanup(&doc, &f);
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST(Text, MemUtf8_Invalid1) {
|
||||||
|
const char *content = "12345\xE0";
|
||||||
|
vfile_t f;
|
||||||
|
document_t doc;
|
||||||
|
load_doc_mem((void *) content, strlen(content), &f, &doc);
|
||||||
|
|
||||||
|
parse_text(&text_500_ctx, &f, &doc);
|
||||||
|
|
||||||
|
ASSERT_STREQ(get_meta(&doc, MetaContent)->str_val, "12345");
|
||||||
|
cleanup(&doc, &f);
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST(Text, MemUtf8_2) {
|
||||||
|
const char *content = "最後測試";
|
||||||
|
vfile_t f;
|
||||||
|
document_t doc;
|
||||||
|
load_doc_mem((void *) content, strlen(content), &f, &doc);
|
||||||
|
|
||||||
|
parse_text(&text_500_ctx, &f, &doc);
|
||||||
|
|
||||||
|
ASSERT_STREQ(get_meta(&doc, MetaContent)->str_val, "最後測試");
|
||||||
|
cleanup(&doc, &f);
|
||||||
|
}
|
||||||
|
|
||||||
|
TEST(Text, MemUtf8_Invalid2) {
|
||||||
|
const char *content = "最後測\xe8\xa9";
|
||||||
|
vfile_t f;
|
||||||
|
document_t doc;
|
||||||
|
load_doc_mem((void *) content, strlen(content), &f, &doc);
|
||||||
|
|
||||||
|
parse_text(&text_500_ctx, &f, &doc);
|
||||||
|
|
||||||
|
ASSERT_STREQ(get_meta(&doc, MetaContent)->str_val, "最後測");
|
||||||
|
cleanup(&doc, &f);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
@ -32,6 +32,23 @@ void fs_close(vfile_t *f) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void load_doc_file(const char *filepath, vfile_t *f, document_t *doc) {
|
||||||
|
doc->meta_head = nullptr;
|
||||||
|
doc->meta_tail = nullptr;
|
||||||
|
load_file(filepath, f);
|
||||||
|
}
|
||||||
|
|
||||||
|
void load_doc_mem(void *mem, size_t mem_len, vfile_t *f, document_t *doc) {
|
||||||
|
doc->meta_head = nullptr;
|
||||||
|
doc->meta_tail = nullptr;
|
||||||
|
load_mem(mem, mem_len, f);
|
||||||
|
}
|
||||||
|
|
||||||
|
void cleanup(document_t *doc, vfile_t *f) {
|
||||||
|
destroy_doc(doc);
|
||||||
|
CLOSE_FILE((*f))
|
||||||
|
}
|
||||||
|
|
||||||
void load_file(const char *filepath, vfile_t *f) {
|
void load_file(const char *filepath, vfile_t *f) {
|
||||||
stat(filepath, &f->info);
|
stat(filepath, &f->info);
|
||||||
f->fd = open(filepath, O_RDONLY);
|
f->fd = open(filepath, O_RDONLY);
|
||||||
|
@ -5,6 +5,9 @@
|
|||||||
|
|
||||||
void load_file(const char *filepath, vfile_t *f);
|
void load_file(const char *filepath, vfile_t *f);
|
||||||
void load_mem(void *mem, size_t size, vfile_t *f);
|
void load_mem(void *mem, size_t size, vfile_t *f);
|
||||||
|
void load_doc_mem(void *mem, size_t mem_len, vfile_t *f, document_t *doc);
|
||||||
|
void load_doc_file(const char *filepath, vfile_t *f, document_t *doc);
|
||||||
|
void cleanup(document_t *doc, vfile_t *f);
|
||||||
|
|
||||||
static void noop_logf(char *filepath, int level, char *format, ...) {
|
static void noop_logf(char *filepath, int level, char *format, ...) {
|
||||||
// noop
|
// noop
|
||||||
|
Loading…
x
Reference in New Issue
Block a user