diff --git a/libscan/arc/arc.c b/libscan/arc/arc.c index eeb0d07..b4993d0 100644 --- a/libscan/arc/arc.c +++ b/libscan/arc/arc.c @@ -5,8 +5,6 @@ #include #include -#define MAX_SUBFILE_SIZE (long)(10000000000) - int should_parse_filtered_file(const char *filepath, int ext) { char tmp[PATH_MAX * 2]; @@ -110,7 +108,7 @@ scan_code_t parse_archive(scan_arc_ctx_t *ctx, vfile_t *f, document_t *doc) { meta_line_t *meta_list = malloc(sizeof(meta_line_t) + buf.cur); meta_list->key = MetaContent; strcpy(meta_list->str_val, buf.buf); - APPEND_META(doc, meta_list); + APPEND_META(doc, meta_list) dyn_buffer_destroy(&buf); } else { diff --git a/libscan/ebook/ebook.c b/libscan/ebook/ebook.c index 6d062c3..63f28a4 100644 --- a/libscan/ebook/ebook.c +++ b/libscan/ebook/ebook.c @@ -157,7 +157,7 @@ int render_cover(scan_ebook_ctx_t *ctx, fz_context *fzctx, document_t *doc, fz_d avcodec_receive_packet(jpeg_encoder, &jpeg_packet); APPEND_TN_META(doc, pixmap->w, pixmap->h) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) jpeg_packet.data, jpeg_packet.size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) jpeg_packet.data, jpeg_packet.size); av_packet_unref(&jpeg_packet); av_free(*scaled_frame->data); @@ -174,14 +174,14 @@ void fz_err_callback(void *user, const char *message) { document_t *doc = (document_t *) user; const scan_ebook_ctx_t *ctx = &thread_ctx; - CTX_LOG_WARNINGF(doc->filepath, "FZ: %s", message); + CTX_LOG_WARNINGF(doc->filepath, "FZ: %s", message) } void fz_warn_callback(void *user, const char *message) { document_t *doc = (document_t *) user; const scan_ebook_ctx_t *ctx = &thread_ctx; - CTX_LOG_DEBUGF(doc->filepath, "FZ: %s", message); + CTX_LOG_DEBUGF(doc->filepath, "FZ: %s", message) } static void init_fzctx(fz_context *fzctx, document_t *doc) { diff --git a/libscan/font/font.c b/libscan/font/font.c index ce2203f..ab38385 100644 --- a/libscan/font/font.c +++ b/libscan/font/font.c @@ -229,7 +229,7 @@ void parse_font(scan_font_ctx_t *ctx, vfile_t *f, document_t *doc) { bmp_format(&bmp_data, dimensions, bitmap); APPEND_TN_META(doc, dimensions.width, dimensions.height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) bmp_data.buf, bmp_data.cur); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) bmp_data.buf, bmp_data.cur); dyn_buffer_destroy(&bmp_data); free(bitmap); diff --git a/libscan/media/media.c b/libscan/media/media.c index 65bd5e4..14bd98c 100644 --- a/libscan/media/media.c +++ b/libscan/media/media.c @@ -1,8 +1,4 @@ #include "media.h" - -#include "../util.h" - - #include #define MIN_SIZE 32 @@ -323,7 +319,7 @@ void parse_media_format_ctx(scan_media_ctx_t *ctx, AVFormatContext *pFormatCtx, //Seek if (stream->nb_frames > 1 && stream->codecpar->codec_id != AV_CODEC_ID_GIF) { - int seek_ret = 0; + int seek_ret; for (int i = 20; i >= 0; i--) { seek_ret = av_seek_frame(pFormatCtx, video_stream, stream->duration * 0.10, 0); @@ -356,7 +352,7 @@ void parse_media_format_ctx(scan_media_ctx_t *ctx, AVFormatContext *pFormatCtx, if (scaled_frame == STORE_AS_IS) { APPEND_TN_META(doc, frame_and_packet->frame->width, frame_and_packet->frame->height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) frame_and_packet->packet->data, frame_and_packet->packet->size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) frame_and_packet->packet->data, frame_and_packet->packet->size); } else { // Encode frame to jpeg AVCodecContext *jpeg_encoder = alloc_jpeg_encoder(scaled_frame->width, scaled_frame->height, @@ -369,7 +365,7 @@ void parse_media_format_ctx(scan_media_ctx_t *ctx, AVFormatContext *pFormatCtx, // Save thumbnail APPEND_TN_META(doc, scaled_frame->width, scaled_frame->height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) jpeg_packet.data, jpeg_packet.size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) jpeg_packet.data, jpeg_packet.size); avcodec_free_context(&jpeg_encoder); av_packet_unref(&jpeg_packet); @@ -608,7 +604,7 @@ int store_image_thumbnail(scan_media_ctx_t *ctx, void* buf, size_t buf_len, docu if (scaled_frame == STORE_AS_IS) { APPEND_TN_META(doc, frame_and_packet->frame->width, frame_and_packet->frame->height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) frame_and_packet->packet->data, frame_and_packet->packet->size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) frame_and_packet->packet->data, frame_and_packet->packet->size); } else { // Encode frame to jpeg AVCodecContext *jpeg_encoder = alloc_jpeg_encoder(scaled_frame->width, scaled_frame->height, @@ -621,7 +617,7 @@ int store_image_thumbnail(scan_media_ctx_t *ctx, void* buf, size_t buf_len, docu // Save thumbnail APPEND_TN_META(doc, scaled_frame->width, scaled_frame->height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) jpeg_packet.data, jpeg_packet.size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) jpeg_packet.data, jpeg_packet.size); av_packet_unref(&jpeg_packet); avcodec_free_context(&jpeg_encoder); diff --git a/libscan/msdoc/msdoc.c b/libscan/msdoc/msdoc.c index 033a63a..e9a2728 100644 --- a/libscan/msdoc/msdoc.c +++ b/libscan/msdoc/msdoc.c @@ -6,7 +6,7 @@ #include "../ebook/ebook.h" -void parse_msdoc_text(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc, FILE *file_in, void* buf, size_t buf_len) { +void parse_msdoc_text(scan_msdoc_ctx_t *ctx, document_t *doc, FILE *file_in, void* buf, size_t buf_len) { // Open word doc options_type *opts = direct_vGetOptions(); @@ -73,7 +73,7 @@ void parse_msdoc_text(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc, FILE * free(out_buf); } -void parse_msdoc_pdf(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc, FILE *file, void* buf, size_t buf_len) { +void parse_msdoc_pdf(scan_msdoc_ctx_t *ctx, document_t *doc, FILE *file, void* buf, size_t buf_len) { scan_ebook_ctx_t ebook_ctx = { .content_size = ctx->content_size, @@ -115,7 +115,7 @@ void parse_msdoc_pdf(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc, FILE *f return; } - int ret = bWordDecryptor(file, buf_len, diag); + bWordDecryptor(file, buf_len, diag); vDestroyDiagram(diag); fclose(file_out); @@ -144,8 +144,8 @@ void parse_msdoc(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc) { } if (ctx->tn_size > 0) { - parse_msdoc_pdf(ctx, f, doc, file, buf, buf_len); + parse_msdoc_pdf(ctx, doc, file, buf, buf_len); } else { - parse_msdoc_text(ctx, f, doc, file, buf, buf_len); + parse_msdoc_text(ctx, doc, file, buf, buf_len); } } diff --git a/libscan/msdoc/msdoc.h b/libscan/msdoc/msdoc.h index aac8f6d..30cba6a 100644 --- a/libscan/msdoc/msdoc.h +++ b/libscan/msdoc/msdoc.h @@ -19,6 +19,6 @@ static int is_msdoc(scan_msdoc_ctx_t *ctx, unsigned int mime) { void parse_msdoc(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc); -void parse_msdoc_text(scan_msdoc_ctx_t *ctx, vfile_t *f, document_t *doc, FILE *file_in, void* buf, size_t buf_len); +void parse_msdoc_text(scan_msdoc_ctx_t *ctx, document_t *doc, FILE *file_in, void* buf, size_t buf_len); #endif diff --git a/libscan/ooxml/ooxml.c b/libscan/ooxml/ooxml.c index f35673c..1b77ce9 100644 --- a/libscan/ooxml/ooxml.c +++ b/libscan/ooxml/ooxml.c @@ -1,6 +1,5 @@ #include "ooxml.h" -#include "../util.h" #include #include #include @@ -106,7 +105,7 @@ static int read_part(scan_ooxml_ctx_t *ctx, struct archive *a, text_buffer_t *bu } __always_inline -static int read_doc_props(scan_ooxml_ctx_t *ctx, struct archive *a, text_buffer_t *buf, document_t *doc) { +static int read_doc_props(scan_ooxml_ctx_t *ctx, struct archive *a, document_t *doc) { xmlDoc *xml = xmlReadIO(xml_io_read, xml_io_close, a, "/", NULL, XML_PARSE_RECOVER | XML_PARSE_NOWARNING | XML_PARSE_NOERROR | XML_PARSE_NONET); @@ -158,7 +157,7 @@ void read_thumbnail(scan_ooxml_ctx_t *ctx, document_t *doc, struct archive *a, s archive_read_data(a, buf, entry_size); APPEND_TN_META(doc, 1, 1) // Size unknown - ctx->store((char *) doc->uuid, sizeof(doc->uuid), buf, entry_size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), buf, entry_size); free(buf); } @@ -198,7 +197,7 @@ void parse_ooxml(scan_ooxml_ctx_t *ctx, vfile_t *f, document_t *doc) { buffer_full = TRUE; } } else if (strcmp(path, "docProps/core.xml") == 0) { - if (read_doc_props(ctx, a, &tex, doc) != 0) { + if (read_doc_props(ctx, a, doc) != 0) { break; } } else if (strcmp(path, "docProps/thumbnail.jpeg") == 0) { diff --git a/libscan/raw/raw.c b/libscan/raw/raw.c index dd775a5..3d40c35 100644 --- a/libscan/raw/raw.c +++ b/libscan/raw/raw.c @@ -2,7 +2,6 @@ #include #include "../media/media.h" -#include #include @@ -71,7 +70,7 @@ int store_thumbnail_rgb24(scan_raw_ctx_t *ctx, libraw_processed_image_t *img, do avcodec_receive_packet(jpeg_encoder, &jpeg_packet); APPEND_TN_META(doc, scaled_frame->width, scaled_frame->height) - ctx->store((char *) doc->uuid, sizeof(doc->uuid), (char *) jpeg_packet.data, jpeg_packet.size); + ctx->store((char *) doc->path_md5, sizeof(doc->path_md5), (char *) jpeg_packet.data, jpeg_packet.size); av_packet_unref(&jpeg_packet); av_free(*scaled_frame->data); diff --git a/libscan/scan.h b/libscan/scan.h index 6341d78..5f68fc2 100644 --- a/libscan/scan.h +++ b/libscan/scan.h @@ -8,6 +8,7 @@ #include #include #include +#include #include "macros.h" @@ -106,6 +107,7 @@ typedef struct document { int mtime; short base; short ext; + unsigned char path_md5[MD5_DIGEST_LENGTH]; meta_line_t *meta_head; meta_line_t *meta_tail; char *filepath;