mirror of
https://github.com/simon987/sist2.git
synced 2025-04-21 19:26:45 +00:00
Compare commits
No commits in common. "410283f14a41c1b034135bfc10d850b0f0f6e8ee" and "af5059f366e858994e172cd09f9261827cc7682c" have entirely different histories.
410283f14a
...
af5059f366
10
third-party/libscan/libscan/ocr/ocr.h
vendored
10
third-party/libscan/libscan/ocr/ocr.h
vendored
@ -5,7 +5,7 @@
|
|||||||
#include <tesseract/capi.h>
|
#include <tesseract/capi.h>
|
||||||
|
|
||||||
#define MIN_OCR_WIDTH 350
|
#define MIN_OCR_WIDTH 350
|
||||||
#define MIN_OCR_HEIGHT 33
|
#define MIN_OCR_HEIGHT 100
|
||||||
#define MIN_OCR_LEN 10
|
#define MIN_OCR_LEN 10
|
||||||
|
|
||||||
#define OCR_IS_VALID_BPP(d) \
|
#define OCR_IS_VALID_BPP(d) \
|
||||||
@ -28,13 +28,7 @@ ocr_extract_text(const char *tesseract_path, const char *tesseract_lang,
|
|||||||
TessBaseAPI *api = TessBaseAPICreate();
|
TessBaseAPI *api = TessBaseAPICreate();
|
||||||
TessBaseAPIInit3(api, tesseract_path, tesseract_lang);
|
TessBaseAPIInit3(api, tesseract_path, tesseract_lang);
|
||||||
|
|
||||||
// https://github.com/simon987/sist2/issues/443
|
TessBaseAPISetPageSegMode(api, PSM_AUTO_OSD);
|
||||||
if (strstr(tesseract_lang, "chi") != NULL) {
|
|
||||||
TessBaseAPISetVariable(api, "preserve_interword_spaces", "1");
|
|
||||||
}
|
|
||||||
|
|
||||||
// TODO: add this as param?
|
|
||||||
// TessBaseAPISetPageSegMode(api, PSM_AUTO_OSD);
|
|
||||||
|
|
||||||
TessBaseAPISetImage(api, img_buf, img_w, img_h, img_bpp, img_stride);
|
TessBaseAPISetImage(api, img_buf, img_w, img_h, img_bpp, img_stride);
|
||||||
TessBaseAPISetSourceResolution(api, img_xres);
|
TessBaseAPISetSourceResolution(api, img_xres);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user