X-Git-Url: https://www.chiark.greenend.org.uk/ucgi/~yarrgweb/git?a=blobdiff_plain;f=pctb%2Focr.h;h=5b5f697dbd88603a37dd8f518f91308c39192dfb;hb=451e1b1ed16a7a53395c030598a83031e266f973;hp=8e1263d94495bf365cc97748d2b2e839234c0dc6;hpb=cd124e1675276f26b594f23367da63637673698f;p=ypp-sc-tools.web-live.git diff --git a/pctb/ocr.h b/pctb/ocr.h index 8e1263d..5b5f697 100644 --- a/pctb/ocr.h +++ b/pctb/ocr.h @@ -1,28 +1,26 @@ +/* + * ocr.c forms a mostly-self-contained bit + * so we put its declarations in this separate file + */ + #ifndef OCR_H #define OCR_H -#define DEBUG_RECTANGLES -// #define DEBUG_OCR - - - #define _GNU_SOURCE -#include -#include -#include -#include #include -#include #include +#include +#include +#include +#include +#include #include -#include -#include +#include #include #include -#include typedef struct { @@ -30,7 +28,6 @@ typedef struct { char d[]; } CanonImage; - typedef uint32_t Pixcol; #define PSPIXCOL(priscan) priscan##32 @@ -40,10 +37,12 @@ typedef struct { unsigned ctxmap; /* match context index */ } OcrResultGlyph; + typedef const struct OcrCellTypeInfo *OcrCellType; extern const struct OcrCellTypeInfo ocr_celltype_text; extern const struct OcrCellTypeInfo ocr_celltype_number; + typedef struct OcrReader OcrReader; OcrReader *ocr_init(int h); @@ -52,68 +51,47 @@ OcrResultGlyph *ocr(OcrReader *rd, OcrCellType, int w, Pixcol cols[]); * array is valid until next call to ocr() */ -void debug_flush(void); -void find_structure(CanonImage *im); +/*----- debugging arrangements, rather contingent -----*/ -#define eassert assert -#define debug stdout +#define DEBUG_FLAG_LIST \ + DF(findypp) \ + DF(pages) \ + DF(rect) \ + DF(ocr) \ + DF(callout) -const char *get_vardir(void); +enum { +#define DF(f) dbg__shift_##f, + DEBUG_FLAG_LIST +#undef DF +}; +enum { +#define DF(f) dbg_##f = 1 << dbg__shift_##f, + DEBUG_FLAG_LIST +#undef DF +}; -CanonImage *file_read_image(FILE *f); -int main_test(void); +unsigned debug_flags; -#define MAX_PAGES 100 -extern CanonImage *page_images[MAX_PAGES]; -extern int npages; +#define DEBUGP(f) (!!(debug_flags & dbg_##f)) +void debug_flush(void); -typedef struct { - unsigned long rgb; /* on screen */ - char c; /* canonical */ -} CanonColourInfo; - -extern const CanonColourInfo canoncolourinfos[]; - -CanonImage *alloc_canon_image(int w, int h); - -#ifdef DEBUG_RECTANGLES -# define CANIMG_DEBUG_RECTANGLE_1LINE(im,w,h) \ - fprintf(debug, "%4d ",y); \ - r= fwrite(im->d + y*w, 1,w, debug); \ - eassert(r==w); \ - fputc('\n',debug); -#else -# define CANIMG_DEBUG_RECTANGLE_1LINE(im,y,h) /* nothing */ -#endif - -#define CANONICALISE_IMAGE(im,w,h, COMPUTE_RGB) do{ \ - /* compute_rgb should be a number of statements, or \ - * a block, which assigns to \ - * unsigned long rgb; \ - * given the values of \ - * int x,y; \ - * all of which are anamorphic. Result is stored in im. \ - */ \ - (im)= alloc_canon_image((w), (h)); \ - \ - int x,y,r; \ - for (y=0; y<(h); y++) { \ - for (x=0; x<(w); x++) { \ - const CanonColourInfo *cci; \ - unsigned long rgb; \ - COMPUTE_RGB; \ - for (cci=canoncolourinfos; cci->c; cci++) \ - if (cci->rgb == rgb) { \ - (im)->d[y*(w) + x]= cci->c; \ - break; \ - } \ - } \ - CANIMG_DEBUG_RECTANGLE_1LINE((im),(w),(h)) \ - } \ - debug_flush(); \ - }while(0) +#define eassert assert +#define debug stderr + +const char *get_vardir(void); + +#define DEBUG_DEFINE_SOME_DEBUGF(fl,funcf) \ + static void v##funcf(const char *fmt, va_list al) { \ + if (DEBUGP(fl)) \ + vfprintf(debug,fmt,al); \ + } \ + static void funcf(const char *fmt, ...) { \ + va_list al; va_start(al,fmt); v##funcf(fmt,al); va_end(al); \ + } +#define DEBUG_DEFINE_DEBUGF(fl) DEBUG_DEFINE_SOME_DEBUGF(fl,debugf) #endif /*OCR_H*/