2 * Parsing of the structure of the YPP client's displayed image
5 * This is part of ypp-sc-tools, a set of third-party tools for assisting
6 * players of Yohoho Puzzle Pirates.
8 * Copyright (C) 2009 Ian Jackson <ijackson@chiark.greenend.org.uk>
10 * This program is free software: you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation, either version 3 of the License, or
13 * (at your option) any later version.
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
20 * You should have received a copy of the GNU General Public License
21 * along with this program. If not, see <http://www.gnu.org/licenses/>.
23 * Yohoho and Puzzle Pirates are probably trademarks of Three Rings and
24 * are used without permission. This program is not endorsed or
25 * sponsored by Three Rings.
28 #include "structure.h"
30 DEBUG_DEFINE_DEBUGF(struct)
32 #define START_MAIN {200,200}
34 #define INTERESTING_COLUMNS 7
35 #define TEXT_COLUMNS 2
40 int commbasey, comminty;
41 int colrightx[INTERESTING_COLUMNS];
44 const CanonImage *page_images[MAX_PAGES];
45 static PageStruct page_structs[MAX_PAGES];
46 const RgbImage *page0_rgbimage;
49 static int text_h=-1, columns=-1;
53 static const CanonImage *cim;
56 char *archipelago, *island;
58 #define OTHERCOORD_x y
59 #define OTHERCOORD_y x
62 void select_page(int page) {
63 cim= page_images[page];
64 s= page_structs[page];
70 Rgb rgbx; /* on screen, REVERSED BYTES ie r||g||b */
71 char c; /* canonical */
74 const CanonColourInfo canoncolourinfo_table[]= {
75 { 0x475A5E, '*' }, /* edge */
76 { 0x2C5F7A, '*' }, /* edge just under box heading shadow */
77 { 0xC5C7AE, '*' }, /* blank area of partial commodities list */
78 { 0x6B828C, '*' }, /* background of ship status meter area */
79 { 0x934405, '*' }, /* border of ship meter area */
80 { 0x7D9094, '+' }, /* interbox */
81 { 0x022158, 'O' }, /* ahoy /w output foreground */
82 { 0xB5B686, 'H' }, /* ahoy /w output heading background */
84 { 0xBDC5BF, ' ' }, /* background - pale Sugar cane, etc. */
85 { 0xADB5AF, ' ' }, /* background - dark */
86 { 0xC7E1C3, ' ' }, /* background - pale Swill, etc. */
87 { 0xB5CFB1, ' ' }, /* background - dark */
88 { 0xD6CEB0, ' ' }, /* background - pale Madder, etc. */
89 { 0xC8C0A2, ' ' }, /* background - dark */
90 { 0xE0E1D3, ' ' }, /* background - pale Lorandite, etc. */
91 { 0xD0D1C3, ' ' }, /* background - dark */
92 { 0xE5E6C1, ' ' }, /* background - pale Cloth */
93 { 0xD7D8B3, ' ' }, /* background - dark */
94 { 0xEDDED9, ' ' }, /* background - pale Dye */
95 { 0xDACBC6, ' ' }, /* background - dark */
96 { 0xD3DEDF, ' ' }, /* background - pale Paint */
97 { 0xC5D0D1, ' ' }, /* background - dark */
98 { 0xDCD1CF, ' ' }, /* background - pale Enamel */
99 { 0xCEC3C1, ' ' }, /* background - dark */
100 { 0xF3F6F5, ' ' }, /* background - pale fruit */
101 { 0xE2E7E5, ' ' }, /* background - dark */
103 { 0x000000, 'o' }, /* foreground */
104 { 0xD4B356, ' ' }, /* background (cursor) */
105 { 0xFFFFFF, 'o' }, /* foreground (cursor) */
107 { 0x5B93BF, '_' }, /* selector dropdown background */
108 { 0xD7C94F, 'X' }, /* selector dropdown foreground */
112 CanonColourInfoReds canoncolourinfo_tree;
114 void canon_colour_prepare(void) {
115 const CanonColourInfo *cci;
116 for (cci=canoncolourinfo_table; cci->c; cci++) {
117 unsigned char r= cci->rgbx >> 16;
118 unsigned char g= cci->rgbx >> 8;
119 unsigned char b= cci->rgbx;
121 CanonColourInfoGreens *greens= canoncolourinfo_tree.red2[r];
123 greens= canoncolourinfo_tree.red2[r]= mmalloc(sizeof(*greens));
127 CanonColourInfoBlues *blues= greens->green2[g];
129 blues= greens->green2[g]= mmalloc(sizeof(*blues));
130 memset(blues, '?', sizeof(*blues));
133 blues->blue2[b]= cci->c;
137 static inline char get(int x, int y) { return cim->d[y * cim->w + x]; }
138 static inline char get_p(Point p) { return get(p.x,p.y); }
141 static void mustfail1(const char *file, int line, const char *what) {
144 "Unable to figure out contents of YPP client display.\n"
145 "Please check the following:\n"
146 " * YPP client is showing commodity listing screen\n"
147 " * YPP client window is on top (we try to raise it but your window\n"
148 " manager might have prevented that from succeeding)\n"
150 "If all of these are true, please report this as a fault.\n\n"
152 " %s:%d: requirement failed:\n"
156 static void mustfail2(void) NORET;
157 static void mustfail2(void) {
158 fprintf(stderr, "\n\nGiving up.\n");
162 #define MUST(x, ifnot) do{ \
163 if (__builtin_expect(!(x), 0)) { \
164 mustfail1(__FILE__,__LINE__,#x); \
170 #define MP(v) fprintf(stderr," %s=%d,%d",#v,(v).x,(v).y)
171 #define MI(v) fprintf(stderr," %s=%d", #v,(v))
172 #define MIL(v) fprintf(stderr," %s=%ld", #v,(v))
173 #define MRGB(v) fprintf(stderr," %s=%06"PRIx32, #v,(v))
174 #define MC(v) fprintf(stderr," %s='%c'", #v,(v))
175 #define MS(v) fprintf(stderr," %s=\"%s\"", #v,(v))
176 #define MF(v) fprintf(stderr," %s=%f", #v,(v))
177 #define MSB(v) fprintf(stderr," %s", (v))
178 #define MR(v) fprintf(stderr," %s=%d,%d..%d,%d",\
179 #v,(v).tl.x,(v).tl.y,(v).br.x,(v).br.y)
182 #define REQUIRE_RECTANGLE(tlx,tly,brx,bry,ok) \
183 require_rectangle(tlx, tly, brx, bry, ok, __LINE__);
185 #define FOR_P_RECT(p,rr) \
186 for ((p).x=(rr).tl.x; (p).x<=(rr).br.x; (p).x++) \
187 for ((p).y=(rr).tl.y; (p).y<=(rr).br.y; (p).y++)
189 static void require_rectangle_r(Rect rr, const char *ok, int lineno) {
193 MUST( strchr(ok,c), ({
194 MI(lineno),MR(rr);MP(p);MS(ok);
198 static void require_rectangle(int tlx, int tly, int brx, int bry,
199 const char *ok, int lineno) {
200 Rect rr= {{tlx,tly},{brx,bry}};
201 require_rectangle_r(rr, ok, lineno);
204 static void debug_rect(const char *what, int whati, Rect rr) {
205 if (!DEBUGP(rect)) return;
207 fprintf(debug, "%s %d: %d,%d..%d,%d:\n", what, whati,
208 rr.tl.x,rr.tl.y, rr.br.x,rr.br.y);
209 w= rr.br.x - rr.tl.x + 1;
210 for (y=rr.tl.y; y<=rr.br.y; y++) {
211 fprintf(debug, "%4d%*s|", y, rr.tl.x,"");
212 fwrite(cim->d + y*cim->w + rr.tl.x, 1, w, debug);
219 static int commod_selector_matches(Rect search, const char *const *all,
220 int allh, int allw) {
221 int alloffy, alloffx;
222 for (alloffy=0; alloffy < search.br.y; alloffy++) {
223 if (alloffy+allh-1 < search.tl.y) continue;
224 for (alloffx=search.tl.x; alloffx+allw-1 <= search.br.x; alloffx++) {
227 for (x=0; x<allw; x++)
228 for (y=0; y<allh; y++) {
230 if (want==' ') continue;
231 if (get(alloffx+x, alloffy+y) == want)
236 debugf("CHECKCOMMOD alloff=%d,%d good=%d bad=%d\n",
237 alloffx,alloffy, good,bad);
245 #define WALK_UNTIL(point,coord,increm,last,edge) \
247 if ((point).coord == (last)+(increm)) break; \
248 if (get_p((point)) == (edge)) { (point).coord -= (increm); break; } \
249 (point).coord += (increm); \
252 #define WALK_UNTIL_MUST(point,coord,increm,last,edge) \
254 WALK_UNTIL(point,coord,increm,last,edge); \
255 MUST( (point).coord != (last)+(increm), \
256 MP(point); MI(increm); MI(last); MC(edge); \
260 #define ADJUST_BOX(search,insidechrs,OP,want, lim,LIMIT_MUST, TLBR,XY,increm) \
262 LIMIT_MUST( (search).tl.XY != (search).br.XY && \
263 (search).TLBR.XY != (lim), \
264 MR((search));MSB(#TLBR);MSB(#XY) ); \
266 Point p=(search).tl; \
267 for (p.XY=(search).TLBR.XY; \
268 p.OTHERCOORD_##XY <= (search).br.OTHERCOORD_##XY; \
269 p.OTHERCOORD_##XY++) \
270 got += !!strchr(insidechrs, get_p(p)); \
271 if ((got) OP (want)) \
273 (search).TLBR.XY += increm; \
276 void find_structure(const CanonImage *im,
277 PageStruct **pagestruct_r,
278 int *max_relevant_y_r,
279 Point *commod_focus_point_r,
280 Point *commod_page_point_r,
281 Point *commod_focuslast_point_r) {
285 Rect whole = { {0,0}, {cim->w-1,cim->h-1} };
289 for (y=0, xscaleunit=1; y<4; y++, xscaleunit*=10) {
291 for (x=0; x<=cim->w; x++) {
292 if (x % xscaleunit) fputc(' ',debug);
293 else fprintf(debug,"%d",(x / xscaleunit)%10);
299 Point mainr_tl= START_MAIN;
301 WALK_UNTIL_MUST(s.mr.tl, y,-1, whole.tl.y, ' ');
304 WALK_UNTIL_MUST(s.mr.tl, x,-1, whole.tl.x, '*');
305 WALK_UNTIL_MUST(s.mr.tl, y,-1, whole.tl.y, '*');
306 WALK_UNTIL_MUST(s.mr.br, x,+1, whole.br.x, '*');
307 WALK_UNTIL_MUST(s.mr.br, y,+1, whole.br.y, '*');
309 REQUIRE_RECTANGLE(s.mr.tl.x-1, s.mr.tl.y, s.mr.tl.x-1, s.mr.br.y, "*");
310 REQUIRE_RECTANGLE(s.mr.br.x+1, s.mr.tl.y, s.mr.br.x+1, s.mr.br.y, "*");
311 REQUIRE_RECTANGLE(s.mr.tl.x, s.mr.tl.y-1, s.mr.br.x, s.mr.tl.y-1, "*");
312 REQUIRE_RECTANGLE(s.mr.tl.x, s.mr.br.y+1, s.mr.br.x, s.mr.br.y+1, "*");
314 #define CHECK_STRIP_BORDER(tlbr,xy,increm) \
319 csb_p.x++; csb_p.y++; \
320 csb_p.xy= s.mr.tlbr.xy; \
321 if (get_p(csb_p)=='+') { \
323 csb_r.tl.xy= csb_p.xy; \
324 csb_r.br.xy= csb_p.xy; \
325 require_rectangle_r(csb_r, "+", __LINE__); \
326 s.mr.tlbr.xy += increm; \
330 debug_rect("s.mr",0, s.mr);
332 CHECK_STRIP_BORDER(tl,x,+1);
333 CHECK_STRIP_BORDER(tl,y,+1);
334 CHECK_STRIP_BORDER(br,x,-1);
335 CHECK_STRIP_BORDER(br,y,-1);
337 debug_rect("s.mr",1, s.mr);
339 Rect updown= {START_MAIN,START_MAIN};
341 updown.br.x += chkw-1;
343 debug_rect("updown",__LINE__,updown);
345 ADJUST_BOX(updown, "+", >=,chkw, s.mr.tl.y, MUST, tl,y,-1);
346 debug_rect("updown",__LINE__,updown);
347 updown.br.y= updown.tl.y;
348 updown.tl.y= updown.tl.y-1;
350 ADJUST_BOX(updown, "+*",>=,chkw, s.mr.tl.y-1, MUST, tl,y,-1);
351 debug_rect("updown",__LINE__,updown);
353 s.commbasey= updown.tl.y + 1;
354 s.comminty= updown.br.y - updown.tl.y;
356 Rect across= {{ s.mr.tl.x - 1, s.commbasey },
357 { s.mr.tl.x, s.commbasey + s.comminty-2 }};
361 #define LIMIT_QUITEQ(cond,mp) { if (!(cond)) break; }
362 debug_rect("across",colno*1000000+__LINE__, across);
363 ADJUST_BOX(across, "+",>=,s.comminty-1,s.mr.br.x,LIMIT_QUITEQ,br,x,+1);
364 debug_rect("across",colno*1000000+__LINE__, across);
366 MUST( colno < MAX_COLUMNS,
367 MI(colno);MR(across);MR(s.mr);MI(s.commbasey); );
368 int colrx= across.br.x-1;
369 if (colrx >= s.mr.br.x) colrx= s.mr.br.x;
370 if (colno < INTERESTING_COLUMNS)
371 s.colrightx[colno]= colrx;
375 if (across.br.x >= s.mr.br.x)
378 REQUIRE_RECTANGLE(across.br.x,s.mr.tl.y, across.br.x,s.mr.br.y, "+");
381 MUST( colno >= MIN_COLUMNS, MI(colno);MR(s.mr);MR(across); );
384 Rect pager= {{ s.mr.br.x, s.mr.br.y - (pagerh-1) },
385 { s.mr.br.x + 1, s.mr.br.y }};
387 debug_rect("pager",__LINE__,pager);
388 ADJUST_BOX(pager, "o",>=,pagerh-2, whole.br.x,MUST, br,x,+1);
389 debug_rect("pager",__LINE__,pager);
391 pager.tl.x= pager.br.x;
392 pager.br.x= pager.br.x + 1;
393 debug_rect("pager",__LINE__,pager);
394 ADJUST_BOX(pager, "o",>=,pagerh-2, whole.br.x,MUST, br,x,+1);
395 debug_rect("pager",__LINE__,pager);
397 ADJUST_BOX(pager, "o",>=,RECT_W(pager)-2, s.mr.tl.y,LIMIT_QUITEQ, tl,y,-1);
398 debug_rect("pager",__LINE__,pager);
400 #define SET_ONCE(var,val) do{ \
402 if ((var)==-1) (var)= v; \
403 else MUST( (var) == v, MSB(#var);MI((var));MI(v);MR(s.mr); ); \
406 SET_ONCE(columns, colno);
407 SET_ONCE(text_h, s.comminty - 1);
410 *pagestruct_r= mmalloc(sizeof(s));
414 if (max_relevant_y_r)
415 SET_ONCE(*max_relevant_y_r, s.mr.br.y + 10);
417 if (commod_focus_point_r) {
418 *commod_focus_point_r= s.mr.tl;
419 commod_focus_point_r->x += 10;
420 commod_focus_point_r->y += s.comminty/3;
422 if (commod_focuslast_point_r) {
423 *commod_focuslast_point_r= s.mr.br;
424 commod_focuslast_point_r->x -= 10;
425 commod_focuslast_point_r->y -= s.comminty/3;
427 if (commod_page_point_r) {
428 commod_page_point_r->x= (pager.tl.x + pager.br.x) / 2;
429 commod_page_point_r->y= pager.tl.y - 1;
432 MUST( text_h <= OCR_MAX_H, MI(text_h) );
435 void check_correct_commodities(void) {
436 Rect search= { { 50,39 }, { 130,59 } };
438 ADJUST_BOX(search,"_",>=,10, cim->h, MUST, tl,y,+1);
439 ADJUST_BOX(search,"_",>=,10, 0, MUST, br,y,-1);
441 debug_rect("commodselr",1, search);
443 static const char *all_small[]= {
444 " ___________________________________ ",
445 " ________X____X__X____________________ ",
446 " ________ X___ X_ X_____XXXXXXXXXXX_____ ",
447 "_________X_X__ X_ X______XXXXXXXXX_______",
448 "________ X X__ X_ X_______XXXXXXX________",
449 "________X_ _X_ X_ X________XXXXX_________",
450 "_______ X__ X_ X_ X_________XXX__________",
451 "_______XXXXXXX X_ X__________X___________",
452 " _____ X X X_ X______________________",
453 " ____X_____ _XX_ X______________________",
454 " __ _______ __ ______________________ ",
456 static const char *all_big[]= {
457 "???_______________________________________???",
458 "??_________________________________________??",
459 "?_________X______X___X______________________?",
460 "_________?X_____?X__?X______XXXXXXXXXXX______",
461 "_________X_X____?X__?X_______XXXXXXXXX_______",
462 "________?X?X____?X__?X________XXXXXXX________",
463 "________X_?_X___?X__?X_________XXXXX_________",
464 "_______?X__?X___?X__?X__________XXX__________",
465 "_______?XXXXX___?X__?X___________X___________",
466 "_______X????_X__?X__?X_______________________",
467 "?_____?X____?X__?X__?X_______________________",
468 "??____X_____?_X_?X__?X_______________________",
469 "???__?_______?__?___?_______________________?",
472 #define COMMOD_SELECTOR_MATCHES(all) \
473 commod_selector_matches(search, all, \
474 sizeof((all))/sizeof((all)[0]), \
477 if (!(COMMOD_SELECTOR_MATCHES(all_small) ||
478 COMMOD_SELECTOR_MATCHES(all_big)))
479 fatal("Commodities selector not set to `All'.");
482 CanonImage *alloc_canon_image(int w, int h) {
483 CanonImage *im= mmalloc(sizeof(CanonImage) + w*h);
486 memset(im->d,'?',w*h);
490 static void file_read_image_ppm(FILE *f) {
492 unsigned char rgb_buf[3];
497 progress("page %d reading ...",npages);
499 pnm_readpaminit(f, &inpam, sizeof(inpam));
500 if (!(inpam.maxval == 255 &&
501 inpam.bytes_per_sample == 1 &&
502 inpam.format == RPPM_FORMAT))
503 fatal("PNM screenshot(s) file must be 8bpp 1 byte-per-sample RGB raw");
505 CANONICALISE_IMAGE(im, inpam.width, inpam.height, ri, {
506 errno=0; int rr= fread_unlocked(&rgb_buf,1,3,f);
508 if (rr!=3) fatal("PNM screenshot(s) file ends unexpectedly");
510 rgb= rgb_buf[0] | (rgb_buf[1] << 8) | (rgb_buf[2] << 16);
513 sysassert(!ferror(screenshot_file));
515 if (!(npages < MAX_PAGES))
516 fatal("Too many images in screenshots file; max is %d.\n", MAX_PAGES);
518 find_structure(im,&pstruct, 0,0,0,0);
519 store_current_page(im,pstruct,ri);
523 void store_current_page(CanonImage *ci, PageStruct *pstruct, RgbImage *rgb) {
525 progress("page %d unantialiasing...",npages);
526 adjust_colours(ci, rgb);
527 progress("page %d storing ...",npages);
528 if (!npages) page0_rgbimage= rgb;
530 page_images[npages]= cim;
531 page_structs[npages]= *pstruct;
535 void read_one_screenshot(void) {
536 progress("reading screenshot...");
537 file_read_image_ppm(screenshot_file);
538 progress_log("read screenshot.");
541 void read_screenshots(void) {
544 sysassert(! fstat(fileno(screenshot_file), &stab) );
547 if (S_ISREG(stab.st_mode)) {
548 long pos= ftell(screenshot_file);
549 if (pos == stab.st_size) break;
551 int c= fgetc(screenshot_file);
553 ungetc(c, screenshot_file);
555 file_read_image_ppm(screenshot_file);
557 sysassert(!ferror(screenshot_file));
558 progress_log("read %d screenshots.",npages);
561 static double aa_bg_chan[3], aa_scale_chan[3], aa_alpha_mean_max;
562 static Rgb aa_background, aa_foreground;
564 static void find_aa_density_prep(Rgb bg, Rgb fg, int fg_extra) {
566 unsigned char fg_chan[3];
570 aa_alpha_mean_max= fg_extra ? 0.999 : 1.0;
572 for (i=0; i<3; i++) {
573 aa_bg_chan[i]= (aa_background >> (i*8)) & 0xff;
574 fg_chan[i]= aa_foreground >> (i*8);
575 aa_scale_chan[i]= 1.0 / (fg_chan[i] + fg_extra - aa_bg_chan[i]);
579 static inline double find_aa_density(const RgbImage *ri, Point p) {
580 Rgb here= ri_rgb(ri, p.x, p.y);
582 double alpha[3], alpha_total=0;
584 for (i=0; i<3; i++) {
585 unsigned char here_chan= here >> (i*8);
587 double alpha_chan= (here_chan - aa_bg_chan[i]) * aa_scale_chan[i];
588 alpha[i]= alpha_chan;
589 alpha_total += alpha_chan;
592 double alpha_mean= round(alpha_total * (1e5/3.0)) * 1e-5;
594 double thresh= 1.5/AAMAXVAL;
595 double alpha_min= alpha_mean - thresh;
596 double alpha_max= alpha_mean + thresh;
599 MUST( alpha_min <= alpha[i] && alpha[i] <= alpha_max,
601 MRGB(here);MRGB(aa_background);MRGB(aa_foreground);
602 MF(aa_alpha_mean_max);
603 MF(alpha_min); MI(i);MF(alpha[i]);MF(alpha_max) );
605 MUST( 0 <= alpha_mean && alpha_mean <= aa_alpha_mean_max,
607 MRGB(here);MRGB(aa_background);MRGB(aa_foreground);
608 MF(aa_alpha_mean_max);
609 MF(alpha_mean); MF(alpha[0]);MF(alpha[1]);MF(alpha[2]); );
614 static void find_commodity(int offset, Rect *rr) {
615 /* rr->tl.x==-1 if offset out of range */
616 rr->tl.y= s.commbasey - offset*s.comminty;
617 rr->br.y= rr->tl.y + s.comminty-2;
618 if (rr->tl.y < s.mr.tl.y || rr->br.y > s.mr.br.y) { rr->tl.x=-1; return; }
623 if (rr->tl.y > s.mr.tl.y)
624 REQUIRE_RECTANGLE(rr->tl.x,rr->tl.y-1, rr->br.x,rr->tl.y-1, "+");
625 if (rr->br.y < s.mr.tl.y)
626 REQUIRE_RECTANGLE(rr->tl.x,rr->br.y+1, rr->br.x,rr->br.y+1, "+");
629 static void compute_table_location(Rect commod, int colno, Rect *cell) {
630 cell->tl.y= commod.tl.y;
631 cell->br.y= commod.br.y;
632 cell->tl.x= !colno ? commod.tl.x : s.colrightx[colno-1]+2;
633 cell->br.x= s.colrightx[colno];
634 debug_rect("cell", colno, *cell);
637 static void ocr_rectangle(Rect r, const OcrCellType ct, FILE *tsv_output) {
638 OcrResultGlyph *results, *res;
640 int w= r.br.x - r.tl.x + 1;
643 for (x=0; x<w; x++) {
645 for (y=0; y<text_h; y++) {
646 Point here= { x+r.tl.x, y+r.tl.y };
647 int pixel= get_p(here);
648 if (pixel==' ') pixel= '0';
649 MUST( pixel >= '0' && pixel <= '0'+AAMAXVAL,
650 MC(pixel);MP(here);MSB(ocr_celltype_name(ct));MR(r); );
651 pixcol_p_add(&cols[x], y, pixel-'0');
656 results= ocr(rd,ct,w,cols);
657 for (res=results; res->s; res++)
658 fputs(res->s,tsv_output);
661 #define FOR_COMMODITY_CELL(ROW_START, CELL, ROW_END) do{ \
663 int tryrect, colno; \
665 for (tryrect= +cim->h; tryrect >= -cim->h; tryrect--) { \
666 find_commodity(tryrect, &rowr); \
669 debug_rect("commod",tryrect, rowr); \
673 for (colno=0; colno<columns; colno++) { \
674 compute_table_location(rowr,colno,&cell); \
683 static void adjust_colours_cell(CanonImage *ci, const RgbImage *ri,
684 int colno, Rect cell) {
686 unsigned char chanbg[3];
687 long bg_count=0, light_count=0, dark_count=0;
691 background= ri_rgb(ri, cell.br.x, cell.br.y);
693 chanbg[i]= background >> (i*8);
696 Rgb herergb= ri_rgb(ri, p.x, p.y);
697 if (herergb==background) {
700 for (i=0; i<3; i++) {
701 unsigned char here= herergb >> (i*8);
702 if (here == chanbg[i]) bg_count++;
703 else if (here < chanbg[i]) dark_count += (chanbg[i] - here)/4 + 1;
704 else if (here > chanbg[i]) light_count += (here - chanbg[i])/4 + 1;
708 long total_count= RECT_W(cell) * RECT_H(cell) * 3;
710 MUST( bg_count > total_count / 2,
711 MR(cell);MIL(total_count);MIL(bg_count);
712 MIL(light_count);MIL(dark_count) );
714 if (bg_count == total_count)
720 if (light_count/16 > dark_count) {
721 foreground= 0xffffffU;
723 } else if (dark_count/16 > light_count) {
727 MUST( !"tell light from dark",
728 MR(cell);MIL(total_count);MIL(bg_count);
729 MIL(light_count);MIL(dark_count);MRGB(background); );
732 debugf("TABLEENTRY col=%d %d,%d..%d,%d bg=%ld light=%ld dark=%ld\n",
733 colno, cell.tl.x,cell.tl.y, cell.br.x,cell.br.y,
734 bg_count, light_count, dark_count);
738 find_aa_density_prep(background, foreground, fg_extra);
741 double alpha= find_aa_density(ri,p);
743 int here_int= floor((AAMAXVAL+1)*alpha);
744 assert(here_int <= AAMAXVAL);
745 if (!(here_int==0 || here_int==AAMAXVAL)) monochrome=0;
746 ci->d[p.y * ci->w + p.x]= '0' + here_int;
749 debug_rect("cell0M", colno, cell);
751 require_rectangle_r(cell, "0123456789", __LINE__);
754 void adjust_colours(CanonImage *ci, const RgbImage *ri) {
755 if (!(o_mode & mf_analyse))
760 FOR_COMMODITY_CELL({},({
761 adjust_colours_cell(ci,ri,colno,cell);
765 void analyse(FILE *tsv_output) {
768 for (page=0; page<npages; page++) {
772 check_correct_commodities();
775 rd= ocr_init(text_h);
777 progress("Processing page %d...",page);
784 fputs(tab, tsv_output);
788 : &ocr_celltype_number,
792 fputs("\n", tsv_output);
793 sysassert(!ferror(tsv_output));
794 sysassert(!fflush(tsv_output));
797 progress("Commodity table scan complete.");
800 //static Rect islandnamer;
802 DEBUG_DEFINE_SOME_DEBUGF(structcolon,colondebugf)
804 Rect find_sunshine_widget(void) {
807 sunshiner.tl.x= cim->w - 1034 + 885;
808 sunshiner.br.x= cim->w - 1034 + 1020;
812 ADJUST_BOX(sunshiner,"o*",>=,30, 100,MUST, tl,y,-1);
813 ADJUST_BOX(sunshiner,"o*",>=,30, 100,MUST, br,y,+1);
814 debug_rect("sunshiner",0, sunshiner);
816 MUST(sunshiner.br.y - sunshiner.tl.y > 20, MR(sunshiner));
819 ADJUST_BOX(sunshiner,"o",>=,20, (cim->w - 1034 + 700), MUST, tl,x,-1);
820 ADJUST_BOX(sunshiner,"o",>=,20, cim->w, MUST, br,x,+1);
821 debug_rect("sunshiner",1, sunshiner);
825 void find_islandname(void) {
826 const RgbImage *rgbsrc= page0_rgbimage;
829 RgbImage *ri= alloc_rgb_image(rgbsrc->w, rgbsrc->h);
830 memcpy(ri->data, rgbsrc->data, ri->w * ri->h * 3);
832 Rect sunshiner= find_sunshine_widget();
833 char sunshine[MAXIMGIDENT], archisland[MAXIMGIDENT];
837 for (srcp= rgbsrc->data, destp=ri->data,
838 endp= ri->data + ri->w * ri->h;
841 Rgb new= *srcp & 0xf0f0f0;
842 *destp= new | (new>>4);
845 identify_rgbimage(ri, sunshiner, sunshine, "sunshine widget");
847 if (!memcmp(sunshine,"Vessel ",5)) {
850 islandnamer.tl.x= cim->w - 1034 + 885;
851 islandnamer.br.x= cim->w - 1034 + 1020;
852 islandnamer.tl.y= 128;
853 islandnamer.br.y= 156;
855 ADJUST_BOX(islandnamer,"o",>=,5, 0, MUST, tl,y,+1);
856 ADJUST_BOX(islandnamer,"o",>=,5, cim->h, MUST, br,y,-1);
858 ADJUST_BOX(islandnamer,"o",>=,1, 0, MUST, tl,x,+1);
859 ADJUST_BOX(islandnamer,"o",>=,1, cim->w, MUST, br,x,-1);
861 debug_rect("islandnamer",0, islandnamer);
862 // int larger_islandnamebry= islandnamer.tl.y + 25;
863 // MUST(islandnamer.br.y < larger_islandnamebry,
864 // MR(islandnamer);MI(larger_islandnamebry));
865 // islandnamer.br.y = larger_islandnamebry;
866 debug_rect("islandnamer",1, islandnamer);
869 for (x=islandnamer.tl.x; x<=islandnamer.br.x; x++)
870 for (y=islandnamer.tl.y; y<=islandnamer.br.y; y++) {
871 if ((ri_rgb(ri,x,y) & 0xff) < 0x40) {
872 *RI_PIXEL32(ri,x,y)= 0;
876 identify_rgbimage(ri, islandnamer, archisland, "island");
877 } else if (!strcmp(sunshine,"Land - Ahoy!")) {
880 islandnamer.tl.x= (sunshiner.tl.x + sunshiner.br.x) / 2;
881 islandnamer.tl.y= sunshiner.tl.y + 100;
882 islandnamer.br= islandnamer.tl;
883 debug_rect("islandnamer",__LINE__, islandnamer);
885 WALK_UNTIL_MUST(islandnamer.tl,y, -1, sunshiner.br.y, 'H');
886 WALK_UNTIL_MUST(islandnamer.tl,x, -1, 0, 'o');
887 WALK_UNTIL_MUST(islandnamer.br,x, +1, cim->w, 'o');
888 debug_rect("islandnamer",__LINE__, islandnamer);
890 #define RW (RECT_W(islandnamer))
891 #define RH (RECT_H(islandnamer))
893 ADJUST_BOX(islandnamer,"O",>=,RW-4, cim->h, MUST,br,y,+1);
894 debug_rect("islandnamer",__LINE__, islandnamer);
896 islandnamer.br.y += 2;
898 ADJUST_BOX(islandnamer,"*",<,RW, cim->h, MUST,br,y,+1);
899 debug_rect("islandnamer",__LINE__, islandnamer);
901 islandnamer.tl.y= islandnamer.br.y-1;
902 islandnamer.br.y= islandnamer.br.y+1;
903 debug_rect("islandnamer",__LINE__, islandnamer);
905 ADJUST_BOX(islandnamer,"*",>=,RW, cim->h, MUST,br,y,+1);
906 debug_rect("islandnamer",__LINE__, islandnamer);
908 ADJUST_BOX(islandnamer,"*",<, RH, cim->w, MUST,tl,x,+1);
909 debug_rect("islandnamer",__LINE__, islandnamer);
911 MUST( RECT_H(islandnamer) <= 30, MR(islandnamer));
914 int nspaces=1, might_be_colon=0;
915 uint32_t colon_pattern= 0;
918 for (p.x=islandnamer.br.x; p.x>islandnamer.tl.x; p.x--) {
919 colondebugf("structcolon: x=%4d nsp=%2d mbc=%d cp=%08"PRIx32" ",
920 p.x, nspaces, might_be_colon, colon_pattern);
923 int runs[32], nruns=0;
924 runs[0]=0; runs[1]=0;
926 find_aa_density_prep(0xCCCCAA,0x002255,0);
928 for (p.y=islandnamer.tl.y; p.y<=islandnamer.br.y; p.y++) {
930 double alpha= find_aa_density(ri,p);
942 colondebugf(" pat=%08"PRIx32" nruns=%d runs[]={%d,%d..} ",
943 pattern, nruns, runs[0],runs[1]);
947 /* omg it _is_ a colon */
952 if (nruns==2 && runs[1]==runs[0]) {
954 if (pattern==colon_pattern)
955 goto ok_might_be_colon;
956 } else if (nspaces>=2) {
957 colon_pattern= pattern;
959 goto ok_might_be_colon;
961 } else if (nruns==1 && runs[0]==1 && might_be_colon) {
968 colondebugf(" nsp=%2d mbc=%d\n", nspaces, might_be_colon);
970 MUST(!"colon found", MP(p);MR(islandnamer) );
973 colondebugf(" found\n");
974 islandnamer.br.x= p.x;
976 identify_rgbimage(ri, islandnamer, archisland, "island");
979 MUST(!"sunshine shows ship or ahoy", MS(sunshine) );
983 char *delim= strstr(archisland," - ");
985 archipelago= masprintf("%.*s", (int)(delim-archisland), archisland);
986 island= masprintf("%s", delim+3);