2 * Parsing of the structure of the YPP client's displayed image
5 * This is part of ypp-sc-tools, a set of third-party tools for assisting
6 * players of Yohoho Puzzle Pirates.
8 * Copyright (C) 2009 Ian Jackson <ijackson@chiark.greenend.org.uk>
10 * This program is free software: you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation, either version 3 of the License, or
13 * (at your option) any later version.
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
20 * You should have received a copy of the GNU General Public License
21 * along with this program. If not, see <http://www.gnu.org/licenses/>.
23 * Yohoho and Puzzle Pirates are probably trademarks of Three Rings and
24 * are used without permission. This program is not endorsed or
25 * sponsored by Three Rings.
28 #include "structure.h"
30 DEBUG_DEFINE_DEBUGF(struct)
32 #define START_MAIN {200,200}
34 #define INTERESTING_COLUMNS 7
35 #define TEXT_COLUMNS 2
40 int commbasey, comminty;
41 int colrightx[INTERESTING_COLUMNS];
44 const CanonImage *page_images[MAX_PAGES];
45 static PageStruct page_structs[MAX_PAGES];
46 const RgbImage *page0_rgbimage;
49 static int text_h=-1, columns=-1;
53 static const CanonImage *cim;
56 char *archipelago, *island;
58 #define OTHERCOORD_x y
59 #define OTHERCOORD_y x
62 void select_page(int page) {
63 cim= page_images[page];
64 s= page_structs[page];
70 Rgb rgbx; /* on screen, REVERSED BYTES ie r||g||b */
71 char c; /* canonical */
74 const CanonColourInfo canoncolourinfo_table[]= {
75 { 0x475A5E, '*' }, /* edge */
76 { 0x2C5F7A, '*' }, /* edge just under box heading shadow */
77 { 0xC5C7AE, '*' }, /* blank area of partial commodities list */
78 { 0x6B828C, '*' }, /* background of ship status meter area */
79 { 0x934405, '*' }, /* border of ship meter area */
80 { 0x7D9094, '+' }, /* interbox */
81 { 0x022158, 'O' }, /* ahoy /w output foreground */
82 { 0xB5B686, 'H' }, /* ahoy /w output heading background */
84 { 0xBDC5BF, ' ' }, /* background - pale Sugar cane, etc. */
85 { 0xADB5AF, ' ' }, /* background - dark */
86 { 0xC7E1C3, ' ' }, /* background - pale Swill, etc. */
87 { 0xB5CFB1, ' ' }, /* background - dark */
88 { 0xD6CEB0, ' ' }, /* background - pale Madder, etc. */
89 { 0xC8C0A2, ' ' }, /* background - dark */
90 { 0xE0E1D3, ' ' }, /* background - pale Lorandite, etc. */
91 { 0xD0D1C3, ' ' }, /* background - dark */
92 { 0xE5E6C1, ' ' }, /* background - pale Cloth */
93 { 0xD7D8B3, ' ' }, /* background - dark */
94 { 0xEDDED9, ' ' }, /* background - pale Dye */
95 { 0xDACBC6, ' ' }, /* background - dark */
96 { 0xD3DEDF, ' ' }, /* background - pale Paint */
97 { 0xC5D0D1, ' ' }, /* background - dark */
98 { 0xDCD1CF, ' ' }, /* background - pale Enamel */
99 { 0xCEC3C1, ' ' }, /* background - dark */
100 { 0xF3F6F5, ' ' }, /* background - pale fruit */
101 { 0xE2E7E5, ' ' }, /* background - dark */
103 { 0x000000, 'o' }, /* foreground */
104 { 0xD4B356, ' ' }, /* background (cursor) */
105 { 0xFFFFFF, 'o' }, /* foreground (cursor) */
107 { 0x5B93BF, '_' }, /* selector dropdown background */
108 { 0xD7C94F, 'X' }, /* selector dropdown foreground */
112 CanonColourInfoReds canoncolourinfo_tree;
114 void canon_colour_prepare(void) {
115 const CanonColourInfo *cci;
116 for (cci=canoncolourinfo_table; cci->c; cci++) {
117 unsigned char r= cci->rgbx >> 16;
118 unsigned char g= cci->rgbx >> 8;
119 unsigned char b= cci->rgbx;
121 CanonColourInfoGreens *greens= canoncolourinfo_tree.red2[r];
123 greens= canoncolourinfo_tree.red2[r]= mmalloc(sizeof(*greens));
127 CanonColourInfoBlues *blues= greens->green2[g];
129 blues= greens->green2[g]= mmalloc(sizeof(*blues));
130 memset(blues, '?', sizeof(*blues));
133 blues->blue2[b]= cci->c;
137 static inline char get(int x, int y) { return cim->d[y * cim->w + x]; }
138 static inline char get_p(Point p) { return get(p.x,p.y); }
141 static void mustfail1(const char *file, int line, const char *what) {
144 "Unable to figure out contents of YPP client display.\n"
145 "Please check the following:\n"
146 " * YPP client is showing commodity listing screen\n"
147 " * YPP client window is on top (we try to raise it but your window\n"
148 " manager might have prevented that from succeeding)\n"
150 "If all of these are true, please report this as a fault.\n\n"
152 " %s:%d: requirement failed:\n"
156 static void mustfail2(void) NORET;
157 static void mustfail2(void) {
158 fprintf(stderr, "\n\nGiving up.\n");
162 #define MUST(x, ifnot) do{ \
163 if (__builtin_expect(!(x), 0)) { \
164 mustfail1(__FILE__,__LINE__,#x); \
170 #define MP(v) fprintf(stderr," %s=%d,%d",#v,(v).x,(v).y)
171 #define MI(v) fprintf(stderr," %s=%d", #v,(v))
172 #define MIL(v) fprintf(stderr," %s=%ld", #v,(v))
173 #define MRGB(v) fprintf(stderr," %s=%06"PRIx32, #v,(v))
174 #define MC(v) fprintf(stderr," %s='%c'", #v,(v))
175 #define MS(v) fprintf(stderr," %s=\"%s\"", #v,(v))
176 #define MF(v) fprintf(stderr," %s=%f", #v,(v))
177 #define MSB(v) fprintf(stderr," %s", (v))
178 #define MR(v) fprintf(stderr," %s=%d,%d..%d,%d",\
179 #v,(v).tl.x,(v).tl.y,(v).br.x,(v).br.y)
182 #define REQUIRE_RECTANGLE(tlx,tly,brx,bry,ok) \
183 require_rectangle(tlx, tly, brx, bry, ok, __LINE__);
185 #define FOR_P_RECT(p,rr) \
186 for ((p).x=(rr).tl.x; (p).x<=(rr).br.x; (p).x++) \
187 for ((p).y=(rr).tl.y; (p).y<=(rr).br.y; (p).y++)
189 static void require_rectangle_r(Rect rr, const char *ok, int lineno) {
193 MUST( strchr(ok,c), ({
194 MI(lineno),MR(rr);MP(p);MS(ok);
198 static void require_rectangle(int tlx, int tly, int brx, int bry,
199 const char *ok, int lineno) {
200 Rect rr= {{tlx,tly},{brx,bry}};
201 require_rectangle_r(rr, ok, lineno);
204 static void debug_rect(const char *what, int whati, Rect rr) {
205 if (!DEBUGP(rect)) return;
207 fprintf(debug, "%s %d: %d,%d..%d,%d:\n", what, whati,
208 rr.tl.x,rr.tl.y, rr.br.x,rr.br.y);
209 w= rr.br.x - rr.tl.x + 1;
210 for (y=rr.tl.y; y<=rr.br.y; y++) {
211 fprintf(debug, "%4d%*s|", y, rr.tl.x,"");
212 fwrite(cim->d + y*cim->w + rr.tl.x, 1, w, debug);
219 static int commod_selector_matches(Rect search, const char *const *all,
220 int allh, int allw) {
221 int alloffy, alloffx;
222 for (alloffy=0; alloffy < search.br.y; alloffy++) {
223 if (alloffy+allh-1 < search.tl.y) continue;
224 for (alloffx=search.tl.x; alloffx+allw-1 <= search.br.x; alloffx++) {
227 for (x=0; x<allw; x++)
228 for (y=0; y<allh; y++) {
230 if (want==' ') continue;
231 if (get(alloffx+x, alloffy+y) == want)
236 debugf("CHECKCOMMOD alloff=%d,%d good=%d bad=%d\n",
237 alloffx,alloffy, good,bad);
245 #define WALK_UNTIL(point,coord,increm,last,edge) \
247 if ((point).coord == (last)+(increm)) break; \
248 if (get_p((point)) == (edge)) { (point).coord -= (increm); break; } \
249 (point).coord += (increm); \
252 #define WALK_UNTIL_MUST(point,coord,increm,last,edge) \
254 WALK_UNTIL(point,coord,increm,last,edge); \
255 MUST( (point).coord != (last)+(increm), \
256 MP(point); MI(increm); MI(last); MC(edge); \
260 #define ADJUST_BOX(search,insidechrs,OP,want, lim,LIMIT_MUST, TLBR,XY,increm) \
262 LIMIT_MUST( (search).tl.XY != (search).br.XY && \
263 (search).TLBR.XY != (lim), \
264 MR((search));MSB(#TLBR);MSB(#XY) ); \
266 Point p=(search).tl; \
267 for (p.XY=(search).TLBR.XY; \
268 p.OTHERCOORD_##XY <= (search).br.OTHERCOORD_##XY; \
269 p.OTHERCOORD_##XY++) \
270 got += !!strchr(insidechrs, get_p(p)); \
271 if ((got) OP (want)) \
273 (search).TLBR.XY += increm; \
276 void find_structure(const CanonImage *im,
277 PageStruct **pagestruct_r,
278 int *max_relevant_y_r,
279 Point *commod_focus_point_r,
280 Point *commod_page_point_r,
281 Point *commod_focuslast_point_r) {
285 Rect whole = { {0,0}, {cim->w-1,cim->h-1} };
289 for (y=0, xscaleunit=1; y<4; y++, xscaleunit*=10) {
291 for (x=0; x<=cim->w; x++) {
292 if (x % xscaleunit) fputc(' ',debug);
293 else fprintf(debug,"%d",(x / xscaleunit)%10);
299 Point mainr_tl= START_MAIN;
301 WALK_UNTIL_MUST(s.mr.tl, y,-1, whole.tl.y, ' ');
304 WALK_UNTIL_MUST(s.mr.tl, x,-1, whole.tl.x, '*');
305 WALK_UNTIL_MUST(s.mr.tl, y,-1, whole.tl.y, '*');
306 WALK_UNTIL_MUST(s.mr.br, x,+1, whole.br.x, '*');
307 WALK_UNTIL_MUST(s.mr.br, y,+1, whole.br.y, '*');
309 REQUIRE_RECTANGLE(s.mr.tl.x-1, s.mr.tl.y, s.mr.tl.x-1, s.mr.br.y, "*");
310 REQUIRE_RECTANGLE(s.mr.br.x+1, s.mr.tl.y, s.mr.br.x+1, s.mr.br.y, "*");
311 REQUIRE_RECTANGLE(s.mr.tl.x, s.mr.tl.y-1, s.mr.br.x, s.mr.tl.y-1, "*");
312 REQUIRE_RECTANGLE(s.mr.tl.x, s.mr.br.y+1, s.mr.br.x, s.mr.br.y+1, "*");
314 #define CHECK_STRIP_BORDER(tlbr,xy,increm) \
319 csb_p.x++; csb_p.y++; \
320 csb_p.xy= s.mr.tlbr.xy; \
321 if (get_p(csb_p)=='+') { \
323 csb_r.tl.xy= csb_p.xy; \
324 csb_r.br.xy= csb_p.xy; \
325 require_rectangle_r(csb_r, "+", __LINE__); \
326 s.mr.tlbr.xy += increm; \
330 debug_rect("s.mr",0, s.mr);
332 CHECK_STRIP_BORDER(tl,x,+1);
333 CHECK_STRIP_BORDER(tl,y,+1);
334 CHECK_STRIP_BORDER(br,x,-1);
335 CHECK_STRIP_BORDER(br,y,-1);
337 debug_rect("s.mr",1, s.mr);
339 Rect updown= {START_MAIN,START_MAIN};
341 updown.br.x += chkw-1;
343 debug_rect("updown",__LINE__,updown);
345 ADJUST_BOX(updown, "+", >=,chkw, s.mr.tl.y, MUST, tl,y,-1);
346 debug_rect("updown",__LINE__,updown);
347 updown.br.y= updown.tl.y;
348 updown.tl.y= updown.tl.y-1;
350 ADJUST_BOX(updown, "+*",>=,chkw, s.mr.tl.y-1, MUST, tl,y,-1);
351 debug_rect("updown",__LINE__,updown);
353 s.commbasey= updown.tl.y + 1;
354 s.comminty= updown.br.y - updown.tl.y;
356 Rect across= {{ s.mr.tl.x - 1, s.commbasey },
357 { s.mr.tl.x, s.commbasey + s.comminty-2 }};
361 #define LIMIT_QUITEQ(cond,mp) { if (!(cond)) break; }
362 debug_rect("across",colno*1000000+__LINE__, across);
363 ADJUST_BOX(across, "+",>=,s.comminty-1,s.mr.br.x,LIMIT_QUITEQ,br,x,+1);
364 debug_rect("across",colno*1000000+__LINE__, across);
366 MUST( colno < MAX_COLUMNS,
367 MI(colno);MR(across);MR(s.mr);MI(s.commbasey); );
368 int colrx= across.br.x-1;
369 if (colrx >= s.mr.br.x) colrx= s.mr.br.x;
370 if (colno < INTERESTING_COLUMNS)
371 s.colrightx[colno]= colrx;
375 if (across.br.x >= s.mr.br.x)
378 REQUIRE_RECTANGLE(across.br.x,s.mr.tl.y, across.br.x,s.mr.br.y, "+");
381 MUST( colno >= MIN_COLUMNS, MI(colno);MR(s.mr);MR(across); );
384 Rect pager= {{ s.mr.br.x, s.mr.br.y - (pagerh-1) },
385 { s.mr.br.x + 1, s.mr.br.y }};
387 debug_rect("pager",__LINE__,pager);
388 ADJUST_BOX(pager, "o",>=,pagerh-2, whole.br.x,MUST, br,x,+1);
389 debug_rect("pager",__LINE__,pager);
391 pager.tl.x= pager.br.x;
392 pager.br.x= pager.br.x + 1;
393 debug_rect("pager",__LINE__,pager);
394 ADJUST_BOX(pager, "o",>=,pagerh-2, whole.br.x,MUST, br,x,+1);
395 debug_rect("pager",__LINE__,pager);
397 ADJUST_BOX(pager, "o",>=,RECT_W(pager)-2, s.mr.tl.y,LIMIT_QUITEQ, tl,y,-1);
398 debug_rect("pager",__LINE__,pager);
400 #define SET_ONCE(var,val) do{ \
402 if ((var)==-1) (var)= v; \
403 else MUST( (var) == v, MSB(#var);MI((var));MI(v);MR(s.mr); ); \
406 SET_ONCE(columns, colno);
407 SET_ONCE(text_h, s.comminty - 1);
410 *pagestruct_r= mmalloc(sizeof(s));
414 if (max_relevant_y_r)
415 SET_ONCE(*max_relevant_y_r, s.mr.br.y + 10);
417 if (commod_focus_point_r) {
418 *commod_focus_point_r= s.mr.tl;
419 commod_focus_point_r->x += 10;
420 commod_focus_point_r->y += s.comminty/3;
422 if (commod_focuslast_point_r) {
423 *commod_focuslast_point_r= s.mr.br;
424 commod_focuslast_point_r->x -= 10;
425 commod_focuslast_point_r->y -= s.comminty/3;
427 if (commod_page_point_r) {
428 commod_page_point_r->x= (pager.tl.x + pager.br.x) / 2;
429 commod_page_point_r->y= pager.tl.y - 1;
432 MUST( text_h <= OCR_MAX_H, MI(text_h) );
435 void check_correct_commodities(void) {
436 Rect search= { { 50,39 }, { 130,59 } };
438 ADJUST_BOX(search,"_",>=,10, cim->h, MUST, tl,y,+1);
439 ADJUST_BOX(search,"_",>=,10, 0, MUST, br,y,-1);
441 debug_rect("commodselr",1, search);
443 static const char *all_small[]= {
444 " ___________________________________ ",
445 " ________X____X__X____________________ ",
446 " ________ X___ X_ X_____XXXXXXXXXXX_____ ",
447 "_________X_X__ X_ X______XXXXXXXXX_______",
448 "________ X X__ X_ X_______XXXXXXX________",
449 "________X_ _X_ X_ X________XXXXX_________",
450 "_______ X__ X_ X_ X_________XXX__________",
451 "_______XXXXXXX X_ X__________X___________",
452 " _____ X X X_ X______________________",
453 " ____X_____ _XX_ X______________________",
454 " __ _______ __ ______________________ ",
456 static const char *all_big[]= {
457 "???_______________________________________???",
458 "??_________________________________________??",
459 "?_________X______X___X______________________?",
460 "_________?X_____?X__?X______XXXXXXXXXXX______",
461 "_________X_X____?X__?X_______XXXXXXXXX_______",
462 "________?X?X____?X__?X________XXXXXXX________",
463 "________X_?_X___?X__?X_________XXXXX_________",
464 "_______?X__?X___?X__?X__________XXX__________",
465 "_______?XXXXX___?X__?X___________X___________",
466 "_______X????_X__?X__?X_______________________",
467 "?_____?X____?X__?X__?X_______________________",
468 "??____X_____?_X_?X__?X_______________________",
469 "???__?_______?__?___?_______________________?",
472 #define COMMOD_SELECTOR_MATCHES(all) \
473 commod_selector_matches(search, all, \
474 sizeof((all))/sizeof((all)[0]), \
477 if (!(COMMOD_SELECTOR_MATCHES(all_small) ||
478 COMMOD_SELECTOR_MATCHES(all_big)))
479 fatal("Commodities selector not set to `All'.");
482 CanonImage *alloc_canon_image(int w, int h) {
483 CanonImage *im= mmalloc(sizeof(CanonImage) + w*h);
486 memset(im->d,'?',w*h);
490 static void file_read_image_ppm(FILE *f) {
492 unsigned char rgb_buf[3];
497 progress("page %d reading ...",npages);
499 pnm_readpaminit(f, &inpam, sizeof(inpam));
500 if (!(inpam.maxval == 255 &&
501 inpam.bytes_per_sample == 1 &&
502 inpam.format == RPPM_FORMAT))
503 fatal("PNM screenshot(s) file must be 8bpp 1 byte-per-sample RGB raw");
505 CANONICALISE_IMAGE(im, inpam.width, inpam.height, ri, {
506 errno=0; int rr= fread_unlocked(&rgb_buf,1,3,f);
508 if (rr!=3) fatal("PNM screenshot(s) file ends unexpectedly");
510 rgb= rgb_buf[0] | (rgb_buf[1] << 8) | (rgb_buf[2] << 16);
513 sysassert(!ferror(screenshot_file));
515 if (!(npages < MAX_PAGES))
516 fatal("Too many images in screenshots file; max is %d.\n", MAX_PAGES);
518 find_structure(im,&pstruct, 0,0,0,0);
519 store_current_page(im,pstruct,ri);
523 void store_current_page(CanonImage *ci, PageStruct *pstruct, RgbImage *rgb) {
525 progress("page %d unantialiasing...",npages);
526 adjust_colours(ci, rgb);
527 progress("page %d storing ...",npages);
528 if (!npages) page0_rgbimage= rgb;
530 page_images[npages]= cim;
531 page_structs[npages]= *pstruct;
535 void read_one_screenshot(void) {
536 progress("reading screenshot...");
537 file_read_image_ppm(screenshot_file);
538 progress_log("read screenshot.");
541 void read_screenshots(void) {
544 sysassert(! fstat(fileno(screenshot_file), &stab) );
547 if (S_ISREG(stab.st_mode)) {
548 long pos= ftell(screenshot_file);
549 if (pos == stab.st_size) break;
551 int c= fgetc(screenshot_file);
553 ungetc(c, screenshot_file);
555 file_read_image_ppm(screenshot_file);
557 sysassert(!ferror(screenshot_file));
558 progress_log("read %d screenshots.",npages);
561 #define FIXPT_SHIFT 15
564 static inline Fixpt int2fixpt(int x) { return x<<FIXPT_SHIFT; }
565 static inline Fixpt dbl2fixpt(double x) { return x * int2fixpt(1); }
566 static inline double fixpt2dbl(Fixpt x) { return x / (1.0*int2fixpt(1)); }
567 static inline Fixpt fixpt_mul(Fixpt a, Fixpt b) {
568 return (a*b + dbl2fixpt(0.5)) / int2fixpt(1);
570 #define MFP(v) fprintf(stderr," %s=%lx=%f", #v,(v),fixpt2dbl((v)))
572 static Fixpt aa_bg_chan[3], aa_scale_chan[3], aa_alpha_mean_max;
573 static Rgb aa_background, aa_foreground;
575 static void find_aa_density_prep(Rgb bg, Rgb fg, int fg_extra) {
577 unsigned char fg_chan[3];
581 aa_alpha_mean_max= fg_extra ? int2fixpt(1)-1 : int2fixpt(1);
583 for (i=0; i<3; i++) {
584 aa_bg_chan[i]= int2fixpt( (aa_background >> (i*8)) & 0xff );
585 fg_chan[i]= aa_foreground >> (i*8);
587 aa_scale_chan[i]= 1.0 / (int2fixpt(fg_chan[i]) + fg_extra - aa_bg_chan[i])
588 * dbl2fixpt(1) * dbl2fixpt(1);
592 static inline Fixpt find_aa_density(const RgbImage *ri, Point p) {
593 Rgb here= ri_rgb(ri, p.x, p.y);
595 if (here==aa_background) return 0;
597 Fixpt alpha[3], alpha_total=0;
599 for (i=0; i<3; i++) {
600 unsigned char here_chan= here >> (i*8);
602 Fixpt alpha_chan= fixpt_mul(int2fixpt(here_chan) - aa_bg_chan[i],
604 alpha[i]= alpha_chan;
605 alpha_total += alpha_chan;
608 Fixpt one_third= dbl2fixpt(1/3.0);
609 Fixpt alpha_mean= fixpt_mul(alpha_total, one_third);
611 Fixpt thresh= dbl2fixpt(1.5/AAMAXVAL);
612 Fixpt alpha_min= alpha_mean - thresh*2;
613 Fixpt alpha_max= alpha_mean + thresh*2;
616 MUST( alpha_min <= alpha[i] && alpha[i] <= alpha_max,
618 MRGB(here);MRGB(aa_background);MRGB(aa_foreground);
619 MFP(aa_alpha_mean_max);MFP(thresh);MFP(alpha_mean);
620 MFP(alpha_min);MI(i);MFP(alpha[i]);MFP(alpha_max) );
622 MUST( -thresh <= alpha_mean && alpha_mean <= aa_alpha_mean_max + thresh,
624 MRGB(here);MRGB(aa_background);MRGB(aa_foreground);
625 MFP(aa_alpha_mean_max);MFP(thresh);
626 MFP(alpha_mean); MFP(alpha[0]);MFP(alpha[1]);MFP(alpha[2]); );
628 if (alpha_mean < 0) alpha_mean= 0;
629 if (alpha_mean > aa_alpha_mean_max) alpha_mean= aa_alpha_mean_max;
634 static void find_commodity(int offset, Rect *rr) {
635 /* rr->tl.x==-1 if offset out of range */
636 rr->tl.y= s.commbasey - offset*s.comminty;
637 rr->br.y= rr->tl.y + s.comminty-2;
638 if (rr->tl.y < s.mr.tl.y || rr->br.y > s.mr.br.y) { rr->tl.x=-1; return; }
643 if (rr->tl.y > s.mr.tl.y)
644 REQUIRE_RECTANGLE(rr->tl.x,rr->tl.y-1, rr->br.x,rr->tl.y-1, "+");
645 if (rr->br.y < s.mr.tl.y)
646 REQUIRE_RECTANGLE(rr->tl.x,rr->br.y+1, rr->br.x,rr->br.y+1, "+");
649 static void compute_table_location(Rect commod, int colno, Rect *cell) {
650 cell->tl.y= commod.tl.y;
651 cell->br.y= commod.br.y;
652 cell->tl.x= !colno ? commod.tl.x : s.colrightx[colno-1]+2;
653 cell->br.x= s.colrightx[colno];
654 debug_rect("cell", colno, *cell);
657 static void ocr_rectangle(Rect r, const OcrCellType ct, FILE *tsv_output) {
658 OcrResultGlyph *results, *res;
660 int w= r.br.x - r.tl.x + 1;
663 for (x=0; x<w; x++) {
665 for (y=0; y<text_h; y++) {
666 Point here= { x+r.tl.x, y+r.tl.y };
667 int pixel= get_p(here);
668 if (pixel==' ') pixel= '0';
669 MUST( pixel >= '0' && pixel <= '0'+AAMAXVAL,
670 MC(pixel);MP(here);MSB(ocr_celltype_name(ct));MR(r); );
671 pixcol_p_add(&cols[x], y, pixel-'0');
676 results= ocr(rd,ct,w,cols);
677 for (res=results; res->s; res++)
678 fputs(res->s,tsv_output);
681 #define FOR_COMMODITY_CELL(ROW_START, CELL, ROW_END) do{ \
683 int tryrect, colno; \
685 for (tryrect= +cim->h; tryrect >= -cim->h; tryrect--) { \
686 find_commodity(tryrect, &rowr); \
689 debug_rect("commod",tryrect, rowr); \
693 for (colno=0; colno<columns; colno++) { \
694 compute_table_location(rowr,colno,&cell); \
703 static void adjust_colours_cell(CanonImage *ci, const RgbImage *ri,
704 int colno, Rect cell) {
706 unsigned char chanbg[3];
707 long bg_count=0, light_count=0, dark_count=0;
711 background= ri_rgb(ri, cell.br.x, cell.br.y);
713 chanbg[i]= background >> (i*8);
716 Rgb herergb= ri_rgb(ri, p.x, p.y);
717 if (herergb==background) {
720 for (i=0; i<3; i++) {
721 unsigned char here= herergb >> (i*8);
722 if (here == chanbg[i]) bg_count++;
723 else if (here < chanbg[i]) dark_count += (chanbg[i] - here)/4 + 1;
724 else if (here > chanbg[i]) light_count += (here - chanbg[i])/4 + 1;
728 long total_count= RECT_W(cell) * RECT_H(cell) * 3;
730 MUST( bg_count > total_count / 2,
731 MR(cell);MIL(total_count);MIL(bg_count);
732 MIL(light_count);MIL(dark_count) );
734 if (bg_count == total_count)
740 if (light_count/16 > dark_count) {
741 foreground= 0xffffffU;
743 } else if (dark_count/16 > light_count) {
747 MUST( !"tell light from dark",
748 MR(cell);MIL(total_count);MIL(bg_count);
749 MIL(light_count);MIL(dark_count);MRGB(background); );
752 debugf("TABLEENTRY col=%d %d,%d..%d,%d bg=%ld light=%ld dark=%ld\n",
753 colno, cell.tl.x,cell.tl.y, cell.br.x,cell.br.y,
754 bg_count, light_count, dark_count);
758 find_aa_density_prep(background, foreground, fg_extra);
761 Fixpt alpha= find_aa_density(ri,p);
763 int here_int= alpha >> (FIXPT_SHIFT - AADEPTH);
764 assert(here_int <= AAMAXVAL);
765 if (!(here_int==0 || here_int==AAMAXVAL)) monochrome=0;
766 ci->d[p.y * ci->w + p.x]= '0' + here_int;
769 debug_rect("cell0M", colno, cell);
771 require_rectangle_r(cell, "0123456789", __LINE__);
774 void adjust_colours(CanonImage *ci, const RgbImage *ri) {
775 if (!(o_mode & mf_analyse))
780 FOR_COMMODITY_CELL({},({
781 adjust_colours_cell(ci,ri,colno,cell);
785 void analyse(FILE *tsv_output) {
788 for (page=0; page<npages; page++) {
792 check_correct_commodities();
795 rd= ocr_init(text_h);
797 progress("Processing page %d...",page);
804 fputs(tab, tsv_output);
808 : &ocr_celltype_number,
812 fputs("\n", tsv_output);
813 sysassert(!ferror(tsv_output));
814 sysassert(!fflush(tsv_output));
817 progress("Commodity table scan complete.");
820 //static Rect islandnamer;
822 DEBUG_DEFINE_SOME_DEBUGF(structcolon,colondebugf)
824 Rect find_sunshine_widget(void) {
827 sunshiner.tl.x= cim->w - 1034 + 885;
828 sunshiner.br.x= cim->w - 1034 + 1020;
832 ADJUST_BOX(sunshiner,"o*",>=,30, 100,MUST, tl,y,-1);
833 ADJUST_BOX(sunshiner,"o*",>=,30, 100,MUST, br,y,+1);
834 debug_rect("sunshiner",0, sunshiner);
836 MUST(sunshiner.br.y - sunshiner.tl.y > 20, MR(sunshiner));
839 ADJUST_BOX(sunshiner,"o",>=,20, (cim->w - 1034 + 700), MUST, tl,x,-1);
840 ADJUST_BOX(sunshiner,"o",>=,20, cim->w, MUST, br,x,+1);
841 debug_rect("sunshiner",1, sunshiner);
845 void find_islandname(void) {
846 const RgbImage *rgbsrc= page0_rgbimage;
849 RgbImage *ri= alloc_rgb_image(rgbsrc->w, rgbsrc->h);
850 memcpy(ri->data, rgbsrc->data, ri->w * ri->h * 3);
852 Rect sunshiner= find_sunshine_widget();
853 char sunshine[MAXIMGIDENT], archisland[MAXIMGIDENT];
857 for (srcp= rgbsrc->data, destp=ri->data,
858 endp= ri->data + ri->w * ri->h;
861 Rgb new= *srcp & 0xf0f0f0;
862 *destp= new | (new>>4);
865 identify_rgbimage(ri, sunshiner, sunshine, "sunshine widget");
867 if (!memcmp(sunshine,"Vessel ",5)) {
870 islandnamer.tl.x= cim->w - 1034 + 885;
871 islandnamer.br.x= cim->w - 1034 + 1020;
872 islandnamer.tl.y= 128;
873 islandnamer.br.y= 156;
875 ADJUST_BOX(islandnamer,"o",>=,5, 0, MUST, tl,y,+1);
876 ADJUST_BOX(islandnamer,"o",>=,5, cim->h, MUST, br,y,-1);
878 ADJUST_BOX(islandnamer,"o",>=,1, 0, MUST, tl,x,+1);
879 ADJUST_BOX(islandnamer,"o",>=,1, cim->w, MUST, br,x,-1);
881 debug_rect("islandnamer",0, islandnamer);
882 // int larger_islandnamebry= islandnamer.tl.y + 25;
883 // MUST(islandnamer.br.y < larger_islandnamebry,
884 // MR(islandnamer);MI(larger_islandnamebry));
885 // islandnamer.br.y = larger_islandnamebry;
886 debug_rect("islandnamer",1, islandnamer);
889 for (x=islandnamer.tl.x; x<=islandnamer.br.x; x++)
890 for (y=islandnamer.tl.y; y<=islandnamer.br.y; y++) {
891 if ((ri_rgb(ri,x,y) & 0xff) < 0x40) {
892 *RI_PIXEL32(ri,x,y)= 0;
896 identify_rgbimage(ri, islandnamer, archisland, "island");
897 } else if (!strcmp(sunshine,"Land - Ahoy!")) {
900 islandnamer.tl.x= (sunshiner.tl.x + sunshiner.br.x) / 2;
901 islandnamer.tl.y= sunshiner.tl.y + 100;
902 islandnamer.br= islandnamer.tl;
903 debug_rect("islandnamer",__LINE__, islandnamer);
905 WALK_UNTIL_MUST(islandnamer.tl,y, -1, sunshiner.br.y, 'H');
906 WALK_UNTIL_MUST(islandnamer.tl,x, -1, 0, 'o');
907 WALK_UNTIL_MUST(islandnamer.br,x, +1, cim->w, 'o');
908 debug_rect("islandnamer",__LINE__, islandnamer);
910 #define RW (RECT_W(islandnamer))
911 #define RH (RECT_H(islandnamer))
913 ADJUST_BOX(islandnamer,"O",>=,RW-4, cim->h, MUST,br,y,+1);
914 debug_rect("islandnamer",__LINE__, islandnamer);
916 islandnamer.br.y += 2;
918 ADJUST_BOX(islandnamer,"*",<,RW, cim->h, MUST,br,y,+1);
919 debug_rect("islandnamer",__LINE__, islandnamer);
921 islandnamer.tl.y= islandnamer.br.y-1;
922 islandnamer.br.y= islandnamer.br.y+1;
923 debug_rect("islandnamer",__LINE__, islandnamer);
925 ADJUST_BOX(islandnamer,"*",>=,RW, cim->h, MUST,br,y,+1);
926 debug_rect("islandnamer",__LINE__, islandnamer);
928 ADJUST_BOX(islandnamer,"*",<, RH, cim->w, MUST,tl,x,+1);
929 debug_rect("islandnamer",__LINE__, islandnamer);
931 MUST( RECT_H(islandnamer) <= 30, MR(islandnamer));
934 int nspaces=1, might_be_colon=0;
935 uint32_t colon_pattern= 0;
938 for (p.x=islandnamer.br.x; p.x>islandnamer.tl.x; p.x--) {
939 colondebugf("structcolon: x=%4d nsp=%2d mbc=%d cp=%08"PRIx32" ",
940 p.x, nspaces, might_be_colon, colon_pattern);
943 int runs[32], nruns=0;
944 runs[0]=0; runs[1]=0;
946 find_aa_density_prep(0xCCCCAA,0x002255,0);
948 for (p.y=islandnamer.tl.y; p.y<=islandnamer.br.y; p.y++) {
950 Fixpt alpha= find_aa_density(ri,p);
951 if (alpha >= dbl2fixpt(0.49)) {
962 colondebugf(" pat=%08"PRIx32" nruns=%d runs[]={%d,%d..} ",
963 pattern, nruns, runs[0],runs[1]);
967 /* omg it _is_ a colon */
972 if (nruns==2 && runs[1]==runs[0]) {
974 if (pattern==colon_pattern)
975 goto ok_might_be_colon;
976 } else if (nspaces>=2) {
977 colon_pattern= pattern;
979 goto ok_might_be_colon;
981 } else if (nruns==1 && runs[0]==1 && might_be_colon) {
988 colondebugf(" nsp=%2d mbc=%d\n", nspaces, might_be_colon);
990 MUST(!"colon found", MP(p);MR(islandnamer) );
993 colondebugf(" found\n");
994 islandnamer.br.x= p.x;
996 identify_rgbimage(ri, islandnamer, archisland, "island");
999 MUST(!"sunshine shows ship or ahoy", MS(sunshine) );
1003 char *delim= strstr(archisland," - ");
1005 archipelago= masprintf("%.*s", (int)(delim-archisland), archisland);
1006 island= masprintf("%s", delim+3);