3 # helper program for OCR in PCTB upload client
5 # This is part of ypp-sc-tools, a set of third-party tools for assisting
6 # players of Yohoho Puzzle Pirates.
8 # Copyright (C) 2009 Ian Jackson <ijackson@chiark.greenend.org.uk>
10 # This program is free software: you can redistribute it and/or modify
11 # it under the terms of the GNU General Public License as published by
12 # the Free Software Foundation, either version 3 of the License, or
13 # (at your option) any later version.
15 # This program is distributed in the hope that it will be useful,
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 # GNU General Public License for more details.
20 # You should have received a copy of the GNU General Public License
21 # along with this program. If not, see <http://www.gnu.org/licenses/>.
23 # Yohoho and Puzzle Pirates are probably trademarks of Three Rings and
24 # are used without permission. This program is not endorsed or
25 # sponsored by Three Rings.
29 # run this without args
31 # one line which is a Tcl list for unk_{l,r} unk_contexts glyphsdone etc.
32 # the xpm in the format expected
33 # then expect child to exit 0, or write a single 0 byte to fd 4
34 # if it wrote a byte to fd 4, it can take another question
37 proc manyset {list args} {
38 foreach val $list var $args {
45 #---------- display core ----------
54 proc init_widgets {} {
56 global csrh gotsh ctxh
58 if {[winfo exists .d]} return
62 image create bitmap image/main
63 label .d.mi -image image/main -borderwidth 0
65 frame .d.csr -bg black -height $csrh
66 frame .d.got -bg black -height $gotsh
67 frame .d.ctx -bg black
69 image create bitmap image/cursor -data \
72 static unsigned char csr_bits[] = {
73 0x20, 0x00, 0x20, 0x00, 0x20, 0x00, 0x21, 0x04, 0x22, 0x02, 0x25, 0x05,
74 0xaa, 0x02, 0x74, 0x01, 0xa8, 0x00, 0x70, 0x00, 0x20, 0x00};
78 label .d.csr.csr.l -image image/cursor -compound left
79 entry .d.csr.csr.e -bd 0
80 pack .d.csr.csr.l -side left
82 frame .d.mi.csr_0 -bg white -width 1
83 frame .d.mi.csr_1 -bg white -width 1
85 pack .d.csr .d.mi .d.got .d.ctx -side top
92 proc show_context {maxhv x ctxs} {
96 if {[llength $ctxs]==1} { set fg blue } { set fg yellow }
97 label $w -bg black -fg $fg -text [join $ctxs "/\n"] -justify left
98 place $w -x [expr {($x-1)*$mul}] -y 0
99 set wh [winfo reqheight $w]
100 if {$wh > $maxh} { set maxh $wh }
103 proc resize_widgets {} {
104 global mulcols mulrows csrh gotsh ctxh glyphsdone
105 global unk_l unk_contexts
107 foreach w {.d.csr .d.got .d.ctx} {
108 $w configure -width $mulcols
110 #.d configure -height [expr {$csrh+$mulrows+$gotsh+$ctxh}]
112 .d.mi.csr_$w configure -height $mulrows
115 eval destroy [winfo children .d.ctx]
118 foreach {min max contexts got} $glyphsdone {
119 show_context maxh $min $contexts
121 show_context maxh $unk_l $unk_contexts
122 .d.ctx configure -height $maxh
126 #---------- xpm input processor ----------
129 global glyphsdone mul inter rhsmost_max unk_l unk_r mulcols mulrows
130 global cols rows wordmap
135 if {[gets $f l] < 0} { error "huh? "}
136 if {![regexp {^"(.*)",$} $l dummy l]} {
138 if {[regexp {^\}\;$} $l]} break
142 manyset $l cols rows colours cpp
143 if {$colours!=2 || $cpp!=1} { error "$l ?" }
145 set chop_l [expr {$unk_l - 80}]
146 set chop_r [expr {$cols - $unk_l - 100}]
147 if {$chop_l<0} { set chop_l 0 }
149 set unk_l [expr {$unk_l - $chop_l}]
150 set unk_r [expr {$unk_r - $chop_l}]
152 foreach {min max contexts got} $glyphsdone {
154 [expr {$min-$chop_l}] \
155 [expr {$max-$chop_l}] \
161 set cols [expr {$cols - $chop_l - $chop_r}]
162 debug "NOW cols=$cols chop_l,r=$chop_l,$chop_r rows=$rows\
165 set mulcols [expr {$cols*$mul+$inter}]
166 set mulrows [expr {$rows*$mul+$inter}]
167 append o "\"$mulcols $mulrows 9 1\",\n"
168 for {set x 0} {$x<$cols} {incr x} { set wordmap($x) 0 }
169 } elseif {$y==-2} { # first pixel
180 } elseif {$y==-1} { # 2nd pixel but we've already printed ours
182 set ybit [expr {1<<$y}]
187 set l [string range $l $chop_l end-$chop_r]
189 set l [string range $l $chop_l end]
190 append l [string repeat " " [expr -$chop_r]]
192 foreach c [split $l ""] {
194 if {$x >= $unk_l && $x <= $unk_r} {
198 foreach {min max contexts got} $glyphsdone {
200 if {$x >= $min && $x <= $max} {
201 set how [lindex {a b} $ab]
210 set p [string toupper $how]
211 incr wordmap($x) $ybit
213 default { error "$c ?" }
215 append ol "[string repeat $p [expr {$mul-$inter}]][
216 string repeat + $inter]"
217 append olh [string repeat + $mul]
223 set olhn [string repeat $olh $inter]
224 if {!$y} { append o $olhn }
225 append o [string repeat $ol [expr {$mul-1}]]
230 set data [exec xpmtoppm << $o]
231 image create photo image/main -data $data
235 #---------- per-invocation display ----------
237 proc draw_glyphsdone {} {
238 global glyphsdone mul inter
239 eval destroy [winfo children .d.got]
240 foreach {min max contexts got} $glyphsdone {
241 frame .d.got.m$min -bd 0 -background \#888
242 label .d.got.m$min.l -text "$got" -fg white -bg black -bd 0
243 pack .d.got.m$min.l -padx 1 -pady 1
244 place .d.got.m$min -x [expr {$min*$mul+$inter}] -y 0
248 proc startup_cursor {} {
249 global cur_already cur_mode cur_0 cur_1 last_ht
250 global glyphsdone unk_l unk_r
252 set cur_already [expr {[llength $glyphsdone]/4-1}]
253 set cur_mode 1 ;# one of: 0 1 already text
256 set cur_1 [expr {$unk_r+1}]
263 #---------- runtime display and keystroke handling ----------
267 if {![string compare $t $last_ht]} return
268 eval destroy [grid slaves .help]
269 set y 0; foreach l $t {
270 set x 0; foreach c $l {
271 set w .help.at${x}x${y}
273 grid $w -row $y -column $x -padx 5
281 proc recursor/0 {} { recursor//01 0 }
282 proc recursor/1 {} { recursor//01 1 }
283 proc recursor//01 {z1} {
284 global mul rhsmost_max cols glyphsdone
286 .d.csr.csr.l configure -text {adjust}
287 place .d.csr.csr -x [expr {$cur*$mul - 7}]
288 bind_key space { othercursor }
289 bind_leftright_q cur_$z1 0 [expr {$cols-1}]
290 if {[llength $glyphsdone]} {
291 bind_key Tab { set cur_mode already; recursor }
296 if {$cur_0 != $cur_1} {
297 .d.csr.csr.e delete 0 end
303 {{<- ->} {move cursor, adjusting area to define}}
304 {Space {switch to moving other cursor}}
305 {Return {confirm location, enter letter(s)}}
306 {Tab {switch to correcting earlier ocr}}
307 {Q {quit and abandon OCR run}}
310 proc othercursor {} {
312 set cur_mode [expr {!$cur_mode}]
316 proc recursor/text {} {
318 {Return {confirm entry of new glyph}}
319 {Escape {abandon entry}}
322 .d.csr.csr.l configure -text {define:}
323 pack .d.csr.csr.e -side left
326 set strq [.d.csr.csr.e get]
327 if {[regexp {^(?:[!-[]|[]-~]|\\\\|\\x[0-9a-f]{2})+} $strq]} {
328 RETURN_RESULT DEFINE "$cur_0 $cur_1 $strq"
333 pack forget .d.csr.csr.e
339 proc recursor/already {} {
342 global cur_already mul
343 global glyphsdone cur_already mul
344 .d.csr.csr.l configure -text {correct}
345 set rmax [lindex $glyphsdone [expr {$cur_already*4}]]
346 place .d.csr.csr -x [expr {$rmax*$mul-3}]
349 bind_leftright_q cur_already 0 [expr {[llength $glyphsdone]/4-1}]
350 bind_key Tab { bind_key Delete {}; set cur_mode 1; recursor }
352 RETURN_RESULT DELETE [lrange $glyphsdone \
353 [expr $cur_already*4] \
354 [expr $cur_already*4+2]]
357 {{<- ->} {move cursor, selecting glyph to correct}}
358 {Del {clear this glyph from the recognition database}}
359 {Tab {switch to selecting area to define as new glyph}}
360 {Q {quit and abandon OCR run}}
364 proc bind_key {k proc} {
366 bind . <Key-$k> $proc
367 set keybindings($k) [expr {!![string length $proc]}]
369 proc unbind_all_keys {} {
371 foreach k [array names keybindings] { bind_key $k {} }
374 proc bind_leftright_q {var min max} {
375 bind_key Left [list leftright $var $min $max -1]
376 bind_key Right [list leftright $var $min $max +1]
378 puts stderr "\nCharacter resolver quitting as you requested."
382 proc leftright {var min max inc} {
386 if {$vnew < $min || $vnew > $max} return
392 global csrh cur_mode cur_0 cur_1 mul
394 place .d.mi.csr_$z1 -y 0 -x [expr {[set cur_$z1] * $mul}]
400 #---------- database read and write ----------
404 # <context> <ncharacters> <hex>...
408 # $database($context 0x<bits> 0x<bits>...) = $hex
410 set database_header {# ypp-sc-tools pctb font v1}
413 if {[gets $f l] < 0} { error "unexpected db eof" }
417 proc read_database {} {
418 global database database_header rows database_fn
419 catch { unset database }
420 set database_fn ./charset-$rows.txt
421 if {![file exists $database_fn]} return
422 set f [open $database_fn r]
423 if {[string compare [db_getsl $f] $database_header]} { error "$l ?" }
424 if {([db_getsl $f])+0 != $rows} { error "wrong h ?" }
426 set context [db_getsl $f]
427 if {![string length $context]} continue
428 if {[regexp {^\#} $context]} continue
429 if {![string compare . $context]} break
432 set strq [db_getsl $f]
435 if {![string length $l]} break
436 lappend bm [format %x 0x$l]
438 set database($bm) $strq
443 proc write_database {} {
444 global database rows database_fn database_header
446 foreach bm [array names database] {
447 set strq $database($bm)
448 set o "[lindex $bm 0]\n$strq\n"
449 foreach x [lrange $bm 1 end] { append o "$x\n" }
453 set f [open $database_fn.new w]
454 puts $f "$database_header\n$rows\n"
455 foreach o [lsort $ol] {
460 file rename -force $database_fn.new $database_fn
463 proc dbkey {ctx l r} {
466 for {set x $l} {$x <= $r} {incr x} {
467 lappend bm [format %x $wordmap($x)]
472 proc update_database/DEFINE {c0 c1 strq} {
473 global glyphsdone unk_l unk_contexts wordmap database
474 if {$c0 > $c1} { manyset [list $c0 $c1] c1 c0 }
476 set ncontexts $unk_contexts
478 foreach {l r contexts got} $glyphsdone {
479 if {$l==$c0} { set ncontexts $contexts; break }
481 if {![info exists ncontexts]} {
482 puts stderr "must start at letter LHS!"
487 foreach c $ncontexts {
488 set bm [dbkey $c $c0 $c1]
489 set database($bm) $strq
494 proc update_database/DELETE {l r ctxs} {
497 set bm [dbkey $ctx $l $r]
498 catch { unset database($bm) }
504 proc RETURN_RESULT {how what} {
506 place forget .d.csr.csr
507 pack forget .d.csr.csr.e
508 helptext {{{ Processing }}}
512 eval update_database/$how $what
516 #---------- main progrm ----------
518 proc main/default {} {
519 puts stderr "Do not run this program directly."
522 global glyphsdone unk_l unk_r unk_contexts
531 set unk_contexts Test
533 set f [open text.xpm]
542 proc done/default {} {
546 global glyphsdone unk_l unk_r unk_contexts
548 if {[gets stdin l]<0} {
549 if {[eof stdin]} { fconfigure stdin -blocking yes; exit 0 }
553 manyset [lrange $l 0 3] unk_l unk_r unk_contexts
554 set glyphsdone [lrange $l 3 end]
557 fileevent stdin readable {}
558 fconfigure stdin -blocking yes
567 proc main/automatic {} {
568 fconfigure stdin -blocking no
569 fileevent stdin readable required
571 proc done/automatic {} {
572 exec sh -c {printf \\0 >&4}
580 switch -exact -- $arg {
581 {--debug} { proc debug {m} { puts stderr "SHOW-THING $m" } }
583 {--automatic-1} { set mainkind automatic }
584 {--automatic*} { error "incompatible versions - install problem" }
585 default { error "huh $argv ?" }