From: kramm Date: Tue, 13 Jan 2009 22:28:00 +0000 (+0000) Subject: (patched) gocr-0.44 X-Git-Tag: release-0-9-0~293 X-Git-Url: http://git.asbjorn.biz/?p=swftools.git;a=commitdiff_plain;h=538278e28e3e9739cee7b9b9d39f5dad828e6b87 (patched) gocr-0.44 --- diff --git a/lib/gocr/database.c b/lib/gocr/database.c new file mode 100644 index 0000000..21a4f02 --- /dev/null +++ b/lib/gocr/database.c @@ -0,0 +1,451 @@ +/* +This is a Optical-Character-Recognition program +Copyright (C) 2000-2006 Joerg Schulenburg + +This program is free software; you can redistribute it and/or +modify it under the terms of the GNU General Public License +as published by the Free Software Foundation; either version 2 +of the License, or (at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + + see README for EMAIL address + */ + +#include +#include +#include "gocr.h" +#include "pnm.h" +#include "pgm2asc.h" +#include +#include + +#define Blen 256 + +// load boxes from database into boxlist (for faster access) +// used as alternate engine, comparing chars with database +int load_db(void) { + FILE *f1; + char s1[Blen+1], + s2[Blen+1] = "./db/", /* ToDo: replace by constant! by configure */ + *s3; + int i, j, ii, i2, line; + struct box *box1; + pix *pp; + + if( JOB->cfg.db_path ) strncpy(s2,JOB->cfg.db_path,Blen-1); + i2=strlen(s2); + if (JOB->cfg.verbose) + fprintf(stderr, "# load database %s %s ... ",s2,JOB->cfg.db_path); + + strncpy(s2+i2,"db.lst",Blen-i2);s2[Blen]=0; + f1 = fopen(s2, "r"); + if (!f1) { + fprintf(stderr, " DB %s not found\n",s2); + return 1; + } + + line = 0; /* line counter for better error report */ + for (ii = 0; !feof(f1); ii++) { +/* bbg: should write a better input routine */ + if (!fgets(s1, Blen, f1)) break; line++; + j = strlen(s1); + /* remove carriage return sequences from line */ + while (j > 0 && (s1[j - 1] == '\r' || s1[j - 1] == '\n')) + s1[--j] = 0; + if (!j) continue; /* skip empty line */ + if (s1[0]=='#') continue; /* skip comments (v0.44) */ + /* copy file name */ + for (i = 0; i < j && i+i2 < Blen && strchr(" \t,;",s1[i]) == 0; i++) + s2[i2 + i] = s1[i]; + s2[i2+i]=0; + /* skip spaces */ + for (; i < j && strchr(" \t",s1[i]) != 0; i++); + /* by now: read pix, fill box, goto next ??? */ + pp = (pix *)malloc(sizeof(pix)); + if( !pp ) fprintf(stderr,"malloc error in load_db pix\n"); + + //readpgm(s2, pp, 0 * JOB->cfg.verbose); + fprintf(stderr, "Can't call readpgm()\n"); + + box1 = (struct box *)malloc_box(NULL); + if(!box1) fprintf(stderr,"malloc error in load_db box1\n"); + box1->x0 = 0; + box1->x1 = pp->x-1; // white border 1 pixel width + box1->y0 = 0; + box1->y1 = pp->y-1; + box1->x = 1; + box1->y = 1; + box1->dots = 0; + box1->c = 0; + box1->modifier = 0; /* ToDo: obsolete */ + box1->tas[0]=NULL; + box1->tac[0]=0; + box1->wac[0]=100; /* really 100% sure? */ + box1->num_ac=1; + if (s1[i]=='"'){ /* parse a string */ + j=strrchr(s1+i+1,'"')-(s1+i+1); /* we only look for first and last "" */ + if (j>=1) { + s3=(char *)malloc(j+1); + if (!s3) fprintf (stderr, "malloc error in load_db s3\n"); + if (s3) { + memcpy(s3,s1+i+1,j); + s3[j]=0; + box1->tas[0]=s3; + // fprintf(stderr,"\nstring=%s",s3); + } + } else { fprintf(stderr,"load_db: string parse error L%d\n",line); } + } else { + box1->tac[0] = box1->c = s1[i]; /* try to interpret as ASCII */ + /* we can live without hexcode in future if we use UTF8-strings */ + s3=s1+i; + j=strtol( s1+i, &s3, 16); /* try to read 4 to 8 digit hex unicode */ + /* if its an hexcode, ASCII interpretation is overwritten */ + if( j && i+3<=Blen && s3-s1-i>3 ) box1->tac[0] = box1->c = j; + // fprintf(stderr,"\nhexcode=%04x=%04x %d",(int)j,(int)box1->c,s3-s1-i); + } + box1->num = 0; + box1->line = -1; + box1->m1 = 0; /* ToDo: should be given too in the database! */ + box1->m2 = 0; + box1->m3 = 0; + box1->m4 = 0; + box1->p = pp; + list_app(&JOB->tmp.dblist, box1); // append to list +#if 0 + out_x(box1); +#endif + } + fclose(f1); + if (JOB->cfg.verbose) + fprintf(stderr, " %d chars loaded\n", ii); + return 0; +} + +// expand database from box/boxlist name=db_$utime.pbm +// this is added in version v0.3.3 +int store_db(struct box *box1) { + FILE *f1; + char s2[Blen+1] = "./db/", s3[Blen+1]; + int i2, dx, dy; + pix b; /* temporary mini page */ + + if( JOB->cfg.db_path ) strncpy(s2,JOB->cfg.db_path,Blen-1); + i2=strlen(s2); + + /* name generation can cause problems, if called twice within a second */ + if (box1->num_ac && box1->tas[0]) + sprintf(s3,"db_%04x_%lu.pbm", (unsigned int)box1->tas[0][0], + (unsigned long)time(NULL)); + else + sprintf(s3,"db_%04x_%lu.pbm", (unsigned int)box1->c, + (unsigned long)time(NULL)); + /* ToDo: the file name may be not unique */ + strncpy(s2+i2,"db.lst",Blen-i2);s2[Blen]=0; + f1 = fopen(s2, "a"); + if (!f1) { + fprintf(stderr, " could not access %s\n",s2); + return 1; + } + strncpy(s2+i2,s3,strlen(s3)); s2[i2+strlen(s3)]=0; + /* store image and infos about the char */ + /* ToDo: store the vector list instead of the pixelarray */ + + if (JOB->cfg.verbose) + fprintf(stderr, "store_db: add file %s to database\n#",s3); + dx=box1->x1-box1->x0+1; + dy=box1->y1-box1->y0+1; + b.p = (unsigned char *) malloc( dx * dy ); + if( !b.p ){ + fprintf( stderr, "\nFATAL: malloc failed, skip store_db" ); + return 2; + } + if (copybox(box1->p, box1->x0, box1->y0, dx, dy, &b, dx * dy)) + return -1; + + //writepbm(s2,&b); /* What is to do on error? */ + + free(b.p); + + /* store the database line */ + /* some infos about box1->m1,..,m4 should added (base line, high etc.) */ + if (box1->num_ac && box1->tas[0]) { + fprintf(f1, "%s \"%s\"\n",s3,box1->tas[0]); + /* ToDo: what if tas contains '"'? */ + } else { + if( (box1->c >= '0' && box1->c <= '9') + || (box1->c >= 'A' && box1->c <= 'Z') + || (box1->c >= 'a' && box1->c <= 'z') ) + fprintf(f1, "%s %c\n",s3,(char)box1->c); + else { + if (((box1->c)>>16)>>16) + fprintf(f1, "%s %08x\n",s3,(unsigned int)box1->c); + else + fprintf(f1, "%s %04x\n",s3,(unsigned int)box1->c); + } + } + fclose(f1); + return 0; +} + +/* function is only for user prompt on console to identify chars + it prints out a part of pixmap b at point x0,y0 to stderr + using dots .,; if no pixel, and @xoO for pixels + */ +void out_env(struct box *px ){ + int x0,y0,x1,y1,dx,dy,x,y,x2,y2,yy0,tx,ty,i,cs; + char c1, c2; pix *b; + cs=JOB->cfg.cs; + yy0=px->y0; + { /* overwrite rest of arguments */ + b=px->p; + x0=px->x0; x1=px->x1; dx=x1-x0+1; + y0=px->y0; y1=px->y1; dy=y1-y0+1; + y0-=2; y1+=2; + if (px->m4 && y0>px->m1) y0=px->m1; + if (px->m4 && y1m4) y1=px->m4; + if (x1-x0+1<52) { x0-=10; x1+=10; } /* fragment? expand frame */ + if (x1-x0+1<52) { x0-=10; x1+=10; } /* fragment? expand frame */ + if (x1-x0+1<62) { x0-=5; x1+=5; } + if (y1-y0+1<10) { y0-= 4; y1+= 4; } /* fragment? */ + if (x0<0) x0=0; if (x1>=b->x) x1=b->x-1; + if (y0<0) y0=0; if (y1>=b->y) y1=b->y-1; + dx=x1-x0+1; + dy=y1-y0+1; yy0=y0; + fprintf(stderr,"\n# show box + environment"); + fprintf(stderr,"\n# show box x= %4d %4d d= %3d %3d r= %d %d", + px->x0, px->y0, px->x1 - px->x0 + 1, px->y1 - px->y0 + 1, + px->x - px->x0, px->y - px->y0); + if (px->num_ac){ /* output table of chars and its probabilities */ + fprintf(stderr,"\n# list box char: "); + for(i=0;inum_ac && itas[i]) + fprintf(stderr," %s(%d)", px->tas[i] ,px->wac[i]); + else + fprintf(stderr," %s(%d)",decode(px->tac[i],ASCII),px->wac[i]); + } + fprintf(stderr,"\n"); + if (px->dots && px->m2 && px->m1m1; dy=px->y1-yy0+1; } + } + tx=dx/80+1; + ty=dy/40+1; // step, usually 1, but greater on large maps + fprintf(stderr,"# show pattern x= %4d %4d d= %3d %3d t= %d %d\n", + x0,y0,dx,dy,tx,ty); + if (dx>0) + for(y=yy0;yx0 || x > px->x1 + || y+ty-1 < px->y0 || y > px->y1) c1=((c1=='#')?'O':','); + fprintf(stderr,"%c", c1 ); + } + + c1=c2=' '; + /* mark lines with < */ + if (px) if (y==px->m1 || y==px->m2 || y==px->m3 || y==px->m4) c1='<'; + if (y==px->y0 || y==px->y1) c2='-'; /* boxmarks */ + fprintf(stderr,"%c%c\n",c1,c2); + } +} + + +/* +// second variant, for database (with slightly other behaviour) +// new variant +// look at the environment of the pixel too (contrast etc.) +// detailed analysis only of diff pixels! +// +// 100% * distance, 0 is best fit +// = similarity of 2 chars for recognition of noisy chars +// weigth of pixels with only one same neighbour set to 0 +// look at contours too! + ToDo: especially on small boxes distance should only be 0 if + characters are 100% identical! +*/ +// #define DEBUG 2 +int distance2( pix *p1, struct box *box1, + pix *p2, struct box *box2, int cs){ + int rc=0,x,y,v1,v2,i1,i2,rgood=0,rbad=0, + x1,y1,x2,y2,dx,dy,dx1,dy1,dx2,dy2,tx,ty; +#if DEBUG == 2 + if(JOB->cfg.verbose) + fprintf(stderr," DEBUG: distance2\n"); +#endif + x1=box1->x0;y1=box1->y0;x2=box2->x0;y2=box2->y0; + dx1=box1->x1-box1->x0+1; dx2=box2->x1-box2->x0+1; dx=((dx1>dx2)?dx1:dx2);dx=dx1; + dy1=box1->y1-box1->y0+1; dy2=box2->y1-box2->y0+1; dy=((dy1>dy2)?dy1:dy2);dy=dy1; + if(abs(dx1-dx2)>1+dx/16 || abs(dy1-dy2)>1+dy/16) rbad++; // how to weight? + // compare relations to baseline and upper line + if(box1->m4>0 && box2->m4>0){ // used ??? + if(2*box1->y1>box1->m3+box1->m4 && 2*box2->y1m3+box2->m4) rbad+=128; + if(2*box1->y0>box1->m1+box1->m2 && 2*box2->y0m1+box2->m2) rbad+=128; + } + tx=dx/16; if(dx<17)tx=1; // raster + ty=dy/32; if(dy<33)ty=1; + // compare pixels + for( y=0;y0) + rbad+=16*v1; + } + if(rgood+rbad) rc= 100*rbad/(rgood+rbad); else rc=99; + /* if width/high is not correct add badness */ + rc += ( abs(dx1*dy2-dx2*dy1) * 10 ) / (dy1*dy2); + if (rc>100) rc=100; + if(/* rc<10 && */ JOB->cfg.verbose /* &1024 */){ +#if DEBUG == 2 + fprintf(stderr," distance2 rc=%d rgood=%d rbad=%d\n",rc,rgood,rbad); +// out_b(NULL,p1,box1->x0,box1->y0,box1->x1-box1->x0+1, +// box1->y1-box1->y0+1,cs); +// out_b(NULL,p2,box2->x0,box2->y0,box2->x1-box2->x0+1, +// box2->y1-box2->y0+1,cs); + out_x(box1); + out_x(box2); +#endif + } + return rc; +} + +wchar_t ocr_db(struct box *box1) { + int dd = 1000, dist = 1000; + wchar_t c = UNKNOWN; + char buf[200]; + Box *box2, *box3; + + if (!list_empty(&JOB->tmp.dblist)){ + box3 = (Box *)list_get_header(&JOB->tmp.dblist); + if(JOB->cfg.verbose) + fprintf(stderr,"\n#DEBUG: ocr_db (%d,%d) ",box1->x0, box1->y0); + + for_each_data(&JOB->tmp.dblist) { + box2 = (Box *)list_get_current(&JOB->tmp.dblist); + /* do preselect!!! distance() slowly */ + dd = distance2( box2->p, box2, box1->p, box1, JOB->cfg.cs); + if (dd <= dist) { /* new best fit */ + dist = dd; + box3 = box2; /* box3 is a pointer and not copied box2 */ + + if (dist<100 && 100-dist > JOB->cfg.certainty) { + /* some deviation of the pattern is tolerated */ + int i, wa; + for (i=0;inum_ac;i++) { + wa = (100-dist)*box3->wac[i]/100; /* weight *= (100-dist) */ + if (box3->tas[i]) setas(box1,box3->tas[i],wa); + else setac(box1,box3->tac[i],wa); + } + if (box3->num_ac) c=box3->tac[0]; /* 0 for strings (!UNKNOWN) */ + if (JOB->cfg.verbose) + fprintf(stderr, " dist=%4d c= %c 0x%02x %s wc= %3d", dist, + ((box3->c>32 && box3->c<127) ? (char) box3->c : '.'), + (int)box3->c, ((box3->tas[0])?box3->tas[0]:""), box3->wac[0]); + } + if (dd<=0 && ((box3->num_ac && box3->tas[0]) || box3->c >= 128 + || !strchr ("l1|I0O", box3->c))) + break; /* speedup if found */ + } + } end_for_each(&JOB->tmp.dblist); + + } + + if( (JOB->cfg.mode&128) != 0 && c == UNKNOWN ) { /* prompt the user */ + /* should the output go to stderr or special pipe??? */ + int utf8_ok=0; /* trigger this flag if input is ok */ + int i, endchar; /* index */ + out_env(box1); /* old: out_x(box1); */ + fprintf(stderr,"The above pattern was not recognized.\n" + "Enter UTF8 char or string for above pattern. Leave empty if unsure.\n" + "Press RET at the end (ALT+RET to store into RAM only) : " + ); /* ToDo: empty + alt-return (0x1b 0x0a) for help? ^a for skip all */ + /* UTF-8 (man 7 utf-8): + * 7bit = 0xxxxxxx (0000-007F) + * 11bit = 110xxxxx 10xxxxxx (0080-07FF) + * 16bit = 1110xxxx 10xxxxxx 10xxxxxx (0800-FFFF) + * 21bit = 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx + * 26bit = 111110xx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx + * 31bit = 1111110x 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx + */ + buf[0]=0; + /* shift/ctrl/altgr-enter acts like enter or ^j or ^m, + * alt-enter returns 0x1b 0x0a and returns from fgets() + * ^d (EOF) returns (nil) from fgets() + * x+(2*)ctrl-d returns from fgets() without returning a 0x0a + * if not UTF-input-mode, we are in trouble? + * ^a=0x01, ^b=0x02, ^e=05, ..., ToDo: meaning of no-input or <=space + */ + fgets(buf,200,stdin); /* including \n=0x0a */ + dd=strlen(buf); + /* output hexcode if verbose set */ + if (JOB->cfg.verbose) { + fprintf(stderr, "\n# fgets [%d]:", dd); + for(i=0; icfg.mode&=~128; } /* skip all */ + buf[dd=i]=0; /* replace final 0x0a or other special codes */ + if (dd==1 && !(buf[0]&128)) { c=buf[0]; utf8_ok=1; } /* single char */ + if (dd>1 && dd<7) { /* try to decode single wide char (utf8) */ + int u0, u1; /* define UTF8-start sequences, u0=0bits u1=1bits */ + u0= 1<<(7-dd); /* compute start byte from UTF8-length */ + u1=255&~((1<<(8-dd))-1); + for (i=1;i0){ /* ToDo: skip space and tab too? */ + if (utf8_ok==1) { setac(box1, c, 100); } /* store single wchar */ + if (utf8_ok==0) { /* store a string of chars (UTF8-string) */ + c='_'; /* what should we do with c? probably a bad idea? */ + setas(box1, buf, 100); + } + /* decide between + * 0) just help gocr to find the results and (dont remember, 0x01) + * 1) help and remember in the same run (store to memory, 0x1b) + * 2) expand the database (dont store ugly chars to the database!) + */ + if (endchar!=0x01){ /* ^a before hit return */ + /* is there a reason to dont store to memory? */ + list_app(&JOB->tmp.dblist, box1); /* append to list for 1+2 */ + } + if (endchar!=0x01 && endchar!=0x1b){ + store_db(box1); /* store to disk for 2 */ + } + if (JOB->cfg.verbose) + fprintf(stderr, " got char= %c 16bit= 0x%04x string= \"%s\"\n", + ((c>32 && c<127)?(char)c:'.'), (int)c, buf); + } + } + + return c; +} diff --git a/lib/gocr/detect.c b/lib/gocr/detect.c new file mode 100644 index 0000000..bfd3ec9 --- /dev/null +++ b/lib/gocr/detect.c @@ -0,0 +1,943 @@ +/* +This is a Optical-Character-Recognition program +Copyright (C) 2000-2007 Joerg Schulenburg + +This program is free software; you can redistribute it and/or +modify it under the terms of the GNU General Public License +as published by the Free Software Foundation; either version 2 +of the License, or (at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + + check README for my email address +*/ + +#include +#include +#include +#include // toupper, tolower +#include "pgm2asc.h" +#include "gocr.h" + +// ----- detect lines --------------- +/* suggestion: Fourier transform and set line frequency where the + amplitude has a maximum (JS: slow and not smarty enough). + + option: range for line numbers 1..1000 or similar + todo: look for thickest line, and divide if thickness=2*mean_thickness + Set these elements of the box structs: + + m1 <-- top of upper case letters and (bdfhkl) (can differ) + m2 <-- top of letters (acegmnopqrsuvwxyz) + m3 <-- baseline + m4 <-- bottom of hanging letters (gqpy) + + performance can be improved by working with a temporary + list of boxes of the special text line + + - Jun23,00 more robustness of m3 (test liebfrau1) + - Feb01,02 more robustness of m4 (test s46_084.pgm) + - Dec03,12 fix problems with footnotes + ToDo: + - generate lists of boxes per line (faster access) + - use statistics + - for each box look at it neighbours and set box-m1..m4 + - m[1..4].max .min if m4.min-m3.max<1 probability lower + */ +int detect_lines1(pix * p, int x0, int y0, int dx, int dy) +{ + int i, jj, j2, y, yy, my, mi, mc, i1, i2, i3, i4, + m1, m2, m3, m4, ma1, ma2, ma3, ma4, m3pre, m4pre; + struct box *box2, *box3; /* box3 is for verbose / debugging */ + struct tlines *lines = &JOB->res.lines; + + /* ToDo: optional read line-data from external source??? */ + if (lines->num == 0) { // initialize one dummy-line for pictures etc. + lines->m4[0] = 0; + lines->m3[0] = 0; + lines->m2[0] = 0; + lines->m1[0] = 0; + lines->x0[0] = p->x; /* expand to left end during detection */ + lines->x1[0] = 0; /* expand to right end */ + lines->pitch[0] = JOB->cfg.spc; /* default word pitch */ + lines->mono[0] = 0; /* default spacing = prop */ + lines->num++; + } + i = lines->num; + if (dy < 4) + return 0; /* image is to low for latin chars */ + my = jj = 0; + // get the mean height of all hollow chars + // (better than mean value of everything including bg-pattern or dust?) + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if ( box2->c != PICTURE + && box2->num_frames>1 && box2->num_frames<3 /* 1 or 2 holes */ + && box2->y0 >= y0 && box2->y1 <= y0 + dy + && box2->x0 >= x0 && box2->x1 <= x0 + dx + && box2->frame_vol[0]>0 + && box2->frame_vol[1]<0 + ) { + jj++; + my += box2->y1 - box2->y0 + 1; + } + } end_for_each(&(JOB->res.boxlist)); + if (jj==0) { + // get the mean height of all chars + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if ( box2->c != PICTURE + && box2->y1 - box2->y0 + 1 >= 4 /* 4x6 font */ + && box2->y0 >= y0 && box2->y1 <= y0 + dy + && box2->x0 >= x0 && box2->x1 <= x0 + dx ) { + jj++; + my += box2->y1 - box2->y0 + 1; + } + } end_for_each(&(JOB->res.boxlist)); + } + if (jj == 0) + return 0; /* no chars detected */ + + + /* ToDo: a better way could be to mark good boxes (of typical high a-zA-Z0-9) + * first and handle only marked boxes for line scan, exclude ?!,.:;etc + * but without setect the chars itself (using good statistics) + * see adjust_text_lines() + */ + my /= jj; /* we only care about chars with high arround my */ + if (JOB->cfg.verbose & 16) + fprintf(stderr,"\n# detect_lines1(%d %d %d %d) vvv&16 chars=%d my=%d\n# ", + x0, y0, dx, dy, jj, my); + // "my" is the average over the whole image (bad, if different fontsizes) + + if (my < 4) + return 0; /* mean high is to small => error */ + + m4pre=m3pre=y0; /* lower bond of upper line */ + // better function for scanning line around a letter ??? + // or define lines around known chars "eaTmM" + for (j2 = y = y0; y < y0 + dy; y++) { + // look for max. of upper and lower bound of next line + m1 = y0 + dy; + jj = 0; +#if 1 + /* this is only for test runs */ + if (JOB->cfg.verbose & 16) + fprintf(stderr,"searching new line %d\n# ",i /* lines->num */); +#endif + + box3 = NULL; /* mark the most upper box starting next line */ + // find highest point of next line => store to m1-min (m1>=y) + // only objects greater 2/3*my and smaller 3*my are allowed + // a higher "!" at end of line can result in a to low m1 + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line>0 || box2->c == PICTURE) continue; + if (lines->dx) + yy = lines->dy * box2->x0 / (lines->dx); /* correct crooked lines */ + else yy=0; + if ( box2->y0 >= y + yy && box2->y1 < y0 + dy // lower than y + && box2->x0 >= x0 && box2->x1 < x0 + dx // within box ? + && box2->c != PICTURE // no picture + && box2->num_boxes <= 1 // ignore 2 for "!?i" 3 for "ä" + && 3 * (box2->y1 - box2->y0) > 2 * my // not to small + && (box2->y1 - box2->y0) < 3 * my // not to big + && (box2->y1 - box2->y0) > 4) // minimum absolute size + { + if (box2->y0 < m1 + yy) { + m1 = box2->y0 - yy; /* highest upper boundary */ + box3 = box2; + } + // fprintf(stderr,"\n %3d %3d %+3d %d m1= %3d", + // box2->x0, box2->y0, box2->y1 - box2->y0 + 1, box2->num_boxes, m1); + } + } end_for_each(&(JOB->res.boxlist)); + if (!box3 || m1 >= y0+dy) break; /* no further line found */ + if (JOB->cfg.verbose & 16) + fprintf(stderr," most upper box at new line xy= %4d %4d %+4d %+4d\n# ", + box3->x0, box3->y0, box3->x1-box3->x0, box3->y1-box3->y0); + + // at the moment values depend from single chars, which can + // result in bad values (ex: 4x6 /\=) + // ToDo: 2) mean size of next line (store list of y0,y1) + // ToDo: 3) count num0[(y0-m1)*16/my], num1[(y1-m1)*16/my] + // ToDo: or down-top search horizontal nerarest neighbours + lines->x0[i] = x0 + dx - 1; /* expand during operation to left end */ + lines->x1[i] = x0; /* expand to the right end of line */ + m4=m2=m1; mi=m1+my; m3=m1+2*my; jj=0; + // find limits for upper bound, base line and ground line + // m2-max m3-min m4-max + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line>0 || box2->c == PICTURE) continue; + if ( box2->y0 < y0 || box2->y1 >= y0 + dy + || box2->x0 < x0 || box2->x1 >= x0 + dx ) continue; // out of image + if (lines->dx) yy = lines->dy * box2->x0 / (lines->dx); + else yy=0; + /* check for ij-dots, used if chars of same high */ + if ( box2->y0 >= y + yy + && box2->y0 >= y + && (box2->y1 - box2->y0) < my + && box2->y1 < m1 + yy + my/4 + && box2->y0 < mi + yy ) { + mi = box2->y0 - yy; /* highest upper boundary i-dot */ + } + // fprintf(stderr,"\n check %3d %3d-%3d y=%d yy=%d m1=%d", box2->x0, box2->y0, box2->y1, y, yy, m1); + /* get m2-max m3-min m4-max */ + if ( box2->y0 >= y + yy // lower than y + && 3 * (box2->y1 - box2->y0 + 1) > 2 * my // right size ? + && (box2->y1 - box2->y0 + 1) < 3 * my // font mix, size = 2.6*my + && (box2->y1 - box2->y0 + 1) > 3 // 4x6 lowercase=4 + && box2->y0 >= m1 // in m1 range? + && box2->y0 <= m1 + yy + 9 * my / 8 // my can be to small if mixed + // ToDo: we need a better (local?) algorithm for big headlines > 2*my + && box2->y1 <= m1 + yy + 3 * my + && box2->y1 >= m1 + yy + my / 2 + // lines can differ in high, my may be to small (smaller headlines) + && box2->y0+box2->y1 <= 2*box3->y1 + ) + { + jj++; // count chars for debugging purpose + if (box2->y0 > m2 + yy) { + m2 = box2->y0 - yy; /* highest upper boundary */ + if (JOB->cfg.verbose & 16) + fprintf(stderr," set m2= %d yy= %d\n# ",m2, yy); + } + if (box2->y1 > m4 + yy && (my>6 || box2->y1 < m3+my)) { + m4 = box2->y1 - yy; /* lowest lower boundary, small font lines can touch */ + } + if ( box2->y1 < m3 + yy + && ( ( 2*box2->y1 > m2+ m4+yy && m2>m1) + || ( 4*box2->y1 > m1+3*m4+yy) ) ) // care for TeX: \(^1\)Footnote 2003 + /* "'!?" could cause trouble here, therefore this lines */ + /* ToDo: get_bw costs time, check pre and next */ + if( get_bw(box2->x0,box2->x1,box2->y1+1 ,box2->y1+my/2,box2->p,JOB->cfg.cs,1) == 0 + || get_bw(box2->x0,box2->x1,box2->y1+my/2,box2->y1+my/2,box2->p,JOB->cfg.cs,1) == 1 + || num_cross(box2->x0,box2->x1,(box2->y0+box2->y1)/2,(box2->y0+box2->y1)/2,box2->p,JOB->cfg.cs)>2 ) + { + m3 = box2->y1 - yy; /* highest lower boundary */ + // printf("\n# set1 m3 m=%3d %+2d %+2d %+2d",m1,m2-m1,m3-m1,m4-m1); + // out_x(box2); + } + if (box2->y0 + box2->y1 > 2*(m3 + yy) + && box2->y1 < m4 + yy - my/4 -1 + && box2->y1 >= (m2 + m4)/2 // care for TeX: \(^1\)Footnote 2003 + && m2 > m1 ) // be sure to not use ', m2 must be ok + { + m3 = box2->y1 - yy; /* highest lower boundary */ + // printf("\n# set2 m3 m=%3d %+2d %+2d %+2d",m1,m2-m1,m3-m1,m4-m1); + // out_x(box2); + } + if (box2->x1>lines->x1[i]) lines->x1[i] = box2->x1; /* right end */ + if (box2->x0x0[i]) lines->x0[i] = box2->x0; /* left end */ + // printf(" m=%3d %+2d %+2d %+2d yy=%3d\n",m1,m2-m1,m3-m1,m4-m1,yy); + } + } end_for_each(&(JOB->res.boxlist)); + +#if 1 + /* this is only for test runs */ + if (JOB->cfg.verbose & 16) + fprintf(stderr," step 1 y=%4d m= %4d %+3d %+3d %+3d" + " my=%2d chars=%3d\n# ", + y, m1, m2-m1, m3-m1, m4-m1, my, jj); +#endif + + if (m3 == m1) + break; +#if 1 /* make averages about the line */ + // same again better estimation + mc = (3 * m3 + m1) / 4; /* lower center ? */ + ma1 = ma2 = ma3 = ma4 = i1 = i2 = i3 = i4 = jj = 0; + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line>0 || box2->c == PICTURE) continue; + if (lines->dx) yy = lines->dy * box2->x0 / (lines->dx); else yy=0; + if (box2->y0 >= y + yy && box2->y1 < y0 + dy // lower than y + && box2->x0 >= x0 && box2->x1 < x0 + dx // in box ? + && box2->c != PICTURE // no picture + && 2 * (box2->y1 - box2->y0) > my // right size ? + && (box2->y1 - box2->y0) < 4 * my) { + if ( box2->y0 - yy >= m1-my/4 + && box2->y0 - yy <= m2+my/4 + && box2->y1 - yy >= m3-my/4 + && box2->y1 - yy <= m4+my/4 ) { /* its within allowed range! */ + // jj++; // not used + if (abs(box2->y0 - yy - m1) <= abs(box2->y0 - yy - m2)) + { i1++; ma1 += box2->y0 - yy; } + else { i2++; ma2 += box2->y0 - yy; } + if (abs(box2->y1 - yy - m3) < abs(box2->y1 - yy - m4)) + { i3++; ma3 += box2->y1 - yy; } + else { i4++; ma4 += box2->y1 - yy; } + if (box2->x1>lines->x1[i]) lines->x1[i] = box2->x1; /* right end */ + if (box2->x0x0[i]) lines->x0[i] = box2->x0; /* left end */ + } + } + } end_for_each(&(JOB->res.boxlist)); + + if (i1) m1 = (ma1+i1/2) / i1; /* best rounded */ + if (i2) m2 = (ma2+i2/2) / i2; + if (i3) m3 = (ma3+i3-1) / i3; /* round up */ + if (i4) m4 = (ma4+i4-1) / i4; + // printf("\n# .. set3 m3 m=%3d %+2d %+2d %+2d",m1,m2-m1,m3-m1,m4-m1); + +#endif + + /* expand right and left end of line */ + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line>0 || box2->c == PICTURE) continue; + if (lines->dx) yy = lines->dy * box2->x0 / (lines->dx); else yy=0; + if ( box2->y0 >= y0 && box2->y1 < y0 + dy + && box2->x0 >= x0 && box2->x1 < x0 + dx // in box ? + && box2->c != PICTURE // no picture + && box2->y0 >= m1-1 + && box2->y0 <= m4 + && box2->y1 >= m1 + && box2->y1 <= m4+1 ) { /* its within line */ + if (box2->x1>lines->x1[i]) lines->x1[i] = box2->x1; /* right end */ + if (box2->x0x0[i]) lines->x0[i] = box2->x0; /* left end */ + } + } end_for_each(&(JOB->res.boxlist)); + +#if 1 + /* this is only for test runs */ + if (JOB->cfg.verbose & 16) + fprintf(stderr," step 2 y=%4d m= %4d %+3d %+3d %+3d\n# ", + y,m1,m2-m1,m3-m1,m4-m1); +#endif + + if (m4 == m1) { + if(m3+m4>2*y) y = (m4+m3)/2; /* lower end may overlap the next line */ + continue; + } + jj=0; + lines->wt[i] = 100; + if (5 * (m2 - m1 +1) < m3 - m2 || (m2 - m1) < 2) jj|=1; /* same high */ + if (5 * (m4 - m3 +1) < m3 - m2 || (m4 - m3) < 1) jj|=2; /* same base */ + if (jj&1) lines->wt[i] = 75*lines->wt[i]/100; + if (jj&2) lines->wt[i] = 75*lines->wt[i]/100; + if (jj>0 && JOB->cfg.verbose) { + fprintf(stderr," trouble on line %d, wt*100= %d\n",i,lines->wt[i]); + fprintf(stderr,"# m= %4d %+3d %+3d %+3d\n",m1,m2-m1,m3-m1,m4-m1); + fprintf(stderr,"# i= %3d %3d %3d %3d (counts)\n",i1,i2,i3,i4); + if (jj==3) fprintf(stderr,"# all boxes of same high!\n# "); + if (jj==1) fprintf(stderr,"# all boxes of same upper bound!\n# "); + if (jj==2) fprintf(stderr,"# all boxes of same lower bound!\n# "); + } + /* ToDo: check for dots ij,. to get the missing information */ +#if 1 + /* jj=3: ABCDEF123456 or mnmno or gqpy or lkhfdtb => we are in trouble */ + if (jj==3 && (m4-m1)>my) { jj=0; m2=m1+my/8+1; m4=m3+my/8+1; } /* ABC123 */ + /* using idots, may fail on "ABCDEFGÄÜÖ" */ + if (jj==3 && mi>0 && mim4pre) { jj=2; m1=mi; } /* use ij dots */ + if (jj==1 && m2-(m3-m2)/4>m3pre ) { /* expect: acegmnopqrsuvwxyz */ + if (m1-m4pre0 && JOB->cfg.verbose & 16) { + fprintf(stderr," m= %4d %+2d %+2d %+2d my= %4d\n# ", + m1, m2-m1, m3-m1, m4-m1, my); + } +#endif + + + { // empty space between lines + lines->m4[i] = m4; + lines->m3[i] = m3; + lines->m2[i] = m2; + lines->m1[i] = m1; + lines->pitch[i] = JOB->cfg.spc; /* default word pitch */ + lines->pitch[i] = 0; /* default spacing */ + if (JOB->cfg.verbose & 16) + fprintf(stderr, " m= %4d %+3d %+3d %+3d w= %d (line=%d)\n# ", + m1, m2 - m1, m3 - m1, m4 - m1, lines->wt[i], i); + if (i < MAXlines && m4 - m1 > 4) + i++; + if (i >= MAXlines) { + fprintf(stderr, "Warning: lines>MAXlines\n"); + break; + } + } + if (m3+m4>2*y) y = (m3+m4)/2; /* lower end may overlap the next line */ + if (m3>m3pre) m3pre = m3; else m3=y0; /* set for next-line scan */ + if (m4>m4pre) m4pre = m4; else m4=y0; /* set for next-line scan */ + } + lines->num = i; + if (JOB->cfg.verbose) + fprintf(stderr, " num_lines= %d", lines->num-1); + return 0; +} + +// ----- layout analyzis of dx*dy region at x0,y0 ----- +// ----- detect lines via recursive division (new version) --------------- +// what about text in frames??? +// ToDo: change to bottom-top analyse or/and take rotation into account +int detect_lines2(pix *p,int x0,int y0,int dx,int dy,int r){ + int i,x2,y2,x3,y3,x4,y4,x5,y5,y6,mx,my,x30,x31,y30,y31; + struct box *box2,*box3; + // shrink box + if(dx<=0 || dy<=0) return 0; + if(y0+dy< p->y/128 && y0==0) return 0; /* looks like dust */ + if(y0>p->y-p->y/128 && y0+dy==p->y) return 0; /* looks like dust */ + + if(r>1000){ return -1;} // something is wrong + if(JOB->cfg.verbose)fprintf(stderr,"\n# r=%2d ",r); + + mx=my=i=0; // mean thickness + // remove border, shrink size + x2=x0+dx-1; // min x + y2=y0+dy-1; // min y + x3=x0; // max x + y3=y0; // max y + for_each_data(&(JOB->res.boxlist)) { + box3 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if(box3->y0>=y0 && box3->y1x0>=x0 && box3->x1x1 > x3 ) x3=box3->x1; // max x + if( box3->x0 < x2 ) x2=box3->x0; // min x + if( box3->y1 > y3 ) y3=box3->y1; // max y + if( box3->y0 < y2 ) y2=box3->y0; // min y + if(box3->c!=PICTURE) + if( box3->y1 - box3->y0 > 4 ) + { + i++; + mx+=box3->x1-box3->x0+1; // mean x + my+=box3->y1-box3->y0+1; // mean y + } + } + } end_for_each(&(JOB->res.boxlist)); + x0=x2; dx=x3-x2+1; + y0=y2; dy=y3-y2+1; + + if(i==0 || dx<=0 || dy<=0) return 0; + mx/=i;my/=i; + // better look for widest h/v-gap, ToDo: vertical lines? + if(r<8){ // max. depth + + // detect widest horizontal gap + y2=y3=y4=y5=y6=0; + x2=x3=x4=x5=y5=0;// min. 3 lines + // position and thickness of gap, y6=num_gaps, nbox^2 ops + for_each_data(&(JOB->res.boxlist)) { // not very efficient, sorry + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if( box2->c!=PICTURE ) /* ToDo: not sure, that this is a good idea */ + if( box2->y0>=y0 && box2->y1x0>=x0 && box2->x1y1-box2->y0>my/2 ){ // no pictures & dust??? + + y4=y0+dy-1; // nearest vert. box + x4=x0+dx-1; + // ToDo: rotate back box2->x1,y1 to x21,y21 + // look for nearest lowest (y4) and right (x4) neighbour + // of every box (box2) + for_each_data(&(JOB->res.boxlist)) { + box3 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if(box3!=box2) + if(box3->y0>=y0 && box3->y1x0>=x0 && box3->x1c!=PICTURE) /* ToDo: not sure, that this is a good idea */ + if(box3->y1-box3->y0>my/2 ){ + // ToDo: here we need the rotation around box2 + x30=box3->x0; + x31=box3->x1; + y30=box3->y0; + y31=box3->y1; + // get min. distances to lower and to right direction + if( y31 > box2->y1 && y30 < y4 ) y4=y30-1; + if( x31 > box2->x1 && x30 < x4 ) x4=x30-1; + } + } end_for_each(&(JOB->res.boxlist)); + // set the witdht and position of largest hor./vert. gap + // largest gap: width position + if( y4-box2->y1 > y3 ) { y3=y4-box2->y1; y2=(y4+box2->y1)/2; } + if( x4-box2->x1 > x3 ) { x3=x4-box2->x1; x2=(x4+box2->x1)/2; } + } + } end_for_each(&(JOB->res.boxlist)); + // fprintf(stderr,"\n widest y-gap= %4d %4d",y2,y3); + // fprintf(stderr,"\n widest x-gap= %4d %4d",x2,x3); + + i=0; // i=1 at x, i=2 at y + // this is the critical point + // is this a good decision or not??? + if(x3>0 || y3>0){ + if(x3>mx && x3>2*y3 && (dy>5*x3 || (x3>10*y3 && y3>0))) i=1; else + if(dx>5*y3 && y3>my) i=2; + } + + // compare with largest box??? + for_each_data(&(JOB->res.boxlist)) { // not very efficient, sorry + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if( box2->c == PICTURE ) + if( box2->y0>=y0 && box2->y1x0>=x0 && box2->x1x1-box2->x0+4 > dx && box2->y1+4y1+1; i=2; break; } + if( box2->x1-box2->x0+4 > dx && box2->y0-4>y0 ) { y3=1; y2=box2->y0-1; i=2; break; } + if( box2->y1-box2->y0+4 > dy && box2->x1+4x1+1; i=1; break; } + if( box2->y1-box2->y0+4 > dy && box2->x0-4>x0 ) { x3=1; x2=box2->x0-1; i=1; break; } + } + } end_for_each(&(JOB->res.boxlist)); + if(JOB->cfg.verbose)fprintf(stderr," i=%d",i); + + if(JOB->cfg.verbose && i) fprintf(stderr," divide at %s x=%4d y=%4d dx=%4d dy=%4d", + ((i)?( (i==1)?"x":"y" ):"?"),x2,y2,x3,y3); + // divide horizontally if v-gap is thicker than h-gap + // and length is larger 5*width + if(i==1){ detect_lines2(p,x0,y0,x2-x0+1,dy,r+1); + return detect_lines2(p,x2,y0,x0+dx-x2+1,dy,r+1); } + // divide vertically + if(i==2){ detect_lines2(p,x0,y0,dx,y2-y0+1,r+1); + return detect_lines2(p,x0,y2,dx,y0+dy-y2+1,r+1); + } + } + + + if(JOB->cfg.verbose) if(dx<5 || dy<7)fprintf(stderr," empty box"); + if(dx<5 || dy<7) return 0; // do not care about dust + if(JOB->cfg.verbose)fprintf(stderr, " box detected at %4d %4d %4d %4d",x0,y0,dx,dy); + if(JOB->tmp.ppo.p){ + for(i=0;itmp.ppo,x0+i ,y0 ,255,16); + for(i=0;itmp.ppo,x0+i ,y0+dy-1,255,16); + for(i=0;itmp.ppo,x0 ,y0+i ,255,16); + for(i=0;itmp.ppo,x0+dx-1,y0+i ,255,16); + // writebmp("out10.bmp",p2,JOB->cfg.verbose); // colored should be better + } + return detect_lines1(p,x0-0*1,y0-0*2,dx+0*2,dy+0*3); + +/* + struct tlines *lines = &JOB->res.lines; + i=lines->num; lines->num++; + lines->m1[i]=y0; lines->m2[i]=y0+5*dy/16; + lines->m3[i]=y0+12*dy/16; lines->m4[i]=y0+dy-1; + lines->x0[i]=x0; lines->x1[i]=x0+dx-1; + if(JOB->cfg.verbose)fprintf(stderr," - line= %d",lines->num); + return 0; + */ +} + +/* ToDo: herons algorithm for square root x=(x+y/x)/2 is more efficient + * than interval subdivision (?) (germ.: Intervallschachtelung) + * without using matlib + * see http://www.math.vt.edu/people/brown/doc/sqrts.pdf + */ +int my_sqrt(int x){ + int y0=0,y1=x,ym; + for (;y0res.lines.{dx,dy} + * pass 1: get mean vector to nearest char + * pass 2: get mean vector to nearest char without outriders to pass 1 + * extimate direction as (dx,dy,num)[pass] + * ToDo: estimate an error, boxes only work fine for zero-rotation + * for 45 degree use vectors, not boxes to get base line + */ +#define INorm 1024 /* integer unit 1.0 */ +int detect_rotation_angle(job_t *job){ + struct box *box2, *box3, + *box_nn; /* nearest neighbour box */ + int x2, y2, x3, y3, dist, mindist, pass, + rx=0, ry=0, re=0, // final result + /* to avoid 2nd run, wie store pairs in 2 different categories */ + nn[4]={0,0,0,0}, /* num_pairs used for estimation [(pass-1)%2,pass%2] */ + dx[4]={0,0,0,0}, /* x-component of rotation vector per pass */ + dy[4]={0,0,0,0}, /* y-component of rotation vector per pass */ + er[4]={INorm/4,0,0,0}; /* mean angle deviation to pass-1 (radius^2) */ + // de; /* ToDo: absolute maximum error (dx^2+dy^2) */ + // ToDo: next pass: go to bigger distances and reduce max error + // error is diff between passes? or diff of bottoms and top borders (?) + + rx=1024; ry=0; // default + for (pass=0;pass<4;pass++) { + for_each_data(&(job->res.boxlist)) { + box2 = (struct box *)list_get_current(&(job->res.boxlist)); + if (box2->c==PICTURE) continue; + /* subfunction probability of char */ + // i? + // if (box2->x1 - box2->x0 < 3) continue; /* smallest font is 4x6 */ + if (box2->y1 - box2->y0 < 4) continue; + /* set maximum possible distance */ + box_nn=box2; // initial box to compare with + + // ToDo: clustering or majority + // the algorithm is far from being perfect, pitfalls are likely + // but its better than the old algorithm, ToDo: database-rotated-images + mindist = job->src.p.x * job->src.p.x + job->src.p.y * job->src.p.y; + /* get middle point of the box */ + x2 = (box2->x0 + box2->x1)/2; + y2 = (box2->y0 + box2->y1)/2; + re=0; + /* search for nearest neighbour box_nn[pass+1] of box_nn[pass] */ + for_each_data(&(job->res.boxlist)) { + box3 = (struct box *)list_get_current(&(job->res.boxlist)); + /* try to select only potential neighbouring chars */ + /* select out all senseless combinations */ + if (box3->c==PICTURE || box3==box2) continue; + x3 = (box3->x0 + box3->x1)/2; + y3 = (box3->y0 + box3->y1)/2; /* get middle point of the box */ + if (x3 pass-1? + // scalprod max in direction, cross prod min in direction + // a,b (vectors): ^2/(|a|*|b|)^2 = 0(90deg)..0.5(45deg).. 1(0deg) + // * 1024 ?? + if (pass>0) { // new variant = scalar product + // danger of int overflow, ToDo: use int fraction + re =(int) ((1.*(x3-x2)*dx[pass-1]+(y3-y2)*dy[pass-1]) + *(1.*(x3-x2)*dx[pass-1]+(y3-y2)*dy[pass-1])*INorm + /(1.*((x3-x2)*(x3-x2)+(y3-y2)*(y3-y2)) + *(1.*dx[pass-1]*dx[pass-1]+dy[pass-1]*dy[pass-1]))); + if (INorm-re>er[pass-1]) continue; // hits mean deviation + } + /* neighbours should have same order of size (?) */ + if (3*(box3->y1-box3->y0+4) < 2*(box2->y1-box2->y0+1)) continue; + if (2*(box3->y1-box3->y0+1) > 3*(box2->y1-box2->y0+4)) continue; + if (2*(box3->x1-box3->x0+1) > 5*(box2->x1-box2->x0+4)) continue; + if (5*(box3->x1-box3->x0+4) < 2*(box2->x1-box2->x0+1)) continue; + /* should be in right range, Idea: center3 outside box2? noholes */ + if ((x3x1-1) && (x3>box2->x0+1) + && (y3y1-1) && (y3>box2->y0+1)) continue; + // if chars are of different size, connect careful + if ( abs(x3-x2) > 2*(box2->x1 - box2->x0 + box3->x1 - box3 ->x0 + 2)) continue; + if ( abs(y3-y2) > (box2->x1 - box2->x0 + box3->x1 - box3 ->x0 + 2)) continue; + dist = (y3-y2)*(y3-y2) + (x3-x2)*(x3-x2); + // make distances in pass-1 directions shorter or continue if not in pass-1 range? + if (dist<9) continue; /* minimum distance^2 is 3^2 */ + if (distres.boxlist)); + + if (box_nn==box2) continue; /* has no neighbour, next box */ + + box3=box_nn; dist=mindist; + x3 = (box3->x0 + box3->x1)/2; + y3 = (box3->y0 + box3->y1)/2; /* get middle point of the box */ + // dist = my_sqrt(1024*((x3-x2)*(x3-x2)+(y3-y2)*(y3-y2))); + // compare with first box + x2 = (box2->x0 + box2->x1)/2; + y2 = (box2->y0 + box2->y1)/2; + // if the high of neighbouring boxes differ, use min diff (y0,y1) + if (pass>0 && 16*abs(dy[pass-1]) < dx[pass-1]) // dont work for strong rot. + if (abs(box2->y1-box2->y0-box3->y1+box3->y0)>(box2->y1-box2->y0)/8) { + // ad eh ck ... + if (abs(box2->y1-box3->y1)y1; y3=box3->y1; } + // ag ep qu ... + if (abs(box2->y0-box3->y0)y0; y3=box3->y0; } + } + if (abs(x3-x2)<4) continue; + dx[pass]+=(x3-x2)*1024; /* normalized before averaging */ + dy[pass]+=(y3-y2)*1024; /* 1024 is for the precision */ + nn[pass]++; + if (pass>0) { // set error = mean deviation from pass -1 + re = INorm-(int)((1.*(x3-x2)*dx[pass-1]+(y3-y2)*dy[pass-1]) + *(1.*(x3-x2)*dx[pass-1]+(y3-y2)*dy[pass-1])*INorm + /((1.*(x3-x2)*(x3-x2)+(y3-y2)*(y3-y2)) + *(1.*dx[pass-1]*dx[pass-1]+dy[pass-1]*dy[pass-1])) + ); + er[pass]+=re; + } +#if 0 + if(JOB->cfg.verbose) + fprintf(stderr,"# next nb (x,y,dx,dy,re) %6d %6d %5d %5d %5d pass %d\n", + x2, y2, x3-x2, y3-y2, re, pass+1); +#endif + } end_for_each(&(job->res.boxlist)); + if (!nn[pass]) break; + if (nn[pass]) { + /* meanvalues */ + rx=dx[pass]/=nn[pass]; + ry=dy[pass]/=nn[pass]; + if (pass>0) er[pass]/=nn[pass]; + } + if(JOB->cfg.verbose) + fprintf(stderr,"# rotation angle (x,y,maxr,num)" + " %6d %6d %6d %4d pass %d\n", + rx, ry, er[pass], nn[pass], pass+1); + } + if (abs(ry*100)>abs(rx*50)) + fprintf(stderr,"\n"); + /* ToDo: normalize to 2^10 bit (square fits to 32 it) */ + JOB->res.lines.dx=rx; + JOB->res.lines.dy=ry; + return 0; +} + +/* ----- detect lines --------------- */ +int detect_text_lines(pix * pp, int mo) { + + if (JOB->cfg.verbose) + fprintf(stderr, "# detect.c detect_text_lines (vvv=16 for more info) "); + if (mo & 4){ + if (JOB->cfg.verbose) fprintf(stderr, "# zoning\n# ... "); + detect_lines2(pp, 0, 0, pp->x, pp->y, 0); // later replaced by better algo + } else + detect_lines1(pp, 0, 0, pp->x, pp->y); // old algo + + if(JOB->cfg.verbose) fprintf(stderr,"\n"); + return 0; +} + + +/* ----- adjust lines --------------- */ +// rotation angle? JOB->res.lines.dy, .x0 removed later +// this is for cases, where m1..m4 is not very sure detected before +// chars are recognized +int adjust_text_lines(pix * pp, int mo) { + struct box *box2; + int *m, /* summ m1..m4, num_chars for m1..m4, min m1..m4, max. m1..m4 */ + l, i, dy, dx, diff=0, y0, y1; + + if ((l=JOB->res.lines.num)<2) return 0; // ??? + if (JOB->cfg.verbose) + fprintf(stderr, "# adjust text lines "); + m=(int *)malloc(l*16*sizeof(int)); + if (!m) { fprintf(stderr," malloc failed\n"); return 0;} + for (i=0;i<16*l;i++) m[i]=0; /* initialize */ + dy=JOB->res.lines.dy; /* tan(alpha) of skewing */ + dx=JOB->res.lines.dx; /* old: width of image */ + // js: later skewing is replaced by one transformation of vectorized image + + if (dx) + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line<=0) continue; + if (box2->num_ac<1) continue; + if (box2->wac[0]<95) continue; + if (box2->m2==0 || box2->y1m2) continue; // char outside line + if (box2->m3==4 || box2->y0>box2->m3) continue; // char outside line + y0=box2->y0-((box2->x1)*dy/dx); /* corrected by page skewing */ + y1=box2->y1-((box2->x1)*dy/dx); + if (strchr("aemnr",(char)box2->tac[0])) { // cC vV sS oO ... is unsure! + m[box2->line*16+1]+=y0; m[box2->line*16+5]++; // num m2 + m[box2->line*16+2]+=y1; m[box2->line*16+6]++; // num m3 + if (m[box2->line*16+ 9]>y0) m[box2->line*16+ 9]=y0; /* min m2 */ + if (m[box2->line*16+13]line*16+13]=y0; /* max m2 */ + if (m[box2->line*16+10]>y1) m[box2->line*16+10]=y1; /* min m3 */ + if (m[box2->line*16+14]line*16+14]=y1; /* max m3 */ + } + if (strchr("bdhklABDEFGHIKLMNRT123456789",(char)box2->tac[0])) { + m[box2->line*16+0]+=y0; m[box2->line*16+4]++; // num m1 + m[box2->line*16+2]+=y1; m[box2->line*16+6]++; // num m3 + if (m[box2->line*16+ 8]>y0) m[box2->line*16+ 8]=y0; /* min m1 */ + if (m[box2->line*16+12]line*16+12]=y0; /* max m1 */ + if (m[box2->line*16+10]>y1) m[box2->line*16+10]=y1; /* min m3 */ + if (m[box2->line*16+14]line*16+14]=y1; /* max m3 */ + } + if (strchr("gq",(char)box2->tac[0])) { + m[box2->line*16+1]+=y0; m[box2->line*16+5]++; // num m2 + m[box2->line*16+3]+=y1; m[box2->line*16+7]++; // num m4 + if (m[box2->line*16+ 9]>y0) m[box2->line*16+ 9]=y0; /* min m2 */ + if (m[box2->line*16+13]line*16+13]=y0; /* max m2 */ + if (m[box2->line*16+11]>y1) m[box2->line*16+11]=y1; /* min m4 */ + if (m[box2->line*16+15]line*16+15]=y1; /* max m4 */ + } + } end_for_each(&(JOB->res.boxlist)); + + for (i=1;ires.lines.m1[i]-m[i*16+0]/m[i*16+4]); + if (m[i*16+5]) diff+=abs(JOB->res.lines.m2[i]-m[i*16+1]/m[i*16+5]); + if (m[i*16+6]) diff+=abs(JOB->res.lines.m3[i]-m[i*16+2]/m[i*16+6]); + if (m[i*16+7]) diff+=abs(JOB->res.lines.m4[i]-m[i*16+3]/m[i*16+7]); + /* recalculate sureness, empirically */ + if (m[i*16+4]*m[i*16+5]*m[i*16+6]*m[i*16+7] > 0) + JOB->res.lines.wt[i]=(JOB->res.lines.wt[i]+100)/2; + else + JOB->res.lines.wt[i]=(JOB->res.lines.wt[i]*90)/100; + // set mean values of sure detected bounds (rounded precisely) + if ( m[i*16+4]) JOB->res.lines.m1[i]=(m[i*16+0]+m[i*16+4]/2)/m[i*16+4]; + if ( m[i*16+5]) JOB->res.lines.m2[i]=(m[i*16+1]+m[i*16+5]/2)/m[i*16+5]; + if ( m[i*16+6]) JOB->res.lines.m3[i]=(m[i*16+2]+m[i*16+6]/2)/m[i*16+6]; + if ( m[i*16+7]) JOB->res.lines.m4[i]=(m[i*16+3]+m[i*16+7]/2)/m[i*16+7]; + // care about very small fonts + if (JOB->res.lines.m2[i]-JOB->res.lines.m1[i]<=1 && m[i*16+5]==0 && m[i*16+4]) + JOB->res.lines.m2[i]=JOB->res.lines.m1[i]+2; + if (JOB->res.lines.m2[i]-JOB->res.lines.m1[i]<=1 && m[i*16+4]==0 && m[i*16+5]) + JOB->res.lines.m1[i]=JOB->res.lines.m2[i]-2; + if (JOB->res.lines.m4[i]-JOB->res.lines.m3[i]<=1 && m[i*16+7]==0 && m[i*16+6]) + JOB->res.lines.m4[i]=JOB->res.lines.m3[i]+2; + if (JOB->res.lines.m4[i]-JOB->res.lines.m3[i]<=1 && m[i*16+6]==0 && m[i*16+7]) + JOB->res.lines.m3[i]=JOB->res.lines.m4[i]-2; + if ( m[i*16+7]<1 && + JOB->res.lines.m4[i] + <=JOB->res.lines.m3[i]+(JOB->res.lines.m3[i]-JOB->res.lines.m2[i])/4 ) + JOB->res.lines.m4[i]= + JOB->res.lines.m3[i]+(JOB->res.lines.m3[i]-JOB->res.lines.m2[i])/4; + if ( m[i*16+7]<1 && m[i*16+12+2]>0 && // m4 < max.m3+.. + JOB->res.lines.m4[i] < 2*m[i*16+12+2]-JOB->res.lines.m3[i]+2 ) + JOB->res.lines.m4[i] = 2*m[i*16+12+2]-JOB->res.lines.m3[i]+2; + if (JOB->res.lines.m4[i]<=JOB->res.lines.m3[i]) + JOB->res.lines.m4[i]= JOB->res.lines.m3[i]+1; /* 4x6 */ + + if (JOB->cfg.verbose & 17) + fprintf(stderr, "\n# line= %3d m= %4d %+3d %+3d %+3d " + " n= %2d %2d %2d %2d w= %3d diff= %d", + i, JOB->res.lines.m1[i], + JOB->res.lines.m2[i] - JOB->res.lines.m1[i], + JOB->res.lines.m3[i] - JOB->res.lines.m1[i], + JOB->res.lines.m4[i] - JOB->res.lines.m1[i], + m[i*16+4],m[i*16+5],m[i*16+6],m[i*16+7], + JOB->res.lines.wt[i], diff); + } + diff=0; // count adjusted chars +#if 1 + if (dx) + for_each_data(&(JOB->res.boxlist)) { + box2 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if (box2->line<=0) continue; + /* check if box was on the wrong line, ToDo: search a better line */ + if (2*box2->y0<2*JOB->res.lines.m1[box2->line] + -JOB->res.lines.m4[box2->line] + +JOB->res.lines.m1[box2->line]) box2->line=0; + if (2*box2->y1>2*JOB->res.lines.m4[box2->line] + +JOB->res.lines.m4[box2->line] + -JOB->res.lines.m1[box2->line]) box2->line=0; + /* do adjustments */ + if (box2->num_ac>0 + && box2->num_ac > 31 && box2->tac[0] < 127 /* islower(>256) may SIGSEGV */ + && strchr("cCoOpPsSuUvVwWxXyYzZ",(char)box2->tac[0])) { // no_wchar + if (box2->y0-((box2->x1)*dy/dx) + < (JOB->res.lines.m1[box2->line]+JOB->res.lines.m2[box2->line])/2 + && islower(box2->tac[0]) + ) { setac(box2,toupper((char)box2->tac[0]),(box2->wac[0]+101)/2); diff++; } + if (box2->y0-((box2->x1)*dy/dx) + > (JOB->res.lines.m1[box2->line]+JOB->res.lines.m2[box2->line]+1)/2 + && isupper(box2->tac[0]) + ){ setac(box2,tolower((char)box2->tac[0]),(box2->wac[0]+101)/2); diff++; } + } + box2->m1=JOB->res.lines.m1[box2->line]+((box2->x1)*dy/dx); + box2->m2=JOB->res.lines.m2[box2->line]+((box2->x1)*dy/dx); + box2->m3=JOB->res.lines.m3[box2->line]+((box2->x1)*dy/dx); + box2->m4=JOB->res.lines.m4[box2->line]+((box2->x1)*dy/dx); + } end_for_each(&(JOB->res.boxlist)); +#endif + + free(m); + if(JOB->cfg.verbose) fprintf(stderr,"\n# changed_chars= %d\n",diff); + return(diff); +} + +/* ---- measure mean character + * recalculate mean width and high after changes in boxlist + * ToDo: only within a Range? + */ +int calc_average() { + int i = 0, x0, y0, x1, y1; + struct box *box4; + + JOB->res.numC = 0; + JOB->res.sumY = 0; + JOB->res.sumX = 0; + for_each_data(&(JOB->res.boxlist)) { + box4 = (struct box *)list_get_current(&(JOB->res.boxlist)); + if( box4->c != PICTURE ){ + x0 = box4->x0; x1 = box4->x1; + y0 = box4->y0; y1 = box4->y1; + i++; + if (JOB->res.avX * JOB->res.avY > 0) { + if (x1 - x0 + 1 > 4 * JOB->res.avX + && y1 - y0 + 1 > 4 * JOB->res.avY) continue; /* small picture */ + if (4 * (y1 - y0 + 1) < JOB->res.avY || y1 - y0 < 2) + continue; // dots .,-_ etc. + } + if (x1 - x0 + 1 < 4 + && y1 - y0 + 1 < 6 ) continue; /* dots etc */ + JOB->res.sumX += x1 - x0 + 1; + JOB->res.sumY += y1 - y0 + 1; + JOB->res.numC++; + } + } end_for_each(&(JOB->res.boxlist)); + if ( JOB->res.numC ) { /* avoid div 0 */ + JOB->res.avY = (JOB->res.sumY+JOB->res.numC/2) / JOB->res.numC; + JOB->res.avX = (JOB->res.sumX+JOB->res.numC/2) / JOB->res.numC; + } + if (JOB->cfg.verbose){ + fprintf(stderr, "# averages: mXmY= %d %d nC= %d n= %d\n", + JOB->res.avX, JOB->res.avY, JOB->res.numC, i); + } + return 0; +} + + +/* ---- analyse boxes, find pictures and mark (do this first!!!) + */ +int detect_pictures(job_t *job) { + int i = 0, x0, y0, x1, y1, num_h; + struct box *box2, *box4; + + if ( job->res.numC == 0 ) { + if (job->cfg.verbose) fprintf(stderr, + "# detect.C L%d Warning: numC=0\n", __LINE__); + return -1; + } + /* ToDo: set Y to uppercase mean value? */ + job->res.avY = (job->res.sumY+job->res.numC/2) / job->res.numC; + job->res.avX = (job->res.sumX+job->res.numC/2) / job->res.numC; + /* ToDo: two highest volumes? crosses, on extreme volume + on border */ + if (job->cfg.verbose) + fprintf(stderr, "# detect.C L%d pictures, frames, mXmY= %d %d ... ", + __LINE__, job->res.avX, job->res.avY); + for_each_data(&(job->res.boxlist)) { + box2 = (struct box *)list_get_current(&(job->res.boxlist)); + if (box2->c == PICTURE) continue; + x0 = box2->x0; x1 = box2->x1; + y0 = box2->y0; y1 = box2->y1; + + /* pictures could be of unusual size */ + if (x1 - x0 + 1 > 4 * job->res.avX || y1 - y0 + 1 > 4 * job->res.avY) { + /* count objects on same baseline which could be chars */ + /* else: big headlines could be misinterpreted as pictures */ + num_h=0; + for_each_data(&(job->res.boxlist)) { + box4 = (struct box *)list_get_current(&(job->res.boxlist)); + if (box4->c == PICTURE) continue; + if (box4->y1-box4->y0 > 2*(y1-y0)) continue; + if (2*(box4->y1-box4->y0) < y1-y0) continue; + if (box4->y0 > y0 + (y1-y0+1)/2 + || box4->y0 < y0 - (y1-y0+1)/2 + || box4->y1 > y1 + (y1-y0+1)/2 + || box4->y1 < y1 - (y1-y0+1)/2) continue; + // ToDo: continue if numcross() only 1, example: |||IIIll||| + num_h++; + } end_for_each(&(job->res.boxlist)); + if (num_h>4) continue; + box2->c = PICTURE; + i++; + } + /* ToDo: pictures could have low contrast=Sum((pixel(p,x,y)-160)^2) */ + } end_for_each(&(job->res.boxlist)); + // start second iteration + if (job->cfg.verbose) { + fprintf(stderr, " %d - boxes %d\n", i, job->res.numC-i); + } + calc_average(); + return 0; +} diff --git a/lib/gocr/job.c b/lib/gocr/job.c new file mode 100644 index 0000000..eacb505 --- /dev/null +++ b/lib/gocr/job.c @@ -0,0 +1,83 @@ +/* +This is a Optical-Character-Recognition program +Copyright (C) 2000-2006 Joerg Schulenburg + +This program is free software; you can redistribute it and/or +modify it under the terms of the GNU General Public License +as published by the Free Software Foundation; either version 2 +of the License, or (at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program; if not, write to the Free Software +Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. + + see README for email address */ + +#include "pgm2asc.h" +#include "gocr.h" + +/* initialize job structure */ +void job_init(job_t *job) { + /* init source */ + job->src.fname = "-"; + /* FIXME jb: init pix */ + job->src.p.p = NULL; + + /* init results */ + list_init( &job->res.boxlist ); + list_init( &job->res.linelist ); + job->res.avX = 5; + job->res.avY = 8; + job->res.sumX = 0; + job->res.sumY = 0; + job->res.numC = 0; + job->res.lines.dy=0; + job->res.lines.num=0; + + /* init temporaries */ + list_init( &job->tmp.dblist ); + job->tmp.n_run = 0; + /* FIXME jb: init ppo */ + job->tmp.ppo.p = NULL; + job->tmp.ppo.x = 0; + job->tmp.ppo.y = 0; + + /* init cfg */ + job->cfg.cs = 0; + job->cfg.spc = 0; + job->cfg.mode = 0; + job->cfg.dust_size = -1; /* auto detect */ + job->cfg.only_numbers = 0; + job->cfg.verbose = 0; + job->cfg.out_format = UTF8; /* old: ISO8859_1; */ + job->cfg.lc = "_"; + job->cfg.db_path = (char*)NULL; + job->cfg.cfilter = (char*)NULL; + job->cfg.certainty = 95; +} + +/* free job structure */ +void job_free(job_t *job) { + + /* if tmp is just a copy of the pointer to the original image */ + if (job->tmp.ppo.p==job->src.p.p) job->tmp.ppo.p=NULL; + + /* FIMXE jb: free lists + * list_free( &job->res.linelist ); + * list_free( &job->tmp.dblist ); + */ + + list_and_data_free(&(job->res.boxlist), (void (*)(void *))free_box); + + /* FIXME jb: free pix */ + if (job->src.p.p) { free(job->src.p.p); job->src.p.p=NULL; } + + /* FIXME jb: free pix */ + if (job->tmp.ppo.p) { free(job->tmp.ppo.p); job->tmp.ppo.p=NULL; } + +}