void k2pdfopt_reflow_bmp(KOPTContext *kctx,WILLUSBITMAP *src,int init) { static K2PDFOPT_SETTINGS _k2settings, *k2settings; static MASTERINFO _masterinfo, *masterinfo; WILLUSBITMAP _srcgrey, *srcgrey; BMPREGION region; static int pages_done=0; srcgrey=&_srcgrey; bmp_init(srcgrey); k2settings=&_k2settings; masterinfo=&_masterinfo; /* First call or new document call should use init = 1 */ if (init==1) { /* Initialize settings */ k2pdfopt_settings_init_from_koptcontext(k2settings,kctx); k2pdfopt_settings_sanity_check(k2settings); /* Init master output structure */ masterinfo_init(masterinfo,k2settings); /* Init for new source doc */ k2pdfopt_settings_new_source_document_init(k2settings); } /* Init new source bitmap */ bmpregion_init(®ion); masterinfo_new_source_page_init(masterinfo,k2settings,src,srcgrey,NULL,®ion,0.,NULL,NULL,1,NULL); /* Process single source page */ if (init) pages_done=0; bmpregion_source_page_add(®ion,k2settings,masterinfo,1,pages_done++); bmp_free(srcgrey); /* ** Get output pages */ { WILLUSBITMAP *bmp,_bmp; int rows,size_reduction; double bmpdpi; bmp=&_bmp; bmp_init(bmp); while ((rows=masterinfo_get_next_output_page(masterinfo,k2settings,1,bmp, &bmpdpi,&size_reduction,NULL))>0) { /* Process output page stored in "bmp" */ } bmp_free(bmp); } /* Final call should use init = -999 */ if (init == -999) masterinfo_free(masterinfo,k2settings); }
/* ** k2pdfopt_proc_one() is the main source file processing function in k2pdfopt. ** ** Depending on the value of rot_deg, it either determines the correct rotation of ** the passed file, or it processes it and converts it. ** ** The basic idea is to parse the source document into rectangular regions ** (held in the BMPREGION structures) and then to place these regions into ** the master destination bitmap (kept track of in MASTERINFO structure). ** You can think of this bitmap as a sort of "infinitely scrolling" output ** bitmap which is then cut into output pages. ** ** The bmpregion_source_page_add() function parses the source file. ** ** The masterinfo_publish() cuts the output bitmap into destination pages. ** ** If rot_deg == SRCROT_AUTO, then the rotation correction of the source ** file is computed and returned, but no other processing is done. ** ** Otherwise, the source file is processed. */ static double k2pdfopt_proc_one(K2PDFOPT_SETTINGS *k2settings0,char *filename,double rot_deg, K2PDFOPT_OUTPUT *k2out) { static K2PDFOPT_SETTINGS _k2settings,*k2settings; static MASTERINFO _masterinfo,*masterinfo; static PDFFILE _mpdf,*mpdf; char dstfile[MAXFILENAMELEN]; char markedfile[MAXFILENAMELEN]; char rotstr[128]; WILLUSBITMAP _src,*src; WILLUSBITMAP _srcgrey,*srcgrey; WILLUSBITMAP _marked,*marked; WILLUSBITMAP preview_internal; int i,status,pw,np,src_type,second_time_through,or_detect,orep_detect,preview; int pagecount,pagestep,pages_done,local_tocwrites; int errcnt,pixwarn; FILELIST *fl,_fl; int folder,dpi; double size,bormean; char *mupdffilename; extern int k2mark_page_count; static char *funcname="k2pdfopt_proc_one"; static char *readerr=TTEXT_WARN "\a\n ** ERROR reading page %d from " TTEXT_BOLD2 "%s" TTEXT_WARN ".\n\n" TTEXT_NORMAL; static char *readlimit=TTEXT_WARN "\a\n ** (No more read errors will be echoed for file %s.)\n\n" TTEXT_NORMAL; /* extern void willus_mem_debug_update(char *); */ #if (WILLUSDEBUGX & 1) printf("@k2pdfopt_proc_one(%s)\n",filename); #endif /* printf("@k2pdfopt_proc_one(filename='%s', rot_deg=%g, preview_bitmap=%p)\n",filename,rot_deg,k2out->bmp); */ /* ** Check to see if we're only echoing page info */ if (k2settings0->info) { #ifdef HAVE_MUPDF_LIB char *buf; int *pagelist; pagelist_get_array(&pagelist,k2settings0->pagelist); /* { int i; for (i=0;pagelist!=NULL&&pagelist[i]>=0;i++) printf("pagelist[%d]=%d\n",i,pagelist[i]); printf("pagelist[%d]=%d\n",i,pagelist[i]); } */ wmupdfinfo_get(filename,pagelist,&buf); printf("%s",buf); if (buf!=NULL) free(buf); if (pagelist!=NULL) free(pagelist); #else printf("FILE: %s\n",filename); printf("Cannot print file info. MuPDF not compiled into application.\n"); #endif return(0.); } local_tocwrites=0; k2out->status = 1; k2settings=&_k2settings; k2pdfopt_settings_copy(k2settings,k2settings0); #ifdef HAVE_K2GUI if (k2gui_active()) k2gui_cbox_set_filename(filename); #endif mpdf=&_mpdf; /* Must be called once per conversion to init margins / devsize / output size */ k2pdfopt_settings_sanity_check(k2settings); k2pdfopt_settings_new_source_document_init(k2settings); errcnt=0; pixwarn=0; mupdffilename=_masterinfo.srcfilename; strncpy(mupdffilename,filename,MAXFILENAMELEN-1); mupdffilename[MAXFILENAMELEN-1]='\0'; or_detect=OR_DETECT(rot_deg); orep_detect=OREP_DETECT(k2settings); if ((fabs(k2settings->src_rot-SRCROT_AUTO)<.5 || orep_detect) && !or_detect) second_time_through=1; else second_time_through=0; /* Don't care about rotation if just echoing page count */ if (k2settings->echo_source_page_count && second_time_through==0) return(0.); if (or_detect && k2settings->src_dpi>300) dpi=300; else dpi=k2settings->src_dpi; folder=(wfile_status(filename)==2); /* if (folder && !second_time_through) k2printf("Processing " TTEXT_INPUT "BITMAP FOLDER %s" TTEXT_NORMAL "...\n", filename); */ /* else k2printf("Processing " TTEXT_BOLD2 "PDF FILE %s" TTEXT_NORMAL "...\n", filename); */ fl=&_fl; filelist_init(fl); if (folder) { char basename[MAXFILENAMELEN]; static char *iolist[]={"*.png","*.jpg",""}; static char *eolist[]={""}; wfile_basespec(basename,filename); if (!second_time_through) k2printf("Searching folder " TTEXT_BOLD2 "%s" TTEXT_NORMAL " ... ",basename); fflush(stdout); filelist_fill_from_disk(fl,filename,iolist,eolist,0,0); if (fl->n<=0) { if (!second_time_through) k2printf(TTEXT_WARN "\n** No bitmaps found in folder %s.\n\n" TTEXT_NORMAL,filename); k2out->status=2; return(0.); } if (!second_time_through) k2printf("%d bitmaps found in %s.\n",(int)fl->n,filename); filelist_sort_by_name(fl); } src=&_src; srcgrey=&_srcgrey; marked=&_marked; bmp_init(src); bmp_init(srcgrey); bmp_init(marked); pw=0; src_type = get_source_type(filename); #ifndef HAVE_DJVU_LIB if (src_type==SRC_TYPE_DJVU) { if (!or_detect) k2printf(TTEXT_WARN "\a\n\n** DjVuLibre not compiled into this version of k2pdfopt. **\n\n" "** Cannot process file %s. **\n\n" TTEXT_NORMAL,filename); k2out->status=3; return(0.); } #endif if (src_type==SRC_TYPE_PS) k2settings->usegs=1; /* ** Turn off native PDF output if source is not PDF */ if (src_type!=SRC_TYPE_PDF) { if (k2settings->use_crop_boxes && !or_detect) k2printf(TTEXT_WARN "\n** Native PDF output mode turned off on file %s. **\n" "** (It is not a PDF file.) **\n\n",filename); k2settings->use_crop_boxes=0; #ifdef HAVE_OCR_LIB if (k2settings->dst_ocr=='m') k2settings->dst_ocr=0; #endif } masterinfo=&_masterinfo; masterinfo_init(masterinfo,k2settings); if (k2settings->preview_page!=0 && !or_detect) { preview=1; if (k2out->bmp!=NULL) masterinfo->preview_bitmap=k2out->bmp; else { masterinfo->preview_bitmap=&preview_internal; bmp_init(masterinfo->preview_bitmap); } } else preview=0; if (!or_detect && !preview) { static int dstfilecount=0; wfile_newext(dstfile,filename,""); dstfilecount++; filename_substitute(dstfile,k2settings->dst_opname_format,filename,dstfilecount,"pdf"); #ifdef HAVE_OCR_LIB if (k2settings->ocrout[0]!='\0' && k2settings->dst_ocr) filename_substitute(masterinfo->ocrfilename,k2settings->ocrout,filename,dstfilecount,"txt"); else #endif masterinfo->ocrfilename[0]='\0'; if (!filename_comp(dstfile,filename)) { k2printf(TTEXT_WARN "\n\aSource file and ouput file have the same name!" TTEXT_NORMAL "\n\n"); k2printf(" Source file = '%s'\n",filename); k2printf(" Output file = '%s'\n",dstfile); k2printf(" Output file name format string = '%s'\n",k2settings->dst_opname_format); k2printf("\nOperation aborted.\n"); k2sys_exit(k2settings,50); } if ((status=overwrite_fail(dstfile,k2settings->overwrite_minsize_mb))!=0) { masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); if (status<0) k2sys_exit(k2settings,20); k2out->status=4; return(0.); } { int can_write; if (!k2settings->use_crop_boxes) can_write = (pdffile_init(&masterinfo->outfile,dstfile,1)!=NULL); else { FILE *f1; f1 = wfile_fopen_utf8(dstfile,"w"); can_write = (f1!=NULL); if (f1!=NULL) { fclose(f1); wfile_remove_utf8(dstfile); } if (!can_write) { k2printf(TTEXT_WARN "\n\aCannot open PDF file %s for output!" TTEXT_NORMAL "\n\n",dstfile); #ifdef HAVE_K2GUI if (k2gui_active()) { k2gui_okay("Failed to open output file", "Cannot open PDF file %s for output!\n" "Maybe another application has it open already?\n" "Conversion failed!",dstfile); k2out->status=4; return(0.); } #endif k2sys_exit(k2settings,30); } } } k2out->outname=NULL; /* Return output file name in k2out for GUI */ willus_mem_alloc((double **)&k2out->outname,(long)(strlen(dstfile)+1),funcname); if (k2out->outname!=NULL) strcpy(k2out->outname,dstfile); if (k2settings->use_crop_boxes) pdffile_close(&masterinfo->outfile); if (k2settings->show_marked_source) { filename_substitute(markedfile,"%s_marked",filename,0,"pdf"); if (pdffile_init(mpdf,markedfile,1)==NULL) { k2printf(TTEXT_WARN "\n\aCannot open PDF file %s for marked output!" TTEXT_NORMAL "\n\n",markedfile); k2sys_exit(k2settings,40); } } } if (src_type==SRC_TYPE_PDF || src_type==SRC_TYPE_DJVU) { np=file_numpages(filename,mupdffilename,src_type,&k2settings->usegs); #ifdef HAVE_MUPDF_LIB if (src_type==SRC_TYPE_PDF) { /* Get bookmarks / outline from PDF file */ if (!or_detect && k2settings->use_toc!=0 && !toclist_valid(k2settings->toclist,NULL)) { masterinfo->outline=wpdfoutline_read_from_pdf_file(mupdffilename); /* Save TOC if requested */ if (k2settings->tocsavefile[0]!='\0') { FILE *f; f=fopen(k2settings->tocsavefile,tocwrites==0?"w":"a"); if (f!=NULL) { int i; fprintf(f,"%sFILE: %s\n",tocwrites==0?"":"\n\n",mupdffilename); for (i=strlen(mupdffilename)+6;i>0;i--) fputc('-',f); fprintf(f,"\n"); if (masterinfo->outline!=NULL) wpdfoutline_echo2(masterinfo->outline,0,f); else fprintf(f,"(No outline info in file.)\n"); fclose(f); tocwrites++; local_tocwrites++; } } } } #endif } else if (src_type==SRC_TYPE_BITMAPFOLDER) np=fl->n; else np=-1; if (k2settings->echo_source_page_count) { printf("\"%s\" page count = %d\n",mupdffilename,np); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); return(0.); } masterinfo->srcpages = np; if (!or_detect && toclist_valid(k2settings->toclist,stdout)) { if (pagelist_valid_page_range(k2settings->toclist)) masterinfo->outline=wpdfoutline_from_pagelist(k2settings->toclist,masterinfo->srcpages); else masterinfo->outline=wpdfoutline_read_from_text_file(k2settings->toclist); } pagecount = np<0 ? -1 : double_pagelist_count(k2settings->pagelist,k2settings->pagexlist,np); #ifdef HAVE_K2GUI if (k2gui_active()) { k2gui_cbox_set_num_pages(pagecount<0 ? 1 : pagecount); k2gui_cbox_set_pages_completed(0,NULL); } #endif if (pagecount<0 || !or_detect) pagestep=1; else { pagestep=pagecount/10; if (pagestep<1) pagestep=1; } pages_done=0; if (np>0 && pagecount==0) { if (!second_time_through) k2printf("\a\n" TTEXT_WARN "No %ss to convert (-p %s -px %s)!" TTEXT_NORMAL "\n\n", folder?"file":"page",k2settings->pagelist,k2settings->pagexlist); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=5; return(0.); } if (!second_time_through) { k2printf("Reading "); if (pagecount>0) { if (pagecount<np) k2printf("%d out of %d %s%s",pagecount,np,folder?"file":"page",np>1?"s":""); else k2printf("%d %s%s",np,folder?"file":"page",np>1?"s":""); } else k2printf("%ss",folder?"file":"page"); k2printf(" from " TTEXT_BOLD2 "%s" TTEXT_NORMAL " ...\n",filename); } if (or_detect) k2printf("\nDetecting document orientation ... "); bormean=1.0; for (i=0;1;i+=pagestep) { char bmpfile[MAXFILENAMELEN]; int pageno,nextpage; /* sprintf(bmpfile,"i=%d",i); willus_mem_debug_update(bmpfile); */ pageno=0; if (pagecount>0 && i+1>pagecount) break; pageno = double_pagelist_page_by_index(k2settings->pagelist,k2settings->pagexlist,i,np); nextpage = (i+2>pagecount) ? -1 : double_pagelist_page_by_index(k2settings->pagelist, k2settings->pagexlist,i+1,np); /* Removed in v2.32 */ /* This always returned non-zero */ /* if (!pagelist_page_by_index(k2settings->pagelist,pageno,np)) continue; */ if (folder) { if (pageno-1>=fl->n) continue; wfile_fullname(bmpfile,fl->dir,fl->entry[pageno-1].name); status=bmp_read(src,bmpfile,stdout); if (status<0) { if (!second_time_through) k2printf(TTEXT_WARN "\n\aCould not read file %s.\n" TTEXT_NORMAL,bmpfile); continue; } } else { double npix; /* If not a PDF/DJVU/PS file, only read it once. */ if (i>0 && src_type!=SRC_TYPE_PDF && src_type!=SRC_TYPE_DJVU && src_type!=SRC_TYPE_PS) break; /* Pre-read at low dpi to check bitmap size */ wsys_set_decimal_period(1); status=bmp_get_one_document_page(src,k2settings,src_type,mupdffilename,pageno,10.,8, stdout); wsys_set_decimal_period(1); if (status<0) { errcnt++; if (errcnt<=10) { k2printf(readerr,pageno,filename); if (errcnt==10) k2printf(readlimit,filename); } /* Error reading PS probably means we've run out of pages. */ if (src_type==SRC_TYPE_PS) break; continue; } /* Sanity check the bitmap size */ npix = (double)(dpi/10.)*(dpi/10.)*src->width*src->height; if (npix > 2.5e8 && !pixwarn) { int ww,hh; ww=(int)((double)(dpi/10.)*src->width+.5); hh=(int)((double)(dpi/10.)*src->height+.5); k2printf("\a\n" TTEXT_WARN "\n\a ** Source resolution is very high (%d x %d pixels)!\n" " You may want to reduce the -odpi or -idpi setting!\n" " k2pdfopt may crash when reading the source file..." TTEXT_NORMAL "\n\n",ww,hh); pixwarn=1; } /* Read again at nominal source dpi */ wsys_set_decimal_period(1); if (k2settings_need_color_initially(k2settings)) status=bmp_get_one_document_page(src,k2settings,src_type,mupdffilename,pageno, dpi,24,stdout); else status=bmp_get_one_document_page(src,k2settings,src_type,mupdffilename,pageno, dpi,8,stdout); wsys_set_decimal_period(1); if (status<0) { errcnt++; if (errcnt<=10) { k2printf(readerr,pageno,filename); if (errcnt==10) aprintf(readlimit,filename); } /* Error reading PS probably means we've run out of pages. */ if (src_type==SRC_TYPE_PS) break; continue; } } k2mark_page_count = i+1; { BMPREGION region; int mstatus; /* Got Good Page Render */ bmpregion_init(®ion); bmpregion_k2pagebreakmarks_allocate(®ion); mstatus=masterinfo_new_source_page_init(masterinfo,k2settings,src,srcgrey,marked, ®ion,rot_deg,&bormean,rotstr,pageno,nextpage,stdout); if (mstatus==0) { /* v2.15 -- memory leak fix */ bmpregion_free(®ion); pages_done++; continue; } if (!preview) k2printf("\n" TTEXT_HEADER "SOURCE PAGE %d",pageno); if (pagecount>0) { if (!preview) { if (k2settings->pagelist[0]!='\0') k2printf(" (%d of %d)",pages_done+1,pagecount); else k2printf(" of %d",pagecount); } } if (!preview) { k2printf(TTEXT_NORMAL " (%.1f x %.1f in) ... %s",(double)srcgrey->width/k2settings->src_dpi, (double)srcgrey->height/k2settings->src_dpi,rotstr); fflush(stdout); } /* Parse the source bitmap for viewable regions */ bmpregion_source_page_add(®ion,k2settings,masterinfo,1,pages_done++); /* v2.15 memory leak fix */ bmpregion_free(®ion); } /* End declaration of BMPREGION region */ #ifdef HAVE_K2GUI if (k2gui_active()) k2gui_cbox_set_pages_completed(pages_done,NULL); #endif if (k2settings->verbose) { k2printf(" master->rows=%d\n",masterinfo->rows); k2printf("Publishing...\n"); } /* Reset the display order for this source page */ if (k2settings->show_marked_source) mark_source_page(k2settings,masterinfo,NULL,0,0xf); /* ** v2.10 Call masterinfo_publish() no matter what. If we've just kicked out a ** page, it doesn't matter. It will do nothing. */ masterinfo_publish(masterinfo,k2settings, masterinfo_should_flush(masterinfo,k2settings)); if (preview && k2_handle_preview(k2settings,masterinfo,k2mark_page_count, k2settings->dst_color?marked:src,k2out)) { bmp_free(marked); bmp_free(srcgrey); bmp_free(src); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=0; return(0.); } if (k2settings->show_marked_source && !preview) publish_marked_page(mpdf,k2settings->dst_color ? marked : src,k2settings->src_dpi); if (!preview) { int np; np=masterinfo->published_pages-pw; k2printf("%d new page%s saved.\n",np,np==1?"":"s"); } pw=masterinfo->published_pages; } /* willus_mem_debug_update("End"); */ /* Didn't find the preview page yet--push out final page. */ if (preview) { masterinfo_flush(masterinfo,k2settings); if (!k2_handle_preview(k2settings,masterinfo,k2mark_page_count, k2settings->dst_color?marked:src,k2out)) { /* No preview bitmap--return zero-width bitmap */ if (k2out->bmp==NULL) bmp_free(masterinfo->preview_bitmap); else k2out->bmp->width=0; } bmp_free(marked); bmp_free(srcgrey); bmp_free(src); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=0; return(0.); } bmp_free(marked); bmp_free(srcgrey); bmp_free(src); /* Determine orientation of document */ if (or_detect) { if (pages_done>0) { double thresh; /* ** bormean = 1.0 means neutral ** bormean >> 1.0 means document is likely portrait (no rotation necessary) ** bormean << 1.0 means document is likely landscape (need to rotate it) */ bormean = pow(bormean,1./pages_done); thresh=10.-(double)pages_done/2.; if (thresh<5.) thresh=5.; if (bormean < 1./thresh) { k2printf("Rotating clockwise.\n"); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=0; return(270.); } } k2printf("No rotation necessary.\n"); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=0; return(0.); } /* ** v2.10 -- Calling masterinfo_flush() without checking if a page has just been ** been flushed is fine at the end. If there is nothing left ** in the master output bitmap, it won't do anything. */ /* if (k2settings->dst_break_pages<=0 && !k2settings_gap_override(k2settings)) */ masterinfo_flush(masterinfo,k2settings); { char cdate[128],author[256],title[256]; #ifdef HAVE_MUPDF_LIB if (src_type==SRC_TYPE_PDF) { if (wmupdf_info_field(mupdffilename,"Author",author,255)<0) author[0]='\0'; if (wmupdf_info_field(mupdffilename,"CreationDate",cdate,127)<0) cdate[0]='\0'; if (wmupdf_info_field(mupdffilename,"Title",title,255)<0) title[0]='\0'; } else #endif author[0]=title[0]=cdate[0]='\0'; if (k2settings->dst_author[0]!='\0') strcpy(author,k2settings->dst_author); if (k2settings->dst_title[0]!='\0') strcpy(title,k2settings->dst_title); if (!k2settings->use_crop_boxes) { if (masterinfo->outline!=NULL) { if (k2settings->debug) wpdfoutline_echo(masterinfo->outline,1,1,stdout); pdffile_add_outline(&masterinfo->outfile,masterinfo->outline); } pdffile_finish(&masterinfo->outfile,title,author,masterinfo->pageinfo.producer,cdate); pdffile_close(&masterinfo->outfile); } else { /* Re-write PDF file using crop boxes */ #if (WILLUSDEBUGX & 64) wpdfboxes_echo(&masterinfo->pageinfo.boxes,stdout); #endif #ifdef HAVE_MUPDF_LIB #if (WILLUSDEBUGX & 64) printf("Calling wpdfpageinfo_scale_source_boxes()...\n"); #endif if (k2settings->dst_author[0]!='\0') strcpy(masterinfo->pageinfo.author,k2settings->dst_author); if (k2settings->dst_title[0]!='\0') strcpy(masterinfo->pageinfo.title,k2settings->dst_title); /* v2.20 bug fix -- need to compensate for document_scale_factor if its not 1.0 */ wpdfpageinfo_scale_source_boxes(&masterinfo->pageinfo,1./k2settings->document_scale_factor); #if (WILLUSDEBUGX & 64) printf("Calling wmupdf_remake_pdf()...\n"); #endif wmupdf_remake_pdf(mupdffilename,dstfile,&masterinfo->pageinfo,1,masterinfo->outline,stdout); #endif } if (k2settings->show_marked_source) { pdffile_finish(mpdf,title,author,masterinfo->pageinfo.producer,cdate); pdffile_close(mpdf); } } // cdate, author, title selection if (k2settings->debug || k2settings->verbose) k2printf("Cleaning up ...\n\n"); /* if (folder) k2printf("Processing on " TTEXT_INPUT "folder %s" TTEXT_NORMAL " complete. Total %d pages.\n\n",filename,masterinfo->published_pages); else k2printf("Processing on " TTEXT_BOLD2 "file %s" TTEXT_NORMAL " complete. Total %d pages.\n\n",filename,masterinfo->published_pages); */ size=wfile_size(dstfile); k2printf("\n" TTEXT_BOLD "%d pages" TTEXT_NORMAL,masterinfo->published_pages); if (masterinfo->wordcount>0) k2printf(" (%d words)",masterinfo->wordcount); k2printf(" written to " TTEXT_MAGENTA "%s" TTEXT_NORMAL " (%.1f MB).\n\n", dstfile,size/1024./1024.); #ifdef HAVE_GHOSTSCRIPT if (k2settings->ppgs) gs_postprocess(dstfile); #endif if (k2settings->show_marked_source) { size=wfile_size(markedfile); k2printf(TTEXT_BOLD "%d pages" TTEXT_NORMAL " written to " TTEXT_MAGENTA "%s" TTEXT_NORMAL " (%.1f MB).\n\n",pages_done,markedfile,size/1024./1024.); } #ifdef HAVE_OCR_LIB if (k2settings->dst_ocr && masterinfo->ocrfilename[0]!='\0' && wfile_status(masterinfo->ocrfilename)==1) { size=wfile_size(masterinfo->ocrfilename); k2printf(TTEXT_BOLD "%d words" TTEXT_NORMAL " written to " TTEXT_MAGENTA "%s" TTEXT_NORMAL " (%.1f MB).\n\n",masterinfo->wordcount,masterinfo->ocrfilename,size/1024./1024.); } #endif if (local_tocwrites>0) k2printf(TTEXT_BOLD "%d bytes" TTEXT_NORMAL " written to " TTEXT_MAGENTA "%s" TTEXT_NORMAL ".\n\n",(int)(wfile_size(k2settings->tocsavefile)+.5),k2settings->tocsavefile); masterinfo_free(masterinfo,k2settings); if (folder) filelist_free(fl); k2out->status=0; return(0.); }
int main(int argc,char *argv[]) { static K2PDFOPT_SETTINGS _k2settings, *k2settings; static MASTERINFO _masterinfo, *masterinfo; WILLUSBITMAP _srcgrey, *srcgrey; WILLUSBITMAP _src, *src; BMPREGION region; int status; if (argc<2) { printf("usage: kview <infile.bmp>\n"); return(0); } src=&_src; bmp_init(src); srcgrey=&_srcgrey; bmp_init(srcgrey); if ((status=bmp_read(src,argv[1],NULL))<0) { printf("Error %d reading bitmap file %s.\n",status,argv[1]); return(10); } printf("Bitmap %s is %d x %d x %d\n",argv[1],src->width,src->height,src->bpp); /* Initialize settings */ k2settings=&_k2settings; k2pdfopt_settings_init(k2settings); k2settings->use_crop_boxes=0; k2settings->src_rot=0; k2settings->erase_vertical_lines=0; k2settings->src_autostraighten=0; k2pdfopt_settings_sanity_check(k2settings); /* Init master output structure */ masterinfo=&_masterinfo; masterinfo_init(masterinfo,k2settings); /* Init for new source doc */ k2pdfopt_settings_new_source_document_init(k2settings); /* Init new source bitmap */ masterinfo_new_source_page_init(masterinfo,k2settings,src,srcgrey,NULL,®ion,0.,NULL,NULL,1,NULL); /* Process single source page */ bmpregion_source_page_add(®ion,k2settings,masterinfo,1, (int)(0.25 * k2settings->src_dpi + .5)); bmp_free(srcgrey); bmp_free(src); /* ** Get output pages */ { WILLUSBITMAP *bmp,_bmp; int pn,rows,size_reduction; double bmpdpi; bmp=&_bmp; bmp_init(bmp); pn=0; while ((rows=masterinfo_get_next_output_page(masterinfo,k2settings,1,bmp, &bmpdpi,&size_reduction,NULL))>0) { char filename[256]; pn++; sprintf(filename,"outpage%02d.bmp",pn); bmp_write(bmp,filename,stdout,0); } bmp_free(bmp); } masterinfo_free(masterinfo,k2settings); return(0); }
void k2pdfopt_reflow_bmp(KOPTContext *kctx) { K2PDFOPT_SETTINGS _k2settings, *k2settings; MASTERINFO _masterinfo, *masterinfo; WILLUSBITMAP _srcgrey, *srcgrey; WILLUSBITMAP *src, *dst; BMPREGION region; int i, bw, marbot, marleft; src = &kctx->src; srcgrey = &_srcgrey; bmp_init(srcgrey); k2settings = &_k2settings; masterinfo = &_masterinfo; /* Initialize settings */ k2pdfopt_settings_init_from_koptcontext(k2settings, kctx); k2pdfopt_settings_quick_sanity_check(k2settings); /* Init for new source doc */ k2pdfopt_settings_new_source_document_init(k2settings); /* Init master output structure */ masterinfo_init(masterinfo, k2settings); wrapbmp_init(&masterinfo->wrapbmp, k2settings->dst_color); /* Init new source bitmap */ bmpregion_init(®ion); masterinfo_new_source_page_init(masterinfo, k2settings, src, srcgrey, NULL, ®ion, k2settings->src_rot, NULL, NULL, 1, -1, NULL ); /* Set output size */ k2pdfopt_settings_set_margins_and_devsize(k2settings,®ion,masterinfo,-1.,0); /* Process single source page */ bmpregion_source_page_add(®ion, k2settings, masterinfo, 1, 0); wrapbmp_flush(masterinfo, k2settings, 0); if (fabs(k2settings->dst_gamma - 1.0) > .001) bmp_gamma_correct(&masterinfo->bmp, &masterinfo->bmp, k2settings->dst_gamma); /* copy master bitmap to context dst bitmap */ dst = &kctx->dst; marbot = (int) (k2settings->dst_dpi * k2settings->dstmargins.box[1] + .5); marleft = (int) (k2settings->dst_dpi * k2settings->dstmargins.box[0] + .5); dst->bpp = masterinfo->bmp.bpp; dst->width = masterinfo->bmp.width; dst->height = masterinfo->rows > kctx->page_height ? masterinfo->rows + marbot : kctx->page_height; bmp_alloc(dst); bmp_fill(dst, 255, 255, 255); bw = bmp_bytewidth(&masterinfo->bmp); for (i = 0; i < masterinfo->rows; i++) memcpy(bmp_rowptr_from_top(dst, i), bmp_rowptr_from_top(&masterinfo->bmp, i), bw); kctx->page_width = kctx->dst.width; kctx->page_height = kctx->dst.height; kctx->precache = 0; int j; BOXA *rboxa = boxaCreate(masterinfo->rectmaps.n); BOXA *nboxa = boxaCreate(masterinfo->rectmaps.n); for (j = 0; j < masterinfo->rectmaps.n; j++) { WRECTMAP * rectmap = &masterinfo->rectmaps.wrectmap[j]; rectmap->coords[1].x += marleft; BOX* rlbox = boxCreate(rectmap->coords[1].x, rectmap->coords[1].y, rectmap->coords[2].x, rectmap->coords[2].y); BOX* nlbox = boxCreate(rectmap->coords[0].x*k2settings->src_dpi/rectmap->srcdpiw/kctx->zoom + kctx->bbox.x0, rectmap->coords[0].y*k2settings->src_dpi/rectmap->srcdpih/kctx->zoom + kctx->bbox.y0, rectmap->coords[2].x*k2settings->src_dpi/rectmap->srcdpiw/kctx->zoom, rectmap->coords[2].y*k2settings->src_dpi/rectmap->srcdpih/kctx->zoom); boxaAddBox(rboxa, rlbox, L_INSERT); boxaAddBox(nboxa, nlbox, L_INSERT); wrectmaps_add_wrectmap(&kctx->rectmaps, rectmap); /*printf("rectmap:coords:\t%.1f %.1f\t%.1f %.1f\t%.1f %.1f\t%.1f %.1f\n", rectmap->coords[0].x, rectmap->coords[0].y, rectmap->coords[1].x, rectmap->coords[1].y, rectmap->coords[2].x, rectmap->coords[2].y, rectmap->srcdpiw, rectmap->srcdpih);*/ } /* 2D sort the bounding boxes of these words. */ BOXAA *rbaa = boxaSort2d(rboxa, NULL, 3, -5, 5); BOXAA *nbaa = boxaSort2d(nboxa, NULL, 3, -5, 5); /* Flatten the boxaa, saving the boxa index for each box */ kctx->rboxa = boxaaFlattenToBoxa(rbaa, &kctx->rnai, L_CLONE); kctx->nboxa = boxaaFlattenToBoxa(nbaa, &kctx->nnai, L_CLONE); boxaDestroy(&rboxa); boxaaDestroy(&rbaa); boxaDestroy(&nboxa); boxaaDestroy(&nbaa); bmp_free(src); bmp_free(srcgrey); bmpregion_free(®ion); masterinfo_free(masterinfo, k2settings); }