new parameter addspacechars
[swftools.git] / lib / pdf / pdf.cc
index 3f72d59..68fa711 100644 (file)
@@ -1,25 +1,27 @@
+#include <stdio.h>
+#include <string.h>
 #include "../gfxdevice.h"
 #include "../gfxsource.h"
+#include "../devices/rescale.h"
 #include "../log.h"
 #include "config.h"
 #include "GlobalParams.h"
 #include "InfoOutputDev.h"
 #include "GFXOutputDev.h"
+#include "FullBitmapOutputDev.h"
+#include "BitmapOutputDev.h"
 #include "../mem.h"
 #include "pdf.h"
 #define NO_ARGPARSER
 #include "../args.h"
 
-static parameter_t* device_config = 0;
-static parameter_t* device_config_next = 0;
-
-int jpeg_dpi = 0;
-int ppm_dpi = 0;
-
 static double zoom = 72; /* xpdf: 86 */
-
+static int zoomtowidth = 0;
+static int multiply = 1;
 static char* global_page_range = 0;
 
+static int globalparams_count=0;
+
 typedef struct _pdf_page_info
 {
     int xMin, yMin, xMax, yMax;
@@ -32,12 +34,28 @@ typedef struct _pdf_page_info
 
 typedef struct _pdf_doc_internal
 {
+    char config_bitmap_optimizing;
+    char config_full_bitmap_optimizing;
+    char config_print;
+    gfxparams_t* parameters;
+
     int protect;
+    int nocopy;
+    int noprint;
+    
     PDFDoc*doc;
     Object docinfo;
     InfoOutputDev*info;
-    GFXOutputDev*outputDev;
+
     pdf_page_info_t*pages;
+    char*filename;
+
+    /* page map */
+    int*pagemap;
+    int pagemap_size;
+    int pagemap_pos;
+
+    gfxsource_t*parent;
 } pdf_doc_internal_t;
 
 typedef struct _pdf_page_internal
@@ -46,11 +64,17 @@ typedef struct _pdf_page_internal
 
 typedef struct _dev_output_internal
 {
-    GFXOutputDev*outputDev;
+    CommonOutputDev*outputDev;
 } dev_output_internal_t;
 
 
-static char* dirseparator()
+typedef struct _gfxsource_internal
+{
+    gfxparams_t* parameters;
+} gfxsource_internal_t;
+
+
+static const char* dirseparator()
 {
 #ifdef WIN32
     return "\\";
@@ -59,7 +83,6 @@ static char* dirseparator()
 #endif
 }
 
-
 void pdfpage_destroy(gfxpage_t*pdf_page)
 {
     pdf_page_internal_t*i= (pdf_page_internal_t*)pdf_page->internal;
@@ -67,10 +90,50 @@ void pdfpage_destroy(gfxpage_t*pdf_page)
     free(pdf_page);pdf_page=0;
 }
 
-void render2(gfxpage_t*page, gfxdevice_t*output)
+static void render2(gfxpage_t*page, gfxdevice_t*dev, int x,int y, int x1,int y1,int x2,int y2)
 {
     pdf_doc_internal_t*pi = (pdf_doc_internal_t*)page->parent->internal;
+    gfxsource_internal_t*i = (gfxsource_internal_t*)pi->parent->internal;
+
+    if(!pi->config_print && pi->nocopy) {msg("<fatal> PDF disallows copying");exit(0);}
+    if(pi->config_print && pi->noprint) {msg("<fatal> PDF disallows printing");exit(0);}
+
+    CommonOutputDev*outputDev = 0;
+    if(pi->config_full_bitmap_optimizing) {
+       FullBitmapOutputDev*d = new FullBitmapOutputDev(pi->info, pi->doc);
+       outputDev = (CommonOutputDev*)d;
+    } else if(pi->config_bitmap_optimizing) {
+       BitmapOutputDev*d = new BitmapOutputDev(pi->info, pi->doc);
+       outputDev = (CommonOutputDev*)d;
+    } else {
+       GFXOutputDev*d = new GFXOutputDev(pi->info, pi->doc);
+       outputDev = (CommonOutputDev*)d;
+    }
+    /* pass global parameters to PDF driver*/
+    gfxparam_t*p = i->parameters->params;
+    while(p) {
+       outputDev->setParameter(p->key, p->value);
+       p = p->next;
+    }
+    p = pi->parameters->params;
+    while(p) {
+       outputDev->setParameter(p->key, p->value);
+       p = p->next;
+    }
 
+    outputDev->setPageMap(pi->pagemap, pi->pagemap_pos);
+    outputDev->setMove(x,y);
+    outputDev->setClip(x1,y1,x2,y2);
+
+    gfxdevice_t* middev=0;
+    if(multiply>1) {
+       middev = (gfxdevice_t*)malloc(sizeof(gfxdevice_t));
+       gfxdevice_rescale_init(middev, 0x00000000, 0, 0, 1.0 / multiply);
+        gfxdevice_rescale_setdevice(middev, dev);
+       middev->setparameter(middev, "protect", "1");
+       dev = middev;
+    } 
+       
     if(!pi) {
        msg("<fatal> pdf_page_render: Parent PDF this page belongs to doesn't exist yet/anymore");
        return;
@@ -82,37 +145,39 @@ void render2(gfxpage_t*page, gfxdevice_t*output)
     }
 
     if(pi->protect) {
-       gfxdevice_t*dev = pi->outputDev->device;
         dev->setparameter(dev, "protect", "1");
     }
-    pi->outputDev->setInfo(pi->info);
-    pi->outputDev->setXRef(pi->doc, pi->doc->getXRef());
-    pi->doc->displayPage((OutputDev*)pi->outputDev, page->nr, zoom, zoom, /*rotate*/0, true, true, /*doLinks*/(int)1);
-    pi->doc->processLinks((OutputDev*)pi->outputDev, page->nr);
-    pi->outputDev->endframe();
+
+    outputDev->setDevice(dev);
+    pi->doc->displayPage((OutputDev*)outputDev, page->nr, zoom*multiply, zoom*multiply, /*rotate*/0, true, true, pi->config_print);
+    pi->doc->processLinks((OutputDev*)outputDev, page->nr);
+    outputDev->finishPage();
+    outputDev->setDevice(0);
+    delete outputDev;
+
+    if(middev) {
+       gfxdevice_rescale_setdevice(middev, 0x00000000);
+       middev->finish(middev);
+    }
+
 }
 
     
 void pdfpage_render(gfxpage_t*page, gfxdevice_t*output)
 {
     pdf_doc_internal_t*pi = (pdf_doc_internal_t*)page->parent->internal;
-    pi->outputDev->setDevice(output);
-    pi->outputDev->setMove(0,0);
-    pi->outputDev->setClip(0,0,0,0);
-    render2(page, output);
-    pi->outputDev->setDevice(0);
+    render2(page, output, 0,0, 0,0,0,0);
 }
 
 void pdfpage_rendersection(gfxpage_t*page, gfxdevice_t*output, gfxcoord_t x, gfxcoord_t y, gfxcoord_t _x1, gfxcoord_t _y1, gfxcoord_t _x2, gfxcoord_t _y2)
 {
-    int x1=(int)_x1,y1=(int)_y1,x2=(int)_x2,y2=(int)_y2;
     pdf_doc_internal_t*pi = (pdf_doc_internal_t*)page->parent->internal;
-    pi->outputDev->setDevice(output);
-    pi->outputDev->setMove((int)x,(int)y);
+
+    int x1=(int)_x1,y1=(int)_y1,x2=(int)_x2,y2=(int)_y2;
     if((x1|y1|x2|y2)==0) x2++;
-    pi->outputDev->setClip((int)x1,(int)y1,(int)x2,(int)y2);
-    render2(page, output);
-    pi->outputDev->setDevice(0);
+
+    render2(page, output, (int)x*multiply,(int)y*multiply,
+                          (int)x1*multiply,(int)y1*multiply,(int)x2*multiply,(int)y2*multiply);
 }
 
 void pdf_doc_destroy(gfxdocument_t*gfx)
@@ -123,6 +188,10 @@ void pdf_doc_destroy(gfxdocument_t*gfx)
     free(i->pages); i->pages = 0;
 
     i->docinfo.free();
+
+    if(i->filename) {
+       free(i->filename);i->filename=0;
+    }
     
     if(i->info) {
        delete i->info;i->info=0;
@@ -135,18 +204,53 @@ void pdf_doc_destroy(gfxdocument_t*gfx)
        free(global_page_range);
        global_page_range = 0;
     }
+    
+    /*globalparams_count--;
+    if(!globalparams_count) {
+       delete globalParams;
+       globalParams = 0;
+       globalparams_count = 0;
+    }*/
+}
+
+static void add_page_to_map(gfxdocument_t*gfx, int pdfpage, int outputpage)
+{
+    pdf_doc_internal_t*i= (pdf_doc_internal_t*)gfx->internal;
+    if(pdfpage < 0)
+       return;
+    if(pdfpage >= i->pagemap_size) {
+       int oldlen = i->pagemap_size;
+       i->pagemap_size = oldlen + 1024;
+       if(pdfpage > i->pagemap_size)
+           i->pagemap_size = pdfpage+1;
+
+        if(i->pages) {
+            i->pagemap = (int*)malloc(i->pagemap_size*sizeof(int));
+        } else {
+           i->pagemap = (int*)realloc(i->pages, i->pagemap_size*sizeof(int));
+        }
+       memset(&i->pagemap[oldlen], -1, (i->pagemap_size-oldlen)*sizeof(int));
+    }
+    i->pagemap[pdfpage] = outputpage;
+    if(pdfpage > i->pagemap_pos)
+       i->pagemap_pos = pdfpage;
 }
 
-void pdf_doc_set_parameter(gfxdocument_t*gfx, char*name, char*value)
+void pdf_doc_setparameter(gfxdocument_t*gfx, const char*name, const char*value)
 {
     pdf_doc_internal_t*i= (pdf_doc_internal_t*)gfx->internal;
     if(!strcmp(name, "pagemap")) {
-       GFXOutputDev*o = i->outputDev;
        int pdfpage=0, outputpage=0;
        sscanf(value,"%d:%d", &pdfpage, &outputpage);
-       o->preparePage(pdfpage, outputpage);
+        add_page_to_map(gfx, pdfpage, outputpage);
+    } else if(!strcmp(name, "poly2bitmap")) {
+        i->config_bitmap_optimizing = atoi(value);
+    } else if(!strcmp(name, "bitmapfonts") || !strcmp(name, "bitmap")) {
+        i->config_full_bitmap_optimizing = atoi(value);
+    } else if(!strcmp(name, "asprint")) {
+        i->config_print = 1;
     } else {
-       msg("<warning> Ignored parameter: %s=%s", name, value);
+        gfxparams_store(i->parameters, name, value);
     }
 }
 
@@ -173,13 +277,13 @@ gfxpage_t* pdf_doc_getpage(gfxdocument_t*doc, int page)
     return pdf_page;
 }
 
-static char*getInfoString(Dict *infoDict, char *key)
+static char*getInfoString(Dict *infoDict, const char *key)
 {
     Object obj;
     GString *s1, *s2;
     int i;
 
-    if (infoDict->lookup(key, &obj)->isString()) {
+    if (infoDict && infoDict->lookup((char*)key, &obj)->isString()) {
        s1 = obj.getString();
        if ((s1->getChar(0) & 0xff) == 0xfe &&
            (s1->getChar(1) & 0xff) == 0xff) {
@@ -206,12 +310,12 @@ static char*getInfoString(Dict *infoDict, char *key)
     return strdup("");
 }
 
-static char*getInfoDate(Dict *infoDict, char *key) 
+static char*getInfoDate(Dict *infoDict, const char *key) 
 {
     Object obj;
     char *s;
 
-    if (infoDict->lookup(key, &obj)->isString()) {
+    if (infoDict && infoDict->lookup((char*)key, &obj)->isString()) {
        s = obj.getString()->getCString();
        if (s[0] == 'D' && s[1] == ':') {
          s += 2;
@@ -223,7 +327,7 @@ static char*getInfoDate(Dict *infoDict, char *key)
     return strdup("");
 }
 
-char* pdf_doc_getinfo(gfxdocument_t*doc, char*name)
+char* pdf_doc_getinfo(gfxdocument_t*doc, const char*name)
 {
     pdf_doc_internal_t*i= (pdf_doc_internal_t*)doc->internal;
     if(!strcmp(name, "title")) return getInfoString(i->docinfo.getDict(), "Title");
@@ -246,71 +350,83 @@ char* pdf_doc_getinfo(gfxdocument_t*doc, char*name)
         sprintf(buf, "%.1f", i->doc->getPDFVersion());
         return strdup(buf);
     }
-    return 0;
+    return strdup("");
 }
 
 
-void storeDeviceParameter(char*name, char*value)
-{
-    parameter_t*p = new parameter_t();
-    p->name = strdup(name);
-    p->value = strdup(value);
-    p->next = 0;
-    if(device_config_next) {
-       device_config_next->next = p;
-       device_config_next = p;
-    } else {
-       device_config = p;
-       device_config_next = p;
-    }
-}
+/* shortcut to InfoOutputDev.cc */
+extern int config_addspace;
+extern int config_fontquality;
+extern int config_bigchar;
 
-void pdf_set_parameter(char*name, char*value)
+static void pdf_setparameter(gfxsource_t*src, const char*name, const char*value)
 {
+    gfxsource_internal_t*i = (gfxsource_internal_t*)src->internal;
+        
+    gfxparams_store(i->parameters, name, value);
+
     msg("<verbose> setting parameter %s to \"%s\"", name, value);
     if(!strncmp(name, "fontdir", strlen("fontdir"))) {
         addGlobalFontDir(value);
+    } else if(!strcmp(name, "addspacechars")) {
+       config_addspace = atoi(value);
+       gfxparams_store(i->parameters, "detectspaces", 0);
+    } else if(!strcmp(name, "detectspaces")) {
+       config_addspace = atoi(value);
+    } else if(!strcmp(name, "fontquality")) {
+       config_fontquality = atoi(value);
+    } else if(!strcmp(name, "bigchar")) {
+       config_bigchar = atoi(value);
     } else if(!strcmp(name, "pages")) {
        global_page_range = strdup(value);
-    } else if(!strncmp(name, "font", strlen("font"))) {
+    } else if(!strncmp(name, "font", strlen("font")) && name[4]!='q') {
        addGlobalFont(value);
     } else if(!strncmp(name, "languagedir", strlen("languagedir"))) {
         addGlobalLanguageDir(value);
+    } else if(!strcmp(name, "zoomtowidth")) {
+       zoomtowidth = atoi(value);
     } else if(!strcmp(name, "zoom")) {
        char buf[80];
        zoom = atof(value);
-       sprintf(buf, "%f", (double)jpeg_dpi/(double)zoom);
-       storeDeviceParameter("jpegsubpixels", buf);
-       sprintf(buf, "%f", (double)ppm_dpi/(double)zoom);
-       storeDeviceParameter("ppmsubpixels", buf);
-    } else if(!strcmp(name, "jpegdpi")) {
-       char buf[80];
-       jpeg_dpi = atoi(value);
-       sprintf(buf, "%f", (double)jpeg_dpi/(double)zoom);
-       storeDeviceParameter("jpegsubpixels", buf);
-    } else if(!strcmp(name, "ppmdpi")) {
-       char buf[80];
-       ppm_dpi = atoi(value);
-       sprintf(buf, "%f", (double)ppm_dpi/(double)zoom);
-       storeDeviceParameter("ppmsubpixels", buf);
-    } else {
-       storeDeviceParameter(name,value);
-    }
+    } else if(!strcmp(name, "jpegdpi") || !strcmp(name, "ppmdpi")) {
+       msg("<error> %s not supported anymore. Please use jpegsubpixels/ppmsubpixels");
+    } else if(!strcmp(name, "multiply")) {
+        multiply = atoi(value);
+    } else if(!strcmp(name, "help")) {
+       printf("\nPDF device global parameters:\n");
+       printf("fontdir=<dir>     a directory with additional fonts\n");
+       printf("font=<filename>   an additional font filename\n");
+       printf("pages=<range>     the range of pages to convert (example: pages=1-100,210-)\n");
+       printf("zoom=<dpi>        the resultion (default: 72)\n");
+       printf("languagedir=<dir> Add an xpdf language directory\n");
+       printf("multiply=<times>  Render everything at <times> the resolution\n");
+       printf("poly2bitmap       Convert graphics to bitmaps\n");
+       printf("bitmap            Convert everything to bitmaps\n");
+    }  
 }
 
-gfxdocument_t*pdf_open(char*filename)
+void pdf_doc_prepare(gfxdocument_t*doc, gfxdevice_t*dev)
 {
+    pdf_doc_internal_t*i= (pdf_doc_internal_t*)doc->internal;
+    i->info->dumpfonts(dev);
+}
+
+static gfxdocument_t*pdf_open(gfxsource_t*src, const char*filename)
+{
+    gfxsource_internal_t*isrc = (gfxsource_internal_t*)src->internal;
     gfxdocument_t*pdf_doc = (gfxdocument_t*)malloc(sizeof(gfxdocument_t));
     memset(pdf_doc, 0, sizeof(gfxdocument_t));
     pdf_doc_internal_t*i= (pdf_doc_internal_t*)malloc(sizeof(pdf_doc_internal_t));
     memset(i, 0, sizeof(pdf_doc_internal_t));
+    i->parent = src;
+    i->parameters = gfxparams_new();
     pdf_doc->internal = i;
     char*userPassword=0;
     
-    filename = strdup(filename);
+    i->filename = strdup(filename);
 
     char*x = 0;
-    if((x = strchr(filename, '|'))) {
+    if((x = strchr((char*)filename, '|'))) {
        *x = 0;
        userPassword = x+1;
     }
@@ -318,10 +434,6 @@ gfxdocument_t*pdf_open(char*filename)
     GString *fileName = new GString(filename);
     GString *userPW;
 
-    // read config file
-    if(!globalParams)
-        globalParams = new GlobalParams("");
-
     // open PDF file
     if (userPassword && userPassword[0]) {
       userPW = new GString(userPassword);
@@ -333,7 +445,6 @@ gfxdocument_t*pdf_open(char*filename)
       delete userPW;
     }
     if (!i->doc->isOk()) {
-        printf("xpdf reports document as broken.\n");
         return 0;
     }
 
@@ -344,52 +455,92 @@ gfxdocument_t*pdf_open(char*filename)
     i->protect = 0;
     if (i->doc->isEncrypted()) {
           if(!i->doc->okToCopy()) {
-              printf("PDF disallows copying.\n");
-              return 0;
+              i->nocopy = 1;
+          }
+          if(!i->doc->okToPrint()) {
+              i->noprint = 1;
           }
           if(!i->doc->okToChange() || !i->doc->okToAddNotes())
               i->protect = 1;
     }
+       
+    if(zoomtowidth && i->doc->getNumPages()) {
+       Page*page = i->doc->getCatalog()->getPage(1);
+       PDFRectangle *r = page->getCropBox();
+       double width_before = r->x2 - r->x1;
+       zoom = 72.0 * zoomtowidth / width_before;
+       msg("<notice> Rendering at %f DPI. (Page width at 72 DPI: %f, target width: %d)", zoom, width_before, zoomtowidth);
+    }
 
-    InfoOutputDev*io = new InfoOutputDev();
+    i->info = new InfoOutputDev(i->doc->getXRef());
     int t;
     i->pages = (pdf_page_info_t*)malloc(sizeof(pdf_page_info_t)*pdf_doc->num_pages);
     memset(i->pages,0,sizeof(pdf_page_info_t)*pdf_doc->num_pages);
     for(t=1;t<=pdf_doc->num_pages;t++) {
        if(!global_page_range || is_in_range(t, global_page_range)) {
-           i->doc->displayPage((OutputDev*)io, t, zoom, zoom, /*rotate*/0, /*usemediabox*/true, /*crop*/true, /*doLinks*/(int)1);
-           i->doc->processLinks((OutputDev*)io, t);
-           i->pages[t-1].xMin = io->x1;
-           i->pages[t-1].yMin = io->y1;
-           i->pages[t-1].xMax = io->x2;
-           i->pages[t-1].yMax = io->y2;
-           i->pages[t-1].width = io->x2 - io->x1;
-           i->pages[t-1].height = io->y2 - io->y1;
-           i->pages[t-1].number_of_images = io->num_images;
-           i->pages[t-1].number_of_links = io->num_links;
-           i->pages[t-1].number_of_fonts = io->num_fonts;
+           i->doc->displayPage((OutputDev*)i->info, t, zoom, zoom, /*rotate*/0, /*usemediabox*/true, /*crop*/true, i->config_print);
+           i->doc->processLinks((OutputDev*)i->info, t);
+           i->pages[t-1].xMin = i->info->x1;
+           i->pages[t-1].yMin = i->info->y1;
+           i->pages[t-1].xMax = i->info->x2;
+           i->pages[t-1].yMax = i->info->y2;
+           i->pages[t-1].width = i->info->x2 - i->info->x1;
+           i->pages[t-1].height = i->info->y2 - i->info->y1;
+           i->pages[t-1].number_of_images = i->info->num_ppm_images + i->info->num_jpeg_images;
+           i->pages[t-1].number_of_links = i->info->num_links;
+           i->pages[t-1].number_of_fonts = i->info->num_fonts;
            i->pages[t-1].has_info = 1;
        }
     }
-    i->info = io;
-    i->outputDev = new GFXOutputDev(device_config);
 
     pdf_doc->get = 0;
     pdf_doc->destroy = pdf_doc_destroy;
-    pdf_doc->set_parameter = pdf_doc_set_parameter;
+    pdf_doc->setparameter = pdf_doc_setparameter;
     pdf_doc->getinfo = pdf_doc_getinfo;
     pdf_doc->getpage = pdf_doc_getpage;
+    pdf_doc->prepare = pdf_doc_prepare;
 
-
+    /* pass global parameters to PDF driver*/
+    gfxparam_t*p = isrc->parameters->params;
+    while(p) {
+       pdf_doc->setparameter(pdf_doc, p->key, p->value);
+       p = p->next;
+    }
+    
     return pdf_doc;
+}
+    
+void pdf_destroy(gfxsource_t*src)
+{
+    if(!src->internal)
+       return;
+    gfxsource_internal_t*i = (gfxsource_internal_t*)src->internal;
+   
+    gfxparams_free(i->parameters);
+    i->parameters=0;
+    
+    free(src->internal);src->internal=0;
 
+    delete globalParams;globalParams = 0;
+    free(src);
 }
 
 gfxsource_t*gfxsource_pdf_create()
 {
     gfxsource_t*src = (gfxsource_t*)malloc(sizeof(gfxsource_t));
     memset(src, 0, sizeof(gfxsource_t));
-    src->set_parameter = pdf_set_parameter;
+    src->setparameter = pdf_setparameter;
     src->open = pdf_open;
+    src->destroy = pdf_destroy;
+    gfxsource_internal_t*i = (gfxsource_internal_t*)rfx_calloc(sizeof(gfxsource_internal_t));
+    src->internal = (void*)i;
+    i->parameters = gfxparams_new();
+
+    if(!globalParams) {
+        globalParams = new GFXGlobalParams();
+       //globalparams_count++;
+    }
+    
+
     return src;
 }