2011-10-25 10:13:12 +09:00
|
|
|
/* -*- Mode: Java; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
|
|
|
/* vim: set shiftwidth=2 tabstop=2 autoindent cindent expandtab: */
|
|
|
|
|
2011-10-26 10:18:22 +09:00
|
|
|
'use strict';
|
|
|
|
|
|
|
|
var globalScope = (typeof window === 'undefined') ? this : window;
|
|
|
|
|
2011-12-03 17:16:40 +09:00
|
|
|
var isWorker = (typeof window == 'undefined');
|
|
|
|
|
2011-10-25 10:13:12 +09:00
|
|
|
var ERRORS = 0, WARNINGS = 1, TODOS = 5;
|
|
|
|
var verbosity = WARNINGS;
|
2011-10-26 07:43:41 +09:00
|
|
|
|
2011-10-27 03:46:57 +09:00
|
|
|
// The global PDFJS object exposes the API
|
2011-10-26 07:43:41 +09:00
|
|
|
// In production, it will be declared outside a global wrapper
|
|
|
|
// In development, it will be declared here
|
2011-10-27 03:46:57 +09:00
|
|
|
if (!globalScope.PDFJS) {
|
|
|
|
globalScope.PDFJS = {};
|
2011-10-26 07:43:41 +09:00
|
|
|
}
|
|
|
|
|
2011-10-25 10:13:12 +09:00
|
|
|
// getPdf()
|
|
|
|
// Convenience function to perform binary Ajax GET
|
|
|
|
// Usage: getPdf('http://...', callback)
|
|
|
|
// getPdf({
|
|
|
|
// url:String ,
|
|
|
|
// [,progress:Function, error:Function]
|
|
|
|
// },
|
|
|
|
// callback)
|
|
|
|
function getPdf(arg, callback) {
|
|
|
|
var params = arg;
|
|
|
|
if (typeof arg === 'string')
|
|
|
|
params = { url: arg };
|
|
|
|
|
|
|
|
var xhr = new XMLHttpRequest();
|
|
|
|
xhr.open('GET', params.url);
|
|
|
|
xhr.mozResponseType = xhr.responseType = 'arraybuffer';
|
2011-12-06 08:48:21 +09:00
|
|
|
xhr.expected = (params.url.indexOf('file:') === 0) ? 0 : 200;
|
2011-10-25 10:13:12 +09:00
|
|
|
|
|
|
|
if ('progress' in params)
|
|
|
|
xhr.onprogress = params.progress || undefined;
|
|
|
|
|
|
|
|
if ('error' in params)
|
|
|
|
xhr.onerror = params.error || undefined;
|
|
|
|
|
2011-11-30 04:28:05 +09:00
|
|
|
xhr.onreadystatechange = function getPdfOnreadystatechange(e) {
|
|
|
|
if (xhr.readyState === 4) {
|
|
|
|
if (xhr.status === xhr.expected) {
|
|
|
|
var data = (xhr.mozResponseArrayBuffer || xhr.mozResponse ||
|
|
|
|
xhr.responseArrayBuffer || xhr.response);
|
|
|
|
callback(data);
|
2011-12-02 02:11:33 +09:00
|
|
|
} else if (params.error) {
|
2011-11-30 04:28:05 +09:00
|
|
|
params.error(e);
|
|
|
|
}
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
|
|
|
};
|
|
|
|
xhr.send(null);
|
|
|
|
}
|
2011-10-27 03:46:57 +09:00
|
|
|
globalScope.PDFJS.getPdf = getPdf;
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
var Page = (function PageClosure() {
|
|
|
|
function Page(xref, pageNumber, pageDict, ref) {
|
2011-10-25 10:13:12 +09:00
|
|
|
this.pageNumber = pageNumber;
|
|
|
|
this.pageDict = pageDict;
|
|
|
|
this.stats = {
|
|
|
|
create: Date.now(),
|
|
|
|
compile: 0.0,
|
|
|
|
fonts: 0.0,
|
|
|
|
images: 0.0,
|
|
|
|
render: 0.0
|
|
|
|
};
|
|
|
|
this.xref = xref;
|
|
|
|
this.ref = ref;
|
2011-11-29 09:55:09 +09:00
|
|
|
|
2011-12-23 03:04:53 +09:00
|
|
|
this.displayReadyPromise = null;
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
Page.prototype = {
|
2011-10-25 10:13:12 +09:00
|
|
|
getPageProp: function pageGetPageProp(key) {
|
|
|
|
return this.xref.fetchIfRef(this.pageDict.get(key));
|
|
|
|
},
|
|
|
|
inheritPageProp: function pageInheritPageProp(key) {
|
|
|
|
var dict = this.pageDict;
|
|
|
|
var obj = dict.get(key);
|
|
|
|
while (obj === undefined) {
|
|
|
|
dict = this.xref.fetchIfRef(dict.get('Parent'));
|
|
|
|
if (!dict)
|
|
|
|
break;
|
|
|
|
obj = dict.get(key);
|
|
|
|
}
|
|
|
|
return obj;
|
|
|
|
},
|
|
|
|
get content() {
|
|
|
|
return shadow(this, 'content', this.getPageProp('Contents'));
|
|
|
|
},
|
|
|
|
get resources() {
|
|
|
|
return shadow(this, 'resources', this.inheritPageProp('Resources'));
|
|
|
|
},
|
|
|
|
get mediaBox() {
|
|
|
|
var obj = this.inheritPageProp('MediaBox');
|
|
|
|
// Reset invalid media box to letter size.
|
|
|
|
if (!isArray(obj) || obj.length !== 4)
|
|
|
|
obj = [0, 0, 612, 792];
|
|
|
|
return shadow(this, 'mediaBox', obj);
|
|
|
|
},
|
|
|
|
get view() {
|
|
|
|
var obj = this.inheritPageProp('CropBox');
|
|
|
|
var view = {
|
|
|
|
x: 0,
|
|
|
|
y: 0,
|
|
|
|
width: this.width,
|
|
|
|
height: this.height
|
|
|
|
};
|
2011-12-31 09:52:15 +09:00
|
|
|
var mediaBox = this.mediaBox;
|
|
|
|
var offsetX = mediaBox[0], offsetY = mediaBox[1];
|
2011-10-25 10:13:12 +09:00
|
|
|
if (isArray(obj) && obj.length == 4) {
|
2011-12-31 09:52:15 +09:00
|
|
|
var tl = this.rotatePoint(obj[0] - offsetX, obj[1] - offsetY);
|
|
|
|
var br = this.rotatePoint(obj[2] - offsetX, obj[3] - offsetY);
|
2011-10-25 10:13:12 +09:00
|
|
|
view.x = Math.min(tl.x, br.x);
|
|
|
|
view.y = Math.min(tl.y, br.y);
|
|
|
|
view.width = Math.abs(tl.x - br.x);
|
|
|
|
view.height = Math.abs(tl.y - br.y);
|
|
|
|
}
|
|
|
|
|
|
|
|
return shadow(this, 'cropBox', view);
|
|
|
|
},
|
|
|
|
get annotations() {
|
|
|
|
return shadow(this, 'annotations', this.inheritPageProp('Annots'));
|
|
|
|
},
|
|
|
|
get width() {
|
|
|
|
var mediaBox = this.mediaBox;
|
|
|
|
var rotate = this.rotate;
|
|
|
|
var width;
|
|
|
|
if (rotate == 0 || rotate == 180) {
|
|
|
|
width = (mediaBox[2] - mediaBox[0]);
|
|
|
|
} else {
|
|
|
|
width = (mediaBox[3] - mediaBox[1]);
|
|
|
|
}
|
|
|
|
return shadow(this, 'width', width);
|
|
|
|
},
|
|
|
|
get height() {
|
|
|
|
var mediaBox = this.mediaBox;
|
|
|
|
var rotate = this.rotate;
|
|
|
|
var height;
|
|
|
|
if (rotate == 0 || rotate == 180) {
|
|
|
|
height = (mediaBox[3] - mediaBox[1]);
|
|
|
|
} else {
|
|
|
|
height = (mediaBox[2] - mediaBox[0]);
|
|
|
|
}
|
|
|
|
return shadow(this, 'height', height);
|
|
|
|
},
|
|
|
|
get rotate() {
|
|
|
|
var rotate = this.inheritPageProp('Rotate') || 0;
|
|
|
|
// Normalize rotation so it's a multiple of 90 and between 0 and 270
|
|
|
|
if (rotate % 90 != 0) {
|
|
|
|
rotate = 0;
|
|
|
|
} else if (rotate >= 360) {
|
|
|
|
rotate = rotate % 360;
|
|
|
|
} else if (rotate < 0) {
|
|
|
|
// The spec doesn't cover negatives, assume its counterclockwise
|
|
|
|
// rotation. The following is the other implementation of modulo.
|
|
|
|
rotate = ((rotate % 360) + 360) % 360;
|
|
|
|
}
|
|
|
|
return shadow(this, 'rotate', rotate);
|
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
startRenderingFromIRQueue: function pageStartRenderingFromIRQueue(
|
2011-10-25 10:13:12 +09:00
|
|
|
IRQueue, fonts) {
|
|
|
|
var self = this;
|
|
|
|
this.IRQueue = IRQueue;
|
|
|
|
|
|
|
|
var displayContinuation = function pageDisplayContinuation() {
|
|
|
|
// Always defer call to display() to work around bug in
|
|
|
|
// Firefox error reporting from XHR callbacks.
|
|
|
|
setTimeout(function pageSetTimeout() {
|
2011-12-23 03:04:53 +09:00
|
|
|
self.displayReadyPromise.resolve();
|
2011-10-25 10:13:12 +09:00
|
|
|
});
|
|
|
|
};
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
this.ensureFonts(fonts,
|
|
|
|
function pageStartRenderingFromIRQueueEnsureFonts() {
|
2011-10-25 10:13:12 +09:00
|
|
|
displayContinuation();
|
|
|
|
});
|
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
getIRQueue: function pageGetIRQueue(handler, dependency) {
|
2011-10-25 10:13:12 +09:00
|
|
|
if (this.IRQueue) {
|
|
|
|
// content was compiled
|
|
|
|
return this.IRQueue;
|
|
|
|
}
|
|
|
|
|
|
|
|
var xref = this.xref;
|
|
|
|
var content = xref.fetchIfRef(this.content);
|
|
|
|
var resources = xref.fetchIfRef(this.resources);
|
|
|
|
if (isArray(content)) {
|
|
|
|
// fetching items
|
|
|
|
var i, n = content.length;
|
|
|
|
for (i = 0; i < n; ++i)
|
|
|
|
content[i] = xref.fetchIfRef(content[i]);
|
|
|
|
content = new StreamsSequenceStream(content);
|
|
|
|
}
|
|
|
|
|
|
|
|
var pe = this.pe = new PartialEvaluator(
|
|
|
|
xref, handler, 'p' + this.pageNumber + '_');
|
|
|
|
var IRQueue = {};
|
2011-11-04 06:26:58 +09:00
|
|
|
return (this.IRQueue = pe.getIRQueue(content, resources, IRQueue,
|
|
|
|
dependency));
|
2011-10-25 10:13:12 +09:00
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
ensureFonts: function pageEnsureFonts(fonts, callback) {
|
2011-10-25 10:13:12 +09:00
|
|
|
// Convert the font names to the corresponding font obj.
|
2011-11-03 04:21:45 +09:00
|
|
|
for (var i = 0, ii = fonts.length; i < ii; i++) {
|
2011-10-25 10:13:12 +09:00
|
|
|
fonts[i] = this.objs.objs[fonts[i]].data;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Load all the fonts
|
|
|
|
var fontObjs = FontLoader.bind(
|
|
|
|
fonts,
|
2011-10-30 19:41:55 +09:00
|
|
|
function pageEnsureFontsFontObjs(fontObjs) {
|
2011-10-25 10:13:12 +09:00
|
|
|
this.stats.fonts = Date.now();
|
|
|
|
|
|
|
|
callback.call(this);
|
|
|
|
}.bind(this),
|
|
|
|
this.objs
|
|
|
|
);
|
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
display: function pageDisplay(gfx, callback) {
|
2011-10-25 10:13:12 +09:00
|
|
|
var xref = this.xref;
|
|
|
|
var resources = xref.fetchIfRef(this.resources);
|
|
|
|
var mediaBox = xref.fetchIfRef(this.mediaBox);
|
|
|
|
assertWellFormed(isDict(resources), 'invalid page resources');
|
|
|
|
|
|
|
|
gfx.xref = xref;
|
|
|
|
gfx.res = resources;
|
|
|
|
gfx.beginDrawing({ x: mediaBox[0], y: mediaBox[1],
|
|
|
|
width: this.width,
|
|
|
|
height: this.height,
|
|
|
|
rotate: this.rotate });
|
|
|
|
|
|
|
|
var startIdx = 0;
|
|
|
|
var length = this.IRQueue.fnArray.length;
|
|
|
|
var IRQueue = this.IRQueue;
|
|
|
|
|
|
|
|
var self = this;
|
|
|
|
function next() {
|
|
|
|
startIdx = gfx.executeIRQueue(IRQueue, startIdx, next);
|
|
|
|
if (startIdx == length) {
|
|
|
|
self.stats.render = Date.now();
|
2011-10-29 06:37:55 +09:00
|
|
|
gfx.endDrawing();
|
2011-10-25 10:13:12 +09:00
|
|
|
if (callback) callback();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
next();
|
|
|
|
},
|
|
|
|
rotatePoint: function pageRotatePoint(x, y, reverse) {
|
|
|
|
var rotate = reverse ? (360 - this.rotate) : this.rotate;
|
|
|
|
switch (rotate) {
|
|
|
|
case 180:
|
|
|
|
return {x: this.width - x, y: y};
|
|
|
|
case 90:
|
|
|
|
return {x: this.width - y, y: this.height - x};
|
|
|
|
case 270:
|
|
|
|
return {x: y, y: x};
|
|
|
|
case 360:
|
|
|
|
case 0:
|
|
|
|
default:
|
|
|
|
return {x: x, y: this.height - y};
|
|
|
|
}
|
|
|
|
},
|
|
|
|
getLinks: function pageGetLinks() {
|
2011-11-03 10:46:39 +09:00
|
|
|
var links = [];
|
|
|
|
var annotations = pageGetAnnotations();
|
|
|
|
var i, n = annotations.length;
|
|
|
|
for (i = 0; i < n; ++i) {
|
|
|
|
if (annotations[i].type != 'Link')
|
|
|
|
continue;
|
|
|
|
links.push(annotations[i]);
|
|
|
|
}
|
|
|
|
return links;
|
|
|
|
},
|
|
|
|
getAnnotations: function pageGetAnnotations() {
|
2011-10-25 10:13:12 +09:00
|
|
|
var xref = this.xref;
|
2011-11-13 06:39:23 +09:00
|
|
|
function getInheritableProperty(annotation, name) {
|
|
|
|
var item = annotation;
|
|
|
|
while (item && !item.has(name)) {
|
|
|
|
item = xref.fetchIfRef(item.get('Parent'));
|
|
|
|
}
|
|
|
|
if (!item)
|
|
|
|
return null;
|
|
|
|
return item.get(name);
|
|
|
|
}
|
|
|
|
|
2011-10-25 10:13:12 +09:00
|
|
|
var annotations = xref.fetchIfRef(this.annotations) || [];
|
|
|
|
var i, n = annotations.length;
|
2011-11-03 10:46:39 +09:00
|
|
|
var items = [];
|
2011-10-25 10:13:12 +09:00
|
|
|
for (i = 0; i < n; ++i) {
|
2011-11-13 06:39:23 +09:00
|
|
|
var annotationRef = annotations[i];
|
|
|
|
var annotation = xref.fetch(annotationRef);
|
2011-10-25 10:13:12 +09:00
|
|
|
if (!isDict(annotation))
|
|
|
|
continue;
|
|
|
|
var subtype = annotation.get('Subtype');
|
2011-11-03 10:46:39 +09:00
|
|
|
if (!isName(subtype))
|
2011-10-25 10:13:12 +09:00
|
|
|
continue;
|
|
|
|
var rect = annotation.get('Rect');
|
|
|
|
var topLeftCorner = this.rotatePoint(rect[0], rect[1]);
|
|
|
|
var bottomRightCorner = this.rotatePoint(rect[2], rect[3]);
|
|
|
|
|
2011-11-03 10:46:39 +09:00
|
|
|
var item = {};
|
|
|
|
item.type = subtype.name;
|
|
|
|
item.x = Math.min(topLeftCorner.x, bottomRightCorner.x);
|
|
|
|
item.y = Math.min(topLeftCorner.y, bottomRightCorner.y);
|
|
|
|
item.width = Math.abs(topLeftCorner.x - bottomRightCorner.x);
|
|
|
|
item.height = Math.abs(topLeftCorner.y - bottomRightCorner.y);
|
|
|
|
switch (subtype.name) {
|
|
|
|
case 'Link':
|
|
|
|
var a = this.xref.fetchIfRef(annotation.get('A'));
|
|
|
|
if (a) {
|
|
|
|
switch (a.get('S').name) {
|
|
|
|
case 'URI':
|
2011-12-22 07:22:07 +09:00
|
|
|
item.url = a.get('URI');
|
2011-11-03 10:46:39 +09:00
|
|
|
break;
|
|
|
|
case 'GoTo':
|
2011-12-22 07:22:07 +09:00
|
|
|
item.dest = a.get('D');
|
2011-11-03 10:46:39 +09:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
TODO('other link types');
|
|
|
|
}
|
|
|
|
} else if (annotation.has('Dest')) {
|
|
|
|
// simple destination link
|
|
|
|
var dest = annotation.get('Dest');
|
2011-12-22 07:22:07 +09:00
|
|
|
item.dest = isName(dest) ? dest.name : dest;
|
2011-11-03 10:46:39 +09:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
case 'Widget':
|
2011-11-13 06:39:23 +09:00
|
|
|
var fieldType = getInheritableProperty(annotation, 'FT');
|
2011-11-03 10:46:39 +09:00
|
|
|
if (!isName(fieldType))
|
2011-10-25 10:13:12 +09:00
|
|
|
break;
|
2011-11-03 10:46:39 +09:00
|
|
|
item.fieldType = fieldType.name;
|
2011-11-13 06:39:23 +09:00
|
|
|
// Building the full field name by collecting the field and
|
|
|
|
// its ancestors 'T' properties and joining them using '.'.
|
2011-11-03 10:46:39 +09:00
|
|
|
var fieldName = [];
|
2011-11-13 06:39:23 +09:00
|
|
|
var namedItem = annotation, ref = annotationRef;
|
|
|
|
while (namedItem) {
|
|
|
|
var parentRef = namedItem.get('Parent');
|
|
|
|
var parent = xref.fetchIfRef(parentRef);
|
|
|
|
var name = namedItem.get('T');
|
2011-11-03 10:46:39 +09:00
|
|
|
if (name)
|
2011-11-13 06:39:23 +09:00
|
|
|
fieldName.unshift(stringToPDFString(name));
|
|
|
|
else {
|
|
|
|
// The field name is absent, that means more than one field
|
|
|
|
// with the same name may exist. Replacing the empty name
|
|
|
|
// with the '`' plus index in the parent's 'Kids' array.
|
|
|
|
// This is not in the PDF spec but necessary to id the
|
|
|
|
// the input controls.
|
|
|
|
var kids = xref.fetchIfRef(parent.get('Kids'));
|
|
|
|
var j, jj;
|
|
|
|
for (j = 0, jj = kids.length; j < jj; j++) {
|
|
|
|
if (kids[j].num == ref.num && kids[j].gen == ref.gen)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
fieldName.unshift('`' + j);
|
|
|
|
}
|
|
|
|
namedItem = parent;
|
|
|
|
ref = parentRef;
|
2011-11-03 10:46:39 +09:00
|
|
|
}
|
|
|
|
item.fullName = fieldName.join('.');
|
|
|
|
var alternativeText = stringToPDFString(annotation.get('TU') || '');
|
|
|
|
item.alternativeText = alternativeText;
|
2011-11-13 06:39:23 +09:00
|
|
|
var da = getInheritableProperty(annotation, 'DA') || '';
|
2011-11-03 10:46:39 +09:00
|
|
|
var m = /([\d\.]+)\sTf/.exec(da);
|
|
|
|
if (m)
|
|
|
|
item.fontSize = parseFloat(m[1]);
|
2011-11-13 06:39:23 +09:00
|
|
|
item.textAlignment = getInheritableProperty(annotation, 'Q');
|
|
|
|
item.flags = getInheritableProperty(annotation, 'Ff') || 0;
|
2011-11-03 10:46:39 +09:00
|
|
|
break;
|
2011-12-22 07:22:07 +09:00
|
|
|
case 'Text':
|
|
|
|
var content = annotation.get('Contents');
|
|
|
|
var title = annotation.get('T');
|
2011-12-22 07:37:52 +09:00
|
|
|
item.content = stringToPDFString(content || '');
|
|
|
|
item.title = stringToPDFString(title || '');
|
2011-12-22 07:22:07 +09:00
|
|
|
item.name = annotation.get('Name').name;
|
|
|
|
break;
|
2011-12-22 07:37:52 +09:00
|
|
|
default:
|
2011-12-22 07:22:07 +09:00
|
|
|
TODO('unimplemented annotation type: ' + subtype.name);
|
|
|
|
break;
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
2011-11-03 10:46:39 +09:00
|
|
|
items.push(item);
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
2011-11-03 10:46:39 +09:00
|
|
|
return items;
|
2011-10-25 10:13:12 +09:00
|
|
|
},
|
2011-11-03 00:23:42 +09:00
|
|
|
startRendering: function pageStartRendering(ctx, callback, textLayer) {
|
2011-10-25 10:13:12 +09:00
|
|
|
this.startRenderingTime = Date.now();
|
2011-12-23 03:04:53 +09:00
|
|
|
|
|
|
|
// If there is no displayReadyPromise yet, then the IRQueue was never
|
|
|
|
// requested before. Make the request and create the promise.
|
|
|
|
if (!this.displayReadyPromise) {
|
|
|
|
this.pdf.startRendering(this);
|
|
|
|
this.displayReadyPromise = new Promise();
|
|
|
|
}
|
|
|
|
|
|
|
|
// Once the IRQueue and fonts are loaded, perform the actual rendering.
|
|
|
|
this.displayReadyPromise.then(function pageDisplayReadyPromise() {
|
|
|
|
var gfx = new CanvasGraphics(ctx, this.objs, textLayer);
|
|
|
|
try {
|
|
|
|
this.display(gfx, callback);
|
|
|
|
} catch (e) {
|
|
|
|
if (self.callback)
|
|
|
|
self.callback(e);
|
|
|
|
else
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
}.bind(this));
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
return Page;
|
2011-10-25 10:13:12 +09:00
|
|
|
})();
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The `PDFDocModel` holds all the data of the PDF file. Compared to the
|
|
|
|
* `PDFDoc`, this one doesn't have any job management code.
|
|
|
|
* Right now there exists one PDFDocModel on the main thread + one object
|
|
|
|
* for each worker. If there is no worker support enabled, there are two
|
|
|
|
* `PDFDocModel` objects on the main thread created.
|
|
|
|
* TODO: Refactor the internal object structure, such that there is no
|
|
|
|
* need for the `PDFDocModel` anymore and there is only one object on the
|
|
|
|
* main thread and not one entire copy on each worker instance.
|
|
|
|
*/
|
2011-12-09 07:18:43 +09:00
|
|
|
var PDFDocModel = (function PDFDocModelClosure() {
|
|
|
|
function PDFDocModel(arg, callback) {
|
2011-10-25 10:13:12 +09:00
|
|
|
if (isStream(arg))
|
|
|
|
init.call(this, arg);
|
|
|
|
else if (isArrayBuffer(arg))
|
|
|
|
init.call(this, new Stream(arg));
|
|
|
|
else
|
|
|
|
error('PDFDocModel: Unknown argument type');
|
|
|
|
}
|
|
|
|
|
|
|
|
function init(stream) {
|
|
|
|
assertWellFormed(stream.length > 0, 'stream must have data');
|
|
|
|
this.stream = stream;
|
|
|
|
this.setup();
|
2011-11-03 10:46:39 +09:00
|
|
|
this.acroForm = this.xref.fetchIfRef(this.catalog.catDict.get('AcroForm'));
|
2011-10-25 10:13:12 +09:00
|
|
|
}
|
|
|
|
|
|
|
|
function find(stream, needle, limit, backwards) {
|
|
|
|
var pos = stream.pos;
|
|
|
|
var end = stream.end;
|
|
|
|
var str = '';
|
|
|
|
if (pos + limit > end)
|
|
|
|
limit = end - pos;
|
|
|
|
for (var n = 0; n < limit; ++n)
|
|
|
|
str += stream.getChar();
|
|
|
|
stream.pos = pos;
|
|
|
|
var index = backwards ? str.lastIndexOf(needle) : str.indexOf(needle);
|
|
|
|
if (index == -1)
|
|
|
|
return false; /* not found */
|
|
|
|
stream.pos += index;
|
|
|
|
return true; /* found */
|
|
|
|
}
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
PDFDocModel.prototype = {
|
2011-10-25 10:13:12 +09:00
|
|
|
get linearization() {
|
|
|
|
var length = this.stream.length;
|
|
|
|
var linearization = false;
|
|
|
|
if (length) {
|
|
|
|
linearization = new Linearization(this.stream);
|
|
|
|
if (linearization.length != length)
|
|
|
|
linearization = false;
|
|
|
|
}
|
|
|
|
// shadow the prototype getter with a data property
|
|
|
|
return shadow(this, 'linearization', linearization);
|
|
|
|
},
|
|
|
|
get startXRef() {
|
|
|
|
var stream = this.stream;
|
|
|
|
var startXRef = 0;
|
|
|
|
var linearization = this.linearization;
|
|
|
|
if (linearization) {
|
|
|
|
// Find end of first obj.
|
|
|
|
stream.reset();
|
|
|
|
if (find(stream, 'endobj', 1024))
|
|
|
|
startXRef = stream.pos + 6;
|
|
|
|
} else {
|
2011-12-05 07:00:22 +09:00
|
|
|
// Find startxref by jumping backward from the end of the file.
|
|
|
|
var step = 1024;
|
2011-12-03 07:33:00 +09:00
|
|
|
var found = false, pos = stream.end;
|
2011-12-05 07:00:22 +09:00
|
|
|
while (!found && pos > 0) {
|
|
|
|
pos -= step - 'startxref'.length;
|
2011-12-03 07:33:00 +09:00
|
|
|
if (pos < 0)
|
|
|
|
pos = 0;
|
|
|
|
stream.pos = pos;
|
2011-12-05 07:00:22 +09:00
|
|
|
found = find(stream, 'startxref', step, true);
|
2011-12-03 07:33:00 +09:00
|
|
|
}
|
|
|
|
if (found) {
|
2011-10-25 10:13:12 +09:00
|
|
|
stream.skip(9);
|
|
|
|
var ch;
|
|
|
|
do {
|
|
|
|
ch = stream.getChar();
|
|
|
|
} while (Lexer.isSpace(ch));
|
|
|
|
var str = '';
|
|
|
|
while ((ch - '0') <= 9) {
|
|
|
|
str += ch;
|
|
|
|
ch = stream.getChar();
|
|
|
|
}
|
|
|
|
startXRef = parseInt(str, 10);
|
|
|
|
if (isNaN(startXRef))
|
|
|
|
startXRef = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// shadow the prototype getter with a data property
|
|
|
|
return shadow(this, 'startXRef', startXRef);
|
|
|
|
},
|
|
|
|
get mainXRefEntriesOffset() {
|
|
|
|
var mainXRefEntriesOffset = 0;
|
|
|
|
var linearization = this.linearization;
|
|
|
|
if (linearization)
|
|
|
|
mainXRefEntriesOffset = linearization.mainXRefEntriesOffset;
|
|
|
|
// shadow the prototype getter with a data property
|
|
|
|
return shadow(this, 'mainXRefEntriesOffset', mainXRefEntriesOffset);
|
|
|
|
},
|
|
|
|
// Find the header, remove leading garbage and setup the stream
|
|
|
|
// starting from the header.
|
|
|
|
checkHeader: function pdfDocCheckHeader() {
|
|
|
|
var stream = this.stream;
|
|
|
|
stream.reset();
|
|
|
|
if (find(stream, '%PDF-', 1024)) {
|
|
|
|
// Found the header, trim off any garbage before it.
|
|
|
|
stream.moveStart();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
// May not be a PDF file, continue anyway.
|
|
|
|
},
|
|
|
|
setup: function pdfDocSetup(ownerPassword, userPassword) {
|
|
|
|
this.checkHeader();
|
|
|
|
this.xref = new XRef(this.stream,
|
|
|
|
this.startXRef,
|
|
|
|
this.mainXRefEntriesOffset);
|
|
|
|
this.catalog = new Catalog(this.xref);
|
2011-12-26 23:07:24 +09:00
|
|
|
if (this.xref.trailer && this.xref.trailer.has('ID')) {
|
2011-12-23 06:29:01 +09:00
|
|
|
var fileID = '';
|
|
|
|
this.xref.trailer.get('ID')[0].split('').forEach(function(el) {
|
|
|
|
fileID += Number(el.charCodeAt(0)).toString(16);
|
|
|
|
});
|
|
|
|
this.fileID = fileID;
|
|
|
|
}
|
2011-10-25 10:13:12 +09:00
|
|
|
},
|
|
|
|
get numPages() {
|
|
|
|
var linearization = this.linearization;
|
|
|
|
var num = linearization ? linearization.numPages : this.catalog.numPages;
|
|
|
|
// shadow the prototype getter
|
|
|
|
return shadow(this, 'numPages', num);
|
|
|
|
},
|
2011-12-23 07:44:42 +09:00
|
|
|
getFingerprint: function pdfDocGetFingerprint() {
|
2011-12-26 23:07:24 +09:00
|
|
|
if (this.fileID) {
|
2011-12-23 07:44:42 +09:00
|
|
|
return this.fileID;
|
|
|
|
} else {
|
2011-12-26 23:07:24 +09:00
|
|
|
// If we got no fileID, then we generate one,
|
|
|
|
// from the first 100 bytes of PDF
|
2011-12-23 07:44:42 +09:00
|
|
|
var data = this.stream.bytes.subarray(0, 100);
|
|
|
|
var hash = calculateMD5(data, 0, data.length);
|
|
|
|
var strHash = '';
|
2011-12-26 23:07:24 +09:00
|
|
|
for (var i = 0, length = hash.length; i < length; i++) {
|
2011-12-23 07:44:42 +09:00
|
|
|
strHash += Number(hash[i]).toString(16);
|
|
|
|
}
|
|
|
|
|
|
|
|
return strHash;
|
|
|
|
}
|
|
|
|
},
|
2011-10-25 10:13:12 +09:00
|
|
|
getPage: function pdfDocGetPage(n) {
|
|
|
|
return this.catalog.getPage(n);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
return PDFDocModel;
|
2011-10-25 10:13:12 +09:00
|
|
|
})();
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
var PDFDoc = (function PDFDocClosure() {
|
|
|
|
function PDFDoc(arg, callback) {
|
2011-10-25 10:13:12 +09:00
|
|
|
var stream = null;
|
|
|
|
var data = null;
|
|
|
|
|
|
|
|
if (isStream(arg)) {
|
|
|
|
stream = arg;
|
|
|
|
data = arg.bytes;
|
|
|
|
} else if (isArrayBuffer(arg)) {
|
|
|
|
stream = new Stream(arg);
|
|
|
|
data = arg;
|
|
|
|
} else {
|
|
|
|
error('PDFDoc: Unknown argument type');
|
|
|
|
}
|
|
|
|
|
|
|
|
this.data = data;
|
|
|
|
this.stream = stream;
|
|
|
|
this.pdf = new PDFDocModel(stream);
|
2011-12-23 07:44:42 +09:00
|
|
|
this.fingerprint = this.pdf.getFingerprint();
|
2011-10-25 10:13:12 +09:00
|
|
|
this.catalog = this.pdf.catalog;
|
|
|
|
this.objs = new PDFObjects();
|
|
|
|
|
|
|
|
this.pageCache = [];
|
2011-11-11 02:33:45 +09:00
|
|
|
this.fontsLoading = {};
|
2011-11-02 04:23:48 +09:00
|
|
|
this.workerReadyPromise = new Promise('workerReady');
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
// If worker support isn't disabled explicit and the browser has worker
|
|
|
|
// support, create a new web worker and test if it/the browser fullfills
|
|
|
|
// all requirements to run parts of pdf.js in a web worker.
|
|
|
|
// Right now, the requirement is, that an Uint8Array is still an Uint8Array
|
|
|
|
// as it arrives on the worker. Chrome added this with version 15.
|
|
|
|
if (!globalScope.PDFJS.disableWorker && typeof Worker !== 'undefined') {
|
2011-11-02 03:32:20 +09:00
|
|
|
var workerSrc = PDFJS.workerSrc;
|
|
|
|
if (typeof workerSrc === 'undefined') {
|
|
|
|
throw 'No PDFJS.workerSrc specified';
|
2011-10-28 21:32:36 +09:00
|
|
|
}
|
2011-11-02 03:32:20 +09:00
|
|
|
|
2011-11-11 02:33:45 +09:00
|
|
|
try {
|
|
|
|
// Some versions of FF can't create a worker on localhost, see:
|
|
|
|
// https://bugzilla.mozilla.org/show_bug.cgi?id=683280
|
2011-12-28 23:21:32 +09:00
|
|
|
var worker = new Worker(workerSrc);
|
2011-12-29 01:32:54 +09:00
|
|
|
|
2011-12-28 23:21:32 +09:00
|
|
|
var messageHandler = new MessageHandler('main', worker);
|
|
|
|
// Tell the worker the file it was created from.
|
|
|
|
messageHandler.send('workerSrc', workerSrc);
|
|
|
|
messageHandler.on('test', function pdfDocTest(supportTypedArray) {
|
|
|
|
if (supportTypedArray) {
|
|
|
|
this.worker = worker;
|
|
|
|
this.setupMessageHandler(messageHandler);
|
|
|
|
} else {
|
|
|
|
globalScope.PDFJS.disableWorker = true;
|
|
|
|
this.setupFakeWorker();
|
|
|
|
}
|
|
|
|
}.bind(this));
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-12-28 23:21:32 +09:00
|
|
|
var testObj = new Uint8Array(1);
|
2011-12-29 03:57:12 +09:00
|
|
|
// Some versions of Opera throw a DATA_CLONE_ERR on
|
2011-12-29 01:32:54 +09:00
|
|
|
// serializing the typed array.
|
2011-12-28 17:10:06 +09:00
|
|
|
messageHandler.send('test', testObj);
|
2011-12-28 23:21:32 +09:00
|
|
|
return;
|
|
|
|
} catch (e) {}
|
2011-11-02 04:23:48 +09:00
|
|
|
}
|
2011-12-28 23:23:39 +09:00
|
|
|
// Either workers are disabled, not supported or have thrown an exception.
|
2011-12-28 23:21:32 +09:00
|
|
|
// Thus, we fallback to a faked worker.
|
|
|
|
globalScope.PDFJS.disableWorker = true;
|
|
|
|
this.setupFakeWorker();
|
2011-11-02 04:23:48 +09:00
|
|
|
}
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
PDFDoc.prototype = {
|
2011-11-02 04:23:48 +09:00
|
|
|
setupFakeWorker: function() {
|
2011-10-25 10:13:12 +09:00
|
|
|
// If we don't use a worker, just post/sendMessage to the main thread.
|
2011-11-02 04:23:48 +09:00
|
|
|
var fakeWorker = {
|
2011-10-30 19:41:55 +09:00
|
|
|
postMessage: function pdfDocPostMessage(obj) {
|
2011-11-02 04:23:48 +09:00
|
|
|
fakeWorker.onmessage({data: obj});
|
2011-10-25 10:13:12 +09:00
|
|
|
},
|
2011-10-30 19:41:55 +09:00
|
|
|
terminate: function pdfDocTerminate() {}
|
2011-10-25 10:13:12 +09:00
|
|
|
};
|
|
|
|
|
2011-11-03 23:30:53 +09:00
|
|
|
var messageHandler = new MessageHandler('main', fakeWorker);
|
|
|
|
this.setupMessageHandler(messageHandler);
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
// If the main thread is our worker, setup the handling for the messages
|
|
|
|
// the main thread sends to it self.
|
2011-11-03 23:30:53 +09:00
|
|
|
WorkerMessageHandler.setup(messageHandler);
|
2011-11-02 04:23:48 +09:00
|
|
|
},
|
2011-10-25 10:13:12 +09:00
|
|
|
|
|
|
|
|
2011-11-03 23:30:53 +09:00
|
|
|
setupMessageHandler: function(messageHandler) {
|
|
|
|
this.messageHandler = messageHandler;
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-03 23:30:53 +09:00
|
|
|
messageHandler.on('page', function pdfDocPage(data) {
|
2011-11-02 04:23:48 +09:00
|
|
|
var pageNum = data.pageNum;
|
|
|
|
var page = this.pageCache[pageNum];
|
|
|
|
var depFonts = data.depFonts;
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
page.startRenderingFromIRQueue(data.IRQueue, depFonts);
|
|
|
|
}, this);
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-03 23:30:53 +09:00
|
|
|
messageHandler.on('obj', function pdfDocObj(data) {
|
2011-11-02 04:23:48 +09:00
|
|
|
var id = data[0];
|
|
|
|
var type = data[1];
|
|
|
|
|
|
|
|
switch (type) {
|
|
|
|
case 'JpegStream':
|
2011-12-09 14:18:04 +09:00
|
|
|
var imageData = data[2];
|
|
|
|
loadJpegStream(id, imageData, this.objs);
|
|
|
|
break;
|
2011-12-09 05:50:34 +09:00
|
|
|
case 'Image':
|
2011-12-08 08:36:27 +09:00
|
|
|
var imageData = data[2];
|
|
|
|
this.objs.resolve(id, imageData);
|
2011-11-02 04:27:19 +09:00
|
|
|
break;
|
2011-11-02 04:23:48 +09:00
|
|
|
case 'Font':
|
|
|
|
var name = data[2];
|
|
|
|
var file = data[3];
|
|
|
|
var properties = data[4];
|
|
|
|
|
|
|
|
if (file) {
|
2011-11-30 07:50:19 +09:00
|
|
|
// Rewrap the ArrayBuffer in a stream.
|
2011-11-02 04:23:48 +09:00
|
|
|
var fontFileDict = new Dict();
|
2011-11-30 07:50:19 +09:00
|
|
|
file = new Stream(file, 0, file.length, fontFileDict);
|
2011-11-02 04:23:48 +09:00
|
|
|
}
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
// For now, resolve the font object here direclty. The real font
|
|
|
|
// object is then created in FontLoader.bind().
|
|
|
|
this.objs.resolve(id, {
|
|
|
|
name: name,
|
|
|
|
file: file,
|
|
|
|
properties: properties
|
|
|
|
});
|
2011-11-02 04:27:19 +09:00
|
|
|
break;
|
2011-11-02 04:23:48 +09:00
|
|
|
default:
|
|
|
|
throw 'Got unkown object type ' + type;
|
|
|
|
}
|
|
|
|
}, this);
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-03 23:30:53 +09:00
|
|
|
messageHandler.on('font_ready', function pdfDocFontReady(data) {
|
2011-11-02 04:23:48 +09:00
|
|
|
var id = data[0];
|
|
|
|
var font = new FontShape(data[1]);
|
2011-10-25 10:13:12 +09:00
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
// If there is no string, then there is nothing to attach to the DOM.
|
|
|
|
if (!font.str) {
|
|
|
|
this.objs.resolve(id, font);
|
|
|
|
} else {
|
|
|
|
this.objs.setData(id, font);
|
|
|
|
}
|
|
|
|
}.bind(this));
|
|
|
|
|
2011-11-29 09:55:09 +09:00
|
|
|
messageHandler.on('page_error', function pdfDocError(data) {
|
|
|
|
var page = this.pageCache[data.pageNum];
|
2011-12-03 03:19:43 +09:00
|
|
|
if (page.callback)
|
|
|
|
page.callback(data.error);
|
2011-11-29 09:55:09 +09:00
|
|
|
else
|
|
|
|
throw data.error;
|
|
|
|
}, this);
|
|
|
|
|
2011-12-15 07:02:00 +09:00
|
|
|
messageHandler.on('jpeg_decode', function(data, promise) {
|
|
|
|
var imageData = data[0];
|
|
|
|
var components = data[1];
|
2011-12-09 05:50:34 +09:00
|
|
|
if (components != 3 && components != 1)
|
|
|
|
error('Only 3 component or 1 component can be returned');
|
|
|
|
|
2011-12-08 08:36:27 +09:00
|
|
|
var img = new Image();
|
|
|
|
img.onload = (function jpegImageLoaderOnload() {
|
|
|
|
var width = img.width;
|
|
|
|
var height = img.height;
|
2011-12-09 05:50:34 +09:00
|
|
|
var size = width * height;
|
|
|
|
var rgbaLength = size * 4;
|
|
|
|
var buf = new Uint8Array(size * components);
|
2011-12-13 08:09:05 +09:00
|
|
|
var tmpCanvas = new ScratchCanvas(width, height);
|
|
|
|
var tmpCtx = tmpCanvas.getContext('2d');
|
|
|
|
tmpCtx.drawImage(img, 0, 0);
|
|
|
|
var data = tmpCtx.getImageData(0, 0, width, height).data;
|
2011-12-09 05:50:34 +09:00
|
|
|
|
|
|
|
if (components == 3) {
|
|
|
|
for (var i = 0, j = 0; i < rgbaLength; i += 4, j += 3) {
|
|
|
|
buf[j] = data[i];
|
|
|
|
buf[j + 1] = data[i + 1];
|
|
|
|
buf[j + 2] = data[i + 2];
|
|
|
|
}
|
2011-12-13 02:26:24 +09:00
|
|
|
} else if (components == 1) {
|
2011-12-09 05:50:34 +09:00
|
|
|
for (var i = 0, j = 0; i < rgbaLength; i += 4, j++) {
|
|
|
|
buf[j] = data[i];
|
|
|
|
}
|
2011-12-08 08:36:27 +09:00
|
|
|
}
|
2011-12-15 07:02:00 +09:00
|
|
|
promise.resolve({ data: buf, width: width, height: height});
|
2011-12-08 08:36:27 +09:00
|
|
|
}).bind(this);
|
|
|
|
var src = 'data:image/jpeg;base64,' + window.btoa(imageData);
|
|
|
|
img.src = src;
|
|
|
|
});
|
|
|
|
|
2011-11-02 04:23:48 +09:00
|
|
|
setTimeout(function pdfDocFontReadySetTimeout() {
|
2011-11-03 23:30:53 +09:00
|
|
|
messageHandler.send('doc', this.data);
|
2011-11-02 04:23:48 +09:00
|
|
|
this.workerReadyPromise.resolve(true);
|
|
|
|
}.bind(this));
|
|
|
|
},
|
2011-10-25 10:13:12 +09:00
|
|
|
|
|
|
|
get numPages() {
|
|
|
|
return this.pdf.numPages;
|
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
startRendering: function pdfDocStartRendering(page) {
|
2011-10-25 10:13:12 +09:00
|
|
|
// The worker might not be ready to receive the page request yet.
|
2011-10-30 19:41:55 +09:00
|
|
|
this.workerReadyPromise.then(function pdfDocStartRenderingThen() {
|
2011-11-03 23:30:53 +09:00
|
|
|
this.messageHandler.send('page_request', page.pageNumber + 1);
|
2011-10-25 10:13:12 +09:00
|
|
|
}.bind(this));
|
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
getPage: function pdfDocGetPage(n) {
|
2011-10-25 10:13:12 +09:00
|
|
|
if (this.pageCache[n])
|
|
|
|
return this.pageCache[n];
|
|
|
|
|
|
|
|
var page = this.pdf.getPage(n);
|
|
|
|
// Add a reference to the objects such that Page can forward the reference
|
|
|
|
// to the CanvasGraphics and so on.
|
|
|
|
page.objs = this.objs;
|
|
|
|
page.pdf = this;
|
2011-11-04 06:26:58 +09:00
|
|
|
return (this.pageCache[n] = page);
|
2011-10-25 10:13:12 +09:00
|
|
|
},
|
|
|
|
|
2011-10-30 19:41:55 +09:00
|
|
|
destroy: function pdfDocDestroy() {
|
2011-10-25 10:13:12 +09:00
|
|
|
if (this.worker)
|
|
|
|
this.worker.terminate();
|
|
|
|
|
|
|
|
if (this.fontWorker)
|
|
|
|
this.fontWorker.terminate();
|
|
|
|
|
|
|
|
for (var n in this.pageCache)
|
|
|
|
delete this.pageCache[n];
|
|
|
|
|
|
|
|
delete this.data;
|
|
|
|
delete this.stream;
|
|
|
|
delete this.pdf;
|
|
|
|
delete this.catalog;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2011-12-09 07:18:43 +09:00
|
|
|
return PDFDoc;
|
2011-10-25 10:13:12 +09:00
|
|
|
})();
|
2011-10-28 03:51:10 +09:00
|
|
|
|
2011-10-27 03:46:57 +09:00
|
|
|
globalScope.PDFJS.PDFDoc = PDFDoc;
|
2011-10-28 03:51:10 +09:00
|
|
|
|