pdf.js/src/core/worker.js

605 lines
19 KiB
JavaScript
Raw Normal View History

2012-09-01 07:48:21 +09:00
/* Copyright 2012 Mozilla Foundation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/* globals PDFJS, createPromiseCapability, LocalPdfManager, NetworkPdfManager,
NetworkManager, isInt, MissingPDFException,
UnexpectedResponseException, PasswordException, Promise, warn,
PasswordResponses, InvalidPDFException, UnknownErrorException,
XRefParseException, Ref, info, globalScope, error, MessageHandler */
2011-10-26 10:18:22 +09:00
'use strict';
2015-10-21 10:50:32 +09:00
var WorkerTask = (function WorkerTaskClosure() {
function WorkerTask(name) {
this.name = name;
this.terminated = false;
this._capability = createPromiseCapability();
}
WorkerTask.prototype = {
get finished() {
return this._capability.promise;
},
finish: function () {
this._capability.resolve();
},
terminate: function () {
this.terminated = true;
},
ensureNotTerminated: function () {
if (this.terminated) {
throw new Error('Worker task was terminated');
}
}
};
return WorkerTask;
})();
var WorkerMessageHandler = PDFJS.WorkerMessageHandler = {
2011-10-29 03:23:30 +09:00
setup: function wphSetup(handler) {
2013-02-07 08:19:29 +09:00
var pdfManager;
var terminated = false;
var cancelXHRs = null;
2015-10-21 10:50:32 +09:00
var WorkerTasks = [];
function ensureNotTerminated() {
if (terminated) {
throw new Error('Worker was terminated');
}
}
2011-10-09 17:37:53 +09:00
2015-10-21 10:50:32 +09:00
function startWorkerTask(task) {
WorkerTasks.push(task);
}
function finishWorkerTask(task) {
task.finish();
var i = WorkerTasks.indexOf(task);
WorkerTasks.splice(i, 1);
}
2013-02-07 08:19:29 +09:00
function loadDocument(recoveryMode) {
var loadDocumentCapability = createPromiseCapability();
2013-02-07 08:19:29 +09:00
var parseSuccess = function parseSuccess() {
var numPagesPromise = pdfManager.ensureDoc('numPages');
var fingerprintPromise = pdfManager.ensureDoc('fingerprint');
2013-02-07 08:19:29 +09:00
var encryptedPromise = pdfManager.ensureXRef('encrypt');
2014-05-08 04:06:44 +09:00
Promise.all([numPagesPromise, fingerprintPromise,
encryptedPromise]).then(function onDocReady(results) {
2013-02-07 08:19:29 +09:00
var doc = {
numPages: results[0],
fingerprint: results[1],
encrypted: !!results[2],
2013-02-07 08:19:29 +09:00
};
loadDocumentCapability.resolve(doc);
},
parseFailure);
2013-02-07 08:19:29 +09:00
};
var parseFailure = function parseFailure(e) {
loadDocumentCapability.reject(e);
2013-02-07 08:19:29 +09:00
};
pdfManager.ensureDoc('checkHeader', []).then(function() {
pdfManager.ensureDoc('parseStartXRef', []).then(function() {
pdfManager.ensureDoc('parse', [recoveryMode]).then(
2014-03-23 04:59:16 +09:00
parseSuccess, parseFailure);
}, parseFailure);
}, parseFailure);
2013-02-07 08:19:29 +09:00
return loadDocumentCapability.promise;
2013-02-07 08:19:29 +09:00
}
function getPdfManager(data) {
var pdfManagerCapability = createPromiseCapability();
var pdfManager;
2013-02-07 08:19:29 +09:00
var source = data.source;
var disableRange = data.disableRange;
if (source.data) {
2013-05-31 06:54:49 +09:00
try {
pdfManager = new LocalPdfManager(source.data, source.password);
pdfManagerCapability.resolve(pdfManager);
2013-05-31 06:54:49 +09:00
} catch (ex) {
pdfManagerCapability.reject(ex);
2013-05-31 06:54:49 +09:00
}
return pdfManagerCapability.promise;
2013-02-07 08:19:29 +09:00
} else if (source.chunkedViewerLoading) {
2013-05-31 06:54:49 +09:00
try {
pdfManager = new NetworkPdfManager(source, handler);
pdfManagerCapability.resolve(pdfManager);
2013-05-31 06:54:49 +09:00
} catch (ex) {
pdfManagerCapability.reject(ex);
2013-05-31 06:54:49 +09:00
}
return pdfManagerCapability.promise;
2013-02-07 08:19:29 +09:00
}
var networkManager = new NetworkManager(source.url, {
httpHeaders: source.httpHeaders,
withCredentials: source.withCredentials
2013-02-07 08:19:29 +09:00
});
var cachedChunks = [];
2013-02-07 08:19:29 +09:00
var fullRequestXhrId = networkManager.requestFull({
onHeadersReceived: function onHeadersReceived() {
if (disableRange) {
return;
}
2013-02-07 08:19:29 +09:00
var fullRequestXhr = networkManager.getRequestXhr(fullRequestXhrId);
if (fullRequestXhr.getResponseHeader('Accept-Ranges') !== 'bytes') {
return;
}
var contentEncoding =
fullRequestXhr.getResponseHeader('Content-Encoding') || 'identity';
if (contentEncoding !== 'identity') {
return;
}
2013-02-07 08:19:29 +09:00
var length = fullRequestXhr.getResponseHeader('Content-Length');
length = parseInt(length, 10);
if (!isInt(length)) {
return;
}
source.length = length;
if (length <= 2 * source.rangeChunkSize) {
// The file size is smaller than the size of two chunks, so it does
// not make any sense to abort the request and retry with a range
// request.
return;
}
if (networkManager.isStreamingRequest(fullRequestXhrId)) {
// We can continue fetching when progressive loading is enabled,
// and we don't need the autoFetch feature.
source.disableAutoFetch = true;
} else {
// NOTE: by cancelling the full request, and then issuing range
// requests, there will be an issue for sites where you can only
// request the pdf once. However, if this is the case, then the
// server should not be returning that it can support range
// requests.
networkManager.abortRequest(fullRequestXhrId);
}
2013-02-07 08:19:29 +09:00
2013-05-31 06:54:49 +09:00
try {
pdfManager = new NetworkPdfManager(source, handler);
pdfManagerCapability.resolve(pdfManager);
2013-05-31 06:54:49 +09:00
} catch (ex) {
pdfManagerCapability.reject(ex);
2013-05-31 06:54:49 +09:00
}
cancelXHRs = null;
2013-02-07 08:19:29 +09:00
},
onProgressiveData: source.disableStream ? null :
function onProgressiveData(chunk) {
if (!pdfManager) {
cachedChunks.push(chunk);
return;
}
pdfManager.sendProgressiveData(chunk);
},
2013-02-07 08:19:29 +09:00
onDone: function onDone(args) {
if (pdfManager) {
return; // already processed
}
var pdfFile;
if (args === null) {
// TODO add some streaming manager, e.g. for unknown length files.
// The data was returned in the onProgressiveData, combining...
var pdfFileLength = 0, pos = 0;
cachedChunks.forEach(function (chunk) {
pdfFileLength += chunk.byteLength;
});
if (source.length && pdfFileLength !== source.length) {
warn('reported HTTP length is different from actual');
}
var pdfFileArray = new Uint8Array(pdfFileLength);
cachedChunks.forEach(function (chunk) {
pdfFileArray.set(new Uint8Array(chunk), pos);
pos += chunk.byteLength;
});
pdfFile = pdfFileArray.buffer;
} else {
pdfFile = args.chunk;
}
2013-02-07 08:19:29 +09:00
// the data is array, instantiating directly from it
2013-05-31 06:54:49 +09:00
try {
pdfManager = new LocalPdfManager(pdfFile, source.password);
pdfManagerCapability.resolve(pdfManager);
2013-05-31 06:54:49 +09:00
} catch (ex) {
pdfManagerCapability.reject(ex);
2013-05-31 06:54:49 +09:00
}
cancelXHRs = null;
2013-02-07 08:19:29 +09:00
},
onError: function onError(status) {
var exception;
if (status === 404 || status === 0 && /^file:/.test(source.url)) {
exception = new MissingPDFException('Missing PDF "' +
source.url + '".');
handler.send('MissingPDF', exception);
2013-02-07 08:19:29 +09:00
} else {
exception = new UnexpectedResponseException(
'Unexpected server response (' + status +
') while retrieving PDF "' + source.url + '".', status);
handler.send('UnexpectedResponse', exception);
2013-02-07 08:19:29 +09:00
}
cancelXHRs = null;
2013-02-07 08:19:29 +09:00
},
2013-02-07 08:19:29 +09:00
onProgress: function onProgress(evt) {
handler.send('DocProgress', {
loaded: evt.loaded,
total: evt.lengthComputable ? evt.total : source.length
2013-02-07 08:19:29 +09:00
});
}
2013-02-07 08:19:29 +09:00
});
cancelXHRs = function () {
networkManager.abortRequest(fullRequestXhrId);
};
return pdfManagerCapability.promise;
2012-06-24 04:48:33 +09:00
}
handler.on('test', function wphSetupTest(data) {
// check if Uint8Array can be sent to worker
if (!(data instanceof Uint8Array)) {
handler.send('test', false);
return;
}
2013-11-12 12:30:26 +09:00
// making sure postMessage transfers are working
var supportTransfers = data[0] === 255;
handler.postMessageTransfers = supportTransfers;
// check if the response property is supported by xhr
var xhr = new XMLHttpRequest();
var responseExists = 'response' in xhr;
// check if the property is actually implemented
try {
var dummy = xhr.responseType;
} catch (e) {
responseExists = false;
}
if (!responseExists) {
handler.send('test', false);
return;
}
2013-11-12 12:30:26 +09:00
handler.send('test', {
supportTypedArray: true,
supportTransfers: supportTransfers
});
2012-06-24 04:48:33 +09:00
});
handler.on('GetDocRequest', function wphSetupDoc(data) {
2013-02-07 08:19:29 +09:00
var onSuccess = function(doc) {
ensureNotTerminated();
2013-02-07 08:19:29 +09:00
handler.send('GetDoc', { pdfInfo: doc });
};
var onFailure = function(e) {
if (e instanceof PasswordException) {
if (e.code === PasswordResponses.NEED_PASSWORD) {
handler.send('NeedPassword', e);
} else if (e.code === PasswordResponses.INCORRECT_PASSWORD) {
handler.send('IncorrectPassword', e);
2013-02-07 08:19:29 +09:00
}
} else if (e instanceof InvalidPDFException) {
handler.send('InvalidPDF', e);
2013-02-07 08:19:29 +09:00
} else if (e instanceof MissingPDFException) {
handler.send('MissingPDF', e);
} else if (e instanceof UnexpectedResponseException) {
handler.send('UnexpectedResponse', e);
2013-02-07 08:19:29 +09:00
} else {
handler.send('UnknownError',
new UnknownErrorException(e.message, e.toString()));
2013-02-07 08:19:29 +09:00
}
};
ensureNotTerminated();
2013-07-11 01:52:37 +09:00
PDFJS.maxImageSize = data.maxImageSize === undefined ?
-1 : data.maxImageSize;
PDFJS.disableFontFace = data.disableFontFace;
2014-01-11 07:30:41 +09:00
PDFJS.disableCreateObjectURL = data.disableCreateObjectURL;
2013-12-19 06:39:03 +09:00
PDFJS.verbosity = data.verbosity;
PDFJS.cMapUrl = data.cMapUrl === undefined ?
null : data.cMapUrl;
2014-03-15 03:22:02 +09:00
PDFJS.cMapPacked = data.cMapPacked === true;
2013-07-11 01:52:37 +09:00
getPdfManager(data).then(function (newPdfManager) {
if (terminated) {
// We were in a process of setting up the manager, but it got
// terminated in the middle.
newPdfManager.terminate();
throw new Error('Worker was terminated');
}
pdfManager = newPdfManager;
handler.send('PDFManagerReady', null);
pdfManager.onLoadedStream().then(function(stream) {
handler.send('DataLoaded', { length: stream.bytes.byteLength });
});
}).then(function pdfManagerReady() {
ensureNotTerminated();
loadDocument(false).then(onSuccess, function loadFailure(ex) {
ensureNotTerminated();
2013-02-07 08:19:29 +09:00
// Try again with recoveryMode == true
if (!(ex instanceof XRefParseException)) {
if (ex instanceof PasswordException) {
// after password exception prepare to receive a new password
// to repeat loading
pdfManager.passwordChanged().then(pdfManagerReady);
}
2013-02-07 08:19:29 +09:00
onFailure(ex);
return;
}
pdfManager.requestLoadedStream();
2013-02-07 08:19:29 +09:00
pdfManager.onLoadedStream().then(function() {
ensureNotTerminated();
2013-02-07 08:19:29 +09:00
loadDocument(true).then(onSuccess, onFailure);
});
2013-05-31 06:54:49 +09:00
}, onFailure);
}, onFailure);
2012-04-12 07:52:15 +09:00
});
handler.on('GetPage', function wphSetupGetPage(data) {
return pdfManager.getPage(data.pageIndex).then(function(page) {
2013-02-07 08:19:29 +09:00
var rotatePromise = pdfManager.ensure(page, 'rotate');
var refPromise = pdfManager.ensure(page, 'ref');
var viewPromise = pdfManager.ensure(page, 'view');
return Promise.all([rotatePromise, refPromise, viewPromise]).then(
2013-02-07 08:19:29 +09:00
function(results) {
return {
2013-02-07 08:19:29 +09:00
rotate: results[0],
ref: results[1],
view: results[2]
};
});
});
});
2011-10-09 17:37:53 +09:00
handler.on('GetPageIndex', function wphSetupGetPageIndex(data) {
var ref = new Ref(data.ref.num, data.ref.gen);
var catalog = pdfManager.pdfDocument.catalog;
return catalog.getPageIndex(ref);
});
2013-02-07 08:19:29 +09:00
handler.on('GetDestinations',
function wphSetupGetDestinations(data) {
return pdfManager.ensureCatalog('destinations');
2013-02-07 08:19:29 +09:00
}
);
handler.on('GetDestination',
function wphSetupGetDestination(data) {
return pdfManager.ensureCatalog('getDestination', [ data.id ]);
}
);
handler.on('GetAttachments',
function wphSetupGetAttachments(data) {
return pdfManager.ensureCatalog('attachments');
}
);
2014-05-08 04:15:34 +09:00
handler.on('GetJavaScript',
function wphSetupGetJavaScript(data) {
return pdfManager.ensureCatalog('javaScript');
2014-05-08 04:15:34 +09:00
}
);
2014-05-08 04:06:44 +09:00
handler.on('GetOutline',
function wphSetupGetOutline(data) {
return pdfManager.ensureCatalog('documentOutline');
2014-05-08 04:06:44 +09:00
}
);
handler.on('GetMetadata',
function wphSetupGetMetadata(data) {
return Promise.all([pdfManager.ensureDoc('documentInfo'),
pdfManager.ensureCatalog('metadata')]);
}
);
handler.on('GetData', function wphSetupGetData(data) {
2013-02-07 08:19:29 +09:00
pdfManager.requestLoadedStream();
return pdfManager.onLoadedStream().then(function(stream) {
return stream.bytes;
2013-02-07 08:19:29 +09:00
});
});
handler.on('GetStats',
function wphSetupGetStats(data) {
return pdfManager.pdfDocument.xref.stats;
}
);
handler.on('UpdatePassword', function wphSetupUpdatePassword(data) {
pdfManager.updatePassword(data);
});
handler.on('GetAnnotations', function wphSetupGetAnnotations(data) {
return pdfManager.getPage(data.pageIndex).then(function(page) {
return pdfManager.ensure(page, 'getAnnotationsData', []);
});
});
handler.on('RenderPageRequest', function wphSetupRenderPage(data) {
2015-10-21 10:50:32 +09:00
var pageIndex = data.pageIndex;
pdfManager.getPage(pageIndex).then(function(page) {
var task = new WorkerTask('RenderPageRequest: page ' + pageIndex);
startWorkerTask(task);
2015-10-21 10:50:32 +09:00
var pageNum = pageIndex + 1;
2013-02-07 08:19:29 +09:00
var start = Date.now();
// Pre compile the pdf page and fetch the fonts/images.
2015-10-21 10:50:32 +09:00
page.getOperatorList(handler, task, data.intent).then(
function(operatorList) {
finishWorkerTask(task);
info('page=' + pageNum + ' - getOperatorList: time=' +
(Date.now() - start) + 'ms, len=' + operatorList.totalLength);
2013-02-07 08:19:29 +09:00
}, function(e) {
2015-10-21 10:50:32 +09:00
finishWorkerTask(task);
if (task.terminated) {
return; // ignoring errors from the terminated thread
}
2013-02-07 08:19:29 +09:00
var minimumStackMessage =
2014-03-23 04:59:16 +09:00
'worker.js: while trying to getPage() and getOperatorList()';
2013-02-07 08:19:29 +09:00
var wrappedException;
// Turn the error into an obj that can be serialized
if (typeof e === 'string') {
wrappedException = {
message: e,
stack: minimumStackMessage
};
} else if (typeof e === 'object') {
wrappedException = {
message: e.message || e.toString(),
stack: e.stack || minimumStackMessage
};
} else {
wrappedException = {
message: 'Unknown exception type: ' + (typeof e),
stack: minimumStackMessage
};
}
handler.send('PageError', {
pageNum: pageNum,
error: wrappedException,
intent: data.intent
2013-02-07 08:19:29 +09:00
});
});
});
}, this);
2011-10-09 17:37:53 +09:00
handler.on('GetTextContent', function wphExtractText(data) {
2015-10-21 10:50:32 +09:00
var pageIndex = data.pageIndex;
return pdfManager.getPage(pageIndex).then(function(page) {
var task = new WorkerTask('GetTextContent: page ' + pageIndex);
startWorkerTask(task);
var pageNum = pageIndex + 1;
2013-02-07 08:19:29 +09:00
var start = Date.now();
2015-10-21 10:50:32 +09:00
return page.extractTextContent(task).then(function(textContent) {
finishWorkerTask(task);
info('text indexing: page=' + pageNum + ' - time=' +
(Date.now() - start) + 'ms');
return textContent;
2015-10-21 10:50:32 +09:00
}, function (reason) {
finishWorkerTask(task);
if (task.terminated) {
return; // ignoring errors from the terminated thread
}
throw reason;
2013-02-07 08:19:29 +09:00
});
});
2011-12-11 08:24:54 +09:00
});
handler.on('Cleanup', function wphCleanup(data) {
2014-05-10 10:21:15 +09:00
return pdfManager.cleanup();
});
handler.on('Terminate', function wphTerminate(data) {
terminated = true;
if (pdfManager) {
pdfManager.terminate();
pdfManager = null;
}
if (cancelXHRs) {
cancelXHRs();
}
2015-10-21 10:50:32 +09:00
var waitOn = [];
WorkerTasks.forEach(function (task) {
waitOn.push(task.finished);
task.terminate();
});
return Promise.all(waitOn).then(function () {});
});
}
2011-10-09 17:37:53 +09:00
};
2011-10-26 07:43:41 +09:00
var consoleTimer = {};
var workerConsole = {
log: function log() {
var args = Array.prototype.slice.call(arguments);
globalScope.postMessage({
action: 'console_log',
data: args
});
},
error: function error() {
var args = Array.prototype.slice.call(arguments);
globalScope.postMessage({
action: 'console_error',
data: args
});
throw 'pdf.js execution error';
},
2011-10-29 03:23:30 +09:00
time: function time(name) {
consoleTimer[name] = Date.now();
},
2011-10-29 03:23:30 +09:00
timeEnd: function timeEnd(name) {
var time = consoleTimer[name];
if (!time) {
2014-01-16 06:28:31 +09:00
error('Unknown timer name ' + name);
}
this.log('Timer:', name, Date.now() - time);
}
2011-10-26 02:43:28 +09:00
};
2011-10-26 07:43:41 +09:00
2014-01-16 06:28:31 +09:00
2011-10-26 07:43:41 +09:00
// Worker thread?
if (typeof window === 'undefined') {
2014-01-16 06:28:31 +09:00
if (!('console' in globalScope)) {
globalScope.console = workerConsole;
}
2011-10-26 07:43:41 +09:00
// Listen for unsupported features so we can pass them on to the main thread.
PDFJS.UnsupportedManager.listen(function (msg) {
globalScope.postMessage({
action: '_unsupported_feature',
data: msg
});
});
var handler = new MessageHandler('worker_processor', this);
WorkerMessageHandler.setup(handler);
2011-10-26 07:43:41 +09:00
}