2014-08-14 05:04:47 +09:00
|
|
|
/* Any copyright is dedicated to the Public Domain.
|
|
|
|
* http://creativecommons.org/publicdomain/zero/1.0/ */
|
|
|
|
|
|
|
|
//
|
|
|
|
// Node tool to dump SVG output into a file.
|
|
|
|
//
|
|
|
|
|
|
|
|
var fs = require('fs');
|
2017-06-21 20:12:34 +09:00
|
|
|
var util = require('util');
|
|
|
|
var path = require('path');
|
|
|
|
var stream = require('stream');
|
2014-08-14 05:04:47 +09:00
|
|
|
|
|
|
|
// HACK few hacks to let PDF.js be loaded not as a module in global space.
|
2017-07-06 18:55:18 +09:00
|
|
|
require('./domstubs.js').setStubs(global);
|
2014-10-22 23:59:20 +09:00
|
|
|
|
2017-05-11 08:28:18 +09:00
|
|
|
// Run `gulp dist-install` to generate 'pdfjs-dist' npm package files.
|
|
|
|
var pdfjsLib = require('pdfjs-dist');
|
2014-08-14 05:04:47 +09:00
|
|
|
|
|
|
|
// Loading file from file system into typed array
|
|
|
|
var pdfPath = process.argv[2] || '../../web/compressed.tracemonkey-pldi-09.pdf';
|
|
|
|
var data = new Uint8Array(fs.readFileSync(pdfPath));
|
|
|
|
|
2017-06-21 20:12:34 +09:00
|
|
|
var outputDirectory = './svgdump';
|
|
|
|
|
|
|
|
try {
|
|
|
|
// Note: This creates a directory only one level deep. If you want to create
|
|
|
|
// multiple subdirectories on the fly, use the mkdirp module from npm.
|
|
|
|
fs.mkdirSync(outputDirectory);
|
|
|
|
} catch (e) {
|
|
|
|
if (e.code !== 'EEXIST') {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-08-14 05:04:47 +09:00
|
|
|
// Dumps svg outputs to a folder called svgdump
|
2017-06-21 20:12:34 +09:00
|
|
|
function getFilePathForPage(pageNum) {
|
|
|
|
var name = path.basename(pdfPath, path.extname(pdfPath));
|
|
|
|
return path.join(outputDirectory, name + '-' + pageNum + '.svg');
|
2014-08-14 05:04:47 +09:00
|
|
|
}
|
|
|
|
|
2017-06-21 20:12:34 +09:00
|
|
|
/**
|
|
|
|
* A readable stream which offers a stream representing the serialization of a
|
|
|
|
* given DOM element (as defined by domstubs.js).
|
|
|
|
*
|
|
|
|
* @param {object} options
|
|
|
|
* @param {DOMElement} options.svgElement The element to serialize
|
|
|
|
*/
|
|
|
|
function ReadableSVGStream(options) {
|
|
|
|
if (!(this instanceof ReadableSVGStream)) {
|
|
|
|
return new ReadableSVGStream(options);
|
|
|
|
}
|
|
|
|
stream.Readable.call(this, options);
|
|
|
|
this.serializer = options.svgElement.getSerializer();
|
|
|
|
}
|
|
|
|
util.inherits(ReadableSVGStream, stream.Readable);
|
|
|
|
// Implements https://nodejs.org/api/stream.html#stream_readable_read_size_1
|
|
|
|
ReadableSVGStream.prototype._read = function() {
|
|
|
|
var chunk;
|
|
|
|
while ((chunk = this.serializer.getNext()) !== null) {
|
|
|
|
if (!this.push(chunk)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
this.push(null);
|
|
|
|
};
|
2014-08-14 05:04:47 +09:00
|
|
|
|
2017-06-21 20:12:34 +09:00
|
|
|
// Streams the SVG element to the given file path.
|
|
|
|
function writeSvgToFile(svgElement, filePath) {
|
|
|
|
var readableSvgStream = new ReadableSVGStream({
|
|
|
|
svgElement: svgElement,
|
|
|
|
});
|
|
|
|
var writableStream = fs.createWriteStream(filePath);
|
|
|
|
return new Promise(function(resolve, reject) {
|
|
|
|
readableSvgStream.once('error', reject);
|
|
|
|
writableStream.once('error', reject);
|
|
|
|
writableStream.once('finish', resolve);
|
|
|
|
readableSvgStream.pipe(writableStream);
|
|
|
|
}).catch(function(err) {
|
|
|
|
readableSvgStream = null; // Explicitly null because of v8 bug 6512.
|
|
|
|
writableStream.end();
|
|
|
|
throw err;
|
|
|
|
});
|
2014-08-14 05:04:47 +09:00
|
|
|
}
|
|
|
|
|
|
|
|
// Will be using promises to load document, pages and misc data instead of
|
|
|
|
// callback.
|
2017-04-05 00:18:25 +09:00
|
|
|
pdfjsLib.getDocument({
|
|
|
|
data: data,
|
2017-05-08 12:32:44 +09:00
|
|
|
// Try to export JPEG images directly if they don't need any further processing.
|
|
|
|
nativeImageDecoderSupport: pdfjsLib.NativeImageDecoding.DISPLAY
|
2017-04-05 00:18:25 +09:00
|
|
|
}).then(function (doc) {
|
2014-08-14 05:04:47 +09:00
|
|
|
var numPages = doc.numPages;
|
|
|
|
console.log('# Document Loaded');
|
|
|
|
console.log('Number of Pages: ' + numPages);
|
|
|
|
console.log();
|
|
|
|
|
|
|
|
var lastPromise = Promise.resolve(); // will be used to chain promises
|
|
|
|
var loadPage = function (pageNum) {
|
|
|
|
return doc.getPage(pageNum).then(function (page) {
|
|
|
|
console.log('# Page ' + pageNum);
|
|
|
|
var viewport = page.getViewport(1.0 /* scale */);
|
|
|
|
console.log('Size: ' + viewport.width + 'x' + viewport.height);
|
|
|
|
console.log();
|
2015-02-03 00:12:52 +09:00
|
|
|
|
2014-08-14 05:04:47 +09:00
|
|
|
return page.getOperatorList().then(function (opList) {
|
2016-03-29 06:44:27 +09:00
|
|
|
var svgGfx = new pdfjsLib.SVGGraphics(page.commonObjs, page.objs);
|
2014-08-15 05:11:27 +09:00
|
|
|
svgGfx.embedFonts = true;
|
2014-08-15 02:56:11 +09:00
|
|
|
return svgGfx.getSVG(opList, viewport).then(function (svg) {
|
2017-06-21 20:12:34 +09:00
|
|
|
return writeSvgToFile(svg, getFilePathForPage(pageNum)).then(function () {
|
|
|
|
console.log('Page: ' + pageNum);
|
|
|
|
}, function(err) {
|
|
|
|
console.log('Error: ' + err);
|
2017-06-18 19:58:53 +09:00
|
|
|
});
|
2014-08-14 05:04:47 +09:00
|
|
|
});
|
|
|
|
});
|
2017-06-21 20:12:34 +09:00
|
|
|
});
|
2014-08-14 05:04:47 +09:00
|
|
|
};
|
2015-02-03 00:12:52 +09:00
|
|
|
|
2014-08-14 05:04:47 +09:00
|
|
|
for (var i = 1; i <= numPages; i++) {
|
|
|
|
lastPromise = lastPromise.then(loadPage.bind(null, i));
|
|
|
|
}
|
|
|
|
return lastPromise;
|
|
|
|
}).then(function () {
|
|
|
|
console.log('# End of Document');
|
|
|
|
}, function (err) {
|
|
|
|
console.error('Error: ' + err);
|
|
|
|
});
|