pdf.js/src/metadata.js

87 lines
2.7 KiB
JavaScript
Raw Normal View History

2012-03-29 03:09:03 +09:00
/* -*- Mode: Java; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* vim: set shiftwidth=2 tabstop=2 autoindent cindent expandtab: */
2012-03-29 03:07:37 +09:00
'use strict';
var Metadata = PDFJS.Metadata = (function MetadataClosure() {
2012-04-24 06:43:20 +09:00
function fixMetadata(meta) {
return meta.replace(/>\\376\\377([^<]+)/g, function(all, codes) {
var bytes = codes.replace(/\\([0-3])([0-7])([0-7])/g,
function(code, d1, d2, d3) {
return String.fromCharCode(d1 * 64 + d2 * 8 + d3 * 1);
});
var chars = '';
for (var i = 0; i < bytes.length; i += 2) {
var code = bytes.charCodeAt(i) * 256 + bytes.charCodeAt(i + 1);
chars += code >= 32 && code < 127 && code != 60 && code != 62 &&
code != 38 && false ? String.fromCharCode(code) :
'&#x' + (0x10000 + code).toString(16).substring(1) + ';';
}
return '>' + chars;
});
}
2012-03-25 03:59:51 +09:00
function Metadata(meta) {
if (typeof meta === 'string') {
2012-04-24 06:43:20 +09:00
// Ghostscript produces invalid metadata
meta = fixMetadata(meta);
2012-03-25 03:59:51 +09:00
var parser = new DOMParser();
meta = parser.parseFromString(meta, 'application/xml');
} else if (!(meta instanceof Document)) {
error('Metadata: Invalid metadata object');
}
this.metaDocument = meta;
this.metadata = {};
this.parse();
}
Metadata.prototype = {
parse: function Metadata_parse() {
2012-03-25 03:59:51 +09:00
var doc = this.metaDocument;
var rdf = doc.documentElement;
2012-03-29 02:15:59 +09:00
if (rdf.nodeName.toLowerCase() !== 'rdf:rdf') { // Wrapped in <xmpmeta>
2012-03-25 03:59:51 +09:00
rdf = rdf.firstChild;
2012-03-29 02:15:59 +09:00
while (rdf && rdf.nodeName.toLowerCase() !== 'rdf:rdf')
2012-03-25 03:59:51 +09:00
rdf = rdf.nextSibling;
}
2012-03-28 05:37:02 +09:00
2012-03-29 02:15:59 +09:00
var nodeName = (rdf) ? rdf.nodeName.toLowerCase() : null;
if (!rdf || nodeName !== 'rdf:rdf' || !rdf.hasChildNodes())
2012-03-25 03:59:51 +09:00
return;
var childNodes = rdf.childNodes, desc, namespace, entries, entry;
for (var i = 0, length = childNodes.length; i < length; i++) {
desc = childNodes[i];
2012-03-28 05:37:02 +09:00
if (desc.nodeName.toLowerCase() !== 'rdf:description')
2012-03-25 03:59:51 +09:00
continue;
entries = [];
for (var ii = 0, iLength = desc.childNodes.length; ii < iLength; ii++) {
2012-03-28 05:37:02 +09:00
if (desc.childNodes[ii].nodeName.toLowerCase() !== '#text')
2012-03-25 03:59:51 +09:00
entries.push(desc.childNodes[ii]);
}
for (ii = 0, iLength = entries.length; ii < iLength; ii++) {
var entry = entries[ii];
var name = entry.nodeName.toLowerCase();
this.metadata[name] = entry.textContent.trim();
2012-03-25 03:59:51 +09:00
}
}
},
get: function Metadata_get(name) {
2012-03-25 03:59:51 +09:00
return this.metadata[name] || null;
},
has: function Metadata_has(name) {
2012-03-25 03:59:51 +09:00
return typeof this.metadata[name] !== 'undefined';
}
};
return Metadata;
})();