Merge pull request #5124 from jordan-thoms/improve-fingerprinting

Improve fingerprinting of documents
This commit is contained in:
Yury Delendik 2014-12-15 13:30:14 -06:00
commit ee1b1252ff

View File

@ -280,6 +280,10 @@ var Page = (function PageClosure() {
* `PDFDocument` objects on the main thread created.
*/
var PDFDocument = (function PDFDocumentClosure() {
var FINGERPRINT_FIRST_BYTES = 1024;
var EMPTY_FINGERPRINT = '\x00\x00\x00\x00\x00\x00\x00' +
'\x00\x00\x00\x00\x00\x00\x00\x00\x00';
function PDFDocument(pdfManager, arg, password) {
if (isStream(arg)) {
init.call(this, pdfManager, arg, password);
@ -493,14 +497,21 @@ var PDFDocument = (function PDFDocumentClosure() {
get fingerprint() {
var xref = this.xref, hash, fileID = '';
if (xref.trailer.has('ID')) {
if (xref.trailer.has('ID') &&
xref.trailer.get('ID')[0] !== EMPTY_FINGERPRINT) {
hash = stringToBytes(xref.trailer.get('ID')[0]);
} else {
hash = calculateMD5(this.stream.bytes.subarray(0, 100), 0, 100);
if (this.stream.ensureRange) {
this.stream.ensureRange(0,
Math.min(FINGERPRINT_FIRST_BYTES, this.stream.end));
}
hash = calculateMD5(this.stream.bytes.subarray(0,
FINGERPRINT_FIRST_BYTES), 0, FINGERPRINT_FIRST_BYTES);
}
for (var i = 0, n = hash.length; i < n; i++) {
fileID += hash[i].toString(16);
var hex = hash[i].toString(16);
fileID += hex.length === 1 ? '0' + hex : hex;
}
return shadow(this, 'fingerprint', fileID);