From 1cc83c4fdc614c41cf314296cf0160693c9b60da Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Mon, 22 Jan 2024 12:14:30 +0100 Subject: [PATCH 1/5] Use `await` consistently in the `PartialEvaluator.buildFormXObject` method --- src/core/evaluator.js | 21 ++++++++++----------- 1 file changed, 10 insertions(+), 11 deletions(-) diff --git a/src/core/evaluator.js b/src/core/evaluator.js index b98a4079a..5bccea9ae 100644 --- a/src/core/evaluator.js +++ b/src/core/evaluator.js @@ -526,23 +526,22 @@ class PartialEvaluator { const args = group ? [matrix, null] : [matrix, bbox]; operatorList.addOp(OPS.paintFormXObjectBegin, args); - return this.getOperatorList({ + await this.getOperatorList({ stream: xobj, task, resources: dict.get("Resources") || resources, operatorList, initialState, - }).then(function () { - operatorList.addOp(OPS.paintFormXObjectEnd, []); - - if (group) { - operatorList.addOp(OPS.endGroup, [groupOptions]); - } - - if (optionalContent !== undefined) { - operatorList.addOp(OPS.endMarkedContent, []); - } }); + operatorList.addOp(OPS.paintFormXObjectEnd, []); + + if (group) { + operatorList.addOp(OPS.endGroup, [groupOptions]); + } + + if (optionalContent !== undefined) { + operatorList.addOp(OPS.endMarkedContent, []); + } } _sendImgData(objId, imgData, cacheGlobally = false) { From cf0797dfbd7fe1f7dcd9f1d4e60848a3a2a5de19 Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Mon, 22 Jan 2024 12:17:20 +0100 Subject: [PATCH 2/5] Use `await` consistently in the `PartialEvaluator.setGState` method --- src/core/evaluator.js | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/src/core/evaluator.js b/src/core/evaluator.js index 5bccea9ae..1958a3520 100644 --- a/src/core/evaluator.js +++ b/src/core/evaluator.js @@ -1188,15 +1188,15 @@ class PartialEvaluator { break; } } - return promise.then(function () { - if (gStateObj.length > 0) { - operatorList.addOp(OPS.setGState, [gStateObj]); - } + await promise; - if (isSimpleGState) { - localGStateCache.set(cacheKey, gStateRef, gStateObj); - } - }); + if (gStateObj.length > 0) { + operatorList.addOp(OPS.setGState, [gStateObj]); + } + + if (isSimpleGState) { + localGStateCache.set(cacheKey, gStateRef, gStateObj); + } } loadFont( From f5c01188dc8fbb586664bf68ef492c26813d5253 Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Mon, 22 Jan 2024 12:22:48 +0100 Subject: [PATCH 3/5] Convert the `PartialEvaluator.extractDataStructures` method to be async --- src/core/evaluator.js | 30 ++++++++++++++---------------- 1 file changed, 14 insertions(+), 16 deletions(-) diff --git a/src/core/evaluator.js b/src/core/evaluator.js index 1958a3520..4c0b29543 100644 --- a/src/core/evaluator.js +++ b/src/core/evaluator.js @@ -3428,7 +3428,7 @@ class PartialEvaluator { }); } - extractDataStructures(dict, baseDict, properties) { + async extractDataStructures(dict, baseDict, properties) { const xref = this.xref; let cidToGidBytes; // 9.10.2 @@ -3554,21 +3554,19 @@ class PartialEvaluator { properties.baseEncodingName = baseEncodingName; properties.hasEncoding = !!baseEncodingName || differences.length > 0; properties.dict = dict; - return toUnicodePromise - .then(readToUnicode => { - properties.toUnicode = readToUnicode; - return this.buildToUnicode(properties); - }) - .then(builtToUnicode => { - properties.toUnicode = builtToUnicode; - if (cidToGidBytes) { - properties.cidToGidMap = this.readCidToGidMap( - cidToGidBytes, - builtToUnicode - ); - } - return properties; - }); + + properties.toUnicode = await toUnicodePromise; + + const builtToUnicode = await this.buildToUnicode(properties); + properties.toUnicode = builtToUnicode; + + if (cidToGidBytes) { + properties.cidToGidMap = this.readCidToGidMap( + cidToGidBytes, + builtToUnicode + ); + } + return properties; } /** From f21a30dfb4c7812e4b31acbb15206f24611ae58b Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Mon, 22 Jan 2024 12:44:32 +0100 Subject: [PATCH 4/5] Convert the `PartialEvaluator.readToUnicode` method to be async --- src/core/evaluator.js | 100 +++++++++++++++++++++--------------------- 1 file changed, 50 insertions(+), 50 deletions(-) diff --git a/src/core/evaluator.js b/src/core/evaluator.js index 4c0b29543..68ab49bb0 100644 --- a/src/core/evaluator.js +++ b/src/core/evaluator.js @@ -3765,70 +3765,70 @@ class PartialEvaluator { return new IdentityToUnicodeMap(properties.firstChar, properties.lastChar); } - readToUnicode(cmapObj) { + async readToUnicode(cmapObj) { if (!cmapObj) { - return Promise.resolve(null); + return null; } if (cmapObj instanceof Name) { - return CMapFactory.create({ + const cmap = await CMapFactory.create({ encoding: cmapObj, fetchBuiltInCMap: this._fetchBuiltInCMapBound, useCMap: null, - }).then(function (cmap) { + }); + + if (cmap instanceof IdentityCMap) { + return new IdentityToUnicodeMap(0, 0xffff); + } + return new ToUnicodeMap(cmap.getMap()); + } + if (cmapObj instanceof BaseStream) { + try { + const cmap = await CMapFactory.create({ + encoding: cmapObj, + fetchBuiltInCMap: this._fetchBuiltInCMapBound, + useCMap: null, + }); + if (cmap instanceof IdentityCMap) { return new IdentityToUnicodeMap(0, 0xffff); } - return new ToUnicodeMap(cmap.getMap()); - }); - } else if (cmapObj instanceof BaseStream) { - return CMapFactory.create({ - encoding: cmapObj, - fetchBuiltInCMap: this._fetchBuiltInCMapBound, - useCMap: null, - }).then( - function (cmap) { - if (cmap instanceof IdentityCMap) { - return new IdentityToUnicodeMap(0, 0xffff); + const map = new Array(cmap.length); + // Convert UTF-16BE + // NOTE: cmap can be a sparse array, so use forEach instead of + // `for(;;)` to iterate over all keys. + cmap.forEach(function (charCode, token) { + // Some cmaps contain *only* CID characters (fixes issue9367.pdf). + if (typeof token === "number") { + map[charCode] = String.fromCodePoint(token); + return; } - const map = new Array(cmap.length); - // Convert UTF-16BE - // NOTE: cmap can be a sparse array, so use forEach instead of - // `for(;;)` to iterate over all keys. - cmap.forEach(function (charCode, token) { - // Some cmaps contain *only* CID characters (fixes issue9367.pdf). - if (typeof token === "number") { - map[charCode] = String.fromCodePoint(token); - return; + const str = []; + for (let k = 0; k < token.length; k += 2) { + const w1 = (token.charCodeAt(k) << 8) | token.charCodeAt(k + 1); + if ((w1 & 0xf800) !== 0xd800) { + // w1 < 0xD800 || w1 > 0xDFFF + str.push(w1); + continue; } - const str = []; - for (let k = 0; k < token.length; k += 2) { - const w1 = (token.charCodeAt(k) << 8) | token.charCodeAt(k + 1); - if ((w1 & 0xf800) !== 0xd800) { - // w1 < 0xD800 || w1 > 0xDFFF - str.push(w1); - continue; - } - k += 2; - const w2 = (token.charCodeAt(k) << 8) | token.charCodeAt(k + 1); - str.push(((w1 & 0x3ff) << 10) + (w2 & 0x3ff) + 0x10000); - } - map[charCode] = String.fromCodePoint(...str); - }); - return new ToUnicodeMap(map); - }, - reason => { - if (reason instanceof AbortException) { - return null; + k += 2; + const w2 = (token.charCodeAt(k) << 8) | token.charCodeAt(k + 1); + str.push(((w1 & 0x3ff) << 10) + (w2 & 0x3ff) + 0x10000); } - if (this.options.ignoreErrors) { - warn(`readToUnicode - ignoring ToUnicode data: "${reason}".`); - return null; - } - throw reason; + map[charCode] = String.fromCodePoint(...str); + }); + return new ToUnicodeMap(map); + } catch (reason) { + if (reason instanceof AbortException) { + return null; } - ); + if (this.options.ignoreErrors) { + warn(`readToUnicode - ignoring ToUnicode data: "${reason}".`); + return null; + } + throw reason; + } } - return Promise.resolve(null); + return null; } readCidToGidMap(glyphsData, toUnicode) { From fa583427eff9f453fba0c836e660e70c6db706ae Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Mon, 22 Jan 2024 13:06:32 +0100 Subject: [PATCH 5/5] Always export the "raw" /ToUnicode-data from `PartialEvaluator.preEvaluateFont` (PR 13354 follow-up) This, ever so slightly, simplifies the implementation in the `PartialEvaluator.extractDataStructures`-method. --- src/core/evaluator.js | 18 ++++++------------ 1 file changed, 6 insertions(+), 12 deletions(-) diff --git a/src/core/evaluator.js b/src/core/evaluator.js index 68ab49bb0..4ccb5e0b7 100644 --- a/src/core/evaluator.js +++ b/src/core/evaluator.js @@ -3428,13 +3428,11 @@ class PartialEvaluator { }); } - async extractDataStructures(dict, baseDict, properties) { + async extractDataStructures(dict, properties) { const xref = this.xref; let cidToGidBytes; // 9.10.2 - const toUnicodePromise = this.readToUnicode( - properties.toUnicode || dict.get("ToUnicode") || baseDict.get("ToUnicode") - ); + const toUnicodePromise = this.readToUnicode(properties.toUnicode); if (properties.composite) { // CIDSystemInfo helps to match CID to glyphs @@ -4017,7 +4015,7 @@ class PartialEvaluator { } let composite = false; - let hash, toUnicode; + let hash; if (type.name === "Type0") { // If font is a composite // - get the descendant font @@ -4042,6 +4040,8 @@ class PartialEvaluator { const firstChar = dict.get("FirstChar") || 0, lastChar = dict.get("LastChar") || (composite ? 0xffff : 0xff); const descriptor = dict.get("FontDescriptor"); + const toUnicode = dict.get("ToUnicode") || baseDict.get("ToUnicode"); + if (descriptor) { hash = new MurmurHash3_64(); @@ -4079,7 +4079,6 @@ class PartialEvaluator { hash.update(`${firstChar}-${lastChar}`); // Fixes issue10665_reduced.pdf - toUnicode = dict.get("ToUnicode") || baseDict.get("ToUnicode"); if (toUnicode instanceof BaseStream) { const stream = toUnicode.str || toUnicode; const uint8array = stream.buffer @@ -4230,7 +4229,6 @@ class PartialEvaluator { } const newProperties = await this.extractDataStructures( - dict, dict, properties ); @@ -4394,11 +4392,7 @@ class PartialEvaluator { properties.vertical = properties.cMap.vertical; } - const newProperties = await this.extractDataStructures( - dict, - baseDict, - properties - ); + const newProperties = await this.extractDataStructures(dict, properties); this.extractWidths(dict, descriptor, newProperties); return new Font(fontName.name, fontFile, newProperties);