diff --git a/src/core/core_utils.js b/src/core/core_utils.js index 71c992d3f..32ffab86d 100644 --- a/src/core/core_utils.js +++ b/src/core/core_utils.js @@ -165,6 +165,26 @@ function isWhiteSpace(ch) { return ch === 0x20 || ch === 0x09 || ch === 0x0d || ch === 0x0a; } +/** + * AcroForm field names use an array like notation to refer to + * repeated XFA elements e.g. foo.bar[nnn]. + * see: XFA Spec Chapter 3 - Repeated Elements + * + * @param {string} path - XFA path name. + * @returns {Array} - Array of Objects with the name and pos of + * each part of the path. + */ +function parseXFAPath(path) { + const positionPattern = /(.+)\[([0-9]+)\]$/; + return path.split(".").map(component => { + const m = component.match(positionPattern); + if (m) { + return { name: m[1], pos: parseInt(m[2], 10) }; + } + return { name: component, pos: 0 }; + }); +} + export { getLookupTableFactory, MissingDataException, @@ -173,6 +193,7 @@ export { getInheritableProperty, toRomanNumerals, log2, + parseXFAPath, readInt8, readUint16, readUint32, diff --git a/src/core/worker.js b/src/core/worker.js index 9d9f18b82..4fdd44e92 100644 --- a/src/core/worker.js +++ b/src/core/worker.js @@ -589,13 +589,13 @@ class WorkerMessageHandler { } xref.resetNewRef(); - return incrementalUpdate( - stream.bytes, - newXrefInfo, + return incrementalUpdate({ + originalData: stream.bytes, + xrefInfo: newXrefInfo, newRefs, xref, - xfaDatasets - ); + datasetsRef: xfaDatasets, + }); }); }); diff --git a/src/core/writer.js b/src/core/writer.js index 19442f5ea..43294bfdb 100644 --- a/src/core/writer.js +++ b/src/core/writer.js @@ -14,15 +14,11 @@ */ /* eslint no-var: error */ -import { - bytesToString, - escapeString, - parseXFAPath, - warn, -} from "../shared/util.js"; +import { bytesToString, escapeString, warn } from "../shared/util.js"; import { Dict, isDict, isName, isRef, isStream, Name } from "./primitives.js"; import { SimpleDOMNode, SimpleXMLParser } from "../shared/xml_parser.js"; import { calculateMD5 } from "./crypto.js"; +import { parseXFAPath } from "./core_utils.js"; function writeDict(dict, buffer, transform) { buffer.push("<<"); @@ -175,7 +171,13 @@ function updateXFA(datasetsRef, newRefs, xref) { newRefs.push({ ref: datasetsRef, data }); } -function incrementalUpdate(originalData, xrefInfo, newRefs, xref, datasetsRef) { +function incrementalUpdate({ + originalData, + xrefInfo, + newRefs, + xref = null, + datasetsRef = null, +}) { updateXFA(datasetsRef, newRefs, xref); const newXref = new Dict(null); diff --git a/src/shared/util.js b/src/shared/util.js index cd3a9486b..2996cac4f 100644 --- a/src/shared/util.js +++ b/src/shared/util.js @@ -910,26 +910,6 @@ const createObjectURL = (function createObjectURLClosure() { }; })(); -/** - * AcroForm field names use an array like notation to refer to - * repeated XFA elements e.g. foo.bar[nnn]. - * see: XFA Spec Chapter 3 - Repeated Elements - * - * @param {string} path - XFA path name. - * @returns {Array} - Array of Objects with the name and pos of - * each part of the path. - */ -function parseXFAPath(path) { - const positionPattern = /(.+)\[([0-9]+)\]$/; - return path.split(".").map(component => { - const m = component.match(positionPattern); - if (m) { - return { name: m[1], pos: parseInt(m[2], 10) }; - } - return { name: component, pos: 0 }; - }); -} - const XMLEntities = { /* < */ 0x3c: "<", /* > */ 0x3e: ">", @@ -1027,7 +1007,6 @@ export { createValidAbsoluteUrl, IsLittleEndianCached, IsEvalSupportedCached, - parseXFAPath, removeNullCharacters, setVerbosityLevel, shadow, diff --git a/src/shared/xml_parser.js b/src/shared/xml_parser.js index 6cc1af14b..a24162cc8 100644 --- a/src/shared/xml_parser.js +++ b/src/shared/xml_parser.js @@ -329,6 +329,18 @@ class SimpleDOMNode { return this.childNodes && this.childNodes.length > 0; } + /** + * Search a node in the tree with the given path + * foo.bar[nnn], i.e. find the nnn-th node named + * bar under a node named foo. + * + * @param {Array} paths - an array of objects as + * returned by {parseXFAPath}. + * @param {number} pos - the current position in + * the paths array. + * @returns {SimpleDOMNode} The node corresponding + * to the path or null if not found. + */ searchNode(paths, pos) { if (pos >= paths.length) { return this; diff --git a/test/unit/core_utils_spec.js b/test/unit/core_utils_spec.js index 315ab28aa..392440848 100644 --- a/test/unit/core_utils_spec.js +++ b/test/unit/core_utils_spec.js @@ -18,6 +18,7 @@ import { getInheritableProperty, isWhiteSpace, log2, + parseXFAPath, toRomanNumerals, } from "../../src/core/core_utils.js"; import { XRefMock } from "./test_utils.js"; @@ -211,4 +212,18 @@ describe("core_utils", function () { expect(isWhiteSpace(undefined)).toEqual(false); }); }); + + describe("parseXFAPath", function () { + it("should get a correctly parsed path", function () { + const path = "foo.bar[12].oof[3].rab.FOO[123].BAR[456]"; + expect(parseXFAPath(path)).toEqual([ + { name: "foo", pos: 0 }, + { name: "bar", pos: 12 }, + { name: "oof", pos: 3 }, + { name: "rab", pos: 0 }, + { name: "FOO", pos: 123 }, + { name: "BAR", pos: 456 }, + ]); + }); + }); }); diff --git a/test/unit/util_spec.js b/test/unit/util_spec.js index 845447ff1..b6062b247 100644 --- a/test/unit/util_spec.js +++ b/test/unit/util_spec.js @@ -25,7 +25,6 @@ import { isNum, isSameOrigin, isString, - parseXFAPath, removeNullCharacters, string32, stringToBytes, @@ -334,20 +333,6 @@ describe("util", function () { }); }); - describe("parseXFAPath", function () { - it("should get a correctly parsed path", function () { - const path = "foo.bar[12].oof[3].rab.FOO[123].BAR[456]"; - expect(parseXFAPath(path)).toEqual([ - { name: "foo", pos: 0 }, - { name: "bar", pos: 12 }, - { name: "oof", pos: 3 }, - { name: "rab", pos: 0 }, - { name: "FOO", pos: 123 }, - { name: "BAR", pos: 456 }, - ]); - }); - }); - describe("encodeToXmlString", function () { it("should get a correctly encoded string with some entities", function () { const str = "\"\u0397ell😂' & "; diff --git a/test/unit/writer_spec.js b/test/unit/writer_spec.js index 2f7196b96..21c917d6e 100644 --- a/test/unit/writer_spec.js +++ b/test/unit/writer_spec.js @@ -37,7 +37,7 @@ describe("Writer", function () { info: {}, }; - let data = incrementalUpdate(originalData, xrefInfo, newRefs, null, null); + let data = incrementalUpdate({ originalData, xrefInfo, newRefs }); data = bytesToString(data); const expected = diff --git a/test/unit/xml_spec.js b/test/unit/xml_spec.js index 9d04e3aa8..a17f5e5ca 100644 --- a/test/unit/xml_spec.js +++ b/test/unit/xml_spec.js @@ -13,7 +13,7 @@ * limitations under the License. */ -import { parseXFAPath } from "../../src/shared/util.js"; +import { parseXFAPath } from "../../src/core/core_utils.js"; import { SimpleXMLParser } from "../../src/shared/xml_parser.js"; describe("XML", function () { @@ -69,7 +69,7 @@ describe("XML", function () { }); it("should dump a xml tree", function () { - let xml = ` + const xml = ` @@ -87,9 +87,7 @@ describe("XML", function () { - - W😂rld - + W😂rld @@ -98,13 +96,14 @@ describe("XML", function () { `; - xml = xml.replace(/\s+/g, ""); const root = new SimpleXMLParser(true).parseFromString(xml) .documentElement; const buffer = []; root.dump(buffer); - expect(buffer.join("").replace(/\s+/g, "")).toEqual(xml); + expect(buffer.join("").replace(/\s+/g, "")).toEqual( + xml.replace(/\s+/g, "") + ); }); }); });