0d84f57cfa
The only purpose, according to the README and existing files, is to parse an integer from those lines, so (\d+) is sufficient for that. This avoids potential exponential backtracking as flagged by CodeQL. I have compared the output of the script with and without these changes and the resulting files are the same.
104 lines
3.2 KiB
JavaScript
104 lines
3.2 KiB
JavaScript
/* Copyright 2014 Mozilla Foundation
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
exports.parseAdobeCMap = function (content) {
|
|
let m = /(\bbegincmap\b[\s\S]*?)\bendcmap\b/.exec(content);
|
|
if (!m) {
|
|
throw new Error("cmap was not found");
|
|
}
|
|
|
|
const body = m[1].replace(/\r\n?/g, "\n");
|
|
const result = {
|
|
type: 1,
|
|
wmode: 0,
|
|
comment:
|
|
"Copyright 1990-2009 Adobe Systems Incorporated.\nAll rights reserved.\nSee ./LICENSE",
|
|
usecmap: null,
|
|
body: [],
|
|
};
|
|
m = /\/CMapType\s+(\d+)\s+def\b/.exec(body);
|
|
result.type = +m[1];
|
|
m = /\/WMode\s+(\d+)\s+def\b/.exec(body);
|
|
result.wmode = +m[1];
|
|
m = /\/([\w-]+)\s+usecmap\b/.exec(body);
|
|
if (m) {
|
|
result.usecmap = m[1];
|
|
}
|
|
const re =
|
|
/(\d+)\s+(begincodespacerange|beginnotdefrange|begincidchar|begincidrange|beginbfchar|beginbfrange)\n([\s\S]*?)\n(endcodespacerange|endnotdefrange|endcidchar|endcidrange|endbfchar|endbfrange)/g;
|
|
while ((m = re.exec(body))) {
|
|
const lines = m[3].toLowerCase().split("\n");
|
|
|
|
switch (m[2]) {
|
|
case "begincodespacerange":
|
|
result.body.push({
|
|
type: 0,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+<(\w+)>/.exec(line);
|
|
return { start: m2[1], end: m2[2] };
|
|
}),
|
|
});
|
|
break;
|
|
case "beginnotdefrange":
|
|
result.body.push({
|
|
type: 1,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+<(\w+)>\s+(\d+)/.exec(line);
|
|
return { start: m2[1], end: m2[2], code: +m2[3] };
|
|
}),
|
|
});
|
|
break;
|
|
case "begincidchar":
|
|
result.body.push({
|
|
type: 2,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+(\d+)/.exec(line);
|
|
return { char: m2[1], code: +m2[2] };
|
|
}),
|
|
});
|
|
break;
|
|
case "begincidrange":
|
|
result.body.push({
|
|
type: 3,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+<(\w+)>\s+(\d+)/.exec(line);
|
|
return { start: m2[1], end: m2[2], code: +m2[3] };
|
|
}),
|
|
});
|
|
break;
|
|
case "beginbfchar":
|
|
result.body.push({
|
|
type: 4,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+<(\w+)>/.exec(line);
|
|
return { char: m2[1], code: m2[2] };
|
|
}),
|
|
});
|
|
break;
|
|
case "beginbfrange":
|
|
result.body.push({
|
|
type: 5,
|
|
items: lines.map(function (line) {
|
|
const m2 = /<(\w+)>\s+<(\w+)>\s+<(\w+)>/.exec(line);
|
|
return { start: m2[1], end: m2[2], code: m2[3] };
|
|
}),
|
|
});
|
|
break;
|
|
}
|
|
}
|
|
|
|
return result;
|
|
};
|