pdf.js/external/cmapscompress/parse.mjs

106 lines
3.2 KiB
JavaScript

/* Copyright 2014 Mozilla Foundation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
function parseAdobeCMap(content) {
let m = /(\bbegincmap\b[\s\S]*?)\bendcmap\b/.exec(content);
if (!m) {
throw new Error("cmap was not found");
}
const body = m[1].replaceAll(/\r\n?/g, "\n");
const result = {
type: 1,
wmode: 0,
comment:
"Copyright 1990-2009 Adobe Systems Incorporated.\nAll rights reserved.\nSee ./LICENSE",
usecmap: null,
body: [],
};
m = /\/CMapType\s+(\d+)\s+def\b/.exec(body);
result.type = +m[1];
m = /\/WMode\s+(\d+)\s+def\b/.exec(body);
result.wmode = +m[1];
m = /\/([\w-]+)\s+usecmap\b/.exec(body);
if (m) {
result.usecmap = m[1];
}
const re =
/(\d+)\s+(begincodespacerange|beginnotdefrange|begincidchar|begincidrange|beginbfchar|beginbfrange)\n([\s\S]*?)\n(endcodespacerange|endnotdefrange|endcidchar|endcidrange|endbfchar|endbfrange)/g;
while ((m = re.exec(body))) {
const lines = m[3].toLowerCase().split("\n");
switch (m[2]) {
case "begincodespacerange":
result.body.push({
type: 0,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+<(\w+)>/.exec(line);
return { start: m2[1], end: m2[2] };
}),
});
break;
case "beginnotdefrange":
result.body.push({
type: 1,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+<(\w+)>\s+(\d+)/.exec(line);
return { start: m2[1], end: m2[2], code: +m2[3] };
}),
});
break;
case "begincidchar":
result.body.push({
type: 2,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+(\d+)/.exec(line);
return { char: m2[1], code: +m2[2] };
}),
});
break;
case "begincidrange":
result.body.push({
type: 3,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+<(\w+)>\s+(\d+)/.exec(line);
return { start: m2[1], end: m2[2], code: +m2[3] };
}),
});
break;
case "beginbfchar":
result.body.push({
type: 4,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+<(\w+)>/.exec(line);
return { char: m2[1], code: m2[2] };
}),
});
break;
case "beginbfrange":
result.body.push({
type: 5,
items: lines.map(function (line) {
const m2 = /<(\w+)>\s+<(\w+)>\s+<(\w+)>/.exec(line);
return { start: m2[1], end: m2[2], code: m2[3] };
}),
});
break;
}
}
return result;
}
export { parseAdobeCMap };