Improve text-selection for Type3 fonts with bogus /FontBBox-entries (issue 14999)
This extends PR 13461, by also building a fallback bounding box for Type3 fonts that contain a much too small /FontBBox-entry. *Please note:* While this patch improves things overall, copy-and-pasting still doesn't work perfectly for this document. In particular the lowercase letter "c" cannot be selected/copied, however this can be reproduced in both Adobe Reader and PDFium (in Google Chrome) too, which is caused by a lack of proper /ToUnicode-data in the PDF document.
This commit is contained in:
parent
a1ac1a61b7
commit
79cfc548fc
@ -4404,8 +4404,10 @@ class TranslatedFont {
|
||||
const fontResources = this.dict.get("Resources") || resources;
|
||||
const charProcOperatorList = Object.create(null);
|
||||
|
||||
const isEmptyBBox =
|
||||
!translatedFont.bbox || isArrayEqual(translatedFont.bbox, [0, 0, 0, 0]);
|
||||
const fontBBox = Util.normalizeRect(translatedFont.bbox || [0, 0, 0, 0]),
|
||||
width = fontBBox[2] - fontBBox[0],
|
||||
height = fontBBox[3] - fontBBox[1];
|
||||
const fontBBoxSize = Math.hypot(width, height);
|
||||
|
||||
for (const key of charProcs.getKeys()) {
|
||||
loadCharProcsPromise = loadCharProcsPromise.then(() => {
|
||||
@ -4426,7 +4428,7 @@ class TranslatedFont {
|
||||
// colour-related parameters) in the graphics state;
|
||||
// any use of such operators shall be ignored."
|
||||
if (operatorList.fnArray[0] === OPS.setCharWidthAndBounds) {
|
||||
this._removeType3ColorOperators(operatorList, isEmptyBBox);
|
||||
this._removeType3ColorOperators(operatorList, fontBBoxSize);
|
||||
}
|
||||
charProcOperatorList[key] = operatorList.getIR();
|
||||
|
||||
@ -4454,7 +4456,7 @@ class TranslatedFont {
|
||||
/**
|
||||
* @private
|
||||
*/
|
||||
_removeType3ColorOperators(operatorList, isEmptyBBox = false) {
|
||||
_removeType3ColorOperators(operatorList, fontBBoxSize = NaN) {
|
||||
if (
|
||||
typeof PDFJSDev === "undefined" ||
|
||||
PDFJSDev.test("!PRODUCTION || TESTING")
|
||||
@ -4467,12 +4469,19 @@ class TranslatedFont {
|
||||
const charBBox = Util.normalizeRect(operatorList.argsArray[0].slice(2)),
|
||||
width = charBBox[2] - charBBox[0],
|
||||
height = charBBox[3] - charBBox[1];
|
||||
const charBBoxSize = Math.hypot(width, height);
|
||||
|
||||
if (width === 0 || height === 0) {
|
||||
// Skip the d1 operator when its bounds are bogus (fixes issue14953.pdf).
|
||||
operatorList.fnArray.splice(0, 1);
|
||||
operatorList.argsArray.splice(0, 1);
|
||||
} else if (isEmptyBBox) {
|
||||
} else if (
|
||||
fontBBoxSize === 0 ||
|
||||
Math.round(charBBoxSize / fontBBoxSize) >= 10
|
||||
) {
|
||||
// Override the fontBBox when it's undefined/empty, or when it's at least
|
||||
// (approximately) one order of magnitude smaller than the charBBox
|
||||
// (fixes issue14999_reduced.pdf).
|
||||
if (!this._bbox) {
|
||||
this._bbox = [Infinity, Infinity, -Infinity, -Infinity];
|
||||
}
|
||||
|
1
test/pdfs/.gitignore
vendored
1
test/pdfs/.gitignore
vendored
@ -121,6 +121,7 @@
|
||||
!issue13916.pdf
|
||||
!issue14023.pdf
|
||||
!issue14438.pdf
|
||||
!issue14999_reduced.pdf
|
||||
!bad-PageLabels.pdf
|
||||
!decodeACSuccessive.pdf
|
||||
!issue13003.pdf
|
||||
|
BIN
test/pdfs/issue14999_reduced.pdf
Normal file
BIN
test/pdfs/issue14999_reduced.pdf
Normal file
Binary file not shown.
@ -2848,6 +2848,12 @@
|
||||
"link": false,
|
||||
"type": "text"
|
||||
},
|
||||
{ "id": "issue14999",
|
||||
"file": "pdfs/issue14999_reduced.pdf",
|
||||
"md5": "a4e664e734f6869aa66245e72d448874",
|
||||
"rounds": 1,
|
||||
"type": "text"
|
||||
},
|
||||
{ "id": "issue6901-eq",
|
||||
"file": "pdfs/issue6901.pdf",
|
||||
"md5": "1a0604b1a7a3aaf2162b425a9a84230b",
|
||||
|
Loading…
Reference in New Issue
Block a user