From cbc07f985b6819609eeb401c4f1f3e9e63409d4a Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Sun, 24 Feb 2019 15:22:25 +0100 Subject: [PATCH 1/2] Load built-in CMap files using the Fetch API when possible --- src/display/display_utils.js | 77 ++++++++++++++++++++++++++---------- src/pdf.js | 9 ++--- test/unit/test_utils.js | 29 +++++++------- 3 files changed, 75 insertions(+), 40 deletions(-) diff --git a/src/display/display_utils.js b/src/display/display_utils.js index 511740513..df565ebac 100644 --- a/src/display/display_utils.js +++ b/src/display/display_utils.js @@ -15,7 +15,7 @@ import { assert, CMapCompressionType, removeNullCharacters, stringToBytes, - unreachable, Util, warn + unreachable, URL, Util, warn } from '../shared/util'; const DEFAULT_LINK_REL = 'noopener noreferrer nofollow'; @@ -66,19 +66,41 @@ class DOMCMapReaderFactory { this.isCompressed = isCompressed; } - fetch({ name, }) { + async fetch({ name, }) { if (!this.baseUrl) { - return Promise.reject(new Error( + throw new Error( 'The CMap "baseUrl" parameter must be specified, ensure that ' + - 'the "cMapUrl" and "cMapPacked" API parameters are provided.')); + 'the "cMapUrl" and "cMapPacked" API parameters are provided.'); } if (!name) { - return Promise.reject(new Error('CMap name must be specified.')); + throw new Error('CMap name must be specified.'); } - return new Promise((resolve, reject) => { - let url = this.baseUrl + name + (this.isCompressed ? '.bcmap' : ''); + const url = this.baseUrl + name + (this.isCompressed ? '.bcmap' : ''); + const compressionType = (this.isCompressed ? CMapCompressionType.BINARY : + CMapCompressionType.NONE); - let request = new XMLHttpRequest(); + if ((typeof PDFJSDev !== 'undefined' && PDFJSDev.test('MOZCENTRAL')) || + (isFetchSupported() && isValidFetchUrl(url, document.baseURI))) { + return fetch(url).then(async (response) => { + if (!response.ok) { + throw new Error(response.statusText); + } + let cMapData; + if (this.isCompressed) { + cMapData = new Uint8Array(await response.arrayBuffer()); + } else { + cMapData = stringToBytes(await response.text()); + } + return { cMapData, compressionType, }; + }).catch((reason) => { + throw new Error(`Unable to load ${this.isCompressed ? 'binary ' : ''}` + + `CMap at: ${url}`); + }); + } + + // The Fetch API is not supported. + return new Promise((resolve, reject) => { + const request = new XMLHttpRequest(); request.open('GET', url, true); if (this.isCompressed) { @@ -89,27 +111,24 @@ class DOMCMapReaderFactory { return; } if (request.status === 200 || request.status === 0) { - let data; + let cMapData; if (this.isCompressed && request.response) { - data = new Uint8Array(request.response); + cMapData = new Uint8Array(request.response); } else if (!this.isCompressed && request.responseText) { - data = stringToBytes(request.responseText); + cMapData = stringToBytes(request.responseText); } - if (data) { - resolve({ - cMapData: data, - compressionType: this.isCompressed ? - CMapCompressionType.BINARY : CMapCompressionType.NONE, - }); + if (cMapData) { + resolve({ cMapData, compressionType, }); return; } } - reject(new Error('Unable to load ' + - (this.isCompressed ? 'binary ' : '') + - 'CMap at: ' + url)); + reject(new Error(request.statusText)); }; request.send(null); + }).catch((reason) => { + throw new Error(`Unable to load ${this.isCompressed ? 'binary ' : ''}` + + `CMap at: ${url}`); }); } } @@ -428,6 +447,23 @@ class DummyStatTimer { } } +function isFetchSupported() { + return (typeof fetch !== 'undefined' && + typeof Response !== 'undefined' && 'body' in Response.prototype && + // eslint-disable-next-line no-restricted-globals + typeof ReadableStream !== 'undefined'); +} + +function isValidFetchUrl(url, baseUrl) { + try { + const { protocol, } = baseUrl ? new URL(url, baseUrl) : new URL(url); + // The Fetch API only supports the http/https protocols, and not file/ftp. + return (protocol === 'http:' || protocol === 'https:'); + } catch (ex) { + return false; // `new URL()` will throw on incorrect data. + } +} + function loadScript(src) { return new Promise((resolve, reject) => { let script = document.createElement('script'); @@ -453,5 +489,6 @@ export { DOMSVGFactory, StatTimer, DummyStatTimer, + isFetchSupported, loadScript, }; diff --git a/src/pdf.js b/src/pdf.js index 3b84f475c..2250abc7f 100644 --- a/src/pdf.js +++ b/src/pdf.js @@ -12,7 +12,7 @@ * See the License for the specific language governing permissions and * limitations under the License. */ -/* eslint-disable no-unused-vars, no-restricted-globals */ +/* eslint-disable no-unused-vars */ 'use strict'; @@ -37,8 +37,7 @@ if (typeof PDFJSDev === 'undefined' || PDFJSDev.test('GENERIC')) { pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { return new PDFNodeStream(params); }); - } else if (typeof Response !== 'undefined' && 'body' in Response.prototype && - typeof ReadableStream !== 'undefined') { + } else if (pdfjsDisplayDisplayUtils.isFetchSupported()) { let PDFFetchStream = require('./display/fetch_stream.js').PDFFetchStream; pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { return new PDFFetchStream(params); @@ -65,8 +64,8 @@ if (typeof PDFJSDev === 'undefined' || PDFJSDev.test('GENERIC')) { return true; } }; - if (typeof Response !== 'undefined' && 'body' in Response.prototype && - typeof ReadableStream !== 'undefined' && isChromeWithFetchCredentials()) { + if (pdfjsDisplayDisplayUtils.isFetchSupported() && + isChromeWithFetchCredentials()) { PDFFetchStream = require('./display/fetch_stream.js').PDFFetchStream; } pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { diff --git a/test/unit/test_utils.js b/test/unit/test_utils.js index 0b590b1cc..32c43f682 100644 --- a/test/unit/test_utils.js +++ b/test/unit/test_utils.js @@ -99,32 +99,31 @@ class NodeCMapReaderFactory { this.isCompressed = isCompressed; } - fetch({ name, }) { + async fetch({ name, }) { if (!this.baseUrl) { - return Promise.reject(new Error( + throw new Error( 'The CMap "baseUrl" parameter must be specified, ensure that ' + - 'the "cMapUrl" and "cMapPacked" API parameters are provided.')); + 'the "cMapUrl" and "cMapPacked" API parameters are provided.'); } if (!name) { - return Promise.reject(new Error('CMap name must be specified.')); + throw new Error('CMap name must be specified.'); } - return new Promise((resolve, reject) => { - let url = this.baseUrl + name + (this.isCompressed ? '.bcmap' : ''); + const url = this.baseUrl + name + (this.isCompressed ? '.bcmap' : ''); + const compressionType = (this.isCompressed ? CMapCompressionType.BINARY : + CMapCompressionType.NONE); - let fs = require('fs'); + return new Promise((resolve, reject) => { + const fs = require('fs'); fs.readFile(url, (error, data) => { if (error || !data) { - reject(new Error('Unable to load ' + - (this.isCompressed ? 'binary ' : '') + - 'CMap at: ' + url)); + reject(new Error(error)); return; } - resolve({ - cMapData: new Uint8Array(data), - compressionType: this.isCompressed ? - CMapCompressionType.BINARY : CMapCompressionType.NONE, - }); + resolve({ cMapData: new Uint8Array(data), compressionType, }); }); + }).catch((reason) => { + throw new Error(`Unable to load ${this.isCompressed ? 'binary ' : ''}` + + `CMap at: ${url}`); }); } } From f664e074c99b0a4a81932d13b2ab5bb3761e5da5 Mon Sep 17 00:00:00 2001 From: Jonas Jenwald Date: Tue, 26 Feb 2019 20:24:06 +0100 Subject: [PATCH 2/2] Avoid using the Fetch API, in `GENERIC` builds, for unsupported protocols (issue 10587) --- src/display/display_utils.js | 1 + src/pdf.js | 17 ++++++++++------- test/unit/display_utils_spec.js | 26 +++++++++++++++++++++++++- 3 files changed, 36 insertions(+), 8 deletions(-) diff --git a/src/display/display_utils.js b/src/display/display_utils.js index df565ebac..faaeedd9d 100644 --- a/src/display/display_utils.js +++ b/src/display/display_utils.js @@ -490,5 +490,6 @@ export { StatTimer, DummyStatTimer, isFetchSupported, + isValidFetchUrl, loadScript, }; diff --git a/src/pdf.js b/src/pdf.js index 2250abc7f..32895bae3 100644 --- a/src/pdf.js +++ b/src/pdf.js @@ -37,14 +37,17 @@ if (typeof PDFJSDev === 'undefined' || PDFJSDev.test('GENERIC')) { pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { return new PDFNodeStream(params); }); - } else if (pdfjsDisplayDisplayUtils.isFetchSupported()) { - let PDFFetchStream = require('./display/fetch_stream.js').PDFFetchStream; - pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { - return new PDFFetchStream(params); - }); } else { let PDFNetworkStream = require('./display/network.js').PDFNetworkStream; + let PDFFetchStream; + if (pdfjsDisplayDisplayUtils.isFetchSupported()) { + PDFFetchStream = require('./display/fetch_stream.js').PDFFetchStream; + } pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { + if (PDFFetchStream && + pdfjsDisplayDisplayUtils.isValidFetchUrl(params.url)) { + return new PDFFetchStream(params); + } return new PDFNetworkStream(params); }); } @@ -69,8 +72,8 @@ if (typeof PDFJSDev === 'undefined' || PDFJSDev.test('GENERIC')) { PDFFetchStream = require('./display/fetch_stream.js').PDFFetchStream; } pdfjsDisplayAPI.setPDFNetworkStreamFactory((params) => { - if (PDFFetchStream && /^https?:/i.test(params.url)) { - // "fetch" is only supported for http(s), not file/ftp. + if (PDFFetchStream && + pdfjsDisplayDisplayUtils.isValidFetchUrl(params.url)) { return new PDFFetchStream(params); } return new PDFNetworkStream(params); diff --git a/test/unit/display_utils_spec.js b/test/unit/display_utils_spec.js index 474cefe8e..67f339fa7 100644 --- a/test/unit/display_utils_spec.js +++ b/test/unit/display_utils_spec.js @@ -14,7 +14,7 @@ */ import { - DOMSVGFactory, getFilenameFromUrl + DOMSVGFactory, getFilenameFromUrl, isValidFetchUrl } from '../../src/display/display_utils'; import isNodeJS from '../../src/shared/is_node'; @@ -94,4 +94,28 @@ describe('display_utils', function() { expect(result).toEqual(expected); }); }); + + describe('isValidFetchUrl', function() { + it('handles invalid Fetch URLs', function() { + expect(isValidFetchUrl(null)).toEqual(false); + expect(isValidFetchUrl(100)).toEqual(false); + expect(isValidFetchUrl('foo')).toEqual(false); + expect(isValidFetchUrl('/foo', 100)).toEqual(false); + }); + + it('handles relative Fetch URLs', function() { + expect(isValidFetchUrl('/foo', 'file://www.example.com')).toEqual(false); + expect(isValidFetchUrl('/foo', 'http://www.example.com')).toEqual(true); + }); + + it('handles unsupported Fetch protocols', function() { + expect(isValidFetchUrl('file://www.example.com')).toEqual(false); + expect(isValidFetchUrl('ftp://www.example.com')).toEqual(false); + }); + + it('handles supported Fetch protocols', function() { + expect(isValidFetchUrl('http://www.example.com')).toEqual(true); + expect(isValidFetchUrl('https://www.example.com')).toEqual(true); + }); + }); });