Merge pull request #13166 from Snuffleupagus/getDocument-URL
[api-minor] Support proper `URL`-objects, in addition to URL-strings, in `getDocument`
This commit is contained in:
		
						commit
						5be0fbe8f1
					
				| @ -111,7 +111,7 @@ function setPDFNetworkStreamFactory(pdfNetworkStreamFactory) { | |||||||
|  * Document initialization / loading parameters object. |  * Document initialization / loading parameters object. | ||||||
|  * |  * | ||||||
|  * @typedef {Object} DocumentInitParameters |  * @typedef {Object} DocumentInitParameters | ||||||
|  * @property {string} [url] - The URL of the PDF. |  * @property {string|URL} [url] - The URL of the PDF. | ||||||
|  * @property {TypedArray|Array<number>|string} [data] - Binary PDF data. Use |  * @property {TypedArray|Array<number>|string} [data] - Binary PDF data. Use | ||||||
|  *    typed arrays (Uint8Array) to improve the memory usage. If PDF data is |  *    typed arrays (Uint8Array) to improve the memory usage. If PDF data is | ||||||
|  *    BASE64-encoded, use `atob()` to convert it to a binary string first. |  *    BASE64-encoded, use `atob()` to convert it to a binary string first. | ||||||
| @ -185,16 +185,6 @@ function setPDFNetworkStreamFactory(pdfNetworkStreamFactory) { | |||||||
|  *   (see `web/debugger.js`). The default value is `false`. |  *   (see `web/debugger.js`). The default value is `false`. | ||||||
|  */ |  */ | ||||||
| 
 | 
 | ||||||
| /** |  | ||||||
|  * @typedef {Object} PDFDocumentStats |  | ||||||
|  * @property {Object<string, boolean>} streamTypes - Used stream types in the |  | ||||||
|  *   document (an item is set to true if specific stream ID was used in the |  | ||||||
|  *   document). |  | ||||||
|  * @property {Object<string, boolean>} fontTypes - Used font types in the |  | ||||||
|  *   document (an item is set to true if specific font ID was used in the |  | ||||||
|  *   document). |  | ||||||
|  */ |  | ||||||
| 
 |  | ||||||
| /** | /** | ||||||
|  * This is the main entry point for loading a PDF and interacting with it. |  * This is the main entry point for loading a PDF and interacting with it. | ||||||
|  * |  * | ||||||
| @ -202,16 +192,16 @@ function setPDFNetworkStreamFactory(pdfNetworkStreamFactory) { | |||||||
|  * XHR as fallback) is used, which means it must follow same origin rules, |  * XHR as fallback) is used, which means it must follow same origin rules, | ||||||
|  * e.g. no cross-domain requests without CORS. |  * e.g. no cross-domain requests without CORS. | ||||||
|  * |  * | ||||||
|  * @param {string|TypedArray|DocumentInitParameters|PDFDataRangeTransport} src - |  * @param {string|URL|TypedArray|PDFDataRangeTransport|DocumentInitParameters} | ||||||
|  *   Can be a URL to where a PDF file is located, a typed array (Uint8Array) |  *   src - Can be a URL where a PDF file is located, a typed array (Uint8Array) | ||||||
|  *   already populated with data or parameter object. |  *         already populated with data, or a parameter object. | ||||||
|  * @returns {PDFDocumentLoadingTask} |  * @returns {PDFDocumentLoadingTask} | ||||||
|  */ |  */ | ||||||
| function getDocument(src) { | function getDocument(src) { | ||||||
|   const task = new PDFDocumentLoadingTask(); |   const task = new PDFDocumentLoadingTask(); | ||||||
| 
 | 
 | ||||||
|   let source; |   let source; | ||||||
|   if (typeof src === "string") { |   if (typeof src === "string" || src instanceof URL) { | ||||||
|     source = { url: src }; |     source = { url: src }; | ||||||
|   } else if (isArrayBuffer(src)) { |   } else if (isArrayBuffer(src)) { | ||||||
|     source = { data: src }; |     source = { data: src }; | ||||||
| @ -221,7 +211,7 @@ function getDocument(src) { | |||||||
|     if (typeof src !== "object") { |     if (typeof src !== "object") { | ||||||
|       throw new Error( |       throw new Error( | ||||||
|         "Invalid parameter in getDocument, " + |         "Invalid parameter in getDocument, " + | ||||||
|           "need either Uint8Array, string or a parameter object" |           "need either string, URL, Uint8Array, or parameter object." | ||||||
|       ); |       ); | ||||||
|     } |     } | ||||||
|     if (!src.url && !src.data && !src.range) { |     if (!src.url && !src.data && !src.range) { | ||||||
| @ -236,49 +226,63 @@ function getDocument(src) { | |||||||
|     worker = null; |     worker = null; | ||||||
| 
 | 
 | ||||||
|   for (const key in source) { |   for (const key in source) { | ||||||
|     if (key === "url" && typeof window !== "undefined") { |     const value = source[key]; | ||||||
|       // The full path is required in the 'url' field.
 | 
 | ||||||
|       params[key] = new URL(source[key], window.location).href; |     switch (key) { | ||||||
|       continue; |       case "url": | ||||||
|     } else if (key === "range") { |         if (typeof window !== "undefined") { | ||||||
|       rangeTransport = source[key]; |           try { | ||||||
|       continue; |             // The full path is required in the 'url' field.
 | ||||||
|     } else if (key === "worker") { |             params[key] = new URL(value, window.location).href; | ||||||
|       worker = source[key]; |             continue; | ||||||
|       continue; |           } catch (ex) { | ||||||
|     } else if (key === "data") { |             warn(`Cannot create valid URL: "${ex}".`); | ||||||
|       // Converting string or array-like data to Uint8Array.
 |           } | ||||||
|       const pdfBytes = source[key]; |         } else if (typeof value === "string" || value instanceof URL) { | ||||||
|       if ( |           params[key] = value.toString(); // Support Node.js environments.
 | ||||||
|         typeof PDFJSDev !== "undefined" && |           continue; | ||||||
|         PDFJSDev.test("GENERIC") && |         } | ||||||
|         isNodeJS && |  | ||||||
|         typeof Buffer !== "undefined" && // eslint-disable-line no-undef
 |  | ||||||
|         pdfBytes instanceof Buffer // eslint-disable-line no-undef
 |  | ||||||
|       ) { |  | ||||||
|         params[key] = new Uint8Array(pdfBytes); |  | ||||||
|       } else if (pdfBytes instanceof Uint8Array) { |  | ||||||
|         // Use the data as-is when it's already a Uint8Array.
 |  | ||||||
|         params[key] = pdfBytes; |  | ||||||
|       } else if (typeof pdfBytes === "string") { |  | ||||||
|         params[key] = stringToBytes(pdfBytes); |  | ||||||
|       } else if ( |  | ||||||
|         typeof pdfBytes === "object" && |  | ||||||
|         pdfBytes !== null && |  | ||||||
|         !isNaN(pdfBytes.length) |  | ||||||
|       ) { |  | ||||||
|         params[key] = new Uint8Array(pdfBytes); |  | ||||||
|       } else if (isArrayBuffer(pdfBytes)) { |  | ||||||
|         params[key] = new Uint8Array(pdfBytes); |  | ||||||
|       } else { |  | ||||||
|         throw new Error( |         throw new Error( | ||||||
|           "Invalid PDF binary data: either typed array, " + |           "Invalid PDF url data: " + | ||||||
|             "string, or array-like object is expected in the data property." |             "either string or URL-object is expected in the url property." | ||||||
|         ); |         ); | ||||||
|       } |       case "range": | ||||||
|       continue; |         rangeTransport = value; | ||||||
|  |         continue; | ||||||
|  |       case "worker": | ||||||
|  |         worker = value; | ||||||
|  |         continue; | ||||||
|  |       case "data": | ||||||
|  |         // Converting string or array-like data to Uint8Array.
 | ||||||
|  |         if ( | ||||||
|  |           typeof PDFJSDev !== "undefined" && | ||||||
|  |           PDFJSDev.test("GENERIC") && | ||||||
|  |           isNodeJS && | ||||||
|  |           typeof Buffer !== "undefined" && // eslint-disable-line no-undef
 | ||||||
|  |           value instanceof Buffer // eslint-disable-line no-undef
 | ||||||
|  |         ) { | ||||||
|  |           params[key] = new Uint8Array(value); | ||||||
|  |         } else if (value instanceof Uint8Array) { | ||||||
|  |           break; // Use the data as-is when it's already a Uint8Array.
 | ||||||
|  |         } else if (typeof value === "string") { | ||||||
|  |           params[key] = stringToBytes(value); | ||||||
|  |         } else if ( | ||||||
|  |           typeof value === "object" && | ||||||
|  |           value !== null && | ||||||
|  |           !isNaN(value.length) | ||||||
|  |         ) { | ||||||
|  |           params[key] = new Uint8Array(value); | ||||||
|  |         } else if (isArrayBuffer(value)) { | ||||||
|  |           params[key] = new Uint8Array(value); | ||||||
|  |         } else { | ||||||
|  |           throw new Error( | ||||||
|  |             "Invalid PDF binary data: either typed array, " + | ||||||
|  |               "string, or array-like object is expected in the data property." | ||||||
|  |           ); | ||||||
|  |         } | ||||||
|  |         continue; | ||||||
|     } |     } | ||||||
|     params[key] = source[key]; |     params[key] = value; | ||||||
|   } |   } | ||||||
| 
 | 
 | ||||||
|   params.rangeChunkSize = params.rangeChunkSize || DEFAULT_RANGE_CHUNK_SIZE; |   params.rangeChunkSize = params.rangeChunkSize || DEFAULT_RANGE_CHUNK_SIZE; | ||||||
| @ -891,6 +895,16 @@ class PDFDocumentProxy { | |||||||
|     return this._transport.downloadInfoCapability.promise; |     return this._transport.downloadInfoCapability.promise; | ||||||
|   } |   } | ||||||
| 
 | 
 | ||||||
|  |   /** | ||||||
|  |    * @typedef {Object} PDFDocumentStats | ||||||
|  |    * @property {Object<string, boolean>} streamTypes - Used stream types in the | ||||||
|  |    *   document (an item is set to true if specific stream ID was used in the | ||||||
|  |    *   document). | ||||||
|  |    * @property {Object<string, boolean>} fontTypes - Used font types in the | ||||||
|  |    *   document (an item is set to true if specific font ID was used in the | ||||||
|  |    *   document). | ||||||
|  |    */ | ||||||
|  | 
 | ||||||
|   /** |   /** | ||||||
|    * @returns {Promise<PDFDocumentStats>} A promise this is resolved with |    * @returns {Promise<PDFDocumentStats>} A promise this is resolved with | ||||||
|    *   current statistics about document structures (see |    *   current statistics about document structures (see | ||||||
|  | |||||||
| @ -73,6 +73,36 @@ describe("api", function () { | |||||||
|   } |   } | ||||||
| 
 | 
 | ||||||
|   describe("getDocument", function () { |   describe("getDocument", function () { | ||||||
|  |     it("creates pdf doc from URL-string", async function () { | ||||||
|  |       const urlStr = TEST_PDFS_PATH + basicApiFileName; | ||||||
|  |       const loadingTask = getDocument(urlStr); | ||||||
|  |       const pdfDocument = await loadingTask.promise; | ||||||
|  | 
 | ||||||
|  |       expect(typeof urlStr).toEqual("string"); | ||||||
|  |       expect(pdfDocument instanceof PDFDocumentProxy).toEqual(true); | ||||||
|  |       expect(pdfDocument.numPages).toEqual(3); | ||||||
|  | 
 | ||||||
|  |       await loadingTask.destroy(); | ||||||
|  |     }); | ||||||
|  | 
 | ||||||
|  |     it("creates pdf doc from URL-object", async function () { | ||||||
|  |       if (isNodeJS) { | ||||||
|  |         pending("window.location is not supported in Node.js."); | ||||||
|  |       } | ||||||
|  |       const urlObj = new URL( | ||||||
|  |         TEST_PDFS_PATH + basicApiFileName, | ||||||
|  |         window.location | ||||||
|  |       ); | ||||||
|  |       const loadingTask = getDocument(urlObj); | ||||||
|  |       const pdfDocument = await loadingTask.promise; | ||||||
|  | 
 | ||||||
|  |       expect(urlObj instanceof URL).toEqual(true); | ||||||
|  |       expect(pdfDocument instanceof PDFDocumentProxy).toEqual(true); | ||||||
|  |       expect(pdfDocument.numPages).toEqual(3); | ||||||
|  | 
 | ||||||
|  |       await loadingTask.destroy(); | ||||||
|  |     }); | ||||||
|  | 
 | ||||||
|     it("creates pdf doc from URL", function (done) { |     it("creates pdf doc from URL", function (done) { | ||||||
|       const loadingTask = getDocument(basicApiGetDocumentParams); |       const loadingTask = getDocument(basicApiGetDocumentParams); | ||||||
| 
 | 
 | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user