worker.js 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597
  1. /* Copyright 2017 Mozilla Foundation
  2. *
  3. * Licensed under the Apache License, Version 2.0 (the "License");
  4. * you may not use this file except in compliance with the License.
  5. * You may obtain a copy of the License at
  6. *
  7. * http://www.apache.org/licenses/LICENSE-2.0
  8. *
  9. * Unless required by applicable law or agreed to in writing, software
  10. * distributed under the License is distributed on an "AS IS" BASIS,
  11. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. * See the License for the specific language governing permissions and
  13. * limitations under the License.
  14. */
  15. 'use strict';
  16. Object.defineProperty(exports, "__esModule", {
  17. value: true
  18. });
  19. exports.WorkerMessageHandler = exports.WorkerTask = undefined;
  20. var _typeof = typeof Symbol === "function" && typeof Symbol.iterator === "symbol" ? function (obj) { return typeof obj; } : function (obj) { return obj && typeof Symbol === "function" && obj.constructor === Symbol && obj !== Symbol.prototype ? "symbol" : typeof obj; };
  21. var _util = require('../shared/util');
  22. var _pdf_manager = require('./pdf_manager');
  23. var _primitives = require('./primitives');
  24. var WorkerTask = function WorkerTaskClosure() {
  25. function WorkerTask(name) {
  26. this.name = name;
  27. this.terminated = false;
  28. this._capability = (0, _util.createPromiseCapability)();
  29. }
  30. WorkerTask.prototype = {
  31. get finished() {
  32. return this._capability.promise;
  33. },
  34. finish: function finish() {
  35. this._capability.resolve();
  36. },
  37. terminate: function terminate() {
  38. this.terminated = true;
  39. },
  40. ensureNotTerminated: function ensureNotTerminated() {
  41. if (this.terminated) {
  42. throw new Error('Worker task was terminated');
  43. }
  44. }
  45. };
  46. return WorkerTask;
  47. }();
  48. ;
  49. var PDFWorkerStream = function PDFWorkerStreamClosure() {
  50. function PDFWorkerStream(msgHandler) {
  51. this._msgHandler = msgHandler;
  52. this._contentLength = null;
  53. this._fullRequestReader = null;
  54. this._rangeRequestReaders = [];
  55. }
  56. PDFWorkerStream.prototype = {
  57. getFullReader: function getFullReader() {
  58. (0, _util.assert)(!this._fullRequestReader);
  59. this._fullRequestReader = new PDFWorkerStreamReader(this._msgHandler);
  60. return this._fullRequestReader;
  61. },
  62. getRangeReader: function getRangeReader(begin, end) {
  63. var reader = new PDFWorkerStreamRangeReader(begin, end, this._msgHandler);
  64. this._rangeRequestReaders.push(reader);
  65. return reader;
  66. },
  67. cancelAllRequests: function cancelAllRequests(reason) {
  68. if (this._fullRequestReader) {
  69. this._fullRequestReader.cancel(reason);
  70. }
  71. var readers = this._rangeRequestReaders.slice(0);
  72. readers.forEach(function (reader) {
  73. reader.cancel(reason);
  74. });
  75. }
  76. };
  77. function PDFWorkerStreamReader(msgHandler) {
  78. var _this = this;
  79. this._msgHandler = msgHandler;
  80. this._contentLength = null;
  81. this._isRangeSupported = false;
  82. this._isStreamingSupported = false;
  83. var readableStream = this._msgHandler.sendWithStream('GetReader');
  84. this._reader = readableStream.getReader();
  85. this._headersReady = this._msgHandler.sendWithPromise('ReaderHeadersReady').then(function (data) {
  86. _this._isStreamingSupported = data.isStreamingSupported;
  87. _this._isRangeSupported = data.isRangeSupported;
  88. _this._contentLength = data.contentLength;
  89. });
  90. }
  91. PDFWorkerStreamReader.prototype = {
  92. get headersReady() {
  93. return this._headersReady;
  94. },
  95. get contentLength() {
  96. return this._contentLength;
  97. },
  98. get isStreamingSupported() {
  99. return this._isStreamingSupported;
  100. },
  101. get isRangeSupported() {
  102. return this._isRangeSupported;
  103. },
  104. read: function read() {
  105. return this._reader.read().then(function (_ref) {
  106. var value = _ref.value,
  107. done = _ref.done;
  108. if (done) {
  109. return {
  110. value: undefined,
  111. done: true
  112. };
  113. }
  114. return {
  115. value: value.buffer,
  116. done: false
  117. };
  118. });
  119. },
  120. cancel: function cancel(reason) {
  121. this._reader.cancel(reason);
  122. }
  123. };
  124. function PDFWorkerStreamRangeReader(begin, end, msgHandler) {
  125. this._msgHandler = msgHandler;
  126. this.onProgress = null;
  127. var readableStream = this._msgHandler.sendWithStream('GetRangeReader', {
  128. begin: begin,
  129. end: end
  130. });
  131. this._reader = readableStream.getReader();
  132. }
  133. PDFWorkerStreamRangeReader.prototype = {
  134. get isStreamingSupported() {
  135. return false;
  136. },
  137. read: function read() {
  138. return this._reader.read().then(function (_ref2) {
  139. var value = _ref2.value,
  140. done = _ref2.done;
  141. if (done) {
  142. return {
  143. value: undefined,
  144. done: true
  145. };
  146. }
  147. return {
  148. value: value.buffer,
  149. done: false
  150. };
  151. });
  152. },
  153. cancel: function cancel(reason) {
  154. this._reader.cancel(reason);
  155. }
  156. };
  157. return PDFWorkerStream;
  158. }();
  159. var WorkerMessageHandler = {
  160. setup: function setup(handler, port) {
  161. var testMessageProcessed = false;
  162. handler.on('test', function wphSetupTest(data) {
  163. if (testMessageProcessed) {
  164. return;
  165. }
  166. testMessageProcessed = true;
  167. if (!(data instanceof Uint8Array)) {
  168. handler.send('test', 'main', false);
  169. return;
  170. }
  171. var supportTransfers = data[0] === 255;
  172. handler.postMessageTransfers = supportTransfers;
  173. var xhr = new XMLHttpRequest();
  174. var responseExists = 'response' in xhr;
  175. try {
  176. xhr.responseType;
  177. } catch (e) {
  178. responseExists = false;
  179. }
  180. if (!responseExists) {
  181. handler.send('test', false);
  182. return;
  183. }
  184. handler.send('test', {
  185. supportTypedArray: true,
  186. supportTransfers: supportTransfers
  187. });
  188. });
  189. handler.on('configure', function wphConfigure(data) {
  190. (0, _util.setVerbosityLevel)(data.verbosity);
  191. });
  192. handler.on('GetDocRequest', function wphSetupDoc(data) {
  193. return WorkerMessageHandler.createDocumentHandler(data, port);
  194. });
  195. },
  196. createDocumentHandler: function createDocumentHandler(docParams, port) {
  197. var pdfManager;
  198. var terminated = false;
  199. var cancelXHRs = null;
  200. var WorkerTasks = [];
  201. var apiVersion = docParams.apiVersion;
  202. var workerVersion = '1.10.83';
  203. if (apiVersion !== null && apiVersion !== workerVersion) {
  204. throw new Error('The API version "' + apiVersion + '" does not match ' + ('the Worker version "' + workerVersion + '".'));
  205. }
  206. var docId = docParams.docId;
  207. var docBaseUrl = docParams.docBaseUrl;
  208. var workerHandlerName = docParams.docId + '_worker';
  209. var handler = new _util.MessageHandler(workerHandlerName, docId, port);
  210. handler.postMessageTransfers = docParams.postMessageTransfers;
  211. function ensureNotTerminated() {
  212. if (terminated) {
  213. throw new Error('Worker was terminated');
  214. }
  215. }
  216. function startWorkerTask(task) {
  217. WorkerTasks.push(task);
  218. }
  219. function finishWorkerTask(task) {
  220. task.finish();
  221. var i = WorkerTasks.indexOf(task);
  222. WorkerTasks.splice(i, 1);
  223. }
  224. function loadDocument(recoveryMode) {
  225. var loadDocumentCapability = (0, _util.createPromiseCapability)();
  226. var parseSuccess = function parseSuccess() {
  227. var numPagesPromise = pdfManager.ensureDoc('numPages');
  228. var fingerprintPromise = pdfManager.ensureDoc('fingerprint');
  229. var encryptedPromise = pdfManager.ensureXRef('encrypt');
  230. Promise.all([numPagesPromise, fingerprintPromise, encryptedPromise]).then(function onDocReady(results) {
  231. var doc = {
  232. numPages: results[0],
  233. fingerprint: results[1],
  234. encrypted: !!results[2]
  235. };
  236. loadDocumentCapability.resolve(doc);
  237. }, parseFailure);
  238. };
  239. var parseFailure = function parseFailure(e) {
  240. loadDocumentCapability.reject(e);
  241. };
  242. pdfManager.ensureDoc('checkHeader', []).then(function () {
  243. pdfManager.ensureDoc('parseStartXRef', []).then(function () {
  244. pdfManager.ensureDoc('parse', [recoveryMode]).then(parseSuccess, parseFailure);
  245. }, parseFailure);
  246. }, parseFailure);
  247. return loadDocumentCapability.promise;
  248. }
  249. function getPdfManager(data, evaluatorOptions) {
  250. var pdfManagerCapability = (0, _util.createPromiseCapability)();
  251. var pdfManager;
  252. var source = data.source;
  253. if (source.data) {
  254. try {
  255. pdfManager = new _pdf_manager.LocalPdfManager(docId, source.data, source.password, evaluatorOptions, docBaseUrl);
  256. pdfManagerCapability.resolve(pdfManager);
  257. } catch (ex) {
  258. pdfManagerCapability.reject(ex);
  259. }
  260. return pdfManagerCapability.promise;
  261. }
  262. var pdfStream,
  263. cachedChunks = [];
  264. try {
  265. pdfStream = new PDFWorkerStream(handler);
  266. } catch (ex) {
  267. pdfManagerCapability.reject(ex);
  268. return pdfManagerCapability.promise;
  269. }
  270. var fullRequest = pdfStream.getFullReader();
  271. fullRequest.headersReady.then(function () {
  272. if (!fullRequest.isRangeSupported) {
  273. return;
  274. }
  275. var disableAutoFetch = source.disableAutoFetch || fullRequest.isStreamingSupported;
  276. pdfManager = new _pdf_manager.NetworkPdfManager(docId, pdfStream, {
  277. msgHandler: handler,
  278. url: source.url,
  279. password: source.password,
  280. length: fullRequest.contentLength,
  281. disableAutoFetch: disableAutoFetch,
  282. rangeChunkSize: source.rangeChunkSize
  283. }, evaluatorOptions, docBaseUrl);
  284. for (var i = 0; i < cachedChunks.length; i++) {
  285. pdfManager.sendProgressiveData(cachedChunks[i]);
  286. }
  287. cachedChunks = [];
  288. pdfManagerCapability.resolve(pdfManager);
  289. cancelXHRs = null;
  290. }).catch(function (reason) {
  291. pdfManagerCapability.reject(reason);
  292. cancelXHRs = null;
  293. });
  294. var loaded = 0;
  295. var flushChunks = function flushChunks() {
  296. var pdfFile = (0, _util.arraysToBytes)(cachedChunks);
  297. if (source.length && pdfFile.length !== source.length) {
  298. (0, _util.warn)('reported HTTP length is different from actual');
  299. }
  300. try {
  301. pdfManager = new _pdf_manager.LocalPdfManager(docId, pdfFile, source.password, evaluatorOptions, docBaseUrl);
  302. pdfManagerCapability.resolve(pdfManager);
  303. } catch (ex) {
  304. pdfManagerCapability.reject(ex);
  305. }
  306. cachedChunks = [];
  307. };
  308. var readPromise = new Promise(function (resolve, reject) {
  309. var readChunk = function readChunk(chunk) {
  310. try {
  311. ensureNotTerminated();
  312. if (chunk.done) {
  313. if (!pdfManager) {
  314. flushChunks();
  315. }
  316. cancelXHRs = null;
  317. return;
  318. }
  319. var data = chunk.value;
  320. loaded += (0, _util.arrayByteLength)(data);
  321. if (!fullRequest.isStreamingSupported) {
  322. handler.send('DocProgress', {
  323. loaded: loaded,
  324. total: Math.max(loaded, fullRequest.contentLength || 0)
  325. });
  326. }
  327. if (pdfManager) {
  328. pdfManager.sendProgressiveData(data);
  329. } else {
  330. cachedChunks.push(data);
  331. }
  332. fullRequest.read().then(readChunk, reject);
  333. } catch (e) {
  334. reject(e);
  335. }
  336. };
  337. fullRequest.read().then(readChunk, reject);
  338. });
  339. readPromise.catch(function (e) {
  340. pdfManagerCapability.reject(e);
  341. cancelXHRs = null;
  342. });
  343. cancelXHRs = function cancelXHRs() {
  344. pdfStream.cancelAllRequests('abort');
  345. };
  346. return pdfManagerCapability.promise;
  347. }
  348. function setupDoc(data) {
  349. function onSuccess(doc) {
  350. ensureNotTerminated();
  351. handler.send('GetDoc', { pdfInfo: doc });
  352. }
  353. function onFailure(e) {
  354. ensureNotTerminated();
  355. if (e instanceof _util.PasswordException) {
  356. var task = new WorkerTask('PasswordException: response ' + e.code);
  357. startWorkerTask(task);
  358. handler.sendWithPromise('PasswordRequest', e).then(function (data) {
  359. finishWorkerTask(task);
  360. pdfManager.updatePassword(data.password);
  361. pdfManagerReady();
  362. }).catch(function (ex) {
  363. finishWorkerTask(task);
  364. handler.send('PasswordException', ex);
  365. }.bind(null, e));
  366. } else if (e instanceof _util.InvalidPDFException) {
  367. handler.send('InvalidPDF', e);
  368. } else if (e instanceof _util.MissingPDFException) {
  369. handler.send('MissingPDF', e);
  370. } else if (e instanceof _util.UnexpectedResponseException) {
  371. handler.send('UnexpectedResponse', e);
  372. } else {
  373. handler.send('UnknownError', new _util.UnknownErrorException(e.message, e.toString()));
  374. }
  375. }
  376. function pdfManagerReady() {
  377. ensureNotTerminated();
  378. loadDocument(false).then(onSuccess, function loadFailure(ex) {
  379. ensureNotTerminated();
  380. if (!(ex instanceof _util.XRefParseException)) {
  381. onFailure(ex);
  382. return;
  383. }
  384. pdfManager.requestLoadedStream();
  385. pdfManager.onLoadedStream().then(function () {
  386. ensureNotTerminated();
  387. loadDocument(true).then(onSuccess, onFailure);
  388. });
  389. }, onFailure);
  390. }
  391. ensureNotTerminated();
  392. var evaluatorOptions = {
  393. forceDataSchema: data.disableCreateObjectURL,
  394. maxImageSize: data.maxImageSize === undefined ? -1 : data.maxImageSize,
  395. disableFontFace: data.disableFontFace,
  396. nativeImageDecoderSupport: data.nativeImageDecoderSupport,
  397. ignoreErrors: data.ignoreErrors,
  398. isEvalSupported: data.isEvalSupported
  399. };
  400. getPdfManager(data, evaluatorOptions).then(function (newPdfManager) {
  401. if (terminated) {
  402. newPdfManager.terminate();
  403. throw new Error('Worker was terminated');
  404. }
  405. pdfManager = newPdfManager;
  406. handler.send('PDFManagerReady', null);
  407. pdfManager.onLoadedStream().then(function (stream) {
  408. handler.send('DataLoaded', { length: stream.bytes.byteLength });
  409. });
  410. }).then(pdfManagerReady, onFailure);
  411. }
  412. handler.on('GetPage', function wphSetupGetPage(data) {
  413. return pdfManager.getPage(data.pageIndex).then(function (page) {
  414. var rotatePromise = pdfManager.ensure(page, 'rotate');
  415. var refPromise = pdfManager.ensure(page, 'ref');
  416. var userUnitPromise = pdfManager.ensure(page, 'userUnit');
  417. var viewPromise = pdfManager.ensure(page, 'view');
  418. return Promise.all([rotatePromise, refPromise, userUnitPromise, viewPromise]).then(function (results) {
  419. return {
  420. rotate: results[0],
  421. ref: results[1],
  422. userUnit: results[2],
  423. view: results[3]
  424. };
  425. });
  426. });
  427. });
  428. handler.on('GetPageIndex', function wphSetupGetPageIndex(data) {
  429. var ref = new _primitives.Ref(data.ref.num, data.ref.gen);
  430. var catalog = pdfManager.pdfDocument.catalog;
  431. return catalog.getPageIndex(ref);
  432. });
  433. handler.on('GetDestinations', function wphSetupGetDestinations(data) {
  434. return pdfManager.ensureCatalog('destinations');
  435. });
  436. handler.on('GetDestination', function wphSetupGetDestination(data) {
  437. return pdfManager.ensureCatalog('getDestination', [data.id]);
  438. });
  439. handler.on('GetPageLabels', function wphSetupGetPageLabels(data) {
  440. return pdfManager.ensureCatalog('pageLabels');
  441. });
  442. handler.on('GetPageMode', function wphSetupGetPageMode(data) {
  443. return pdfManager.ensureCatalog('pageMode');
  444. });
  445. handler.on('GetAttachments', function wphSetupGetAttachments(data) {
  446. return pdfManager.ensureCatalog('attachments');
  447. });
  448. handler.on('GetJavaScript', function wphSetupGetJavaScript(data) {
  449. return pdfManager.ensureCatalog('javaScript');
  450. });
  451. handler.on('GetOutline', function wphSetupGetOutline(data) {
  452. return pdfManager.ensureCatalog('documentOutline');
  453. });
  454. handler.on('GetMetadata', function wphSetupGetMetadata(data) {
  455. return Promise.all([pdfManager.ensureDoc('documentInfo'), pdfManager.ensureCatalog('metadata')]);
  456. });
  457. handler.on('GetData', function wphSetupGetData(data) {
  458. pdfManager.requestLoadedStream();
  459. return pdfManager.onLoadedStream().then(function (stream) {
  460. return stream.bytes;
  461. });
  462. });
  463. handler.on('GetStats', function wphSetupGetStats(data) {
  464. return pdfManager.pdfDocument.xref.stats;
  465. });
  466. handler.on('GetAnnotations', function wphSetupGetAnnotations(data) {
  467. return pdfManager.getPage(data.pageIndex).then(function (page) {
  468. return pdfManager.ensure(page, 'getAnnotationsData', [data.intent]);
  469. });
  470. });
  471. handler.on('RenderPageRequest', function wphSetupRenderPage(data) {
  472. var pageIndex = data.pageIndex;
  473. pdfManager.getPage(pageIndex).then(function (page) {
  474. var task = new WorkerTask('RenderPageRequest: page ' + pageIndex);
  475. startWorkerTask(task);
  476. var pageNum = pageIndex + 1;
  477. var start = Date.now();
  478. page.getOperatorList({
  479. handler: handler,
  480. task: task,
  481. intent: data.intent,
  482. renderInteractiveForms: data.renderInteractiveForms
  483. }).then(function (operatorList) {
  484. finishWorkerTask(task);
  485. (0, _util.info)('page=' + pageNum + ' - getOperatorList: time=' + (Date.now() - start) + 'ms, len=' + operatorList.totalLength);
  486. }, function (e) {
  487. finishWorkerTask(task);
  488. if (task.terminated) {
  489. return;
  490. }
  491. handler.send('UnsupportedFeature', { featureId: _util.UNSUPPORTED_FEATURES.unknown });
  492. var minimumStackMessage = 'worker.js: while trying to getPage() and getOperatorList()';
  493. var wrappedException;
  494. if (typeof e === 'string') {
  495. wrappedException = {
  496. message: e,
  497. stack: minimumStackMessage
  498. };
  499. } else if ((typeof e === 'undefined' ? 'undefined' : _typeof(e)) === 'object') {
  500. wrappedException = {
  501. message: e.message || e.toString(),
  502. stack: e.stack || minimumStackMessage
  503. };
  504. } else {
  505. wrappedException = {
  506. message: 'Unknown exception type: ' + (typeof e === 'undefined' ? 'undefined' : _typeof(e)),
  507. stack: minimumStackMessage
  508. };
  509. }
  510. handler.send('PageError', {
  511. pageNum: pageNum,
  512. error: wrappedException,
  513. intent: data.intent
  514. });
  515. });
  516. });
  517. }, this);
  518. handler.on('GetTextContent', function wphExtractText(data, sink) {
  519. var pageIndex = data.pageIndex;
  520. sink.onPull = function (desiredSize) {};
  521. sink.onCancel = function (reason) {};
  522. pdfManager.getPage(pageIndex).then(function (page) {
  523. var task = new WorkerTask('GetTextContent: page ' + pageIndex);
  524. startWorkerTask(task);
  525. var pageNum = pageIndex + 1;
  526. var start = Date.now();
  527. page.extractTextContent({
  528. handler: handler,
  529. task: task,
  530. sink: sink,
  531. normalizeWhitespace: data.normalizeWhitespace,
  532. combineTextItems: data.combineTextItems
  533. }).then(function () {
  534. finishWorkerTask(task);
  535. (0, _util.info)('text indexing: page=' + pageNum + ' - time=' + (Date.now() - start) + 'ms');
  536. sink.close();
  537. }, function (reason) {
  538. finishWorkerTask(task);
  539. if (task.terminated) {
  540. return;
  541. }
  542. sink.error(reason);
  543. throw reason;
  544. });
  545. });
  546. });
  547. handler.on('Cleanup', function wphCleanup(data) {
  548. return pdfManager.cleanup();
  549. });
  550. handler.on('Terminate', function wphTerminate(data) {
  551. terminated = true;
  552. if (pdfManager) {
  553. pdfManager.terminate();
  554. pdfManager = null;
  555. }
  556. if (cancelXHRs) {
  557. cancelXHRs();
  558. }
  559. var waitOn = [];
  560. WorkerTasks.forEach(function (task) {
  561. waitOn.push(task.finished);
  562. task.terminate();
  563. });
  564. return Promise.all(waitOn).then(function () {
  565. handler.destroy();
  566. handler = null;
  567. });
  568. });
  569. handler.on('Ready', function wphReady(data) {
  570. setupDoc(docParams);
  571. docParams = null;
  572. });
  573. return workerHandlerName;
  574. },
  575. initializeFromPort: function initializeFromPort(port) {
  576. var handler = new _util.MessageHandler('worker', 'main', port);
  577. WorkerMessageHandler.setup(handler, port);
  578. handler.send('ready', null);
  579. }
  580. };
  581. function isMessagePort(maybePort) {
  582. return typeof maybePort.postMessage === 'function' && 'onmessage' in maybePort;
  583. }
  584. if (typeof window === 'undefined' && !(0, _util.isNodeJS)() && typeof self !== 'undefined' && isMessagePort(self)) {
  585. WorkerMessageHandler.initializeFromPort(self);
  586. }
  587. exports.WorkerTask = WorkerTask;
  588. exports.WorkerMessageHandler = WorkerMessageHandler;