2
0

worker.js 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686
  1. /* Copyright 2017 Mozilla Foundation
  2. *
  3. * Licensed under the Apache License, Version 2.0 (the "License");
  4. * you may not use this file except in compliance with the License.
  5. * You may obtain a copy of the License at
  6. *
  7. * http://www.apache.org/licenses/LICENSE-2.0
  8. *
  9. * Unless required by applicable law or agreed to in writing, software
  10. * distributed under the License is distributed on an "AS IS" BASIS,
  11. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. * See the License for the specific language governing permissions and
  13. * limitations under the License.
  14. */
  15. 'use strict';
  16. var sharedUtil = require('../shared/util.js');
  17. var corePrimitives = require('./primitives.js');
  18. var corePdfManager = require('./pdf_manager.js');
  19. var UNSUPPORTED_FEATURES = sharedUtil.UNSUPPORTED_FEATURES;
  20. var InvalidPDFException = sharedUtil.InvalidPDFException;
  21. var MessageHandler = sharedUtil.MessageHandler;
  22. var MissingPDFException = sharedUtil.MissingPDFException;
  23. var UnexpectedResponseException = sharedUtil.UnexpectedResponseException;
  24. var PasswordException = sharedUtil.PasswordException;
  25. var UnknownErrorException = sharedUtil.UnknownErrorException;
  26. var XRefParseException = sharedUtil.XRefParseException;
  27. var arrayByteLength = sharedUtil.arrayByteLength;
  28. var arraysToBytes = sharedUtil.arraysToBytes;
  29. var assert = sharedUtil.assert;
  30. var createPromiseCapability = sharedUtil.createPromiseCapability;
  31. var info = sharedUtil.info;
  32. var warn = sharedUtil.warn;
  33. var setVerbosityLevel = sharedUtil.setVerbosityLevel;
  34. var isNodeJS = sharedUtil.isNodeJS;
  35. var Ref = corePrimitives.Ref;
  36. var LocalPdfManager = corePdfManager.LocalPdfManager;
  37. var NetworkPdfManager = corePdfManager.NetworkPdfManager;
  38. var WorkerTask = function WorkerTaskClosure() {
  39. function WorkerTask(name) {
  40. this.name = name;
  41. this.terminated = false;
  42. this._capability = createPromiseCapability();
  43. }
  44. WorkerTask.prototype = {
  45. get finished() {
  46. return this._capability.promise;
  47. },
  48. finish: function () {
  49. this._capability.resolve();
  50. },
  51. terminate: function () {
  52. this.terminated = true;
  53. },
  54. ensureNotTerminated: function () {
  55. if (this.terminated) {
  56. throw new Error('Worker task was terminated');
  57. }
  58. }
  59. };
  60. return WorkerTask;
  61. }();
  62. var PDFWorkerStream = function PDFWorkerStreamClosure() {
  63. function PDFWorkerStream(params, msgHandler) {
  64. this._queuedChunks = [];
  65. var initialData = params.initialData;
  66. if (initialData && initialData.length > 0) {
  67. this._queuedChunks.push(initialData);
  68. }
  69. this._msgHandler = msgHandler;
  70. this._isRangeSupported = !params.disableRange;
  71. this._isStreamingSupported = !params.disableStream;
  72. this._contentLength = params.length;
  73. this._fullRequestReader = null;
  74. this._rangeReaders = [];
  75. msgHandler.on('OnDataRange', this._onReceiveData.bind(this));
  76. msgHandler.on('OnDataProgress', this._onProgress.bind(this));
  77. }
  78. PDFWorkerStream.prototype = {
  79. _onReceiveData: function PDFWorkerStream_onReceiveData(args) {
  80. if (args.begin === undefined) {
  81. if (this._fullRequestReader) {
  82. this._fullRequestReader._enqueue(args.chunk);
  83. } else {
  84. this._queuedChunks.push(args.chunk);
  85. }
  86. } else {
  87. var found = this._rangeReaders.some(function (rangeReader) {
  88. if (rangeReader._begin !== args.begin) {
  89. return false;
  90. }
  91. rangeReader._enqueue(args.chunk);
  92. return true;
  93. });
  94. assert(found);
  95. }
  96. },
  97. _onProgress: function PDFWorkerStream_onProgress(evt) {
  98. if (this._rangeReaders.length > 0) {
  99. var firstReader = this._rangeReaders[0];
  100. if (firstReader.onProgress) {
  101. firstReader.onProgress({ loaded: evt.loaded });
  102. }
  103. }
  104. },
  105. _removeRangeReader: function PDFWorkerStream_removeRangeReader(reader) {
  106. var i = this._rangeReaders.indexOf(reader);
  107. if (i >= 0) {
  108. this._rangeReaders.splice(i, 1);
  109. }
  110. },
  111. getFullReader: function PDFWorkerStream_getFullReader() {
  112. assert(!this._fullRequestReader);
  113. var queuedChunks = this._queuedChunks;
  114. this._queuedChunks = null;
  115. return new PDFWorkerStreamReader(this, queuedChunks);
  116. },
  117. getRangeReader: function PDFWorkerStream_getRangeReader(begin, end) {
  118. var reader = new PDFWorkerStreamRangeReader(this, begin, end);
  119. this._msgHandler.send('RequestDataRange', {
  120. begin: begin,
  121. end: end
  122. });
  123. this._rangeReaders.push(reader);
  124. return reader;
  125. },
  126. cancelAllRequests: function PDFWorkerStream_cancelAllRequests(reason) {
  127. if (this._fullRequestReader) {
  128. this._fullRequestReader.cancel(reason);
  129. }
  130. var readers = this._rangeReaders.slice(0);
  131. readers.forEach(function (rangeReader) {
  132. rangeReader.cancel(reason);
  133. });
  134. }
  135. };
  136. function PDFWorkerStreamReader(stream, queuedChunks) {
  137. this._stream = stream;
  138. this._done = false;
  139. this._queuedChunks = queuedChunks || [];
  140. this._requests = [];
  141. this._headersReady = Promise.resolve();
  142. stream._fullRequestReader = this;
  143. this.onProgress = null;
  144. }
  145. PDFWorkerStreamReader.prototype = {
  146. _enqueue: function PDFWorkerStreamReader_enqueue(chunk) {
  147. if (this._done) {
  148. return;
  149. }
  150. if (this._requests.length > 0) {
  151. var requestCapability = this._requests.shift();
  152. requestCapability.resolve({
  153. value: chunk,
  154. done: false
  155. });
  156. return;
  157. }
  158. this._queuedChunks.push(chunk);
  159. },
  160. get headersReady() {
  161. return this._headersReady;
  162. },
  163. get isRangeSupported() {
  164. return this._stream._isRangeSupported;
  165. },
  166. get isStreamingSupported() {
  167. return this._stream._isStreamingSupported;
  168. },
  169. get contentLength() {
  170. return this._stream._contentLength;
  171. },
  172. read: function PDFWorkerStreamReader_read() {
  173. if (this._queuedChunks.length > 0) {
  174. var chunk = this._queuedChunks.shift();
  175. return Promise.resolve({
  176. value: chunk,
  177. done: false
  178. });
  179. }
  180. if (this._done) {
  181. return Promise.resolve({
  182. value: undefined,
  183. done: true
  184. });
  185. }
  186. var requestCapability = createPromiseCapability();
  187. this._requests.push(requestCapability);
  188. return requestCapability.promise;
  189. },
  190. cancel: function PDFWorkerStreamReader_cancel(reason) {
  191. this._done = true;
  192. this._requests.forEach(function (requestCapability) {
  193. requestCapability.resolve({
  194. value: undefined,
  195. done: true
  196. });
  197. });
  198. this._requests = [];
  199. }
  200. };
  201. function PDFWorkerStreamRangeReader(stream, begin, end) {
  202. this._stream = stream;
  203. this._begin = begin;
  204. this._end = end;
  205. this._queuedChunk = null;
  206. this._requests = [];
  207. this._done = false;
  208. this.onProgress = null;
  209. }
  210. PDFWorkerStreamRangeReader.prototype = {
  211. _enqueue: function PDFWorkerStreamRangeReader_enqueue(chunk) {
  212. if (this._done) {
  213. return;
  214. }
  215. if (this._requests.length === 0) {
  216. this._queuedChunk = chunk;
  217. } else {
  218. var requestsCapability = this._requests.shift();
  219. requestsCapability.resolve({
  220. value: chunk,
  221. done: false
  222. });
  223. this._requests.forEach(function (requestCapability) {
  224. requestCapability.resolve({
  225. value: undefined,
  226. done: true
  227. });
  228. });
  229. this._requests = [];
  230. }
  231. this._done = true;
  232. this._stream._removeRangeReader(this);
  233. },
  234. get isStreamingSupported() {
  235. return false;
  236. },
  237. read: function PDFWorkerStreamRangeReader_read() {
  238. if (this._queuedChunk) {
  239. return Promise.resolve({
  240. value: this._queuedChunk,
  241. done: false
  242. });
  243. }
  244. if (this._done) {
  245. return Promise.resolve({
  246. value: undefined,
  247. done: true
  248. });
  249. }
  250. var requestCapability = createPromiseCapability();
  251. this._requests.push(requestCapability);
  252. return requestCapability.promise;
  253. },
  254. cancel: function PDFWorkerStreamRangeReader_cancel(reason) {
  255. this._done = true;
  256. this._requests.forEach(function (requestCapability) {
  257. requestCapability.resolve({
  258. value: undefined,
  259. done: true
  260. });
  261. });
  262. this._requests = [];
  263. this._stream._removeRangeReader(this);
  264. }
  265. };
  266. return PDFWorkerStream;
  267. }();
  268. var PDFNetworkStream;
  269. function setPDFNetworkStreamClass(cls) {
  270. PDFNetworkStream = cls;
  271. }
  272. var WorkerMessageHandler = {
  273. setup: function wphSetup(handler, port) {
  274. var testMessageProcessed = false;
  275. handler.on('test', function wphSetupTest(data) {
  276. if (testMessageProcessed) {
  277. return;
  278. }
  279. testMessageProcessed = true;
  280. if (!(data instanceof Uint8Array)) {
  281. handler.send('test', 'main', false);
  282. return;
  283. }
  284. var supportTransfers = data[0] === 255;
  285. handler.postMessageTransfers = supportTransfers;
  286. var xhr = new XMLHttpRequest();
  287. var responseExists = 'response' in xhr;
  288. try {
  289. xhr.responseType;
  290. } catch (e) {
  291. responseExists = false;
  292. }
  293. if (!responseExists) {
  294. handler.send('test', false);
  295. return;
  296. }
  297. handler.send('test', {
  298. supportTypedArray: true,
  299. supportTransfers: supportTransfers
  300. });
  301. });
  302. handler.on('configure', function wphConfigure(data) {
  303. setVerbosityLevel(data.verbosity);
  304. });
  305. handler.on('GetDocRequest', function wphSetupDoc(data) {
  306. return WorkerMessageHandler.createDocumentHandler(data, port);
  307. });
  308. },
  309. createDocumentHandler: function wphCreateDocumentHandler(docParams, port) {
  310. var pdfManager;
  311. var terminated = false;
  312. var cancelXHRs = null;
  313. var WorkerTasks = [];
  314. var docId = docParams.docId;
  315. var docBaseUrl = docParams.docBaseUrl;
  316. var workerHandlerName = docParams.docId + '_worker';
  317. var handler = new MessageHandler(workerHandlerName, docId, port);
  318. handler.postMessageTransfers = docParams.postMessageTransfers;
  319. function ensureNotTerminated() {
  320. if (terminated) {
  321. throw new Error('Worker was terminated');
  322. }
  323. }
  324. function startWorkerTask(task) {
  325. WorkerTasks.push(task);
  326. }
  327. function finishWorkerTask(task) {
  328. task.finish();
  329. var i = WorkerTasks.indexOf(task);
  330. WorkerTasks.splice(i, 1);
  331. }
  332. function loadDocument(recoveryMode) {
  333. var loadDocumentCapability = createPromiseCapability();
  334. var parseSuccess = function parseSuccess() {
  335. var numPagesPromise = pdfManager.ensureDoc('numPages');
  336. var fingerprintPromise = pdfManager.ensureDoc('fingerprint');
  337. var encryptedPromise = pdfManager.ensureXRef('encrypt');
  338. Promise.all([numPagesPromise, fingerprintPromise, encryptedPromise]).then(function onDocReady(results) {
  339. var doc = {
  340. numPages: results[0],
  341. fingerprint: results[1],
  342. encrypted: !!results[2]
  343. };
  344. loadDocumentCapability.resolve(doc);
  345. }, parseFailure);
  346. };
  347. var parseFailure = function parseFailure(e) {
  348. loadDocumentCapability.reject(e);
  349. };
  350. pdfManager.ensureDoc('checkHeader', []).then(function () {
  351. pdfManager.ensureDoc('parseStartXRef', []).then(function () {
  352. pdfManager.ensureDoc('parse', [recoveryMode]).then(parseSuccess, parseFailure);
  353. }, parseFailure);
  354. }, parseFailure);
  355. return loadDocumentCapability.promise;
  356. }
  357. function getPdfManager(data, evaluatorOptions) {
  358. var pdfManagerCapability = createPromiseCapability();
  359. var pdfManager;
  360. var source = data.source;
  361. if (source.data) {
  362. try {
  363. pdfManager = new LocalPdfManager(docId, source.data, source.password, evaluatorOptions, docBaseUrl);
  364. pdfManagerCapability.resolve(pdfManager);
  365. } catch (ex) {
  366. pdfManagerCapability.reject(ex);
  367. }
  368. return pdfManagerCapability.promise;
  369. }
  370. var pdfStream;
  371. try {
  372. if (source.chunkedViewerLoading) {
  373. pdfStream = new PDFWorkerStream(source, handler);
  374. } else {
  375. assert(PDFNetworkStream, 'pdfjs/core/network module is not loaded');
  376. pdfStream = new PDFNetworkStream(data);
  377. }
  378. } catch (ex) {
  379. pdfManagerCapability.reject(ex);
  380. return pdfManagerCapability.promise;
  381. }
  382. var fullRequest = pdfStream.getFullReader();
  383. fullRequest.headersReady.then(function () {
  384. if (!fullRequest.isStreamingSupported || !fullRequest.isRangeSupported) {
  385. fullRequest.onProgress = function (evt) {
  386. handler.send('DocProgress', {
  387. loaded: evt.loaded,
  388. total: evt.total
  389. });
  390. };
  391. }
  392. if (!fullRequest.isRangeSupported) {
  393. return;
  394. }
  395. var disableAutoFetch = source.disableAutoFetch || fullRequest.isStreamingSupported;
  396. pdfManager = new NetworkPdfManager(docId, pdfStream, {
  397. msgHandler: handler,
  398. url: source.url,
  399. password: source.password,
  400. length: fullRequest.contentLength,
  401. disableAutoFetch: disableAutoFetch,
  402. rangeChunkSize: source.rangeChunkSize
  403. }, evaluatorOptions, docBaseUrl);
  404. pdfManagerCapability.resolve(pdfManager);
  405. cancelXHRs = null;
  406. }).catch(function (reason) {
  407. pdfManagerCapability.reject(reason);
  408. cancelXHRs = null;
  409. });
  410. var cachedChunks = [],
  411. loaded = 0;
  412. var flushChunks = function () {
  413. var pdfFile = arraysToBytes(cachedChunks);
  414. if (source.length && pdfFile.length !== source.length) {
  415. warn('reported HTTP length is different from actual');
  416. }
  417. try {
  418. pdfManager = new LocalPdfManager(docId, pdfFile, source.password, evaluatorOptions, docBaseUrl);
  419. pdfManagerCapability.resolve(pdfManager);
  420. } catch (ex) {
  421. pdfManagerCapability.reject(ex);
  422. }
  423. cachedChunks = [];
  424. };
  425. var readPromise = new Promise(function (resolve, reject) {
  426. var readChunk = function (chunk) {
  427. try {
  428. ensureNotTerminated();
  429. if (chunk.done) {
  430. if (!pdfManager) {
  431. flushChunks();
  432. }
  433. cancelXHRs = null;
  434. return;
  435. }
  436. var data = chunk.value;
  437. loaded += arrayByteLength(data);
  438. if (!fullRequest.isStreamingSupported) {
  439. handler.send('DocProgress', {
  440. loaded: loaded,
  441. total: Math.max(loaded, fullRequest.contentLength || 0)
  442. });
  443. }
  444. if (pdfManager) {
  445. pdfManager.sendProgressiveData(data);
  446. } else {
  447. cachedChunks.push(data);
  448. }
  449. fullRequest.read().then(readChunk, reject);
  450. } catch (e) {
  451. reject(e);
  452. }
  453. };
  454. fullRequest.read().then(readChunk, reject);
  455. });
  456. readPromise.catch(function (e) {
  457. pdfManagerCapability.reject(e);
  458. cancelXHRs = null;
  459. });
  460. cancelXHRs = function () {
  461. pdfStream.cancelAllRequests('abort');
  462. };
  463. return pdfManagerCapability.promise;
  464. }
  465. function setupDoc(data) {
  466. function onSuccess(doc) {
  467. ensureNotTerminated();
  468. handler.send('GetDoc', { pdfInfo: doc });
  469. }
  470. function onFailure(e) {
  471. if (e instanceof PasswordException) {
  472. var task = new WorkerTask('PasswordException: response ' + e.code);
  473. startWorkerTask(task);
  474. handler.sendWithPromise('PasswordRequest', e).then(function (data) {
  475. finishWorkerTask(task);
  476. pdfManager.updatePassword(data.password);
  477. pdfManagerReady();
  478. }).catch(function (ex) {
  479. finishWorkerTask(task);
  480. handler.send('PasswordException', ex);
  481. }.bind(null, e));
  482. } else if (e instanceof InvalidPDFException) {
  483. handler.send('InvalidPDF', e);
  484. } else if (e instanceof MissingPDFException) {
  485. handler.send('MissingPDF', e);
  486. } else if (e instanceof UnexpectedResponseException) {
  487. handler.send('UnexpectedResponse', e);
  488. } else {
  489. handler.send('UnknownError', new UnknownErrorException(e.message, e.toString()));
  490. }
  491. }
  492. function pdfManagerReady() {
  493. ensureNotTerminated();
  494. loadDocument(false).then(onSuccess, function loadFailure(ex) {
  495. ensureNotTerminated();
  496. if (!(ex instanceof XRefParseException)) {
  497. onFailure(ex);
  498. return;
  499. }
  500. pdfManager.requestLoadedStream();
  501. pdfManager.onLoadedStream().then(function () {
  502. ensureNotTerminated();
  503. loadDocument(true).then(onSuccess, onFailure);
  504. });
  505. }, onFailure);
  506. }
  507. ensureNotTerminated();
  508. var evaluatorOptions = {
  509. forceDataSchema: data.disableCreateObjectURL,
  510. maxImageSize: data.maxImageSize === undefined ? -1 : data.maxImageSize,
  511. disableFontFace: data.disableFontFace,
  512. disableNativeImageDecoder: data.disableNativeImageDecoder
  513. };
  514. getPdfManager(data, evaluatorOptions).then(function (newPdfManager) {
  515. if (terminated) {
  516. newPdfManager.terminate();
  517. throw new Error('Worker was terminated');
  518. }
  519. pdfManager = newPdfManager;
  520. handler.send('PDFManagerReady', null);
  521. pdfManager.onLoadedStream().then(function (stream) {
  522. handler.send('DataLoaded', { length: stream.bytes.byteLength });
  523. });
  524. }).then(pdfManagerReady, onFailure);
  525. }
  526. handler.on('GetPage', function wphSetupGetPage(data) {
  527. return pdfManager.getPage(data.pageIndex).then(function (page) {
  528. var rotatePromise = pdfManager.ensure(page, 'rotate');
  529. var refPromise = pdfManager.ensure(page, 'ref');
  530. var userUnitPromise = pdfManager.ensure(page, 'userUnit');
  531. var viewPromise = pdfManager.ensure(page, 'view');
  532. return Promise.all([rotatePromise, refPromise, userUnitPromise, viewPromise]).then(function (results) {
  533. return {
  534. rotate: results[0],
  535. ref: results[1],
  536. userUnit: results[2],
  537. view: results[3]
  538. };
  539. });
  540. });
  541. });
  542. handler.on('GetPageIndex', function wphSetupGetPageIndex(data) {
  543. var ref = new Ref(data.ref.num, data.ref.gen);
  544. var catalog = pdfManager.pdfDocument.catalog;
  545. return catalog.getPageIndex(ref);
  546. });
  547. handler.on('GetDestinations', function wphSetupGetDestinations(data) {
  548. return pdfManager.ensureCatalog('destinations');
  549. });
  550. handler.on('GetDestination', function wphSetupGetDestination(data) {
  551. return pdfManager.ensureCatalog('getDestination', [data.id]);
  552. });
  553. handler.on('GetPageLabels', function wphSetupGetPageLabels(data) {
  554. return pdfManager.ensureCatalog('pageLabels');
  555. });
  556. handler.on('GetAttachments', function wphSetupGetAttachments(data) {
  557. return pdfManager.ensureCatalog('attachments');
  558. });
  559. handler.on('GetJavaScript', function wphSetupGetJavaScript(data) {
  560. return pdfManager.ensureCatalog('javaScript');
  561. });
  562. handler.on('GetOutline', function wphSetupGetOutline(data) {
  563. return pdfManager.ensureCatalog('documentOutline');
  564. });
  565. handler.on('GetMetadata', function wphSetupGetMetadata(data) {
  566. return Promise.all([pdfManager.ensureDoc('documentInfo'), pdfManager.ensureCatalog('metadata')]);
  567. });
  568. handler.on('GetData', function wphSetupGetData(data) {
  569. pdfManager.requestLoadedStream();
  570. return pdfManager.onLoadedStream().then(function (stream) {
  571. return stream.bytes;
  572. });
  573. });
  574. handler.on('GetStats', function wphSetupGetStats(data) {
  575. return pdfManager.pdfDocument.xref.stats;
  576. });
  577. handler.on('GetAnnotations', function wphSetupGetAnnotations(data) {
  578. return pdfManager.getPage(data.pageIndex).then(function (page) {
  579. return pdfManager.ensure(page, 'getAnnotationsData', [data.intent]);
  580. });
  581. });
  582. handler.on('RenderPageRequest', function wphSetupRenderPage(data) {
  583. var pageIndex = data.pageIndex;
  584. pdfManager.getPage(pageIndex).then(function (page) {
  585. var task = new WorkerTask('RenderPageRequest: page ' + pageIndex);
  586. startWorkerTask(task);
  587. var pageNum = pageIndex + 1;
  588. var start = Date.now();
  589. page.getOperatorList(handler, task, data.intent, data.renderInteractiveForms).then(function (operatorList) {
  590. finishWorkerTask(task);
  591. info('page=' + pageNum + ' - getOperatorList: time=' + (Date.now() - start) + 'ms, len=' + operatorList.totalLength);
  592. }, function (e) {
  593. finishWorkerTask(task);
  594. if (task.terminated) {
  595. return;
  596. }
  597. handler.send('UnsupportedFeature', { featureId: UNSUPPORTED_FEATURES.unknown });
  598. var minimumStackMessage = 'worker.js: while trying to getPage() and getOperatorList()';
  599. var wrappedException;
  600. if (typeof e === 'string') {
  601. wrappedException = {
  602. message: e,
  603. stack: minimumStackMessage
  604. };
  605. } else if (typeof e === 'object') {
  606. wrappedException = {
  607. message: e.message || e.toString(),
  608. stack: e.stack || minimumStackMessage
  609. };
  610. } else {
  611. wrappedException = {
  612. message: 'Unknown exception type: ' + typeof e,
  613. stack: minimumStackMessage
  614. };
  615. }
  616. handler.send('PageError', {
  617. pageNum: pageNum,
  618. error: wrappedException,
  619. intent: data.intent
  620. });
  621. });
  622. });
  623. }, this);
  624. handler.on('GetTextContent', function wphExtractText(data) {
  625. var pageIndex = data.pageIndex;
  626. var normalizeWhitespace = data.normalizeWhitespace;
  627. var combineTextItems = data.combineTextItems;
  628. return pdfManager.getPage(pageIndex).then(function (page) {
  629. var task = new WorkerTask('GetTextContent: page ' + pageIndex);
  630. startWorkerTask(task);
  631. var pageNum = pageIndex + 1;
  632. var start = Date.now();
  633. return page.extractTextContent(handler, task, normalizeWhitespace, combineTextItems).then(function (textContent) {
  634. finishWorkerTask(task);
  635. info('text indexing: page=' + pageNum + ' - time=' + (Date.now() - start) + 'ms');
  636. return textContent;
  637. }, function (reason) {
  638. finishWorkerTask(task);
  639. if (task.terminated) {
  640. return;
  641. }
  642. throw reason;
  643. });
  644. });
  645. });
  646. handler.on('Cleanup', function wphCleanup(data) {
  647. return pdfManager.cleanup();
  648. });
  649. handler.on('Terminate', function wphTerminate(data) {
  650. terminated = true;
  651. if (pdfManager) {
  652. pdfManager.terminate();
  653. pdfManager = null;
  654. }
  655. if (cancelXHRs) {
  656. cancelXHRs();
  657. }
  658. var waitOn = [];
  659. WorkerTasks.forEach(function (task) {
  660. waitOn.push(task.finished);
  661. task.terminate();
  662. });
  663. return Promise.all(waitOn).then(function () {
  664. handler.destroy();
  665. handler = null;
  666. });
  667. });
  668. handler.on('Ready', function wphReady(data) {
  669. setupDoc(docParams);
  670. docParams = null;
  671. });
  672. return workerHandlerName;
  673. }
  674. };
  675. function initializeWorker() {
  676. var handler = new MessageHandler('worker', 'main', self);
  677. WorkerMessageHandler.setup(handler, self);
  678. handler.send('ready', null);
  679. }
  680. if (typeof window === 'undefined' && !isNodeJS()) {
  681. initializeWorker();
  682. }
  683. exports.setPDFNetworkStreamClass = setPDFNetworkStreamClass;
  684. exports.WorkerTask = WorkerTask;
  685. exports.WorkerMessageHandler = WorkerMessageHandler;