cmap.js 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884
  1. /* Copyright 2017 Mozilla Foundation
  2. *
  3. * Licensed under the Apache License, Version 2.0 (the "License");
  4. * you may not use this file except in compliance with the License.
  5. * You may obtain a copy of the License at
  6. *
  7. * http://www.apache.org/licenses/LICENSE-2.0
  8. *
  9. * Unless required by applicable law or agreed to in writing, software
  10. * distributed under the License is distributed on an "AS IS" BASIS,
  11. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. * See the License for the specific language governing permissions and
  13. * limitations under the License.
  14. */
  15. 'use strict';
  16. var sharedUtil = require('../shared/util.js');
  17. var corePrimitives = require('./primitives.js');
  18. var coreStream = require('./stream.js');
  19. var coreParser = require('./parser.js');
  20. var Util = sharedUtil.Util;
  21. var assert = sharedUtil.assert;
  22. var warn = sharedUtil.warn;
  23. var error = sharedUtil.error;
  24. var isInt = sharedUtil.isInt;
  25. var isString = sharedUtil.isString;
  26. var MissingDataException = sharedUtil.MissingDataException;
  27. var CMapCompressionType = sharedUtil.CMapCompressionType;
  28. var isEOF = corePrimitives.isEOF;
  29. var isName = corePrimitives.isName;
  30. var isCmd = corePrimitives.isCmd;
  31. var isStream = corePrimitives.isStream;
  32. var Stream = coreStream.Stream;
  33. var Lexer = coreParser.Lexer;
  34. var BUILT_IN_CMAPS = [
  35. 'Adobe-GB1-UCS2',
  36. 'Adobe-CNS1-UCS2',
  37. 'Adobe-Japan1-UCS2',
  38. 'Adobe-Korea1-UCS2',
  39. '78-EUC-H',
  40. '78-EUC-V',
  41. '78-H',
  42. '78-RKSJ-H',
  43. '78-RKSJ-V',
  44. '78-V',
  45. '78ms-RKSJ-H',
  46. '78ms-RKSJ-V',
  47. '83pv-RKSJ-H',
  48. '90ms-RKSJ-H',
  49. '90ms-RKSJ-V',
  50. '90msp-RKSJ-H',
  51. '90msp-RKSJ-V',
  52. '90pv-RKSJ-H',
  53. '90pv-RKSJ-V',
  54. 'Add-H',
  55. 'Add-RKSJ-H',
  56. 'Add-RKSJ-V',
  57. 'Add-V',
  58. 'Adobe-CNS1-0',
  59. 'Adobe-CNS1-1',
  60. 'Adobe-CNS1-2',
  61. 'Adobe-CNS1-3',
  62. 'Adobe-CNS1-4',
  63. 'Adobe-CNS1-5',
  64. 'Adobe-CNS1-6',
  65. 'Adobe-GB1-0',
  66. 'Adobe-GB1-1',
  67. 'Adobe-GB1-2',
  68. 'Adobe-GB1-3',
  69. 'Adobe-GB1-4',
  70. 'Adobe-GB1-5',
  71. 'Adobe-Japan1-0',
  72. 'Adobe-Japan1-1',
  73. 'Adobe-Japan1-2',
  74. 'Adobe-Japan1-3',
  75. 'Adobe-Japan1-4',
  76. 'Adobe-Japan1-5',
  77. 'Adobe-Japan1-6',
  78. 'Adobe-Korea1-0',
  79. 'Adobe-Korea1-1',
  80. 'Adobe-Korea1-2',
  81. 'B5-H',
  82. 'B5-V',
  83. 'B5pc-H',
  84. 'B5pc-V',
  85. 'CNS-EUC-H',
  86. 'CNS-EUC-V',
  87. 'CNS1-H',
  88. 'CNS1-V',
  89. 'CNS2-H',
  90. 'CNS2-V',
  91. 'ETHK-B5-H',
  92. 'ETHK-B5-V',
  93. 'ETen-B5-H',
  94. 'ETen-B5-V',
  95. 'ETenms-B5-H',
  96. 'ETenms-B5-V',
  97. 'EUC-H',
  98. 'EUC-V',
  99. 'Ext-H',
  100. 'Ext-RKSJ-H',
  101. 'Ext-RKSJ-V',
  102. 'Ext-V',
  103. 'GB-EUC-H',
  104. 'GB-EUC-V',
  105. 'GB-H',
  106. 'GB-V',
  107. 'GBK-EUC-H',
  108. 'GBK-EUC-V',
  109. 'GBK2K-H',
  110. 'GBK2K-V',
  111. 'GBKp-EUC-H',
  112. 'GBKp-EUC-V',
  113. 'GBT-EUC-H',
  114. 'GBT-EUC-V',
  115. 'GBT-H',
  116. 'GBT-V',
  117. 'GBTpc-EUC-H',
  118. 'GBTpc-EUC-V',
  119. 'GBpc-EUC-H',
  120. 'GBpc-EUC-V',
  121. 'H',
  122. 'HKdla-B5-H',
  123. 'HKdla-B5-V',
  124. 'HKdlb-B5-H',
  125. 'HKdlb-B5-V',
  126. 'HKgccs-B5-H',
  127. 'HKgccs-B5-V',
  128. 'HKm314-B5-H',
  129. 'HKm314-B5-V',
  130. 'HKm471-B5-H',
  131. 'HKm471-B5-V',
  132. 'HKscs-B5-H',
  133. 'HKscs-B5-V',
  134. 'Hankaku',
  135. 'Hiragana',
  136. 'KSC-EUC-H',
  137. 'KSC-EUC-V',
  138. 'KSC-H',
  139. 'KSC-Johab-H',
  140. 'KSC-Johab-V',
  141. 'KSC-V',
  142. 'KSCms-UHC-H',
  143. 'KSCms-UHC-HW-H',
  144. 'KSCms-UHC-HW-V',
  145. 'KSCms-UHC-V',
  146. 'KSCpc-EUC-H',
  147. 'KSCpc-EUC-V',
  148. 'Katakana',
  149. 'NWP-H',
  150. 'NWP-V',
  151. 'RKSJ-H',
  152. 'RKSJ-V',
  153. 'Roman',
  154. 'UniCNS-UCS2-H',
  155. 'UniCNS-UCS2-V',
  156. 'UniCNS-UTF16-H',
  157. 'UniCNS-UTF16-V',
  158. 'UniCNS-UTF32-H',
  159. 'UniCNS-UTF32-V',
  160. 'UniCNS-UTF8-H',
  161. 'UniCNS-UTF8-V',
  162. 'UniGB-UCS2-H',
  163. 'UniGB-UCS2-V',
  164. 'UniGB-UTF16-H',
  165. 'UniGB-UTF16-V',
  166. 'UniGB-UTF32-H',
  167. 'UniGB-UTF32-V',
  168. 'UniGB-UTF8-H',
  169. 'UniGB-UTF8-V',
  170. 'UniJIS-UCS2-H',
  171. 'UniJIS-UCS2-HW-H',
  172. 'UniJIS-UCS2-HW-V',
  173. 'UniJIS-UCS2-V',
  174. 'UniJIS-UTF16-H',
  175. 'UniJIS-UTF16-V',
  176. 'UniJIS-UTF32-H',
  177. 'UniJIS-UTF32-V',
  178. 'UniJIS-UTF8-H',
  179. 'UniJIS-UTF8-V',
  180. 'UniJIS2004-UTF16-H',
  181. 'UniJIS2004-UTF16-V',
  182. 'UniJIS2004-UTF32-H',
  183. 'UniJIS2004-UTF32-V',
  184. 'UniJIS2004-UTF8-H',
  185. 'UniJIS2004-UTF8-V',
  186. 'UniJISPro-UCS2-HW-V',
  187. 'UniJISPro-UCS2-V',
  188. 'UniJISPro-UTF8-V',
  189. 'UniJISX0213-UTF32-H',
  190. 'UniJISX0213-UTF32-V',
  191. 'UniJISX02132004-UTF32-H',
  192. 'UniJISX02132004-UTF32-V',
  193. 'UniKS-UCS2-H',
  194. 'UniKS-UCS2-V',
  195. 'UniKS-UTF16-H',
  196. 'UniKS-UTF16-V',
  197. 'UniKS-UTF32-H',
  198. 'UniKS-UTF32-V',
  199. 'UniKS-UTF8-H',
  200. 'UniKS-UTF8-V',
  201. 'V',
  202. 'WP-Symbol'
  203. ];
  204. var CMap = function CMapClosure() {
  205. function CMap(builtInCMap) {
  206. this.codespaceRanges = [
  207. [],
  208. [],
  209. [],
  210. []
  211. ];
  212. this.numCodespaceRanges = 0;
  213. this._map = [];
  214. this.name = '';
  215. this.vertical = false;
  216. this.useCMap = null;
  217. this.builtInCMap = builtInCMap;
  218. }
  219. CMap.prototype = {
  220. addCodespaceRange: function (n, low, high) {
  221. this.codespaceRanges[n - 1].push(low, high);
  222. this.numCodespaceRanges++;
  223. },
  224. mapCidRange: function (low, high, dstLow) {
  225. while (low <= high) {
  226. this._map[low++] = dstLow++;
  227. }
  228. },
  229. mapBfRange: function (low, high, dstLow) {
  230. var lastByte = dstLow.length - 1;
  231. while (low <= high) {
  232. this._map[low++] = dstLow;
  233. dstLow = dstLow.substr(0, lastByte) + String.fromCharCode(dstLow.charCodeAt(lastByte) + 1);
  234. }
  235. },
  236. mapBfRangeToArray: function (low, high, array) {
  237. var i = 0, ii = array.length;
  238. while (low <= high && i < ii) {
  239. this._map[low] = array[i++];
  240. ++low;
  241. }
  242. },
  243. mapOne: function (src, dst) {
  244. this._map[src] = dst;
  245. },
  246. lookup: function (code) {
  247. return this._map[code];
  248. },
  249. contains: function (code) {
  250. return this._map[code] !== undefined;
  251. },
  252. forEach: function (callback) {
  253. var map = this._map;
  254. var length = map.length;
  255. var i;
  256. if (length <= 0x10000) {
  257. for (i = 0; i < length; i++) {
  258. if (map[i] !== undefined) {
  259. callback(i, map[i]);
  260. }
  261. }
  262. } else {
  263. for (i in this._map) {
  264. callback(i, map[i]);
  265. }
  266. }
  267. },
  268. charCodeOf: function (value) {
  269. return this._map.indexOf(value);
  270. },
  271. getMap: function () {
  272. return this._map;
  273. },
  274. readCharCode: function (str, offset, out) {
  275. var c = 0;
  276. var codespaceRanges = this.codespaceRanges;
  277. var codespaceRangesLen = this.codespaceRanges.length;
  278. for (var n = 0; n < codespaceRangesLen; n++) {
  279. c = (c << 8 | str.charCodeAt(offset + n)) >>> 0;
  280. var codespaceRange = codespaceRanges[n];
  281. for (var k = 0, kk = codespaceRange.length; k < kk;) {
  282. var low = codespaceRange[k++];
  283. var high = codespaceRange[k++];
  284. if (c >= low && c <= high) {
  285. out.charcode = c;
  286. out.length = n + 1;
  287. return;
  288. }
  289. }
  290. }
  291. out.charcode = 0;
  292. out.length = 1;
  293. },
  294. get length() {
  295. return this._map.length;
  296. },
  297. get isIdentityCMap() {
  298. if (!(this.name === 'Identity-H' || this.name === 'Identity-V')) {
  299. return false;
  300. }
  301. if (this._map.length !== 0x10000) {
  302. return false;
  303. }
  304. for (var i = 0; i < 0x10000; i++) {
  305. if (this._map[i] !== i) {
  306. return false;
  307. }
  308. }
  309. return true;
  310. }
  311. };
  312. return CMap;
  313. }();
  314. var IdentityCMap = function IdentityCMapClosure() {
  315. function IdentityCMap(vertical, n) {
  316. CMap.call(this);
  317. this.vertical = vertical;
  318. this.addCodespaceRange(n, 0, 0xffff);
  319. }
  320. Util.inherit(IdentityCMap, CMap, {});
  321. IdentityCMap.prototype = {
  322. addCodespaceRange: CMap.prototype.addCodespaceRange,
  323. mapCidRange: function (low, high, dstLow) {
  324. error('should not call mapCidRange');
  325. },
  326. mapBfRange: function (low, high, dstLow) {
  327. error('should not call mapBfRange');
  328. },
  329. mapBfRangeToArray: function (low, high, array) {
  330. error('should not call mapBfRangeToArray');
  331. },
  332. mapOne: function (src, dst) {
  333. error('should not call mapCidOne');
  334. },
  335. lookup: function (code) {
  336. return isInt(code) && code <= 0xffff ? code : undefined;
  337. },
  338. contains: function (code) {
  339. return isInt(code) && code <= 0xffff;
  340. },
  341. forEach: function (callback) {
  342. for (var i = 0; i <= 0xffff; i++) {
  343. callback(i, i);
  344. }
  345. },
  346. charCodeOf: function (value) {
  347. return isInt(value) && value <= 0xffff ? value : -1;
  348. },
  349. getMap: function () {
  350. var map = new Array(0x10000);
  351. for (var i = 0; i <= 0xffff; i++) {
  352. map[i] = i;
  353. }
  354. return map;
  355. },
  356. readCharCode: CMap.prototype.readCharCode,
  357. get length() {
  358. return 0x10000;
  359. },
  360. get isIdentityCMap() {
  361. error('should not access .isIdentityCMap');
  362. }
  363. };
  364. return IdentityCMap;
  365. }();
  366. var BinaryCMapReader = function BinaryCMapReaderClosure() {
  367. function hexToInt(a, size) {
  368. var n = 0;
  369. for (var i = 0; i <= size; i++) {
  370. n = n << 8 | a[i];
  371. }
  372. return n >>> 0;
  373. }
  374. function hexToStr(a, size) {
  375. if (size === 1) {
  376. return String.fromCharCode(a[0], a[1]);
  377. }
  378. if (size === 3) {
  379. return String.fromCharCode(a[0], a[1], a[2], a[3]);
  380. }
  381. return String.fromCharCode.apply(null, a.subarray(0, size + 1));
  382. }
  383. function addHex(a, b, size) {
  384. var c = 0;
  385. for (var i = size; i >= 0; i--) {
  386. c += a[i] + b[i];
  387. a[i] = c & 255;
  388. c >>= 8;
  389. }
  390. }
  391. function incHex(a, size) {
  392. var c = 1;
  393. for (var i = size; i >= 0 && c > 0; i--) {
  394. c += a[i];
  395. a[i] = c & 255;
  396. c >>= 8;
  397. }
  398. }
  399. var MAX_NUM_SIZE = 16;
  400. var MAX_ENCODED_NUM_SIZE = 19;
  401. function BinaryCMapStream(data) {
  402. this.buffer = data;
  403. this.pos = 0;
  404. this.end = data.length;
  405. this.tmpBuf = new Uint8Array(MAX_ENCODED_NUM_SIZE);
  406. }
  407. BinaryCMapStream.prototype = {
  408. readByte: function () {
  409. if (this.pos >= this.end) {
  410. return -1;
  411. }
  412. return this.buffer[this.pos++];
  413. },
  414. readNumber: function () {
  415. var n = 0;
  416. var last;
  417. do {
  418. var b = this.readByte();
  419. if (b < 0) {
  420. error('unexpected EOF in bcmap');
  421. }
  422. last = !(b & 0x80);
  423. n = n << 7 | b & 0x7F;
  424. } while (!last);
  425. return n;
  426. },
  427. readSigned: function () {
  428. var n = this.readNumber();
  429. return n & 1 ? ~(n >>> 1) : n >>> 1;
  430. },
  431. readHex: function (num, size) {
  432. num.set(this.buffer.subarray(this.pos, this.pos + size + 1));
  433. this.pos += size + 1;
  434. },
  435. readHexNumber: function (num, size) {
  436. var last;
  437. var stack = this.tmpBuf, sp = 0;
  438. do {
  439. var b = this.readByte();
  440. if (b < 0) {
  441. error('unexpected EOF in bcmap');
  442. }
  443. last = !(b & 0x80);
  444. stack[sp++] = b & 0x7F;
  445. } while (!last);
  446. var i = size, buffer = 0, bufferSize = 0;
  447. while (i >= 0) {
  448. while (bufferSize < 8 && stack.length > 0) {
  449. buffer = stack[--sp] << bufferSize | buffer;
  450. bufferSize += 7;
  451. }
  452. num[i] = buffer & 255;
  453. i--;
  454. buffer >>= 8;
  455. bufferSize -= 8;
  456. }
  457. },
  458. readHexSigned: function (num, size) {
  459. this.readHexNumber(num, size);
  460. var sign = num[size] & 1 ? 255 : 0;
  461. var c = 0;
  462. for (var i = 0; i <= size; i++) {
  463. c = (c & 1) << 8 | num[i];
  464. num[i] = c >> 1 ^ sign;
  465. }
  466. },
  467. readString: function () {
  468. var len = this.readNumber();
  469. var s = '';
  470. for (var i = 0; i < len; i++) {
  471. s += String.fromCharCode(this.readNumber());
  472. }
  473. return s;
  474. }
  475. };
  476. function processBinaryCMap(data, cMap, extend) {
  477. return new Promise(function (resolve, reject) {
  478. var stream = new BinaryCMapStream(data);
  479. var header = stream.readByte();
  480. cMap.vertical = !!(header & 1);
  481. var useCMap = null;
  482. var start = new Uint8Array(MAX_NUM_SIZE);
  483. var end = new Uint8Array(MAX_NUM_SIZE);
  484. var char = new Uint8Array(MAX_NUM_SIZE);
  485. var charCode = new Uint8Array(MAX_NUM_SIZE);
  486. var tmp = new Uint8Array(MAX_NUM_SIZE);
  487. var code;
  488. var b;
  489. while ((b = stream.readByte()) >= 0) {
  490. var type = b >> 5;
  491. if (type === 7) {
  492. switch (b & 0x1F) {
  493. case 0:
  494. stream.readString();
  495. break;
  496. case 1:
  497. useCMap = stream.readString();
  498. break;
  499. }
  500. continue;
  501. }
  502. var sequence = !!(b & 0x10);
  503. var dataSize = b & 15;
  504. assert(dataSize + 1 <= MAX_NUM_SIZE);
  505. var ucs2DataSize = 1;
  506. var subitemsCount = stream.readNumber();
  507. var i;
  508. switch (type) {
  509. case 0:
  510. stream.readHex(start, dataSize);
  511. stream.readHexNumber(end, dataSize);
  512. addHex(end, start, dataSize);
  513. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  514. for (i = 1; i < subitemsCount; i++) {
  515. incHex(end, dataSize);
  516. stream.readHexNumber(start, dataSize);
  517. addHex(start, end, dataSize);
  518. stream.readHexNumber(end, dataSize);
  519. addHex(end, start, dataSize);
  520. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  521. }
  522. break;
  523. case 1:
  524. stream.readHex(start, dataSize);
  525. stream.readHexNumber(end, dataSize);
  526. addHex(end, start, dataSize);
  527. code = stream.readNumber();
  528. for (i = 1; i < subitemsCount; i++) {
  529. incHex(end, dataSize);
  530. stream.readHexNumber(start, dataSize);
  531. addHex(start, end, dataSize);
  532. stream.readHexNumber(end, dataSize);
  533. addHex(end, start, dataSize);
  534. code = stream.readNumber();
  535. }
  536. break;
  537. case 2:
  538. stream.readHex(char, dataSize);
  539. code = stream.readNumber();
  540. cMap.mapOne(hexToInt(char, dataSize), code);
  541. for (i = 1; i < subitemsCount; i++) {
  542. incHex(char, dataSize);
  543. if (!sequence) {
  544. stream.readHexNumber(tmp, dataSize);
  545. addHex(char, tmp, dataSize);
  546. }
  547. code = stream.readSigned() + (code + 1);
  548. cMap.mapOne(hexToInt(char, dataSize), code);
  549. }
  550. break;
  551. case 3:
  552. stream.readHex(start, dataSize);
  553. stream.readHexNumber(end, dataSize);
  554. addHex(end, start, dataSize);
  555. code = stream.readNumber();
  556. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  557. for (i = 1; i < subitemsCount; i++) {
  558. incHex(end, dataSize);
  559. if (!sequence) {
  560. stream.readHexNumber(start, dataSize);
  561. addHex(start, end, dataSize);
  562. } else {
  563. start.set(end);
  564. }
  565. stream.readHexNumber(end, dataSize);
  566. addHex(end, start, dataSize);
  567. code = stream.readNumber();
  568. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  569. }
  570. break;
  571. case 4:
  572. stream.readHex(char, ucs2DataSize);
  573. stream.readHex(charCode, dataSize);
  574. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  575. for (i = 1; i < subitemsCount; i++) {
  576. incHex(char, ucs2DataSize);
  577. if (!sequence) {
  578. stream.readHexNumber(tmp, ucs2DataSize);
  579. addHex(char, tmp, ucs2DataSize);
  580. }
  581. incHex(charCode, dataSize);
  582. stream.readHexSigned(tmp, dataSize);
  583. addHex(charCode, tmp, dataSize);
  584. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  585. }
  586. break;
  587. case 5:
  588. stream.readHex(start, ucs2DataSize);
  589. stream.readHexNumber(end, ucs2DataSize);
  590. addHex(end, start, ucs2DataSize);
  591. stream.readHex(charCode, dataSize);
  592. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  593. for (i = 1; i < subitemsCount; i++) {
  594. incHex(end, ucs2DataSize);
  595. if (!sequence) {
  596. stream.readHexNumber(start, ucs2DataSize);
  597. addHex(start, end, ucs2DataSize);
  598. } else {
  599. start.set(end);
  600. }
  601. stream.readHexNumber(end, ucs2DataSize);
  602. addHex(end, start, ucs2DataSize);
  603. stream.readHex(charCode, dataSize);
  604. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  605. }
  606. break;
  607. default:
  608. reject(new Error('processBinaryCMap: Unknown type: ' + type));
  609. return;
  610. }
  611. }
  612. if (useCMap) {
  613. resolve(extend(useCMap));
  614. return;
  615. }
  616. resolve(cMap);
  617. });
  618. }
  619. function BinaryCMapReader() {
  620. }
  621. BinaryCMapReader.prototype = { process: processBinaryCMap };
  622. return BinaryCMapReader;
  623. }();
  624. var CMapFactory = function CMapFactoryClosure() {
  625. function strToInt(str) {
  626. var a = 0;
  627. for (var i = 0; i < str.length; i++) {
  628. a = a << 8 | str.charCodeAt(i);
  629. }
  630. return a >>> 0;
  631. }
  632. function expectString(obj) {
  633. if (!isString(obj)) {
  634. error('Malformed CMap: expected string.');
  635. }
  636. }
  637. function expectInt(obj) {
  638. if (!isInt(obj)) {
  639. error('Malformed CMap: expected int.');
  640. }
  641. }
  642. function parseBfChar(cMap, lexer) {
  643. while (true) {
  644. var obj = lexer.getObj();
  645. if (isEOF(obj)) {
  646. break;
  647. }
  648. if (isCmd(obj, 'endbfchar')) {
  649. return;
  650. }
  651. expectString(obj);
  652. var src = strToInt(obj);
  653. obj = lexer.getObj();
  654. expectString(obj);
  655. var dst = obj;
  656. cMap.mapOne(src, dst);
  657. }
  658. }
  659. function parseBfRange(cMap, lexer) {
  660. while (true) {
  661. var obj = lexer.getObj();
  662. if (isEOF(obj)) {
  663. break;
  664. }
  665. if (isCmd(obj, 'endbfrange')) {
  666. return;
  667. }
  668. expectString(obj);
  669. var low = strToInt(obj);
  670. obj = lexer.getObj();
  671. expectString(obj);
  672. var high = strToInt(obj);
  673. obj = lexer.getObj();
  674. if (isInt(obj) || isString(obj)) {
  675. var dstLow = isInt(obj) ? String.fromCharCode(obj) : obj;
  676. cMap.mapBfRange(low, high, dstLow);
  677. } else if (isCmd(obj, '[')) {
  678. obj = lexer.getObj();
  679. var array = [];
  680. while (!isCmd(obj, ']') && !isEOF(obj)) {
  681. array.push(obj);
  682. obj = lexer.getObj();
  683. }
  684. cMap.mapBfRangeToArray(low, high, array);
  685. } else {
  686. break;
  687. }
  688. }
  689. error('Invalid bf range.');
  690. }
  691. function parseCidChar(cMap, lexer) {
  692. while (true) {
  693. var obj = lexer.getObj();
  694. if (isEOF(obj)) {
  695. break;
  696. }
  697. if (isCmd(obj, 'endcidchar')) {
  698. return;
  699. }
  700. expectString(obj);
  701. var src = strToInt(obj);
  702. obj = lexer.getObj();
  703. expectInt(obj);
  704. var dst = obj;
  705. cMap.mapOne(src, dst);
  706. }
  707. }
  708. function parseCidRange(cMap, lexer) {
  709. while (true) {
  710. var obj = lexer.getObj();
  711. if (isEOF(obj)) {
  712. break;
  713. }
  714. if (isCmd(obj, 'endcidrange')) {
  715. return;
  716. }
  717. expectString(obj);
  718. var low = strToInt(obj);
  719. obj = lexer.getObj();
  720. expectString(obj);
  721. var high = strToInt(obj);
  722. obj = lexer.getObj();
  723. expectInt(obj);
  724. var dstLow = obj;
  725. cMap.mapCidRange(low, high, dstLow);
  726. }
  727. }
  728. function parseCodespaceRange(cMap, lexer) {
  729. while (true) {
  730. var obj = lexer.getObj();
  731. if (isEOF(obj)) {
  732. break;
  733. }
  734. if (isCmd(obj, 'endcodespacerange')) {
  735. return;
  736. }
  737. if (!isString(obj)) {
  738. break;
  739. }
  740. var low = strToInt(obj);
  741. obj = lexer.getObj();
  742. if (!isString(obj)) {
  743. break;
  744. }
  745. var high = strToInt(obj);
  746. cMap.addCodespaceRange(obj.length, low, high);
  747. }
  748. error('Invalid codespace range.');
  749. }
  750. function parseWMode(cMap, lexer) {
  751. var obj = lexer.getObj();
  752. if (isInt(obj)) {
  753. cMap.vertical = !!obj;
  754. }
  755. }
  756. function parseCMapName(cMap, lexer) {
  757. var obj = lexer.getObj();
  758. if (isName(obj) && isString(obj.name)) {
  759. cMap.name = obj.name;
  760. }
  761. }
  762. function parseCMap(cMap, lexer, fetchBuiltInCMap, useCMap) {
  763. var previous;
  764. var embededUseCMap;
  765. objLoop:
  766. while (true) {
  767. try {
  768. var obj = lexer.getObj();
  769. if (isEOF(obj)) {
  770. break;
  771. } else if (isName(obj)) {
  772. if (obj.name === 'WMode') {
  773. parseWMode(cMap, lexer);
  774. } else if (obj.name === 'CMapName') {
  775. parseCMapName(cMap, lexer);
  776. }
  777. previous = obj;
  778. } else if (isCmd(obj)) {
  779. switch (obj.cmd) {
  780. case 'endcmap':
  781. break objLoop;
  782. case 'usecmap':
  783. if (isName(previous)) {
  784. embededUseCMap = previous.name;
  785. }
  786. break;
  787. case 'begincodespacerange':
  788. parseCodespaceRange(cMap, lexer);
  789. break;
  790. case 'beginbfchar':
  791. parseBfChar(cMap, lexer);
  792. break;
  793. case 'begincidchar':
  794. parseCidChar(cMap, lexer);
  795. break;
  796. case 'beginbfrange':
  797. parseBfRange(cMap, lexer);
  798. break;
  799. case 'begincidrange':
  800. parseCidRange(cMap, lexer);
  801. break;
  802. }
  803. }
  804. } catch (ex) {
  805. if (ex instanceof MissingDataException) {
  806. throw ex;
  807. }
  808. warn('Invalid cMap data: ' + ex);
  809. continue;
  810. }
  811. }
  812. if (!useCMap && embededUseCMap) {
  813. useCMap = embededUseCMap;
  814. }
  815. if (useCMap) {
  816. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  817. }
  818. return Promise.resolve(cMap);
  819. }
  820. function extendCMap(cMap, fetchBuiltInCMap, useCMap) {
  821. return createBuiltInCMap(useCMap, fetchBuiltInCMap).then(function (newCMap) {
  822. cMap.useCMap = newCMap;
  823. if (cMap.numCodespaceRanges === 0) {
  824. var useCodespaceRanges = cMap.useCMap.codespaceRanges;
  825. for (var i = 0; i < useCodespaceRanges.length; i++) {
  826. cMap.codespaceRanges[i] = useCodespaceRanges[i].slice();
  827. }
  828. cMap.numCodespaceRanges = cMap.useCMap.numCodespaceRanges;
  829. }
  830. cMap.useCMap.forEach(function (key, value) {
  831. if (!cMap.contains(key)) {
  832. cMap.mapOne(key, cMap.useCMap.lookup(key));
  833. }
  834. });
  835. return cMap;
  836. });
  837. }
  838. function createBuiltInCMap(name, fetchBuiltInCMap) {
  839. if (name === 'Identity-H') {
  840. return Promise.resolve(new IdentityCMap(false, 2));
  841. } else if (name === 'Identity-V') {
  842. return Promise.resolve(new IdentityCMap(true, 2));
  843. }
  844. if (BUILT_IN_CMAPS.indexOf(name) === -1) {
  845. return Promise.reject(new Error('Unknown cMap name: ' + name));
  846. }
  847. assert(fetchBuiltInCMap, 'Built-in CMap parameters are not provided.');
  848. return fetchBuiltInCMap(name).then(function (data) {
  849. var cMapData = data.cMapData, compressionType = data.compressionType;
  850. var cMap = new CMap(true);
  851. if (compressionType === CMapCompressionType.BINARY) {
  852. return new BinaryCMapReader().process(cMapData, cMap, function (useCMap) {
  853. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  854. });
  855. }
  856. assert(compressionType === CMapCompressionType.NONE, 'TODO: Only BINARY/NONE CMap compression is currently supported.');
  857. var lexer = new Lexer(new Stream(cMapData));
  858. return parseCMap(cMap, lexer, fetchBuiltInCMap, null);
  859. });
  860. }
  861. return {
  862. create: function (params) {
  863. var encoding = params.encoding;
  864. var fetchBuiltInCMap = params.fetchBuiltInCMap;
  865. var useCMap = params.useCMap;
  866. if (isName(encoding)) {
  867. return createBuiltInCMap(encoding.name, fetchBuiltInCMap);
  868. } else if (isStream(encoding)) {
  869. var cMap = new CMap();
  870. var lexer = new Lexer(encoding);
  871. return parseCMap(cMap, lexer, fetchBuiltInCMap, useCMap).then(function (parsedCMap) {
  872. if (parsedCMap.isIdentityCMap) {
  873. return createBuiltInCMap(parsedCMap.name, fetchBuiltInCMap);
  874. }
  875. return parsedCMap;
  876. });
  877. }
  878. return Promise.reject(new Error('Encoding required.'));
  879. }
  880. };
  881. }();
  882. exports.CMap = CMap;
  883. exports.CMapFactory = CMapFactory;
  884. exports.IdentityCMap = IdentityCMap;