cmap.js 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735
  1. /**
  2. * @licstart The following is the entire license notice for the
  3. * JavaScript code in this page
  4. *
  5. * Copyright 2022 Mozilla Foundation
  6. *
  7. * Licensed under the Apache License, Version 2.0 (the "License");
  8. * you may not use this file except in compliance with the License.
  9. * You may obtain a copy of the License at
  10. *
  11. * http://www.apache.org/licenses/LICENSE-2.0
  12. *
  13. * Unless required by applicable law or agreed to in writing, software
  14. * distributed under the License is distributed on an "AS IS" BASIS,
  15. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  16. * See the License for the specific language governing permissions and
  17. * limitations under the License.
  18. *
  19. * @licend The above is the entire license notice for the
  20. * JavaScript code in this page
  21. */
  22. "use strict";
  23. Object.defineProperty(exports, "__esModule", {
  24. value: true
  25. });
  26. exports.IdentityCMap = exports.CMapFactory = exports.CMap = void 0;
  27. var _util = require("../shared/util.js");
  28. var _primitives = require("./primitives.js");
  29. var _base_stream = require("./base_stream.js");
  30. var _parser = require("./parser.js");
  31. var _core_utils = require("./core_utils.js");
  32. var _stream = require("./stream.js");
  33. const BUILT_IN_CMAPS = ["Adobe-GB1-UCS2", "Adobe-CNS1-UCS2", "Adobe-Japan1-UCS2", "Adobe-Korea1-UCS2", "78-EUC-H", "78-EUC-V", "78-H", "78-RKSJ-H", "78-RKSJ-V", "78-V", "78ms-RKSJ-H", "78ms-RKSJ-V", "83pv-RKSJ-H", "90ms-RKSJ-H", "90ms-RKSJ-V", "90msp-RKSJ-H", "90msp-RKSJ-V", "90pv-RKSJ-H", "90pv-RKSJ-V", "Add-H", "Add-RKSJ-H", "Add-RKSJ-V", "Add-V", "Adobe-CNS1-0", "Adobe-CNS1-1", "Adobe-CNS1-2", "Adobe-CNS1-3", "Adobe-CNS1-4", "Adobe-CNS1-5", "Adobe-CNS1-6", "Adobe-GB1-0", "Adobe-GB1-1", "Adobe-GB1-2", "Adobe-GB1-3", "Adobe-GB1-4", "Adobe-GB1-5", "Adobe-Japan1-0", "Adobe-Japan1-1", "Adobe-Japan1-2", "Adobe-Japan1-3", "Adobe-Japan1-4", "Adobe-Japan1-5", "Adobe-Japan1-6", "Adobe-Korea1-0", "Adobe-Korea1-1", "Adobe-Korea1-2", "B5-H", "B5-V", "B5pc-H", "B5pc-V", "CNS-EUC-H", "CNS-EUC-V", "CNS1-H", "CNS1-V", "CNS2-H", "CNS2-V", "ETHK-B5-H", "ETHK-B5-V", "ETen-B5-H", "ETen-B5-V", "ETenms-B5-H", "ETenms-B5-V", "EUC-H", "EUC-V", "Ext-H", "Ext-RKSJ-H", "Ext-RKSJ-V", "Ext-V", "GB-EUC-H", "GB-EUC-V", "GB-H", "GB-V", "GBK-EUC-H", "GBK-EUC-V", "GBK2K-H", "GBK2K-V", "GBKp-EUC-H", "GBKp-EUC-V", "GBT-EUC-H", "GBT-EUC-V", "GBT-H", "GBT-V", "GBTpc-EUC-H", "GBTpc-EUC-V", "GBpc-EUC-H", "GBpc-EUC-V", "H", "HKdla-B5-H", "HKdla-B5-V", "HKdlb-B5-H", "HKdlb-B5-V", "HKgccs-B5-H", "HKgccs-B5-V", "HKm314-B5-H", "HKm314-B5-V", "HKm471-B5-H", "HKm471-B5-V", "HKscs-B5-H", "HKscs-B5-V", "Hankaku", "Hiragana", "KSC-EUC-H", "KSC-EUC-V", "KSC-H", "KSC-Johab-H", "KSC-Johab-V", "KSC-V", "KSCms-UHC-H", "KSCms-UHC-HW-H", "KSCms-UHC-HW-V", "KSCms-UHC-V", "KSCpc-EUC-H", "KSCpc-EUC-V", "Katakana", "NWP-H", "NWP-V", "RKSJ-H", "RKSJ-V", "Roman", "UniCNS-UCS2-H", "UniCNS-UCS2-V", "UniCNS-UTF16-H", "UniCNS-UTF16-V", "UniCNS-UTF32-H", "UniCNS-UTF32-V", "UniCNS-UTF8-H", "UniCNS-UTF8-V", "UniGB-UCS2-H", "UniGB-UCS2-V", "UniGB-UTF16-H", "UniGB-UTF16-V", "UniGB-UTF32-H", "UniGB-UTF32-V", "UniGB-UTF8-H", "UniGB-UTF8-V", "UniJIS-UCS2-H", "UniJIS-UCS2-HW-H", "UniJIS-UCS2-HW-V", "UniJIS-UCS2-V", "UniJIS-UTF16-H", "UniJIS-UTF16-V", "UniJIS-UTF32-H", "UniJIS-UTF32-V", "UniJIS-UTF8-H", "UniJIS-UTF8-V", "UniJIS2004-UTF16-H", "UniJIS2004-UTF16-V", "UniJIS2004-UTF32-H", "UniJIS2004-UTF32-V", "UniJIS2004-UTF8-H", "UniJIS2004-UTF8-V", "UniJISPro-UCS2-HW-V", "UniJISPro-UCS2-V", "UniJISPro-UTF8-V", "UniJISX0213-UTF32-H", "UniJISX0213-UTF32-V", "UniJISX02132004-UTF32-H", "UniJISX02132004-UTF32-V", "UniKS-UCS2-H", "UniKS-UCS2-V", "UniKS-UTF16-H", "UniKS-UTF16-V", "UniKS-UTF32-H", "UniKS-UTF32-V", "UniKS-UTF8-H", "UniKS-UTF8-V", "V", "WP-Symbol"];
  34. const MAX_MAP_RANGE = 2 ** 24 - 1;
  35. class CMap {
  36. constructor(builtInCMap = false) {
  37. this.codespaceRanges = [[], [], [], []];
  38. this.numCodespaceRanges = 0;
  39. this._map = [];
  40. this.name = "";
  41. this.vertical = false;
  42. this.useCMap = null;
  43. this.builtInCMap = builtInCMap;
  44. }
  45. addCodespaceRange(n, low, high) {
  46. this.codespaceRanges[n - 1].push(low, high);
  47. this.numCodespaceRanges++;
  48. }
  49. mapCidRange(low, high, dstLow) {
  50. if (high - low > MAX_MAP_RANGE) {
  51. throw new Error("mapCidRange - ignoring data above MAX_MAP_RANGE.");
  52. }
  53. while (low <= high) {
  54. this._map[low++] = dstLow++;
  55. }
  56. }
  57. mapBfRange(low, high, dstLow) {
  58. if (high - low > MAX_MAP_RANGE) {
  59. throw new Error("mapBfRange - ignoring data above MAX_MAP_RANGE.");
  60. }
  61. const lastByte = dstLow.length - 1;
  62. while (low <= high) {
  63. this._map[low++] = dstLow;
  64. const nextCharCode = dstLow.charCodeAt(lastByte) + 1;
  65. if (nextCharCode > 0xff) {
  66. dstLow = dstLow.substring(0, lastByte - 1) + String.fromCharCode(dstLow.charCodeAt(lastByte - 1) + 1) + "\x00";
  67. continue;
  68. }
  69. dstLow = dstLow.substring(0, lastByte) + String.fromCharCode(nextCharCode);
  70. }
  71. }
  72. mapBfRangeToArray(low, high, array) {
  73. if (high - low > MAX_MAP_RANGE) {
  74. throw new Error("mapBfRangeToArray - ignoring data above MAX_MAP_RANGE.");
  75. }
  76. const ii = array.length;
  77. let i = 0;
  78. while (low <= high && i < ii) {
  79. this._map[low] = array[i++];
  80. ++low;
  81. }
  82. }
  83. mapOne(src, dst) {
  84. this._map[src] = dst;
  85. }
  86. lookup(code) {
  87. return this._map[code];
  88. }
  89. contains(code) {
  90. return this._map[code] !== undefined;
  91. }
  92. forEach(callback) {
  93. const map = this._map;
  94. const length = map.length;
  95. if (length <= 0x10000) {
  96. for (let i = 0; i < length; i++) {
  97. if (map[i] !== undefined) {
  98. callback(i, map[i]);
  99. }
  100. }
  101. } else {
  102. for (const i in map) {
  103. callback(i, map[i]);
  104. }
  105. }
  106. }
  107. charCodeOf(value) {
  108. const map = this._map;
  109. if (map.length <= 0x10000) {
  110. return map.indexOf(value);
  111. }
  112. for (const charCode in map) {
  113. if (map[charCode] === value) {
  114. return charCode | 0;
  115. }
  116. }
  117. return -1;
  118. }
  119. getMap() {
  120. return this._map;
  121. }
  122. readCharCode(str, offset, out) {
  123. let c = 0;
  124. const codespaceRanges = this.codespaceRanges;
  125. for (let n = 0, nn = codespaceRanges.length; n < nn; n++) {
  126. c = (c << 8 | str.charCodeAt(offset + n)) >>> 0;
  127. const codespaceRange = codespaceRanges[n];
  128. for (let k = 0, kk = codespaceRange.length; k < kk;) {
  129. const low = codespaceRange[k++];
  130. const high = codespaceRange[k++];
  131. if (c >= low && c <= high) {
  132. out.charcode = c;
  133. out.length = n + 1;
  134. return;
  135. }
  136. }
  137. }
  138. out.charcode = 0;
  139. out.length = 1;
  140. }
  141. getCharCodeLength(charCode) {
  142. const codespaceRanges = this.codespaceRanges;
  143. for (let n = 0, nn = codespaceRanges.length; n < nn; n++) {
  144. const codespaceRange = codespaceRanges[n];
  145. for (let k = 0, kk = codespaceRange.length; k < kk;) {
  146. const low = codespaceRange[k++];
  147. const high = codespaceRange[k++];
  148. if (charCode >= low && charCode <= high) {
  149. return n + 1;
  150. }
  151. }
  152. }
  153. return 1;
  154. }
  155. get length() {
  156. return this._map.length;
  157. }
  158. get isIdentityCMap() {
  159. if (!(this.name === "Identity-H" || this.name === "Identity-V")) {
  160. return false;
  161. }
  162. if (this._map.length !== 0x10000) {
  163. return false;
  164. }
  165. for (let i = 0; i < 0x10000; i++) {
  166. if (this._map[i] !== i) {
  167. return false;
  168. }
  169. }
  170. return true;
  171. }
  172. }
  173. exports.CMap = CMap;
  174. class IdentityCMap extends CMap {
  175. constructor(vertical, n) {
  176. super();
  177. this.vertical = vertical;
  178. this.addCodespaceRange(n, 0, 0xffff);
  179. }
  180. mapCidRange(low, high, dstLow) {
  181. (0, _util.unreachable)("should not call mapCidRange");
  182. }
  183. mapBfRange(low, high, dstLow) {
  184. (0, _util.unreachable)("should not call mapBfRange");
  185. }
  186. mapBfRangeToArray(low, high, array) {
  187. (0, _util.unreachable)("should not call mapBfRangeToArray");
  188. }
  189. mapOne(src, dst) {
  190. (0, _util.unreachable)("should not call mapCidOne");
  191. }
  192. lookup(code) {
  193. return Number.isInteger(code) && code <= 0xffff ? code : undefined;
  194. }
  195. contains(code) {
  196. return Number.isInteger(code) && code <= 0xffff;
  197. }
  198. forEach(callback) {
  199. for (let i = 0; i <= 0xffff; i++) {
  200. callback(i, i);
  201. }
  202. }
  203. charCodeOf(value) {
  204. return Number.isInteger(value) && value <= 0xffff ? value : -1;
  205. }
  206. getMap() {
  207. const map = new Array(0x10000);
  208. for (let i = 0; i <= 0xffff; i++) {
  209. map[i] = i;
  210. }
  211. return map;
  212. }
  213. get length() {
  214. return 0x10000;
  215. }
  216. get isIdentityCMap() {
  217. (0, _util.unreachable)("should not access .isIdentityCMap");
  218. }
  219. }
  220. exports.IdentityCMap = IdentityCMap;
  221. const BinaryCMapReader = function BinaryCMapReaderClosure() {
  222. function hexToInt(a, size) {
  223. let n = 0;
  224. for (let i = 0; i <= size; i++) {
  225. n = n << 8 | a[i];
  226. }
  227. return n >>> 0;
  228. }
  229. function hexToStr(a, size) {
  230. if (size === 1) {
  231. return String.fromCharCode(a[0], a[1]);
  232. }
  233. if (size === 3) {
  234. return String.fromCharCode(a[0], a[1], a[2], a[3]);
  235. }
  236. return String.fromCharCode.apply(null, a.subarray(0, size + 1));
  237. }
  238. function addHex(a, b, size) {
  239. let c = 0;
  240. for (let i = size; i >= 0; i--) {
  241. c += a[i] + b[i];
  242. a[i] = c & 255;
  243. c >>= 8;
  244. }
  245. }
  246. function incHex(a, size) {
  247. let c = 1;
  248. for (let i = size; i >= 0 && c > 0; i--) {
  249. c += a[i];
  250. a[i] = c & 255;
  251. c >>= 8;
  252. }
  253. }
  254. const MAX_NUM_SIZE = 16;
  255. const MAX_ENCODED_NUM_SIZE = 19;
  256. class BinaryCMapStream {
  257. constructor(data) {
  258. this.buffer = data;
  259. this.pos = 0;
  260. this.end = data.length;
  261. this.tmpBuf = new Uint8Array(MAX_ENCODED_NUM_SIZE);
  262. }
  263. readByte() {
  264. if (this.pos >= this.end) {
  265. return -1;
  266. }
  267. return this.buffer[this.pos++];
  268. }
  269. readNumber() {
  270. let n = 0;
  271. let last;
  272. do {
  273. const b = this.readByte();
  274. if (b < 0) {
  275. throw new _util.FormatError("unexpected EOF in bcmap");
  276. }
  277. last = !(b & 0x80);
  278. n = n << 7 | b & 0x7f;
  279. } while (!last);
  280. return n;
  281. }
  282. readSigned() {
  283. const n = this.readNumber();
  284. return n & 1 ? ~(n >>> 1) : n >>> 1;
  285. }
  286. readHex(num, size) {
  287. num.set(this.buffer.subarray(this.pos, this.pos + size + 1));
  288. this.pos += size + 1;
  289. }
  290. readHexNumber(num, size) {
  291. let last;
  292. const stack = this.tmpBuf;
  293. let sp = 0;
  294. do {
  295. const b = this.readByte();
  296. if (b < 0) {
  297. throw new _util.FormatError("unexpected EOF in bcmap");
  298. }
  299. last = !(b & 0x80);
  300. stack[sp++] = b & 0x7f;
  301. } while (!last);
  302. let i = size,
  303. buffer = 0,
  304. bufferSize = 0;
  305. while (i >= 0) {
  306. while (bufferSize < 8 && stack.length > 0) {
  307. buffer |= stack[--sp] << bufferSize;
  308. bufferSize += 7;
  309. }
  310. num[i] = buffer & 255;
  311. i--;
  312. buffer >>= 8;
  313. bufferSize -= 8;
  314. }
  315. }
  316. readHexSigned(num, size) {
  317. this.readHexNumber(num, size);
  318. const sign = num[size] & 1 ? 255 : 0;
  319. let c = 0;
  320. for (let i = 0; i <= size; i++) {
  321. c = (c & 1) << 8 | num[i];
  322. num[i] = c >> 1 ^ sign;
  323. }
  324. }
  325. readString() {
  326. const len = this.readNumber();
  327. let s = "";
  328. for (let i = 0; i < len; i++) {
  329. s += String.fromCharCode(this.readNumber());
  330. }
  331. return s;
  332. }
  333. }
  334. class BinaryCMapReader {
  335. async process(data, cMap, extend) {
  336. const stream = new BinaryCMapStream(data);
  337. const header = stream.readByte();
  338. cMap.vertical = !!(header & 1);
  339. let useCMap = null;
  340. const start = new Uint8Array(MAX_NUM_SIZE);
  341. const end = new Uint8Array(MAX_NUM_SIZE);
  342. const char = new Uint8Array(MAX_NUM_SIZE);
  343. const charCode = new Uint8Array(MAX_NUM_SIZE);
  344. const tmp = new Uint8Array(MAX_NUM_SIZE);
  345. let code;
  346. let b;
  347. while ((b = stream.readByte()) >= 0) {
  348. const type = b >> 5;
  349. if (type === 7) {
  350. switch (b & 0x1f) {
  351. case 0:
  352. stream.readString();
  353. break;
  354. case 1:
  355. useCMap = stream.readString();
  356. break;
  357. }
  358. continue;
  359. }
  360. const sequence = !!(b & 0x10);
  361. const dataSize = b & 15;
  362. if (dataSize + 1 > MAX_NUM_SIZE) {
  363. throw new Error("BinaryCMapReader.process: Invalid dataSize.");
  364. }
  365. const ucs2DataSize = 1;
  366. const subitemsCount = stream.readNumber();
  367. switch (type) {
  368. case 0:
  369. stream.readHex(start, dataSize);
  370. stream.readHexNumber(end, dataSize);
  371. addHex(end, start, dataSize);
  372. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  373. for (let i = 1; i < subitemsCount; i++) {
  374. incHex(end, dataSize);
  375. stream.readHexNumber(start, dataSize);
  376. addHex(start, end, dataSize);
  377. stream.readHexNumber(end, dataSize);
  378. addHex(end, start, dataSize);
  379. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  380. }
  381. break;
  382. case 1:
  383. stream.readHex(start, dataSize);
  384. stream.readHexNumber(end, dataSize);
  385. addHex(end, start, dataSize);
  386. stream.readNumber();
  387. for (let i = 1; i < subitemsCount; i++) {
  388. incHex(end, dataSize);
  389. stream.readHexNumber(start, dataSize);
  390. addHex(start, end, dataSize);
  391. stream.readHexNumber(end, dataSize);
  392. addHex(end, start, dataSize);
  393. stream.readNumber();
  394. }
  395. break;
  396. case 2:
  397. stream.readHex(char, dataSize);
  398. code = stream.readNumber();
  399. cMap.mapOne(hexToInt(char, dataSize), code);
  400. for (let i = 1; i < subitemsCount; i++) {
  401. incHex(char, dataSize);
  402. if (!sequence) {
  403. stream.readHexNumber(tmp, dataSize);
  404. addHex(char, tmp, dataSize);
  405. }
  406. code = stream.readSigned() + (code + 1);
  407. cMap.mapOne(hexToInt(char, dataSize), code);
  408. }
  409. break;
  410. case 3:
  411. stream.readHex(start, dataSize);
  412. stream.readHexNumber(end, dataSize);
  413. addHex(end, start, dataSize);
  414. code = stream.readNumber();
  415. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  416. for (let i = 1; i < subitemsCount; i++) {
  417. incHex(end, dataSize);
  418. if (!sequence) {
  419. stream.readHexNumber(start, dataSize);
  420. addHex(start, end, dataSize);
  421. } else {
  422. start.set(end);
  423. }
  424. stream.readHexNumber(end, dataSize);
  425. addHex(end, start, dataSize);
  426. code = stream.readNumber();
  427. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  428. }
  429. break;
  430. case 4:
  431. stream.readHex(char, ucs2DataSize);
  432. stream.readHex(charCode, dataSize);
  433. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  434. for (let i = 1; i < subitemsCount; i++) {
  435. incHex(char, ucs2DataSize);
  436. if (!sequence) {
  437. stream.readHexNumber(tmp, ucs2DataSize);
  438. addHex(char, tmp, ucs2DataSize);
  439. }
  440. incHex(charCode, dataSize);
  441. stream.readHexSigned(tmp, dataSize);
  442. addHex(charCode, tmp, dataSize);
  443. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  444. }
  445. break;
  446. case 5:
  447. stream.readHex(start, ucs2DataSize);
  448. stream.readHexNumber(end, ucs2DataSize);
  449. addHex(end, start, ucs2DataSize);
  450. stream.readHex(charCode, dataSize);
  451. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  452. for (let i = 1; i < subitemsCount; i++) {
  453. incHex(end, ucs2DataSize);
  454. if (!sequence) {
  455. stream.readHexNumber(start, ucs2DataSize);
  456. addHex(start, end, ucs2DataSize);
  457. } else {
  458. start.set(end);
  459. }
  460. stream.readHexNumber(end, ucs2DataSize);
  461. addHex(end, start, ucs2DataSize);
  462. stream.readHex(charCode, dataSize);
  463. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  464. }
  465. break;
  466. default:
  467. throw new Error(`BinaryCMapReader.process - unknown type: ${type}`);
  468. }
  469. }
  470. if (useCMap) {
  471. return extend(useCMap);
  472. }
  473. return cMap;
  474. }
  475. }
  476. return BinaryCMapReader;
  477. }();
  478. const CMapFactory = function CMapFactoryClosure() {
  479. function strToInt(str) {
  480. let a = 0;
  481. for (let i = 0; i < str.length; i++) {
  482. a = a << 8 | str.charCodeAt(i);
  483. }
  484. return a >>> 0;
  485. }
  486. function expectString(obj) {
  487. if (typeof obj !== "string") {
  488. throw new _util.FormatError("Malformed CMap: expected string.");
  489. }
  490. }
  491. function expectInt(obj) {
  492. if (!Number.isInteger(obj)) {
  493. throw new _util.FormatError("Malformed CMap: expected int.");
  494. }
  495. }
  496. function parseBfChar(cMap, lexer) {
  497. while (true) {
  498. let obj = lexer.getObj();
  499. if (obj === _primitives.EOF) {
  500. break;
  501. }
  502. if ((0, _primitives.isCmd)(obj, "endbfchar")) {
  503. return;
  504. }
  505. expectString(obj);
  506. const src = strToInt(obj);
  507. obj = lexer.getObj();
  508. expectString(obj);
  509. const dst = obj;
  510. cMap.mapOne(src, dst);
  511. }
  512. }
  513. function parseBfRange(cMap, lexer) {
  514. while (true) {
  515. let obj = lexer.getObj();
  516. if (obj === _primitives.EOF) {
  517. break;
  518. }
  519. if ((0, _primitives.isCmd)(obj, "endbfrange")) {
  520. return;
  521. }
  522. expectString(obj);
  523. const low = strToInt(obj);
  524. obj = lexer.getObj();
  525. expectString(obj);
  526. const high = strToInt(obj);
  527. obj = lexer.getObj();
  528. if (Number.isInteger(obj) || typeof obj === "string") {
  529. const dstLow = Number.isInteger(obj) ? String.fromCharCode(obj) : obj;
  530. cMap.mapBfRange(low, high, dstLow);
  531. } else if ((0, _primitives.isCmd)(obj, "[")) {
  532. obj = lexer.getObj();
  533. const array = [];
  534. while (!(0, _primitives.isCmd)(obj, "]") && obj !== _primitives.EOF) {
  535. array.push(obj);
  536. obj = lexer.getObj();
  537. }
  538. cMap.mapBfRangeToArray(low, high, array);
  539. } else {
  540. break;
  541. }
  542. }
  543. throw new _util.FormatError("Invalid bf range.");
  544. }
  545. function parseCidChar(cMap, lexer) {
  546. while (true) {
  547. let obj = lexer.getObj();
  548. if (obj === _primitives.EOF) {
  549. break;
  550. }
  551. if ((0, _primitives.isCmd)(obj, "endcidchar")) {
  552. return;
  553. }
  554. expectString(obj);
  555. const src = strToInt(obj);
  556. obj = lexer.getObj();
  557. expectInt(obj);
  558. const dst = obj;
  559. cMap.mapOne(src, dst);
  560. }
  561. }
  562. function parseCidRange(cMap, lexer) {
  563. while (true) {
  564. let obj = lexer.getObj();
  565. if (obj === _primitives.EOF) {
  566. break;
  567. }
  568. if ((0, _primitives.isCmd)(obj, "endcidrange")) {
  569. return;
  570. }
  571. expectString(obj);
  572. const low = strToInt(obj);
  573. obj = lexer.getObj();
  574. expectString(obj);
  575. const high = strToInt(obj);
  576. obj = lexer.getObj();
  577. expectInt(obj);
  578. const dstLow = obj;
  579. cMap.mapCidRange(low, high, dstLow);
  580. }
  581. }
  582. function parseCodespaceRange(cMap, lexer) {
  583. while (true) {
  584. let obj = lexer.getObj();
  585. if (obj === _primitives.EOF) {
  586. break;
  587. }
  588. if ((0, _primitives.isCmd)(obj, "endcodespacerange")) {
  589. return;
  590. }
  591. if (typeof obj !== "string") {
  592. break;
  593. }
  594. const low = strToInt(obj);
  595. obj = lexer.getObj();
  596. if (typeof obj !== "string") {
  597. break;
  598. }
  599. const high = strToInt(obj);
  600. cMap.addCodespaceRange(obj.length, low, high);
  601. }
  602. throw new _util.FormatError("Invalid codespace range.");
  603. }
  604. function parseWMode(cMap, lexer) {
  605. const obj = lexer.getObj();
  606. if (Number.isInteger(obj)) {
  607. cMap.vertical = !!obj;
  608. }
  609. }
  610. function parseCMapName(cMap, lexer) {
  611. const obj = lexer.getObj();
  612. if (obj instanceof _primitives.Name) {
  613. cMap.name = obj.name;
  614. }
  615. }
  616. async function parseCMap(cMap, lexer, fetchBuiltInCMap, useCMap) {
  617. let previous, embeddedUseCMap;
  618. objLoop: while (true) {
  619. try {
  620. const obj = lexer.getObj();
  621. if (obj === _primitives.EOF) {
  622. break;
  623. } else if (obj instanceof _primitives.Name) {
  624. if (obj.name === "WMode") {
  625. parseWMode(cMap, lexer);
  626. } else if (obj.name === "CMapName") {
  627. parseCMapName(cMap, lexer);
  628. }
  629. previous = obj;
  630. } else if (obj instanceof _primitives.Cmd) {
  631. switch (obj.cmd) {
  632. case "endcmap":
  633. break objLoop;
  634. case "usecmap":
  635. if (previous instanceof _primitives.Name) {
  636. embeddedUseCMap = previous.name;
  637. }
  638. break;
  639. case "begincodespacerange":
  640. parseCodespaceRange(cMap, lexer);
  641. break;
  642. case "beginbfchar":
  643. parseBfChar(cMap, lexer);
  644. break;
  645. case "begincidchar":
  646. parseCidChar(cMap, lexer);
  647. break;
  648. case "beginbfrange":
  649. parseBfRange(cMap, lexer);
  650. break;
  651. case "begincidrange":
  652. parseCidRange(cMap, lexer);
  653. break;
  654. }
  655. }
  656. } catch (ex) {
  657. if (ex instanceof _core_utils.MissingDataException) {
  658. throw ex;
  659. }
  660. (0, _util.warn)("Invalid cMap data: " + ex);
  661. continue;
  662. }
  663. }
  664. if (!useCMap && embeddedUseCMap) {
  665. useCMap = embeddedUseCMap;
  666. }
  667. if (useCMap) {
  668. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  669. }
  670. return cMap;
  671. }
  672. async function extendCMap(cMap, fetchBuiltInCMap, useCMap) {
  673. cMap.useCMap = await createBuiltInCMap(useCMap, fetchBuiltInCMap);
  674. if (cMap.numCodespaceRanges === 0) {
  675. const useCodespaceRanges = cMap.useCMap.codespaceRanges;
  676. for (let i = 0; i < useCodespaceRanges.length; i++) {
  677. cMap.codespaceRanges[i] = useCodespaceRanges[i].slice();
  678. }
  679. cMap.numCodespaceRanges = cMap.useCMap.numCodespaceRanges;
  680. }
  681. cMap.useCMap.forEach(function (key, value) {
  682. if (!cMap.contains(key)) {
  683. cMap.mapOne(key, cMap.useCMap.lookup(key));
  684. }
  685. });
  686. return cMap;
  687. }
  688. async function createBuiltInCMap(name, fetchBuiltInCMap) {
  689. if (name === "Identity-H") {
  690. return new IdentityCMap(false, 2);
  691. } else if (name === "Identity-V") {
  692. return new IdentityCMap(true, 2);
  693. }
  694. if (!BUILT_IN_CMAPS.includes(name)) {
  695. throw new Error("Unknown CMap name: " + name);
  696. }
  697. if (!fetchBuiltInCMap) {
  698. throw new Error("Built-in CMap parameters are not provided.");
  699. }
  700. const {
  701. cMapData,
  702. compressionType
  703. } = await fetchBuiltInCMap(name);
  704. const cMap = new CMap(true);
  705. if (compressionType === _util.CMapCompressionType.BINARY) {
  706. return new BinaryCMapReader().process(cMapData, cMap, useCMap => {
  707. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  708. });
  709. }
  710. if (compressionType === _util.CMapCompressionType.NONE) {
  711. const lexer = new _parser.Lexer(new _stream.Stream(cMapData));
  712. return parseCMap(cMap, lexer, fetchBuiltInCMap, null);
  713. }
  714. throw new Error(`Invalid CMap "compressionType" value: ${compressionType}`);
  715. }
  716. return {
  717. async create(params) {
  718. const encoding = params.encoding;
  719. const fetchBuiltInCMap = params.fetchBuiltInCMap;
  720. const useCMap = params.useCMap;
  721. if (encoding instanceof _primitives.Name) {
  722. return createBuiltInCMap(encoding.name, fetchBuiltInCMap);
  723. } else if (encoding instanceof _base_stream.BaseStream) {
  724. const parsedCMap = await parseCMap(new CMap(), new _parser.Lexer(encoding), fetchBuiltInCMap, useCMap);
  725. if (parsedCMap.isIdentityCMap) {
  726. return createBuiltInCMap(parsedCMap.name, fetchBuiltInCMap);
  727. }
  728. return parsedCMap;
  729. }
  730. throw new Error("Encoding required.");
  731. }
  732. };
  733. }();
  734. exports.CMapFactory = CMapFactory;