cmap.js 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939
  1. /**
  2. * @licstart The following is the entire license notice for the
  3. * Javascript code in this page
  4. *
  5. * Copyright 2021 Mozilla Foundation
  6. *
  7. * Licensed under the Apache License, Version 2.0 (the "License");
  8. * you may not use this file except in compliance with the License.
  9. * You may obtain a copy of the License at
  10. *
  11. * http://www.apache.org/licenses/LICENSE-2.0
  12. *
  13. * Unless required by applicable law or agreed to in writing, software
  14. * distributed under the License is distributed on an "AS IS" BASIS,
  15. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  16. * See the License for the specific language governing permissions and
  17. * limitations under the License.
  18. *
  19. * @licend The above is the entire license notice for the
  20. * Javascript code in this page
  21. */
  22. "use strict";
  23. Object.defineProperty(exports, "__esModule", {
  24. value: true
  25. });
  26. exports.IdentityCMap = exports.CMapFactory = exports.CMap = void 0;
  27. var _util = require("../shared/util.js");
  28. var _primitives = require("./primitives.js");
  29. var _parser = require("./parser.js");
  30. var _core_utils = require("./core_utils.js");
  31. var _stream = require("./stream.js");
  32. const BUILT_IN_CMAPS = ["Adobe-GB1-UCS2", "Adobe-CNS1-UCS2", "Adobe-Japan1-UCS2", "Adobe-Korea1-UCS2", "78-EUC-H", "78-EUC-V", "78-H", "78-RKSJ-H", "78-RKSJ-V", "78-V", "78ms-RKSJ-H", "78ms-RKSJ-V", "83pv-RKSJ-H", "90ms-RKSJ-H", "90ms-RKSJ-V", "90msp-RKSJ-H", "90msp-RKSJ-V", "90pv-RKSJ-H", "90pv-RKSJ-V", "Add-H", "Add-RKSJ-H", "Add-RKSJ-V", "Add-V", "Adobe-CNS1-0", "Adobe-CNS1-1", "Adobe-CNS1-2", "Adobe-CNS1-3", "Adobe-CNS1-4", "Adobe-CNS1-5", "Adobe-CNS1-6", "Adobe-GB1-0", "Adobe-GB1-1", "Adobe-GB1-2", "Adobe-GB1-3", "Adobe-GB1-4", "Adobe-GB1-5", "Adobe-Japan1-0", "Adobe-Japan1-1", "Adobe-Japan1-2", "Adobe-Japan1-3", "Adobe-Japan1-4", "Adobe-Japan1-5", "Adobe-Japan1-6", "Adobe-Korea1-0", "Adobe-Korea1-1", "Adobe-Korea1-2", "B5-H", "B5-V", "B5pc-H", "B5pc-V", "CNS-EUC-H", "CNS-EUC-V", "CNS1-H", "CNS1-V", "CNS2-H", "CNS2-V", "ETHK-B5-H", "ETHK-B5-V", "ETen-B5-H", "ETen-B5-V", "ETenms-B5-H", "ETenms-B5-V", "EUC-H", "EUC-V", "Ext-H", "Ext-RKSJ-H", "Ext-RKSJ-V", "Ext-V", "GB-EUC-H", "GB-EUC-V", "GB-H", "GB-V", "GBK-EUC-H", "GBK-EUC-V", "GBK2K-H", "GBK2K-V", "GBKp-EUC-H", "GBKp-EUC-V", "GBT-EUC-H", "GBT-EUC-V", "GBT-H", "GBT-V", "GBTpc-EUC-H", "GBTpc-EUC-V", "GBpc-EUC-H", "GBpc-EUC-V", "H", "HKdla-B5-H", "HKdla-B5-V", "HKdlb-B5-H", "HKdlb-B5-V", "HKgccs-B5-H", "HKgccs-B5-V", "HKm314-B5-H", "HKm314-B5-V", "HKm471-B5-H", "HKm471-B5-V", "HKscs-B5-H", "HKscs-B5-V", "Hankaku", "Hiragana", "KSC-EUC-H", "KSC-EUC-V", "KSC-H", "KSC-Johab-H", "KSC-Johab-V", "KSC-V", "KSCms-UHC-H", "KSCms-UHC-HW-H", "KSCms-UHC-HW-V", "KSCms-UHC-V", "KSCpc-EUC-H", "KSCpc-EUC-V", "Katakana", "NWP-H", "NWP-V", "RKSJ-H", "RKSJ-V", "Roman", "UniCNS-UCS2-H", "UniCNS-UCS2-V", "UniCNS-UTF16-H", "UniCNS-UTF16-V", "UniCNS-UTF32-H", "UniCNS-UTF32-V", "UniCNS-UTF8-H", "UniCNS-UTF8-V", "UniGB-UCS2-H", "UniGB-UCS2-V", "UniGB-UTF16-H", "UniGB-UTF16-V", "UniGB-UTF32-H", "UniGB-UTF32-V", "UniGB-UTF8-H", "UniGB-UTF8-V", "UniJIS-UCS2-H", "UniJIS-UCS2-HW-H", "UniJIS-UCS2-HW-V", "UniJIS-UCS2-V", "UniJIS-UTF16-H", "UniJIS-UTF16-V", "UniJIS-UTF32-H", "UniJIS-UTF32-V", "UniJIS-UTF8-H", "UniJIS-UTF8-V", "UniJIS2004-UTF16-H", "UniJIS2004-UTF16-V", "UniJIS2004-UTF32-H", "UniJIS2004-UTF32-V", "UniJIS2004-UTF8-H", "UniJIS2004-UTF8-V", "UniJISPro-UCS2-HW-V", "UniJISPro-UCS2-V", "UniJISPro-UTF8-V", "UniJISX0213-UTF32-H", "UniJISX0213-UTF32-V", "UniJISX02132004-UTF32-H", "UniJISX02132004-UTF32-V", "UniKS-UCS2-H", "UniKS-UCS2-V", "UniKS-UTF16-H", "UniKS-UTF16-V", "UniKS-UTF32-H", "UniKS-UTF32-V", "UniKS-UTF8-H", "UniKS-UTF8-V", "V", "WP-Symbol"];
  33. const MAX_MAP_RANGE = 2 ** 24 - 1;
  34. class CMap {
  35. constructor(builtInCMap = false) {
  36. this.codespaceRanges = [[], [], [], []];
  37. this.numCodespaceRanges = 0;
  38. this._map = [];
  39. this.name = "";
  40. this.vertical = false;
  41. this.useCMap = null;
  42. this.builtInCMap = builtInCMap;
  43. }
  44. addCodespaceRange(n, low, high) {
  45. this.codespaceRanges[n - 1].push(low, high);
  46. this.numCodespaceRanges++;
  47. }
  48. mapCidRange(low, high, dstLow) {
  49. if (high - low > MAX_MAP_RANGE) {
  50. throw new Error("mapCidRange - ignoring data above MAX_MAP_RANGE.");
  51. }
  52. while (low <= high) {
  53. this._map[low++] = dstLow++;
  54. }
  55. }
  56. mapBfRange(low, high, dstLow) {
  57. if (high - low > MAX_MAP_RANGE) {
  58. throw new Error("mapBfRange - ignoring data above MAX_MAP_RANGE.");
  59. }
  60. const lastByte = dstLow.length - 1;
  61. while (low <= high) {
  62. this._map[low++] = dstLow;
  63. const nextCharCode = dstLow.charCodeAt(lastByte) + 1;
  64. if (nextCharCode > 0xff) {
  65. dstLow = dstLow.substring(0, lastByte - 1) + String.fromCharCode(dstLow.charCodeAt(lastByte - 1) + 1) + "\x00";
  66. continue;
  67. }
  68. dstLow = dstLow.substring(0, lastByte) + String.fromCharCode(nextCharCode);
  69. }
  70. }
  71. mapBfRangeToArray(low, high, array) {
  72. if (high - low > MAX_MAP_RANGE) {
  73. throw new Error("mapBfRangeToArray - ignoring data above MAX_MAP_RANGE.");
  74. }
  75. const ii = array.length;
  76. let i = 0;
  77. while (low <= high && i < ii) {
  78. this._map[low] = array[i++];
  79. ++low;
  80. }
  81. }
  82. mapOne(src, dst) {
  83. this._map[src] = dst;
  84. }
  85. lookup(code) {
  86. return this._map[code];
  87. }
  88. contains(code) {
  89. return this._map[code] !== undefined;
  90. }
  91. forEach(callback) {
  92. const map = this._map;
  93. const length = map.length;
  94. if (length <= 0x10000) {
  95. for (let i = 0; i < length; i++) {
  96. if (map[i] !== undefined) {
  97. callback(i, map[i]);
  98. }
  99. }
  100. } else {
  101. for (const i in map) {
  102. callback(i, map[i]);
  103. }
  104. }
  105. }
  106. charCodeOf(value) {
  107. const map = this._map;
  108. if (map.length <= 0x10000) {
  109. return map.indexOf(value);
  110. }
  111. for (const charCode in map) {
  112. if (map[charCode] === value) {
  113. return charCode | 0;
  114. }
  115. }
  116. return -1;
  117. }
  118. getMap() {
  119. return this._map;
  120. }
  121. readCharCode(str, offset, out) {
  122. let c = 0;
  123. const codespaceRanges = this.codespaceRanges;
  124. for (let n = 0, nn = codespaceRanges.length; n < nn; n++) {
  125. c = (c << 8 | str.charCodeAt(offset + n)) >>> 0;
  126. const codespaceRange = codespaceRanges[n];
  127. for (let k = 0, kk = codespaceRange.length; k < kk;) {
  128. const low = codespaceRange[k++];
  129. const high = codespaceRange[k++];
  130. if (c >= low && c <= high) {
  131. out.charcode = c;
  132. out.length = n + 1;
  133. return;
  134. }
  135. }
  136. }
  137. out.charcode = 0;
  138. out.length = 1;
  139. }
  140. getCharCodeLength(charCode) {
  141. const codespaceRanges = this.codespaceRanges;
  142. for (let n = 0, nn = codespaceRanges.length; n < nn; n++) {
  143. const codespaceRange = codespaceRanges[n];
  144. for (let k = 0, kk = codespaceRange.length; k < kk;) {
  145. const low = codespaceRange[k++];
  146. const high = codespaceRange[k++];
  147. if (charCode >= low && charCode <= high) {
  148. return n + 1;
  149. }
  150. }
  151. }
  152. return 1;
  153. }
  154. get length() {
  155. return this._map.length;
  156. }
  157. get isIdentityCMap() {
  158. if (!(this.name === "Identity-H" || this.name === "Identity-V")) {
  159. return false;
  160. }
  161. if (this._map.length !== 0x10000) {
  162. return false;
  163. }
  164. for (let i = 0; i < 0x10000; i++) {
  165. if (this._map[i] !== i) {
  166. return false;
  167. }
  168. }
  169. return true;
  170. }
  171. }
  172. exports.CMap = CMap;
  173. class IdentityCMap extends CMap {
  174. constructor(vertical, n) {
  175. super();
  176. this.vertical = vertical;
  177. this.addCodespaceRange(n, 0, 0xffff);
  178. }
  179. mapCidRange(low, high, dstLow) {
  180. (0, _util.unreachable)("should not call mapCidRange");
  181. }
  182. mapBfRange(low, high, dstLow) {
  183. (0, _util.unreachable)("should not call mapBfRange");
  184. }
  185. mapBfRangeToArray(low, high, array) {
  186. (0, _util.unreachable)("should not call mapBfRangeToArray");
  187. }
  188. mapOne(src, dst) {
  189. (0, _util.unreachable)("should not call mapCidOne");
  190. }
  191. lookup(code) {
  192. return Number.isInteger(code) && code <= 0xffff ? code : undefined;
  193. }
  194. contains(code) {
  195. return Number.isInteger(code) && code <= 0xffff;
  196. }
  197. forEach(callback) {
  198. for (let i = 0; i <= 0xffff; i++) {
  199. callback(i, i);
  200. }
  201. }
  202. charCodeOf(value) {
  203. return Number.isInteger(value) && value <= 0xffff ? value : -1;
  204. }
  205. getMap() {
  206. const map = new Array(0x10000);
  207. for (let i = 0; i <= 0xffff; i++) {
  208. map[i] = i;
  209. }
  210. return map;
  211. }
  212. get length() {
  213. return 0x10000;
  214. }
  215. get isIdentityCMap() {
  216. (0, _util.unreachable)("should not access .isIdentityCMap");
  217. }
  218. }
  219. exports.IdentityCMap = IdentityCMap;
  220. const BinaryCMapReader = function BinaryCMapReaderClosure() {
  221. function hexToInt(a, size) {
  222. let n = 0;
  223. for (let i = 0; i <= size; i++) {
  224. n = n << 8 | a[i];
  225. }
  226. return n >>> 0;
  227. }
  228. function hexToStr(a, size) {
  229. if (size === 1) {
  230. return String.fromCharCode(a[0], a[1]);
  231. }
  232. if (size === 3) {
  233. return String.fromCharCode(a[0], a[1], a[2], a[3]);
  234. }
  235. return String.fromCharCode.apply(null, a.subarray(0, size + 1));
  236. }
  237. function addHex(a, b, size) {
  238. let c = 0;
  239. for (let i = size; i >= 0; i--) {
  240. c += a[i] + b[i];
  241. a[i] = c & 255;
  242. c >>= 8;
  243. }
  244. }
  245. function incHex(a, size) {
  246. let c = 1;
  247. for (let i = size; i >= 0 && c > 0; i--) {
  248. c += a[i];
  249. a[i] = c & 255;
  250. c >>= 8;
  251. }
  252. }
  253. const MAX_NUM_SIZE = 16;
  254. const MAX_ENCODED_NUM_SIZE = 19;
  255. class BinaryCMapStream {
  256. constructor(data) {
  257. this.buffer = data;
  258. this.pos = 0;
  259. this.end = data.length;
  260. this.tmpBuf = new Uint8Array(MAX_ENCODED_NUM_SIZE);
  261. }
  262. readByte() {
  263. if (this.pos >= this.end) {
  264. return -1;
  265. }
  266. return this.buffer[this.pos++];
  267. }
  268. readNumber() {
  269. let n = 0;
  270. let last;
  271. do {
  272. const b = this.readByte();
  273. if (b < 0) {
  274. throw new _util.FormatError("unexpected EOF in bcmap");
  275. }
  276. last = !(b & 0x80);
  277. n = n << 7 | b & 0x7f;
  278. } while (!last);
  279. return n;
  280. }
  281. readSigned() {
  282. const n = this.readNumber();
  283. return n & 1 ? ~(n >>> 1) : n >>> 1;
  284. }
  285. readHex(num, size) {
  286. num.set(this.buffer.subarray(this.pos, this.pos + size + 1));
  287. this.pos += size + 1;
  288. }
  289. readHexNumber(num, size) {
  290. let last;
  291. const stack = this.tmpBuf;
  292. let sp = 0;
  293. do {
  294. const b = this.readByte();
  295. if (b < 0) {
  296. throw new _util.FormatError("unexpected EOF in bcmap");
  297. }
  298. last = !(b & 0x80);
  299. stack[sp++] = b & 0x7f;
  300. } while (!last);
  301. let i = size,
  302. buffer = 0,
  303. bufferSize = 0;
  304. while (i >= 0) {
  305. while (bufferSize < 8 && stack.length > 0) {
  306. buffer |= stack[--sp] << bufferSize;
  307. bufferSize += 7;
  308. }
  309. num[i] = buffer & 255;
  310. i--;
  311. buffer >>= 8;
  312. bufferSize -= 8;
  313. }
  314. }
  315. readHexSigned(num, size) {
  316. this.readHexNumber(num, size);
  317. const sign = num[size] & 1 ? 255 : 0;
  318. let c = 0;
  319. for (let i = 0; i <= size; i++) {
  320. c = (c & 1) << 8 | num[i];
  321. num[i] = c >> 1 ^ sign;
  322. }
  323. }
  324. readString() {
  325. const len = this.readNumber();
  326. let s = "";
  327. for (let i = 0; i < len; i++) {
  328. s += String.fromCharCode(this.readNumber());
  329. }
  330. return s;
  331. }
  332. }
  333. class BinaryCMapReader {
  334. async process(data, cMap, extend) {
  335. const stream = new BinaryCMapStream(data);
  336. const header = stream.readByte();
  337. cMap.vertical = !!(header & 1);
  338. let useCMap = null;
  339. const start = new Uint8Array(MAX_NUM_SIZE);
  340. const end = new Uint8Array(MAX_NUM_SIZE);
  341. const char = new Uint8Array(MAX_NUM_SIZE);
  342. const charCode = new Uint8Array(MAX_NUM_SIZE);
  343. const tmp = new Uint8Array(MAX_NUM_SIZE);
  344. let code;
  345. let b;
  346. while ((b = stream.readByte()) >= 0) {
  347. const type = b >> 5;
  348. if (type === 7) {
  349. switch (b & 0x1f) {
  350. case 0:
  351. stream.readString();
  352. break;
  353. case 1:
  354. useCMap = stream.readString();
  355. break;
  356. }
  357. continue;
  358. }
  359. const sequence = !!(b & 0x10);
  360. const dataSize = b & 15;
  361. if (dataSize + 1 > MAX_NUM_SIZE) {
  362. throw new Error("BinaryCMapReader.process: Invalid dataSize.");
  363. }
  364. const ucs2DataSize = 1;
  365. const subitemsCount = stream.readNumber();
  366. switch (type) {
  367. case 0:
  368. stream.readHex(start, dataSize);
  369. stream.readHexNumber(end, dataSize);
  370. addHex(end, start, dataSize);
  371. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  372. for (let i = 1; i < subitemsCount; i++) {
  373. incHex(end, dataSize);
  374. stream.readHexNumber(start, dataSize);
  375. addHex(start, end, dataSize);
  376. stream.readHexNumber(end, dataSize);
  377. addHex(end, start, dataSize);
  378. cMap.addCodespaceRange(dataSize + 1, hexToInt(start, dataSize), hexToInt(end, dataSize));
  379. }
  380. break;
  381. case 1:
  382. stream.readHex(start, dataSize);
  383. stream.readHexNumber(end, dataSize);
  384. addHex(end, start, dataSize);
  385. stream.readNumber();
  386. for (let i = 1; i < subitemsCount; i++) {
  387. incHex(end, dataSize);
  388. stream.readHexNumber(start, dataSize);
  389. addHex(start, end, dataSize);
  390. stream.readHexNumber(end, dataSize);
  391. addHex(end, start, dataSize);
  392. stream.readNumber();
  393. }
  394. break;
  395. case 2:
  396. stream.readHex(char, dataSize);
  397. code = stream.readNumber();
  398. cMap.mapOne(hexToInt(char, dataSize), code);
  399. for (let i = 1; i < subitemsCount; i++) {
  400. incHex(char, dataSize);
  401. if (!sequence) {
  402. stream.readHexNumber(tmp, dataSize);
  403. addHex(char, tmp, dataSize);
  404. }
  405. code = stream.readSigned() + (code + 1);
  406. cMap.mapOne(hexToInt(char, dataSize), code);
  407. }
  408. break;
  409. case 3:
  410. stream.readHex(start, dataSize);
  411. stream.readHexNumber(end, dataSize);
  412. addHex(end, start, dataSize);
  413. code = stream.readNumber();
  414. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  415. for (let i = 1; i < subitemsCount; i++) {
  416. incHex(end, dataSize);
  417. if (!sequence) {
  418. stream.readHexNumber(start, dataSize);
  419. addHex(start, end, dataSize);
  420. } else {
  421. start.set(end);
  422. }
  423. stream.readHexNumber(end, dataSize);
  424. addHex(end, start, dataSize);
  425. code = stream.readNumber();
  426. cMap.mapCidRange(hexToInt(start, dataSize), hexToInt(end, dataSize), code);
  427. }
  428. break;
  429. case 4:
  430. stream.readHex(char, ucs2DataSize);
  431. stream.readHex(charCode, dataSize);
  432. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  433. for (let i = 1; i < subitemsCount; i++) {
  434. incHex(char, ucs2DataSize);
  435. if (!sequence) {
  436. stream.readHexNumber(tmp, ucs2DataSize);
  437. addHex(char, tmp, ucs2DataSize);
  438. }
  439. incHex(charCode, dataSize);
  440. stream.readHexSigned(tmp, dataSize);
  441. addHex(charCode, tmp, dataSize);
  442. cMap.mapOne(hexToInt(char, ucs2DataSize), hexToStr(charCode, dataSize));
  443. }
  444. break;
  445. case 5:
  446. stream.readHex(start, ucs2DataSize);
  447. stream.readHexNumber(end, ucs2DataSize);
  448. addHex(end, start, ucs2DataSize);
  449. stream.readHex(charCode, dataSize);
  450. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  451. for (let i = 1; i < subitemsCount; i++) {
  452. incHex(end, ucs2DataSize);
  453. if (!sequence) {
  454. stream.readHexNumber(start, ucs2DataSize);
  455. addHex(start, end, ucs2DataSize);
  456. } else {
  457. start.set(end);
  458. }
  459. stream.readHexNumber(end, ucs2DataSize);
  460. addHex(end, start, ucs2DataSize);
  461. stream.readHex(charCode, dataSize);
  462. cMap.mapBfRange(hexToInt(start, ucs2DataSize), hexToInt(end, ucs2DataSize), hexToStr(charCode, dataSize));
  463. }
  464. break;
  465. default:
  466. throw new Error(`BinaryCMapReader.process - unknown type: ${type}`);
  467. }
  468. }
  469. if (useCMap) {
  470. return extend(useCMap);
  471. }
  472. return cMap;
  473. }
  474. }
  475. return BinaryCMapReader;
  476. }();
  477. const CMapFactory = function CMapFactoryClosure() {
  478. function strToInt(str) {
  479. let a = 0;
  480. for (let i = 0; i < str.length; i++) {
  481. a = a << 8 | str.charCodeAt(i);
  482. }
  483. return a >>> 0;
  484. }
  485. function expectString(obj) {
  486. if (!(0, _util.isString)(obj)) {
  487. throw new _util.FormatError("Malformed CMap: expected string.");
  488. }
  489. }
  490. function expectInt(obj) {
  491. if (!Number.isInteger(obj)) {
  492. throw new _util.FormatError("Malformed CMap: expected int.");
  493. }
  494. }
  495. function parseBfChar(cMap, lexer) {
  496. while (true) {
  497. let obj = lexer.getObj();
  498. if (obj === _primitives.EOF) {
  499. break;
  500. }
  501. if ((0, _primitives.isCmd)(obj, "endbfchar")) {
  502. return;
  503. }
  504. expectString(obj);
  505. const src = strToInt(obj);
  506. obj = lexer.getObj();
  507. expectString(obj);
  508. const dst = obj;
  509. cMap.mapOne(src, dst);
  510. }
  511. }
  512. function parseBfRange(cMap, lexer) {
  513. while (true) {
  514. let obj = lexer.getObj();
  515. if (obj === _primitives.EOF) {
  516. break;
  517. }
  518. if ((0, _primitives.isCmd)(obj, "endbfrange")) {
  519. return;
  520. }
  521. expectString(obj);
  522. const low = strToInt(obj);
  523. obj = lexer.getObj();
  524. expectString(obj);
  525. const high = strToInt(obj);
  526. obj = lexer.getObj();
  527. if (Number.isInteger(obj) || (0, _util.isString)(obj)) {
  528. const dstLow = Number.isInteger(obj) ? String.fromCharCode(obj) : obj;
  529. cMap.mapBfRange(low, high, dstLow);
  530. } else if ((0, _primitives.isCmd)(obj, "[")) {
  531. obj = lexer.getObj();
  532. const array = [];
  533. while (!(0, _primitives.isCmd)(obj, "]") && obj !== _primitives.EOF) {
  534. array.push(obj);
  535. obj = lexer.getObj();
  536. }
  537. cMap.mapBfRangeToArray(low, high, array);
  538. } else {
  539. break;
  540. }
  541. }
  542. throw new _util.FormatError("Invalid bf range.");
  543. }
  544. function parseCidChar(cMap, lexer) {
  545. while (true) {
  546. let obj = lexer.getObj();
  547. if (obj === _primitives.EOF) {
  548. break;
  549. }
  550. if ((0, _primitives.isCmd)(obj, "endcidchar")) {
  551. return;
  552. }
  553. expectString(obj);
  554. const src = strToInt(obj);
  555. obj = lexer.getObj();
  556. expectInt(obj);
  557. const dst = obj;
  558. cMap.mapOne(src, dst);
  559. }
  560. }
  561. function parseCidRange(cMap, lexer) {
  562. while (true) {
  563. let obj = lexer.getObj();
  564. if (obj === _primitives.EOF) {
  565. break;
  566. }
  567. if ((0, _primitives.isCmd)(obj, "endcidrange")) {
  568. return;
  569. }
  570. expectString(obj);
  571. const low = strToInt(obj);
  572. obj = lexer.getObj();
  573. expectString(obj);
  574. const high = strToInt(obj);
  575. obj = lexer.getObj();
  576. expectInt(obj);
  577. const dstLow = obj;
  578. cMap.mapCidRange(low, high, dstLow);
  579. }
  580. }
  581. function parseCodespaceRange(cMap, lexer) {
  582. while (true) {
  583. let obj = lexer.getObj();
  584. if (obj === _primitives.EOF) {
  585. break;
  586. }
  587. if ((0, _primitives.isCmd)(obj, "endcodespacerange")) {
  588. return;
  589. }
  590. if (!(0, _util.isString)(obj)) {
  591. break;
  592. }
  593. const low = strToInt(obj);
  594. obj = lexer.getObj();
  595. if (!(0, _util.isString)(obj)) {
  596. break;
  597. }
  598. const high = strToInt(obj);
  599. cMap.addCodespaceRange(obj.length, low, high);
  600. }
  601. throw new _util.FormatError("Invalid codespace range.");
  602. }
  603. function parseWMode(cMap, lexer) {
  604. const obj = lexer.getObj();
  605. if (Number.isInteger(obj)) {
  606. cMap.vertical = !!obj;
  607. }
  608. }
  609. function parseCMapName(cMap, lexer) {
  610. const obj = lexer.getObj();
  611. if ((0, _primitives.isName)(obj) && (0, _util.isString)(obj.name)) {
  612. cMap.name = obj.name;
  613. }
  614. }
  615. async function parseCMap(cMap, lexer, fetchBuiltInCMap, useCMap) {
  616. let previous, embeddedUseCMap;
  617. objLoop: while (true) {
  618. try {
  619. const obj = lexer.getObj();
  620. if (obj === _primitives.EOF) {
  621. break;
  622. } else if ((0, _primitives.isName)(obj)) {
  623. if (obj.name === "WMode") {
  624. parseWMode(cMap, lexer);
  625. } else if (obj.name === "CMapName") {
  626. parseCMapName(cMap, lexer);
  627. }
  628. previous = obj;
  629. } else if ((0, _primitives.isCmd)(obj)) {
  630. switch (obj.cmd) {
  631. case "endcmap":
  632. break objLoop;
  633. case "usecmap":
  634. if ((0, _primitives.isName)(previous)) {
  635. embeddedUseCMap = previous.name;
  636. }
  637. break;
  638. case "begincodespacerange":
  639. parseCodespaceRange(cMap, lexer);
  640. break;
  641. case "beginbfchar":
  642. parseBfChar(cMap, lexer);
  643. break;
  644. case "begincidchar":
  645. parseCidChar(cMap, lexer);
  646. break;
  647. case "beginbfrange":
  648. parseBfRange(cMap, lexer);
  649. break;
  650. case "begincidrange":
  651. parseCidRange(cMap, lexer);
  652. break;
  653. }
  654. }
  655. } catch (ex) {
  656. if (ex instanceof _core_utils.MissingDataException) {
  657. throw ex;
  658. }
  659. (0, _util.warn)("Invalid cMap data: " + ex);
  660. continue;
  661. }
  662. }
  663. if (!useCMap && embeddedUseCMap) {
  664. useCMap = embeddedUseCMap;
  665. }
  666. if (useCMap) {
  667. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  668. }
  669. return cMap;
  670. }
  671. async function extendCMap(cMap, fetchBuiltInCMap, useCMap) {
  672. cMap.useCMap = await createBuiltInCMap(useCMap, fetchBuiltInCMap);
  673. if (cMap.numCodespaceRanges === 0) {
  674. const useCodespaceRanges = cMap.useCMap.codespaceRanges;
  675. for (let i = 0; i < useCodespaceRanges.length; i++) {
  676. cMap.codespaceRanges[i] = useCodespaceRanges[i].slice();
  677. }
  678. cMap.numCodespaceRanges = cMap.useCMap.numCodespaceRanges;
  679. }
  680. cMap.useCMap.forEach(function (key, value) {
  681. if (!cMap.contains(key)) {
  682. cMap.mapOne(key, cMap.useCMap.lookup(key));
  683. }
  684. });
  685. return cMap;
  686. }
  687. async function createBuiltInCMap(name, fetchBuiltInCMap) {
  688. if (name === "Identity-H") {
  689. return new IdentityCMap(false, 2);
  690. } else if (name === "Identity-V") {
  691. return new IdentityCMap(true, 2);
  692. }
  693. if (!BUILT_IN_CMAPS.includes(name)) {
  694. throw new Error("Unknown CMap name: " + name);
  695. }
  696. if (!fetchBuiltInCMap) {
  697. throw new Error("Built-in CMap parameters are not provided.");
  698. }
  699. const {
  700. cMapData,
  701. compressionType
  702. } = await fetchBuiltInCMap(name);
  703. const cMap = new CMap(true);
  704. if (compressionType === _util.CMapCompressionType.BINARY) {
  705. return new BinaryCMapReader().process(cMapData, cMap, useCMap => {
  706. return extendCMap(cMap, fetchBuiltInCMap, useCMap);
  707. });
  708. }
  709. if (compressionType === _util.CMapCompressionType.NONE) {
  710. const lexer = new _parser.Lexer(new _stream.Stream(cMapData));
  711. return parseCMap(cMap, lexer, fetchBuiltInCMap, null);
  712. }
  713. throw new Error("TODO: Only BINARY/NONE CMap compression is currently supported.");
  714. }
  715. return {
  716. async create(params) {
  717. const encoding = params.encoding;
  718. const fetchBuiltInCMap = params.fetchBuiltInCMap;
  719. const useCMap = params.useCMap;
  720. if ((0, _primitives.isName)(encoding)) {
  721. return createBuiltInCMap(encoding.name, fetchBuiltInCMap);
  722. } else if ((0, _primitives.isStream)(encoding)) {
  723. const parsedCMap = await parseCMap(new CMap(), new _parser.Lexer(encoding), fetchBuiltInCMap, useCMap);
  724. if (parsedCMap.isIdentityCMap) {
  725. return createBuiltInCMap(parsedCMap.name, fetchBuiltInCMap);
  726. }
  727. return parsedCMap;
  728. }
  729. throw new Error("Encoding required.");
  730. }
  731. };
  732. }();
  733. exports.CMapFactory = CMapFactory;