123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379 |
- /**
- * @licstart The following is the entire license notice for the
- * Javascript code in this page
- *
- * Copyright 2021 Mozilla Foundation
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- *
- * @licend The above is the entire license notice for the
- * Javascript code in this page
- */
- "use strict";
- Object.defineProperty(exports, "__esModule", {
- value: true
- });
- exports.StructTreeRoot = exports.StructTreePage = void 0;
- var _primitives = require("./primitives.js");
- var _util = require("../shared/util.js");
- var _name_number_tree = require("./name_number_tree.js");
- const MAX_DEPTH = 40;
- const StructElementType = {
- PAGE_CONTENT: "PAGE_CONTENT",
- STREAM_CONTENT: "STREAM_CONTENT",
- OBJECT: "OBJECT",
- ELEMENT: "ELEMENT"
- };
- class StructTreeRoot {
- constructor(rootDict) {
- this.dict = rootDict;
- this.roleMap = new Map();
- }
- init() {
- this.readRoleMap();
- }
- readRoleMap() {
- const roleMapDict = this.dict.get("RoleMap");
- if (!(0, _primitives.isDict)(roleMapDict)) {
- return;
- }
- roleMapDict.forEach((key, value) => {
- if (!(0, _primitives.isName)(value)) {
- return;
- }
- this.roleMap.set(key, value.name);
- });
- }
- }
- exports.StructTreeRoot = StructTreeRoot;
- class StructElementNode {
- constructor(tree, dict) {
- this.tree = tree;
- this.dict = dict;
- this.kids = [];
- this.parseKids();
- }
- get role() {
- const nameObj = this.dict.get("S");
- const name = (0, _primitives.isName)(nameObj) ? nameObj.name : "";
- const {
- root
- } = this.tree;
- if (root.roleMap.has(name)) {
- return root.roleMap.get(name);
- }
- return name;
- }
- parseKids() {
- let pageObjId = null;
- const objRef = this.dict.getRaw("Pg");
- if ((0, _primitives.isRef)(objRef)) {
- pageObjId = objRef.toString();
- }
- const kids = this.dict.get("K");
- if (Array.isArray(kids)) {
- for (const kid of kids) {
- const element = this.parseKid(pageObjId, kid);
- if (element) {
- this.kids.push(element);
- }
- }
- } else {
- const element = this.parseKid(pageObjId, kids);
- if (element) {
- this.kids.push(element);
- }
- }
- }
- parseKid(pageObjId, kid) {
- if (Number.isInteger(kid)) {
- if (this.tree.pageDict.objId !== pageObjId) {
- return null;
- }
- return new StructElement({
- type: StructElementType.PAGE_CONTENT,
- mcid: kid,
- pageObjId
- });
- }
- let kidDict = null;
- if ((0, _primitives.isRef)(kid)) {
- kidDict = this.dict.xref.fetch(kid);
- } else if ((0, _primitives.isDict)(kid)) {
- kidDict = kid;
- }
- if (!kidDict) {
- return null;
- }
- const pageRef = kidDict.getRaw("Pg");
- if ((0, _primitives.isRef)(pageRef)) {
- pageObjId = pageRef.toString();
- }
- const type = (0, _primitives.isName)(kidDict.get("Type")) ? kidDict.get("Type").name : null;
- if (type === "MCR") {
- if (this.tree.pageDict.objId !== pageObjId) {
- return null;
- }
- return new StructElement({
- type: StructElementType.STREAM_CONTENT,
- refObjId: (0, _primitives.isRef)(kidDict.getRaw("Stm")) ? kidDict.getRaw("Stm").toString() : null,
- pageObjId,
- mcid: kidDict.get("MCID")
- });
- }
- if (type === "OBJR") {
- if (this.tree.pageDict.objId !== pageObjId) {
- return null;
- }
- return new StructElement({
- type: StructElementType.OBJECT,
- refObjId: (0, _primitives.isRef)(kidDict.getRaw("Obj")) ? kidDict.getRaw("Obj").toString() : null,
- pageObjId
- });
- }
- return new StructElement({
- type: StructElementType.ELEMENT,
- dict: kidDict
- });
- }
- }
- class StructElement {
- constructor({
- type,
- dict = null,
- mcid = null,
- pageObjId = null,
- refObjId = null
- }) {
- this.type = type;
- this.dict = dict;
- this.mcid = mcid;
- this.pageObjId = pageObjId;
- this.refObjId = refObjId;
- this.parentNode = null;
- }
- }
- class StructTreePage {
- constructor(structTreeRoot, pageDict) {
- this.root = structTreeRoot;
- this.rootDict = structTreeRoot ? structTreeRoot.dict : null;
- this.pageDict = pageDict;
- this.nodes = [];
- }
- parse() {
- if (!this.root || !this.rootDict) {
- return;
- }
- const parentTree = this.rootDict.get("ParentTree");
- if (!parentTree) {
- return;
- }
- const id = this.pageDict.get("StructParents");
- if (!Number.isInteger(id)) {
- return;
- }
- const numberTree = new _name_number_tree.NumberTree(parentTree, this.rootDict.xref);
- const parentArray = numberTree.get(id);
- if (!Array.isArray(parentArray)) {
- return;
- }
- const map = new Map();
- for (const ref of parentArray) {
- if ((0, _primitives.isRef)(ref)) {
- this.addNode(this.rootDict.xref.fetch(ref), map);
- }
- }
- }
- addNode(dict, map, level = 0) {
- if (level > MAX_DEPTH) {
- (0, _util.warn)("StructTree MAX_DEPTH reached.");
- return null;
- }
- if (map.has(dict)) {
- return map.get(dict);
- }
- const element = new StructElementNode(this, dict);
- map.set(dict, element);
- const parent = dict.get("P");
- if (!parent || (0, _primitives.isName)(parent.get("Type"), "StructTreeRoot")) {
- if (!this.addTopLevelNode(dict, element)) {
- map.delete(dict);
- }
- return element;
- }
- const parentNode = this.addNode(parent, map, level + 1);
- if (!parentNode) {
- return element;
- }
- let save = false;
- for (const kid of parentNode.kids) {
- if (kid.type === StructElementType.ELEMENT && kid.dict === dict) {
- kid.parentNode = element;
- save = true;
- }
- }
- if (!save) {
- map.delete(dict);
- }
- return element;
- }
- addTopLevelNode(dict, element) {
- const obj = this.rootDict.get("K");
- if (!obj) {
- return false;
- }
- if ((0, _primitives.isDict)(obj)) {
- if (obj.objId !== dict.objId) {
- return false;
- }
- this.nodes[0] = element;
- return true;
- }
- if (!Array.isArray(obj)) {
- return true;
- }
- let save = false;
- for (let i = 0; i < obj.length; i++) {
- const kidRef = obj[i];
- if (kidRef && kidRef.toString() === dict.objId) {
- this.nodes[i] = element;
- save = true;
- }
- }
- return save;
- }
- get serializable() {
- function nodeToSerializable(node, parent, level = 0) {
- if (level > MAX_DEPTH) {
- (0, _util.warn)("StructTree too deep to be fully serialized.");
- return;
- }
- const obj = Object.create(null);
- obj.role = node.role;
- obj.children = [];
- parent.children.push(obj);
- const alt = node.dict.get("Alt");
- if ((0, _util.isString)(alt)) {
- obj.alt = (0, _util.stringToPDFString)(alt);
- }
- for (const kid of node.kids) {
- const kidElement = kid.type === StructElementType.ELEMENT ? kid.parentNode : null;
- if (kidElement) {
- nodeToSerializable(kidElement, obj, level + 1);
- continue;
- } else if (kid.type === StructElementType.PAGE_CONTENT || kid.type === StructElementType.STREAM_CONTENT) {
- obj.children.push({
- type: "content",
- id: `page${kid.pageObjId}_mcid${kid.mcid}`
- });
- } else if (kid.type === StructElementType.OBJECT) {
- obj.children.push({
- type: "object",
- id: kid.refObjId
- });
- }
- }
- }
- const root = Object.create(null);
- root.children = [];
- root.role = "Root";
- for (const child of this.nodes) {
- if (!child) {
- continue;
- }
- nodeToSerializable(child, root);
- }
- return root;
- }
- }
- exports.StructTreePage = StructTreePage;
|