| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657 |
- /* Copyright 2012 Mozilla Foundation
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- import {
- collectActions,
- MissingDataException,
- PDF_VERSION_REGEXP,
- recoverJsURL,
- toRomanNumerals,
- XRefEntryException,
- } from "./core_utils.js";
- import {
- createValidAbsoluteUrl,
- DocumentActionEventType,
- FormatError,
- info,
- objectSize,
- PermissionFlag,
- shadow,
- stringToPDFString,
- stringToUTF8String,
- warn,
- } from "../shared/util.js";
- import {
- Dict,
- isDict,
- isName,
- isRefsEqual,
- Name,
- Ref,
- RefSet,
- RefSetCache,
- } from "./primitives.js";
- import { NameTree, NumberTree } from "./name_number_tree.js";
- import { BaseStream } from "./base_stream.js";
- import { clearGlobalCaches } from "./cleanup_helper.js";
- import { ColorSpace } from "./colorspace.js";
- import { FileSpec } from "./file_spec.js";
- import { GlobalImageCache } from "./image_utils.js";
- import { MetadataParser } from "./metadata_parser.js";
- import { StructTreeRoot } from "./struct_tree.js";
- function fetchDestination(dest) {
- if (dest instanceof Dict) {
- dest = dest.get("D");
- }
- return Array.isArray(dest) ? dest : null;
- }
- class Catalog {
- constructor(pdfManager, xref) {
- this.pdfManager = pdfManager;
- this.xref = xref;
- this._catDict = xref.getCatalogObj();
- if (!(this._catDict instanceof Dict)) {
- throw new FormatError("Catalog object is not a dictionary.");
- }
- // Given that `XRef.parse` will both fetch *and* validate the /Pages-entry,
- // the following call must always succeed here:
- this.toplevelPagesDict; // eslint-disable-line no-unused-expressions
- this._actualNumPages = null;
- this.fontCache = new RefSetCache();
- this.builtInCMapCache = new Map();
- this.standardFontDataCache = new Map();
- this.globalImageCache = new GlobalImageCache();
- this.pageKidsCountCache = new RefSetCache();
- this.pageIndexCache = new RefSetCache();
- this.nonBlendModesSet = new RefSet();
- }
- get version() {
- const version = this._catDict.get("Version");
- if (version instanceof Name) {
- if (PDF_VERSION_REGEXP.test(version.name)) {
- return shadow(this, "version", version.name);
- }
- warn(`Invalid PDF catalog version: ${version.name}`);
- }
- return shadow(this, "version", null);
- }
- get lang() {
- const lang = this._catDict.get("Lang");
- return shadow(
- this,
- "lang",
- typeof lang === "string" ? stringToPDFString(lang) : null
- );
- }
- /**
- * @type {boolean} `true` for pure XFA documents,
- * `false` for XFA Foreground documents.
- */
- get needsRendering() {
- const needsRendering = this._catDict.get("NeedsRendering");
- return shadow(
- this,
- "needsRendering",
- typeof needsRendering === "boolean" ? needsRendering : false
- );
- }
- get collection() {
- let collection = null;
- try {
- const obj = this._catDict.get("Collection");
- if (obj instanceof Dict && obj.size > 0) {
- collection = obj;
- }
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- info("Cannot fetch Collection entry; assuming no collection is present.");
- }
- return shadow(this, "collection", collection);
- }
- get acroForm() {
- let acroForm = null;
- try {
- const obj = this._catDict.get("AcroForm");
- if (obj instanceof Dict && obj.size > 0) {
- acroForm = obj;
- }
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- info("Cannot fetch AcroForm entry; assuming no forms are present.");
- }
- return shadow(this, "acroForm", acroForm);
- }
- get acroFormRef() {
- const value = this._catDict.getRaw("AcroForm");
- return shadow(this, "acroFormRef", value instanceof Ref ? value : null);
- }
- get metadata() {
- const streamRef = this._catDict.getRaw("Metadata");
- if (!(streamRef instanceof Ref)) {
- return shadow(this, "metadata", null);
- }
- let metadata = null;
- try {
- const suppressEncryption = !(
- this.xref.encrypt && this.xref.encrypt.encryptMetadata
- );
- const stream = this.xref.fetch(streamRef, suppressEncryption);
- if (stream instanceof BaseStream && stream.dict instanceof Dict) {
- const type = stream.dict.get("Type");
- const subtype = stream.dict.get("Subtype");
- if (isName(type, "Metadata") && isName(subtype, "XML")) {
- // XXX: This should examine the charset the XML document defines,
- // however since there are currently no real means to decode arbitrary
- // charsets, let's just hope that the author of the PDF was reasonable
- // enough to stick with the XML default charset, which is UTF-8.
- const data = stringToUTF8String(stream.getString());
- if (data) {
- metadata = new MetadataParser(data).serializable;
- }
- }
- }
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- info(`Skipping invalid Metadata: "${ex}".`);
- }
- return shadow(this, "metadata", metadata);
- }
- get markInfo() {
- let markInfo = null;
- try {
- markInfo = this._readMarkInfo();
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn("Unable to read mark info.");
- }
- return shadow(this, "markInfo", markInfo);
- }
- /**
- * @private
- */
- _readMarkInfo() {
- const obj = this._catDict.get("MarkInfo");
- if (!(obj instanceof Dict)) {
- return null;
- }
- const markInfo = {
- Marked: false,
- UserProperties: false,
- Suspects: false,
- };
- for (const key in markInfo) {
- const value = obj.get(key);
- if (typeof value === "boolean") {
- markInfo[key] = value;
- }
- }
- return markInfo;
- }
- get structTreeRoot() {
- let structTree = null;
- try {
- structTree = this._readStructTreeRoot();
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn("Unable read to structTreeRoot info.");
- }
- return shadow(this, "structTreeRoot", structTree);
- }
- /**
- * @private
- */
- _readStructTreeRoot() {
- const obj = this._catDict.get("StructTreeRoot");
- if (!(obj instanceof Dict)) {
- return null;
- }
- const root = new StructTreeRoot(obj);
- root.init();
- return root;
- }
- get toplevelPagesDict() {
- const pagesObj = this._catDict.get("Pages");
- if (!(pagesObj instanceof Dict)) {
- throw new FormatError("Invalid top-level pages dictionary.");
- }
- return shadow(this, "toplevelPagesDict", pagesObj);
- }
- get documentOutline() {
- let obj = null;
- try {
- obj = this._readDocumentOutline();
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn("Unable to read document outline.");
- }
- return shadow(this, "documentOutline", obj);
- }
- /**
- * @private
- */
- _readDocumentOutline() {
- let obj = this._catDict.get("Outlines");
- if (!(obj instanceof Dict)) {
- return null;
- }
- obj = obj.getRaw("First");
- if (!(obj instanceof Ref)) {
- return null;
- }
- const root = { items: [] };
- const queue = [{ obj, parent: root }];
- // To avoid recursion, keep track of the already processed items.
- const processed = new RefSet();
- processed.put(obj);
- const xref = this.xref,
- blackColor = new Uint8ClampedArray(3);
- while (queue.length > 0) {
- const i = queue.shift();
- const outlineDict = xref.fetchIfRef(i.obj);
- if (outlineDict === null) {
- continue;
- }
- if (!outlineDict.has("Title")) {
- throw new FormatError("Invalid outline item encountered.");
- }
- const data = { url: null, dest: null, action: null };
- Catalog.parseDestDictionary({
- destDict: outlineDict,
- resultObj: data,
- docBaseUrl: this.pdfManager.docBaseUrl,
- docAttachments: this.attachments,
- });
- const title = outlineDict.get("Title");
- const flags = outlineDict.get("F") || 0;
- const color = outlineDict.getArray("C");
- const count = outlineDict.get("Count");
- let rgbColor = blackColor;
- // We only need to parse the color when it's valid, and non-default.
- if (
- Array.isArray(color) &&
- color.length === 3 &&
- (color[0] !== 0 || color[1] !== 0 || color[2] !== 0)
- ) {
- rgbColor = ColorSpace.singletons.rgb.getRgb(color, 0);
- }
- const outlineItem = {
- action: data.action,
- attachment: data.attachment,
- dest: data.dest,
- url: data.url,
- unsafeUrl: data.unsafeUrl,
- newWindow: data.newWindow,
- setOCGState: data.setOCGState,
- title: stringToPDFString(title),
- color: rgbColor,
- count: Number.isInteger(count) ? count : undefined,
- bold: !!(flags & 2),
- italic: !!(flags & 1),
- items: [],
- };
- i.parent.items.push(outlineItem);
- obj = outlineDict.getRaw("First");
- if (obj instanceof Ref && !processed.has(obj)) {
- queue.push({ obj, parent: outlineItem });
- processed.put(obj);
- }
- obj = outlineDict.getRaw("Next");
- if (obj instanceof Ref && !processed.has(obj)) {
- queue.push({ obj, parent: i.parent });
- processed.put(obj);
- }
- }
- return root.items.length > 0 ? root.items : null;
- }
- get permissions() {
- let permissions = null;
- try {
- permissions = this._readPermissions();
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn("Unable to read permissions.");
- }
- return shadow(this, "permissions", permissions);
- }
- /**
- * @private
- */
- _readPermissions() {
- const encrypt = this.xref.trailer.get("Encrypt");
- if (!(encrypt instanceof Dict)) {
- return null;
- }
- let flags = encrypt.get("P");
- if (typeof flags !== "number") {
- return null;
- }
- // PDF integer objects are represented internally in signed 2's complement
- // form. Therefore, convert the signed decimal integer to a signed 2's
- // complement binary integer so we can use regular bitwise operations on it.
- flags += 2 ** 32;
- const permissions = [];
- for (const key in PermissionFlag) {
- const value = PermissionFlag[key];
- if (flags & value) {
- permissions.push(value);
- }
- }
- return permissions;
- }
- get optionalContentConfig() {
- let config = null;
- try {
- const properties = this._catDict.get("OCProperties");
- if (!properties) {
- return shadow(this, "optionalContentConfig", null);
- }
- const defaultConfig = properties.get("D");
- if (!defaultConfig) {
- return shadow(this, "optionalContentConfig", null);
- }
- const groupsData = properties.get("OCGs");
- if (!Array.isArray(groupsData)) {
- return shadow(this, "optionalContentConfig", null);
- }
- const groups = [];
- const groupRefs = [];
- // Ensure all the optional content groups are valid.
- for (const groupRef of groupsData) {
- if (!(groupRef instanceof Ref)) {
- continue;
- }
- groupRefs.push(groupRef);
- const group = this.xref.fetchIfRef(groupRef);
- groups.push({
- id: groupRef.toString(),
- name:
- typeof group.get("Name") === "string"
- ? stringToPDFString(group.get("Name"))
- : null,
- intent:
- typeof group.get("Intent") === "string"
- ? stringToPDFString(group.get("Intent"))
- : null,
- });
- }
- config = this._readOptionalContentConfig(defaultConfig, groupRefs);
- config.groups = groups;
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn(`Unable to read optional content config: ${ex}`);
- }
- return shadow(this, "optionalContentConfig", config);
- }
- _readOptionalContentConfig(config, contentGroupRefs) {
- function parseOnOff(refs) {
- const onParsed = [];
- if (Array.isArray(refs)) {
- for (const value of refs) {
- if (!(value instanceof Ref)) {
- continue;
- }
- if (contentGroupRefs.includes(value)) {
- onParsed.push(value.toString());
- }
- }
- }
- return onParsed;
- }
- function parseOrder(refs, nestedLevels = 0) {
- if (!Array.isArray(refs)) {
- return null;
- }
- const order = [];
- for (const value of refs) {
- if (value instanceof Ref && contentGroupRefs.includes(value)) {
- parsedOrderRefs.put(value); // Handle "hidden" groups, see below.
- order.push(value.toString());
- continue;
- }
- // Handle nested /Order arrays (see e.g. issue 9462 and bug 1240641).
- const nestedOrder = parseNestedOrder(value, nestedLevels);
- if (nestedOrder) {
- order.push(nestedOrder);
- }
- }
- if (nestedLevels > 0) {
- return order;
- }
- const hiddenGroups = [];
- for (const groupRef of contentGroupRefs) {
- if (parsedOrderRefs.has(groupRef)) {
- continue;
- }
- hiddenGroups.push(groupRef.toString());
- }
- if (hiddenGroups.length) {
- order.push({ name: null, order: hiddenGroups });
- }
- return order;
- }
- function parseNestedOrder(ref, nestedLevels) {
- if (++nestedLevels > MAX_NESTED_LEVELS) {
- warn("parseNestedOrder - reached MAX_NESTED_LEVELS.");
- return null;
- }
- const value = xref.fetchIfRef(ref);
- if (!Array.isArray(value)) {
- return null;
- }
- const nestedName = xref.fetchIfRef(value[0]);
- if (typeof nestedName !== "string") {
- return null;
- }
- const nestedOrder = parseOrder(value.slice(1), nestedLevels);
- if (!nestedOrder || !nestedOrder.length) {
- return null;
- }
- return { name: stringToPDFString(nestedName), order: nestedOrder };
- }
- const xref = this.xref,
- parsedOrderRefs = new RefSet(),
- MAX_NESTED_LEVELS = 10;
- return {
- name:
- typeof config.get("Name") === "string"
- ? stringToPDFString(config.get("Name"))
- : null,
- creator:
- typeof config.get("Creator") === "string"
- ? stringToPDFString(config.get("Creator"))
- : null,
- baseState:
- config.get("BaseState") instanceof Name
- ? config.get("BaseState").name
- : null,
- on: parseOnOff(config.get("ON")),
- off: parseOnOff(config.get("OFF")),
- order: parseOrder(config.get("Order")),
- groups: null,
- };
- }
- setActualNumPages(num = null) {
- this._actualNumPages = num;
- }
- get hasActualNumPages() {
- return this._actualNumPages !== null;
- }
- get _pagesCount() {
- const obj = this.toplevelPagesDict.get("Count");
- if (!Number.isInteger(obj)) {
- throw new FormatError(
- "Page count in top-level pages dictionary is not an integer."
- );
- }
- return shadow(this, "_pagesCount", obj);
- }
- get numPages() {
- return this.hasActualNumPages ? this._actualNumPages : this._pagesCount;
- }
- get destinations() {
- const obj = this._readDests(),
- dests = Object.create(null);
- if (obj instanceof NameTree) {
- for (const [key, value] of obj.getAll()) {
- const dest = fetchDestination(value);
- if (dest) {
- dests[stringToPDFString(key)] = dest;
- }
- }
- } else if (obj instanceof Dict) {
- obj.forEach(function (key, value) {
- const dest = fetchDestination(value);
- if (dest) {
- dests[key] = dest;
- }
- });
- }
- return shadow(this, "destinations", dests);
- }
- getDestination(id) {
- const obj = this._readDests();
- if (obj instanceof NameTree) {
- const dest = fetchDestination(obj.get(id));
- if (dest) {
- return dest;
- }
- // Fallback to checking the *entire* NameTree, in an attempt to handle
- // corrupt PDF documents with out-of-order NameTrees (fixes issue 10272).
- const allDest = this.destinations[id];
- if (allDest) {
- warn(`Found "${id}" at an incorrect position in the NameTree.`);
- return allDest;
- }
- } else if (obj instanceof Dict) {
- const dest = fetchDestination(obj.get(id));
- if (dest) {
- return dest;
- }
- }
- return null;
- }
- /**
- * @private
- */
- _readDests() {
- const obj = this._catDict.get("Names");
- if (obj && obj.has("Dests")) {
- return new NameTree(obj.getRaw("Dests"), this.xref);
- } else if (this._catDict.has("Dests")) {
- // Simple destination dictionary.
- return this._catDict.get("Dests");
- }
- return undefined;
- }
- get pageLabels() {
- let obj = null;
- try {
- obj = this._readPageLabels();
- } catch (ex) {
- if (ex instanceof MissingDataException) {
- throw ex;
- }
- warn("Unable to read page labels.");
- }
- return shadow(this, "pageLabels", obj);
- }
- /**
- * @private
- */
- _readPageLabels() {
- const obj = this._catDict.getRaw("PageLabels");
- if (!obj) {
- return null;
- }
- const pageLabels = new Array(this.numPages);
- let style = null,
- prefix = "";
- const numberTree = new NumberTree(obj, this.xref);
- const nums = numberTree.getAll();
- let currentLabel = "",
- currentIndex = 1;
- for (let i = 0, ii = this.numPages; i < ii; i++) {
- const labelDict = nums.get(i);
- if (labelDict !== undefined) {
- if (!(labelDict instanceof Dict)) {
- throw new FormatError("PageLabel is not a dictionary.");
- }
- if (
- labelDict.has("Type") &&
- !isName(labelDict.get("Type"), "PageLabel")
- ) {
- throw new FormatError("Invalid type in PageLabel dictionary.");
- }
- if (labelDict.has("S")) {
- const s = labelDict.get("S");
- if (!(s instanceof Name)) {
- throw new FormatError("Invalid style in PageLabel dictionary.");
- }
- style = s.name;
- } else {
- style = null;
- }
- if (labelDict.has("P")) {
- const p = labelDict.get("P");
- if (typeof p !== "string") {
- throw new FormatError("Invalid prefix in PageLabel dictionary.");
- }
- prefix = stringToPDFString(p);
- } else {
- prefix = "";
- }
- if (labelDict.has("St")) {
- const st = labelDict.get("St");
- if (!(Number.isInteger(st) && st >= 1)) {
- throw new FormatError("Invalid start in PageLabel dictionary.");
- }
- currentIndex = st;
- } else {
- currentIndex = 1;
- }
- }
- switch (style) {
- case "D":
- currentLabel = currentIndex;
- break;
- case "R":
- case "r":
- currentLabel = toRomanNumerals(currentIndex, style === "r");
- break;
- case "A":
- case "a":
- const LIMIT = 26; // Use only the characters A-Z, or a-z.
- const A_UPPER_CASE = 0x41,
- A_LOWER_CASE = 0x61;
- const baseCharCode = style === "a" ? A_LOWER_CASE : A_UPPER_CASE;
- const letterIndex = currentIndex - 1;
- const character = String.fromCharCode(
- baseCharCode + (letterIndex % LIMIT)
- );
- currentLabel = character.repeat(Math.floor(letterIndex / LIMIT) + 1);
- break;
- default:
- if (style) {
- throw new FormatError(
- `Invalid style "${style}" in PageLabel dictionary.`
- );
- }
- currentLabel = "";
- }
- pageLabels[i] = prefix + currentLabel;
- currentIndex++;
- }
- return pageLabels;
- }
- get pageLayout() {
- const obj = this._catDict.get("PageLayout");
- // Purposely use a non-standard default value, rather than 'SinglePage', to
- // allow differentiating between `undefined` and /SinglePage since that does
- // affect the Scroll mode (continuous/non-continuous) used in Adobe Reader.
- let pageLayout = "";
- if (obj instanceof Name) {
- switch (obj.name) {
- case "SinglePage":
- case "OneColumn":
- case "TwoColumnLeft":
- case "TwoColumnRight":
- case "TwoPageLeft":
- case "TwoPageRight":
- pageLayout = obj.name;
- }
- }
- return shadow(this, "pageLayout", pageLayout);
- }
- get pageMode() {
- const obj = this._catDict.get("PageMode");
- let pageMode = "UseNone"; // Default value.
- if (obj instanceof Name) {
- switch (obj.name) {
- case "UseNone":
- case "UseOutlines":
- case "UseThumbs":
- case "FullScreen":
- case "UseOC":
- case "UseAttachments":
- pageMode = obj.name;
- }
- }
- return shadow(this, "pageMode", pageMode);
- }
- get viewerPreferences() {
- const obj = this._catDict.get("ViewerPreferences");
- if (!(obj instanceof Dict)) {
- return shadow(this, "viewerPreferences", null);
- }
- let prefs = null;
- for (const key of obj.getKeys()) {
- const value = obj.get(key);
- let prefValue;
- switch (key) {
- case "HideToolbar":
- case "HideMenubar":
- case "HideWindowUI":
- case "FitWindow":
- case "CenterWindow":
- case "DisplayDocTitle":
- case "PickTrayByPDFSize":
- if (typeof value === "boolean") {
- prefValue = value;
- }
- break;
- case "NonFullScreenPageMode":
- if (value instanceof Name) {
- switch (value.name) {
- case "UseNone":
- case "UseOutlines":
- case "UseThumbs":
- case "UseOC":
- prefValue = value.name;
- break;
- default:
- prefValue = "UseNone";
- }
- }
- break;
- case "Direction":
- if (value instanceof Name) {
- switch (value.name) {
- case "L2R":
- case "R2L":
- prefValue = value.name;
- break;
- default:
- prefValue = "L2R";
- }
- }
- break;
- case "ViewArea":
- case "ViewClip":
- case "PrintArea":
- case "PrintClip":
- if (value instanceof Name) {
- switch (value.name) {
- case "MediaBox":
- case "CropBox":
- case "BleedBox":
- case "TrimBox":
- case "ArtBox":
- prefValue = value.name;
- break;
- default:
- prefValue = "CropBox";
- }
- }
- break;
- case "PrintScaling":
- if (value instanceof Name) {
- switch (value.name) {
- case "None":
- case "AppDefault":
- prefValue = value.name;
- break;
- default:
- prefValue = "AppDefault";
- }
- }
- break;
- case "Duplex":
- if (value instanceof Name) {
- switch (value.name) {
- case "Simplex":
- case "DuplexFlipShortEdge":
- case "DuplexFlipLongEdge":
- prefValue = value.name;
- break;
- default:
- prefValue = "None";
- }
- }
- break;
- case "PrintPageRange":
- // The number of elements must be even.
- if (Array.isArray(value) && value.length % 2 === 0) {
- const isValid = value.every((page, i, arr) => {
- return (
- Number.isInteger(page) &&
- page > 0 &&
- (i === 0 || page >= arr[i - 1]) &&
- page <= this.numPages
- );
- });
- if (isValid) {
- prefValue = value;
- }
- }
- break;
- case "NumCopies":
- if (Number.isInteger(value) && value > 0) {
- prefValue = value;
- }
- break;
- default:
- warn(`Ignoring non-standard key in ViewerPreferences: ${key}.`);
- continue;
- }
- if (prefValue === undefined) {
- warn(`Bad value, for key "${key}", in ViewerPreferences: ${value}.`);
- continue;
- }
- if (!prefs) {
- prefs = Object.create(null);
- }
- prefs[key] = prefValue;
- }
- return shadow(this, "viewerPreferences", prefs);
- }
- get openAction() {
- const obj = this._catDict.get("OpenAction");
- const openAction = Object.create(null);
- if (obj instanceof Dict) {
- // Convert the OpenAction dictionary into a format that works with
- // `parseDestDictionary`, to avoid having to re-implement those checks.
- const destDict = new Dict(this.xref);
- destDict.set("A", obj);
- const resultObj = { url: null, dest: null, action: null };
- Catalog.parseDestDictionary({ destDict, resultObj });
- if (Array.isArray(resultObj.dest)) {
- openAction.dest = resultObj.dest;
- } else if (resultObj.action) {
- openAction.action = resultObj.action;
- }
- } else if (Array.isArray(obj)) {
- openAction.dest = obj;
- }
- return shadow(
- this,
- "openAction",
- objectSize(openAction) > 0 ? openAction : null
- );
- }
- get attachments() {
- const obj = this._catDict.get("Names");
- let attachments = null;
- if (obj instanceof Dict && obj.has("EmbeddedFiles")) {
- const nameTree = new NameTree(obj.getRaw("EmbeddedFiles"), this.xref);
- for (const [key, value] of nameTree.getAll()) {
- const fs = new FileSpec(value, this.xref);
- if (!attachments) {
- attachments = Object.create(null);
- }
- attachments[stringToPDFString(key)] = fs.serializable;
- }
- }
- return shadow(this, "attachments", attachments);
- }
- get xfaImages() {
- const obj = this._catDict.get("Names");
- let xfaImages = null;
- if (obj instanceof Dict && obj.has("XFAImages")) {
- const nameTree = new NameTree(obj.getRaw("XFAImages"), this.xref);
- for (const [key, value] of nameTree.getAll()) {
- if (!xfaImages) {
- xfaImages = new Dict(this.xref);
- }
- xfaImages.set(stringToPDFString(key), value);
- }
- }
- return shadow(this, "xfaImages", xfaImages);
- }
- _collectJavaScript() {
- const obj = this._catDict.get("Names");
- let javaScript = null;
- function appendIfJavaScriptDict(name, jsDict) {
- if (!(jsDict instanceof Dict)) {
- return;
- }
- if (!isName(jsDict.get("S"), "JavaScript")) {
- return;
- }
- let js = jsDict.get("JS");
- if (js instanceof BaseStream) {
- js = js.getString();
- } else if (typeof js !== "string") {
- return;
- }
- if (javaScript === null) {
- javaScript = new Map();
- }
- js = stringToPDFString(js).replace(/\u0000/g, "");
- javaScript.set(name, js);
- }
- if (obj instanceof Dict && obj.has("JavaScript")) {
- const nameTree = new NameTree(obj.getRaw("JavaScript"), this.xref);
- for (const [key, value] of nameTree.getAll()) {
- appendIfJavaScriptDict(stringToPDFString(key), value);
- }
- }
- // Append OpenAction "JavaScript" actions, if any, to the JavaScript map.
- const openAction = this._catDict.get("OpenAction");
- if (openAction) {
- appendIfJavaScriptDict("OpenAction", openAction);
- }
- return javaScript;
- }
- get javaScript() {
- const javaScript = this._collectJavaScript();
- return shadow(
- this,
- "javaScript",
- javaScript ? [...javaScript.values()] : null
- );
- }
- get jsActions() {
- const javaScript = this._collectJavaScript();
- let actions = collectActions(
- this.xref,
- this._catDict,
- DocumentActionEventType
- );
- if (javaScript) {
- if (!actions) {
- actions = Object.create(null);
- }
- for (const [key, val] of javaScript) {
- if (key in actions) {
- actions[key].push(val);
- } else {
- actions[key] = [val];
- }
- }
- }
- return shadow(this, "jsActions", actions);
- }
- async fontFallback(id, handler) {
- const translatedFonts = await Promise.all(this.fontCache);
- for (const translatedFont of translatedFonts) {
- if (translatedFont.loadedName === id) {
- translatedFont.fallback(handler);
- return;
- }
- }
- }
- async cleanup(manuallyTriggered = false) {
- clearGlobalCaches();
- this.globalImageCache.clear(/* onlyData = */ manuallyTriggered);
- this.pageKidsCountCache.clear();
- this.pageIndexCache.clear();
- this.nonBlendModesSet.clear();
- const translatedFonts = await Promise.all(this.fontCache);
- for (const { dict } of translatedFonts) {
- delete dict.cacheKey;
- }
- this.fontCache.clear();
- this.builtInCMapCache.clear();
- this.standardFontDataCache.clear();
- }
- async getPageDict(pageIndex) {
- const nodesToVisit = [this.toplevelPagesDict];
- const visitedNodes = new RefSet();
- const pagesRef = this._catDict.getRaw("Pages");
- if (pagesRef instanceof Ref) {
- visitedNodes.put(pagesRef);
- }
- const xref = this.xref,
- pageKidsCountCache = this.pageKidsCountCache,
- pageIndexCache = this.pageIndexCache;
- let currentPageIndex = 0;
- while (nodesToVisit.length) {
- const currentNode = nodesToVisit.pop();
- if (currentNode instanceof Ref) {
- const count = pageKidsCountCache.get(currentNode);
- // Skip nodes where the page can't be.
- if (count >= 0 && currentPageIndex + count <= pageIndex) {
- currentPageIndex += count;
- continue;
- }
- // Prevent circular references in the /Pages tree.
- if (visitedNodes.has(currentNode)) {
- throw new FormatError("Pages tree contains circular reference.");
- }
- visitedNodes.put(currentNode);
- const obj = await xref.fetchAsync(currentNode);
- if (obj instanceof Dict) {
- let type = obj.getRaw("Type");
- if (type instanceof Ref) {
- type = await xref.fetchAsync(type);
- }
- if (isName(type, "Page") || !obj.has("Kids")) {
- // Cache the Page reference, since it can *greatly* improve
- // performance by reducing redundant lookups in long documents
- // where all nodes are found at *one* level of the tree.
- if (!pageKidsCountCache.has(currentNode)) {
- pageKidsCountCache.put(currentNode, 1);
- }
- // Help improve performance of the `getPageIndex` method.
- if (!pageIndexCache.has(currentNode)) {
- pageIndexCache.put(currentNode, currentPageIndex);
- }
- if (currentPageIndex === pageIndex) {
- return [obj, currentNode];
- }
- currentPageIndex++;
- continue;
- }
- }
- nodesToVisit.push(obj);
- continue;
- }
- // Must be a child page dictionary.
- if (!(currentNode instanceof Dict)) {
- throw new FormatError(
- "Page dictionary kid reference points to wrong type of object."
- );
- }
- const { objId } = currentNode;
- let count = currentNode.getRaw("Count");
- if (count instanceof Ref) {
- count = await xref.fetchAsync(count);
- }
- if (Number.isInteger(count) && count >= 0) {
- // Cache the Kids count, since it can reduce redundant lookups in
- // documents where all nodes are found at *one* level of the tree.
- if (objId && !pageKidsCountCache.has(objId)) {
- pageKidsCountCache.put(objId, count);
- }
- // Skip nodes where the page can't be.
- if (currentPageIndex + count <= pageIndex) {
- currentPageIndex += count;
- continue;
- }
- }
- let kids = currentNode.getRaw("Kids");
- if (kids instanceof Ref) {
- kids = await xref.fetchAsync(kids);
- }
- if (!Array.isArray(kids)) {
- // Prevent errors in corrupt PDF documents that violate the
- // specification by *inlining* Page dicts directly in the Kids
- // array, rather than using indirect objects (fixes issue9540.pdf).
- let type = currentNode.getRaw("Type");
- if (type instanceof Ref) {
- type = await xref.fetchAsync(type);
- }
- if (isName(type, "Page") || !currentNode.has("Kids")) {
- if (currentPageIndex === pageIndex) {
- return [currentNode, null];
- }
- currentPageIndex++;
- continue;
- }
- throw new FormatError("Page dictionary kids object is not an array.");
- }
- // Always check all `Kids` nodes, to avoid getting stuck in an empty
- // node further down in the tree (see issue5644.pdf, issue8088.pdf),
- // and to ensure that we actually find the correct `Page` dict.
- for (let last = kids.length - 1; last >= 0; last--) {
- nodesToVisit.push(kids[last]);
- }
- }
- throw new Error(`Page index ${pageIndex} not found.`);
- }
- /**
- * Eagerly fetches the entire /Pages-tree; should ONLY be used as a fallback.
- * @returns {Promise<Map>}
- */
- async getAllPageDicts(recoveryMode = false) {
- const { ignoreErrors } = this.pdfManager.evaluatorOptions;
- const queue = [{ currentNode: this.toplevelPagesDict, posInKids: 0 }];
- const visitedNodes = new RefSet();
- const pagesRef = this._catDict.getRaw("Pages");
- if (pagesRef instanceof Ref) {
- visitedNodes.put(pagesRef);
- }
- const map = new Map(),
- xref = this.xref,
- pageIndexCache = this.pageIndexCache;
- let pageIndex = 0;
- function addPageDict(pageDict, pageRef) {
- // Help improve performance of the `getPageIndex` method.
- if (pageRef && !pageIndexCache.has(pageRef)) {
- pageIndexCache.put(pageRef, pageIndex);
- }
- map.set(pageIndex++, [pageDict, pageRef]);
- }
- function addPageError(error) {
- if (error instanceof XRefEntryException && !recoveryMode) {
- throw error;
- }
- if (recoveryMode && ignoreErrors && pageIndex === 0) {
- // Ensure that the viewer will always load (fixes issue15590.pdf).
- warn(`getAllPageDicts - Skipping invalid first page: "${error}".`);
- error = Dict.empty;
- }
- map.set(pageIndex++, [error, null]);
- }
- while (queue.length > 0) {
- const queueItem = queue.at(-1);
- const { currentNode, posInKids } = queueItem;
- let kids = currentNode.getRaw("Kids");
- if (kids instanceof Ref) {
- try {
- kids = await xref.fetchAsync(kids);
- } catch (ex) {
- addPageError(ex);
- break;
- }
- }
- if (!Array.isArray(kids)) {
- addPageError(
- new FormatError("Page dictionary kids object is not an array.")
- );
- break;
- }
- if (posInKids >= kids.length) {
- queue.pop();
- continue;
- }
- const kidObj = kids[posInKids];
- let obj;
- if (kidObj instanceof Ref) {
- // Prevent circular references in the /Pages tree.
- if (visitedNodes.has(kidObj)) {
- addPageError(
- new FormatError("Pages tree contains circular reference.")
- );
- break;
- }
- visitedNodes.put(kidObj);
- try {
- obj = await xref.fetchAsync(kidObj);
- } catch (ex) {
- addPageError(ex);
- break;
- }
- } else {
- // Prevent errors in corrupt PDF documents that violate the
- // specification by *inlining* Page dicts directly in the Kids
- // array, rather than using indirect objects (see issue9540.pdf).
- obj = kidObj;
- }
- if (!(obj instanceof Dict)) {
- addPageError(
- new FormatError(
- "Page dictionary kid reference points to wrong type of object."
- )
- );
- break;
- }
- let type = obj.getRaw("Type");
- if (type instanceof Ref) {
- try {
- type = await xref.fetchAsync(type);
- } catch (ex) {
- addPageError(ex);
- break;
- }
- }
- if (isName(type, "Page") || !obj.has("Kids")) {
- addPageDict(obj, kidObj instanceof Ref ? kidObj : null);
- } else {
- queue.push({ currentNode: obj, posInKids: 0 });
- }
- queueItem.posInKids++;
- }
- return map;
- }
- getPageIndex(pageRef) {
- const cachedPageIndex = this.pageIndexCache.get(pageRef);
- if (cachedPageIndex !== undefined) {
- return Promise.resolve(cachedPageIndex);
- }
- // The page tree nodes have the count of all the leaves below them. To get
- // how many pages are before we just have to walk up the tree and keep
- // adding the count of siblings to the left of the node.
- const xref = this.xref;
- function pagesBeforeRef(kidRef) {
- let total = 0,
- parentRef;
- return xref
- .fetchAsync(kidRef)
- .then(function (node) {
- if (
- isRefsEqual(kidRef, pageRef) &&
- !isDict(node, "Page") &&
- !(node instanceof Dict && !node.has("Type") && node.has("Contents"))
- ) {
- throw new FormatError(
- "The reference does not point to a /Page dictionary."
- );
- }
- if (!node) {
- return null;
- }
- if (!(node instanceof Dict)) {
- throw new FormatError("Node must be a dictionary.");
- }
- parentRef = node.getRaw("Parent");
- return node.getAsync("Parent");
- })
- .then(function (parent) {
- if (!parent) {
- return null;
- }
- if (!(parent instanceof Dict)) {
- throw new FormatError("Parent must be a dictionary.");
- }
- return parent.getAsync("Kids");
- })
- .then(function (kids) {
- if (!kids) {
- return null;
- }
- const kidPromises = [];
- let found = false;
- for (const kid of kids) {
- if (!(kid instanceof Ref)) {
- throw new FormatError("Kid must be a reference.");
- }
- if (isRefsEqual(kid, kidRef)) {
- found = true;
- break;
- }
- kidPromises.push(
- xref.fetchAsync(kid).then(function (obj) {
- if (!(obj instanceof Dict)) {
- throw new FormatError("Kid node must be a dictionary.");
- }
- if (obj.has("Count")) {
- total += obj.get("Count");
- } else {
- // Page leaf node.
- total++;
- }
- })
- );
- }
- if (!found) {
- throw new FormatError("Kid reference not found in parent's kids.");
- }
- return Promise.all(kidPromises).then(function () {
- return [total, parentRef];
- });
- });
- }
- let total = 0;
- const next = ref =>
- pagesBeforeRef(ref).then(args => {
- if (!args) {
- this.pageIndexCache.put(pageRef, total);
- return total;
- }
- const [count, parentRef] = args;
- total += count;
- return next(parentRef);
- });
- return next(pageRef);
- }
- get baseUrl() {
- const uri = this._catDict.get("URI");
- if (uri instanceof Dict) {
- const base = uri.get("Base");
- if (typeof base === "string") {
- const absoluteUrl = createValidAbsoluteUrl(base, null, {
- tryConvertEncoding: true,
- });
- if (absoluteUrl) {
- return shadow(this, "baseUrl", absoluteUrl.href);
- }
- }
- }
- return shadow(this, "baseUrl", null);
- }
- /**
- * @typedef {Object} ParseDestDictionaryParameters
- * @property {Dict} destDict - The dictionary containing the destination.
- * @property {Object} resultObj - The object where the parsed destination
- * properties will be placed.
- * @property {string} [docBaseUrl] - The document base URL that is used when
- * attempting to recover valid absolute URLs from relative ones.
- * @property {Object} [docAttachments] - The document attachments (may not
- * exist in most PDF documents).
- */
- /**
- * Helper function used to parse the contents of destination dictionaries.
- * @param {ParseDestDictionaryParameters} params
- */
- static parseDestDictionary(params) {
- const destDict = params.destDict;
- if (!(destDict instanceof Dict)) {
- warn("parseDestDictionary: `destDict` must be a dictionary.");
- return;
- }
- const resultObj = params.resultObj;
- if (typeof resultObj !== "object") {
- warn("parseDestDictionary: `resultObj` must be an object.");
- return;
- }
- const docBaseUrl = params.docBaseUrl || null;
- const docAttachments = params.docAttachments || null;
- let action = destDict.get("A"),
- url,
- dest;
- if (!(action instanceof Dict)) {
- if (destDict.has("Dest")) {
- // A /Dest entry should *only* contain a Name or an Array, but some bad
- // PDF generators ignore that and treat it as an /A entry.
- action = destDict.get("Dest");
- } else {
- action = destDict.get("AA");
- if (action instanceof Dict) {
- if (action.has("D")) {
- // MouseDown
- action = action.get("D");
- } else if (action.has("U")) {
- // MouseUp
- action = action.get("U");
- }
- }
- }
- }
- if (action instanceof Dict) {
- const actionType = action.get("S");
- if (!(actionType instanceof Name)) {
- warn("parseDestDictionary: Invalid type in Action dictionary.");
- return;
- }
- const actionName = actionType.name;
- switch (actionName) {
- case "ResetForm":
- const flags = action.get("Flags");
- const include = ((typeof flags === "number" ? flags : 0) & 1) === 0;
- const fields = [];
- const refs = [];
- for (const obj of action.get("Fields") || []) {
- if (obj instanceof Ref) {
- refs.push(obj.toString());
- } else if (typeof obj === "string") {
- fields.push(stringToPDFString(obj));
- }
- }
- resultObj.resetForm = { fields, refs, include };
- break;
- case "URI":
- url = action.get("URI");
- if (url instanceof Name) {
- // Some bad PDFs do not put parentheses around relative URLs.
- url = "/" + url.name;
- }
- break;
- case "GoTo":
- dest = action.get("D");
- break;
- case "Launch":
- // We neither want, nor can, support arbitrary 'Launch' actions.
- // However, in practice they are mostly used for linking to other PDF
- // files, which we thus attempt to support (utilizing `docBaseUrl`).
- /* falls through */
- case "GoToR":
- const urlDict = action.get("F");
- if (urlDict instanceof Dict) {
- // We assume that we found a FileSpec dictionary
- // and fetch the URL without checking any further.
- url = urlDict.get("F") || null;
- } else if (typeof urlDict === "string") {
- url = urlDict;
- }
- // NOTE: the destination is relative to the *remote* document.
- let remoteDest = action.get("D");
- if (remoteDest) {
- if (remoteDest instanceof Name) {
- remoteDest = remoteDest.name;
- }
- if (typeof url === "string") {
- const baseUrl = url.split("#")[0];
- if (typeof remoteDest === "string") {
- url = baseUrl + "#" + remoteDest;
- } else if (Array.isArray(remoteDest)) {
- url = baseUrl + "#" + JSON.stringify(remoteDest);
- }
- }
- }
- // The 'NewWindow' property, equal to `LinkTarget.BLANK`.
- const newWindow = action.get("NewWindow");
- if (typeof newWindow === "boolean") {
- resultObj.newWindow = newWindow;
- }
- break;
- case "GoToE":
- const target = action.get("T");
- let attachment;
- if (docAttachments && target instanceof Dict) {
- const relationship = target.get("R");
- const name = target.get("N");
- if (isName(relationship, "C") && typeof name === "string") {
- attachment = docAttachments[stringToPDFString(name)];
- }
- }
- if (attachment) {
- resultObj.attachment = attachment;
- } else {
- warn(`parseDestDictionary - unimplemented "GoToE" action.`);
- }
- break;
- case "Named":
- const namedAction = action.get("N");
- if (namedAction instanceof Name) {
- resultObj.action = namedAction.name;
- }
- break;
- case "SetOCGState":
- const state = action.get("State");
- const preserveRB = action.get("PreserveRB");
- if (!Array.isArray(state) || state.length === 0) {
- break;
- }
- const stateArr = [];
- for (const elem of state) {
- if (elem instanceof Name) {
- switch (elem.name) {
- case "ON":
- case "OFF":
- case "Toggle":
- stateArr.push(elem.name);
- break;
- }
- } else if (elem instanceof Ref) {
- stateArr.push(elem.toString());
- }
- }
- if (stateArr.length !== state.length) {
- break; // Some of the original entries are not valid.
- }
- resultObj.setOCGState = {
- state: stateArr,
- preserveRB: typeof preserveRB === "boolean" ? preserveRB : true,
- };
- break;
- case "JavaScript":
- const jsAction = action.get("JS");
- let js;
- if (jsAction instanceof BaseStream) {
- js = jsAction.getString();
- } else if (typeof jsAction === "string") {
- js = jsAction;
- }
- const jsURL = js && recoverJsURL(stringToPDFString(js));
- if (jsURL) {
- url = jsURL.url;
- resultObj.newWindow = jsURL.newWindow;
- break;
- }
- /* falls through */
- default:
- if (actionName === "JavaScript" || actionName === "SubmitForm") {
- // Don't bother the user with a warning for actions that require
- // scripting support, since those will be handled separately.
- break;
- }
- warn(`parseDestDictionary - unsupported action: "${actionName}".`);
- break;
- }
- } else if (destDict.has("Dest")) {
- // Simple destination.
- dest = destDict.get("Dest");
- }
- if (typeof url === "string") {
- const absoluteUrl = createValidAbsoluteUrl(url, docBaseUrl, {
- addDefaultProtocol: true,
- tryConvertEncoding: true,
- });
- if (absoluteUrl) {
- resultObj.url = absoluteUrl.href;
- }
- resultObj.unsafeUrl = url;
- }
- if (dest) {
- if (dest instanceof Name) {
- dest = dest.name;
- }
- if (typeof dest === "string") {
- resultObj.dest = stringToPDFString(dest);
- } else if (Array.isArray(dest)) {
- resultObj.dest = dest;
- }
- }
- }
- }
- export { Catalog };
|