UNPKG

pdfjs-dist/lib/core/parser.js

Version:
34.5 kBJavaScriptView Raw
1/**
* @licstart The following is the entire license notice for the
* JavaScript code in this page
*
* Copyright 2022 Mozilla Foundation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* @licend The above is the entire license notice for the
* JavaScript code in this page
*/
22"use strict";
23
24Object.defineProperty(exports, "__esModule", {
value: true
26});
27exports.Parser = exports.Linearization = exports.Lexer = void 0;
28
29var _util = require("../shared/util.js");
30
31var _primitives = require("./primitives.js");
32
33var _core_utils = require("./core_utils.js");
34
35var _ascii_85_stream = require("./ascii_85_stream.js");
36
37var _ascii_hex_stream = require("./ascii_hex_stream.js");
38
39var _ccitt_stream = require("./ccitt_stream.js");
40
41var _flate_stream = require("./flate_stream.js");
42
43var _jbig2_stream = require("./jbig2_stream.js");
44
45var _jpeg_stream = require("./jpeg_stream.js");
46
47var _jpx_stream = require("./jpx_stream.js");
48
49var _lzw_stream = require("./lzw_stream.js");
50
51var _stream = require("./stream.js");
52
53var _predictor_stream = require("./predictor_stream.js");
54
55var _run_length_stream = require("./run_length_stream.js");
56
57const MAX_LENGTH_TO_CACHE = 1000;
58const MAX_ADLER32_LENGTH = 5552;
59
60function computeAdler32(bytes) {
const bytesLength = bytes.length;
let a = 1,
    b = 0;
64
for (let i = 0; i < bytesLength; ++i) {
  a += bytes[i] & 0xff;
  b += a;
}
69
return b % 65521 << 16 | a % 65521;
71}
72
73class Parser {
constructor({
  lexer,
  xref,
  allowStreams = false,
  recoveryMode = false
}) {
  this.lexer = lexer;
  this.xref = xref;
  this.allowStreams = allowStreams;
  this.recoveryMode = recoveryMode;
  this.imageCache = Object.create(null);
  this.refill();
}
87
refill() {
  this.buf1 = this.lexer.getObj();
  this.buf2 = this.lexer.getObj();
}
92
shift() {
  if (this.buf2 instanceof _primitives.Cmd && this.buf2.cmd === "ID") {
    this.buf1 = this.buf2;
    this.buf2 = null;
  } else {
    this.buf1 = this.buf2;
    this.buf2 = this.lexer.getObj();
  }
}
102
tryShift() {
  try {
    this.shift();
    return true;
  } catch (e) {
    if (e instanceof _core_utils.MissingDataException) {
      throw e;
    }
111
    return false;
  }
}
115
getObj(cipherTransform = null) {
  const buf1 = this.buf1;
  this.shift();
119
  if (buf1 instanceof _primitives.Cmd) {
    switch (buf1.cmd) {
      case "BI":
        return this.makeInlineImage(cipherTransform);
124
      case "[":
        const array = [];
127
        while (!(0, _primitives.isCmd)(this.buf1, "]") && this.buf1 !== _primitives.EOF) {
          array.push(this.getObj(cipherTransform));
        }
131
        if (this.buf1 === _primitives.EOF) {
          if (this.recoveryMode) {
            return array;
          }
136
          throw new _core_utils.ParserEOFException("End of file inside array.");
        }
139
        this.shift();
        return array;
142
      case "<<":
        const dict = new _primitives.Dict(this.xref);
145
        while (!(0, _primitives.isCmd)(this.buf1, ">>") && this.buf1 !== _primitives.EOF) {
          if (!(this.buf1 instanceof _primitives.Name)) {
            (0, _util.info)("Malformed dictionary: key must be a name object");
            this.shift();
            continue;
          }
152
          const key = this.buf1.name;
          this.shift();
155
          if (this.buf1 === _primitives.EOF) {
            break;
          }
159
          dict.set(key, this.getObj(cipherTransform));
        }
162
        if (this.buf1 === _primitives.EOF) {
          if (this.recoveryMode) {
            return dict;
          }
167
          throw new _core_utils.ParserEOFException("End of file inside dictionary.");
        }
170
        if ((0, _primitives.isCmd)(this.buf2, "stream")) {
          return this.allowStreams ? this.makeStream(dict, cipherTransform) : dict;
        }
174
        this.shift();
        return dict;
177
      default:
        return buf1;
    }
  }
182
  if (Number.isInteger(buf1)) {
    if (Number.isInteger(this.buf1) && (0, _primitives.isCmd)(this.buf2, "R")) {
      const ref = _primitives.Ref.get(buf1, this.buf1);
186
      this.shift();
      this.shift();
      return ref;
    }
191
    return buf1;
  }
194
  if (typeof buf1 === "string") {
    if (cipherTransform) {
      return cipherTransform.decryptString(buf1);
    }
199
    return buf1;
  }
202
  return buf1;
}
205
findDefaultInlineStreamEnd(stream) {
  const E = 0x45,
        I = 0x49,
        SPACE = 0x20,
        LF = 0xa,
        CR = 0xd,
        NUL = 0x0;
  const lexer = this.lexer,
        startPos = stream.pos,
        n = 10;
  let state = 0,
      ch,
      maybeEIPos;
219
  while ((ch = stream.getByte()) !== -1) {
    if (state === 0) {
      state = ch === E ? 1 : 0;
    } else if (state === 1) {
      state = ch === I ? 2 : 0;
    } else {
      (0, _util.assert)(state === 2, "findDefaultInlineStreamEnd - invalid state.");
227
      if (ch === SPACE || ch === LF || ch === CR) {
        maybeEIPos = stream.pos;
        const followingBytes = stream.peekBytes(n);
231
        for (let i = 0, ii = followingBytes.length; i < ii; i++) {
          ch = followingBytes[i];
234
          if (ch === NUL && followingBytes[i + 1] !== NUL) {
            continue;
          }
238
          if (ch !== LF && ch !== CR && (ch < SPACE || ch > 0x7f)) {
            state = 0;
            break;
          }
        }
244
        if (state !== 2) {
          continue;
        }
248
        if (lexer.knownCommands) {
          const nextObj = lexer.peekObj();
251
          if (nextObj instanceof _primitives.Cmd && !lexer.knownCommands[nextObj.cmd]) {
            state = 0;
          }
        } else {
          (0, _util.warn)("findDefaultInlineStreamEnd - `lexer.knownCommands` is undefined.");
        }
258
        if (state === 2) {
          break;
        }
      } else {
        state = 0;
      }
    }
  }
267
  if (ch === -1) {
    (0, _util.warn)("findDefaultInlineStreamEnd: " + "Reached the end of the stream without finding a valid EI marker");
270
    if (maybeEIPos) {
      (0, _util.warn)('... trying to recover by using the last "EI" occurrence.');
      stream.skip(-(stream.pos - maybeEIPos));
    }
  }
276
  let endOffset = 4;
  stream.skip(-endOffset);
  ch = stream.peekByte();
  stream.skip(endOffset);
281
  if (!(0, _core_utils.isWhiteSpace)(ch)) {
    endOffset--;
  }
285
  return stream.pos - endOffset - startPos;
}
288
findDCTDecodeInlineStreamEnd(stream) {
  const startPos = stream.pos;
  let foundEOI = false,
      b,
      markerLength;
294
  while ((b = stream.getByte()) !== -1) {
    if (b !== 0xff) {
      continue;
    }
299
    switch (stream.getByte()) {
      case 0x00:
        break;
303
      case 0xff:
        stream.skip(-1);
        break;
307
      case 0xd9:
        foundEOI = true;
        break;
311
      case 0xc0:
      case 0xc1:
      case 0xc2:
      case 0xc3:
      case 0xc5:
      case 0xc6:
      case 0xc7:
      case 0xc9:
      case 0xca:
      case 0xcb:
      case 0xcd:
      case 0xce:
      case 0xcf:
      case 0xc4:
      case 0xcc:
      case 0xda:
      case 0xdb:
      case 0xdc:
      case 0xdd:
      case 0xde:
      case 0xdf:
      case 0xe0:
      case 0xe1:
      case 0xe2:
      case 0xe3:
      case 0xe4:
      case 0xe5:
      case 0xe6:
      case 0xe7:
      case 0xe8:
      case 0xe9:
      case 0xea:
      case 0xeb:
      case 0xec:
      case 0xed:
      case 0xee:
      case 0xef:
      case 0xfe:
        markerLength = stream.getUint16();
351
        if (markerLength > 2) {
          stream.skip(markerLength - 2);
        } else {
          stream.skip(-2);
        }
357
        break;
    }
360
    if (foundEOI) {
      break;
    }
  }
365
  const length = stream.pos - startPos;
367
  if (b === -1) {
    (0, _util.warn)("Inline DCTDecode image stream: " + "EOI marker not found, searching for /EI/ instead.");
    stream.skip(-length);
    return this.findDefaultInlineStreamEnd(stream);
  }
373
  this.inlineStreamSkipEI(stream);
  return length;
}
377
findASCII85DecodeInlineStreamEnd(stream) {
  const TILDE = 0x7e,
        GT = 0x3e;
  const startPos = stream.pos;
  let ch;
383
  while ((ch = stream.getByte()) !== -1) {
    if (ch === TILDE) {
      const tildePos = stream.pos;
      ch = stream.peekByte();
388
      while ((0, _core_utils.isWhiteSpace)(ch)) {
        stream.skip();
        ch = stream.peekByte();
      }
393
      if (ch === GT) {
        stream.skip();
        break;
      }
398
      if (stream.pos > tildePos) {
        const maybeEI = stream.peekBytes(2);
401
        if (maybeEI[0] === 0x45 && maybeEI[1] === 0x49) {
          break;
        }
      }
    }
  }
408
  const length = stream.pos - startPos;
410
  if (ch === -1) {
    (0, _util.warn)("Inline ASCII85Decode image stream: " + "EOD marker not found, searching for /EI/ instead.");
    stream.skip(-length);
    return this.findDefaultInlineStreamEnd(stream);
  }
416
  this.inlineStreamSkipEI(stream);
  return length;
}
420
findASCIIHexDecodeInlineStreamEnd(stream) {
  const GT = 0x3e;
  const startPos = stream.pos;
  let ch;
425
  while ((ch = stream.getByte()) !== -1) {
    if (ch === GT) {
      break;
    }
  }
431
  const length = stream.pos - startPos;
433
  if (ch === -1) {
    (0, _util.warn)("Inline ASCIIHexDecode image stream: " + "EOD marker not found, searching for /EI/ instead.");
    stream.skip(-length);
    return this.findDefaultInlineStreamEnd(stream);
  }
439
  this.inlineStreamSkipEI(stream);
  return length;
}
443
inlineStreamSkipEI(stream) {
  const E = 0x45,
        I = 0x49;
  let state = 0,
      ch;
449
  while ((ch = stream.getByte()) !== -1) {
    if (state === 0) {
      state = ch === E ? 1 : 0;
    } else if (state === 1) {
      state = ch === I ? 2 : 0;
    } else if (state === 2) {
      break;
    }
  }
}
460
makeInlineImage(cipherTransform) {
  const lexer = this.lexer;
  const stream = lexer.stream;
  const dict = new _primitives.Dict(this.xref);
  let dictLength;
466
  while (!(0, _primitives.isCmd)(this.buf1, "ID") && this.buf1 !== _primitives.EOF) {
    if (!(this.buf1 instanceof _primitives.Name)) {
      throw new _util.FormatError("Dictionary key must be a name object");
    }
471
    const key = this.buf1.name;
    this.shift();
474
    if (this.buf1 === _primitives.EOF) {
      break;
    }
478
    dict.set(key, this.getObj(cipherTransform));
  }
481
  if (lexer.beginInlineImagePos !== -1) {
    dictLength = stream.pos - lexer.beginInlineImagePos;
  }
485
  const filter = dict.get("F", "Filter");
  let filterName;
488
  if (filter instanceof _primitives.Name) {
    filterName = filter.name;
  } else if (Array.isArray(filter)) {
    const filterZero = this.xref.fetchIfRef(filter[0]);
493
    if (filterZero instanceof _primitives.Name) {
      filterName = filterZero.name;
    }
  }
498
  const startPos = stream.pos;
  let length;
501
  switch (filterName) {
    case "DCT":
    case "DCTDecode":
      length = this.findDCTDecodeInlineStreamEnd(stream);
      break;
507
    case "A85":
    case "ASCII85Decode":
      length = this.findASCII85DecodeInlineStreamEnd(stream);
      break;
512
    case "AHx":
    case "ASCIIHexDecode":
      length = this.findASCIIHexDecodeInlineStreamEnd(stream);
      break;
517
    default:
      length = this.findDefaultInlineStreamEnd(stream);
  }
521
  let imageStream = stream.makeSubStream(startPos, length, dict);
  let cacheKey;
524
  if (length < MAX_LENGTH_TO_CACHE && dictLength < MAX_ADLER32_LENGTH) {
    const imageBytes = imageStream.getBytes();
    imageStream.reset();
    const initialStreamPos = stream.pos;
    stream.pos = lexer.beginInlineImagePos;
    const dictBytes = stream.getBytes(dictLength);
    stream.pos = initialStreamPos;
    cacheKey = computeAdler32(imageBytes) + "_" + computeAdler32(dictBytes);
    const cacheEntry = this.imageCache[cacheKey];
534
    if (cacheEntry !== undefined) {
      this.buf2 = _primitives.Cmd.get("EI");
      this.shift();
      cacheEntry.reset();
      return cacheEntry;
    }
  }
542
  if (cipherTransform) {
    imageStream = cipherTransform.createStream(imageStream, length);
  }
546
  imageStream = this.filter(imageStream, dict, length);
  imageStream.dict = dict;
549
  if (cacheKey !== undefined) {
    imageStream.cacheKey = `inline_${length}_${cacheKey}`;
    this.imageCache[cacheKey] = imageStream;
  }
554
  this.buf2 = _primitives.Cmd.get("EI");
  this.shift();
  return imageStream;
}
559
_findStreamLength(startPos, signature) {
  const {
    stream
  } = this.lexer;
  stream.pos = startPos;
  const SCAN_BLOCK_LENGTH = 2048;
  const signatureLength = signature.length;
567
  while (stream.pos < stream.end) {
    const scanBytes = stream.peekBytes(SCAN_BLOCK_LENGTH);
    const scanLength = scanBytes.length - signatureLength;
571
    if (scanLength <= 0) {
      break;
    }
575
    let pos = 0;
577
    while (pos < scanLength) {
      let j = 0;
580
      while (j < signatureLength && scanBytes[pos + j] === signature[j]) {
        j++;
      }
584
      if (j >= signatureLength) {
        stream.pos += pos;
        return stream.pos - startPos;
      }
589
      pos++;
    }
592
    stream.pos += scanLength;
  }
595
  return -1;
}
598
makeStream(dict, cipherTransform) {
  const lexer = this.lexer;
  let stream = lexer.stream;
  lexer.skipToNextLine();
  const startPos = stream.pos - 1;
  let length = dict.get("Length");
605
  if (!Number.isInteger(length)) {
    (0, _util.info)(`Bad length "${length && length.toString()}" in stream.`);
    length = 0;
  }
610
  stream.pos = startPos + length;
  lexer.nextChar();
613
  if (this.tryShift() && (0, _primitives.isCmd)(this.buf2, "endstream")) {
    this.shift();
  } else {
    const ENDSTREAM_SIGNATURE = new Uint8Array([0x65, 0x6e, 0x64, 0x73, 0x74, 0x72, 0x65, 0x61, 0x6d]);
618
    let actualLength = this._findStreamLength(startPos, ENDSTREAM_SIGNATURE);
620
    if (actualLength < 0) {
      const MAX_TRUNCATION = 1;
623
      for (let i = 1; i <= MAX_TRUNCATION; i++) {
        const end = ENDSTREAM_SIGNATURE.length - i;
        const TRUNCATED_SIGNATURE = ENDSTREAM_SIGNATURE.slice(0, end);
627
        const maybeLength = this._findStreamLength(startPos, TRUNCATED_SIGNATURE);
629
        if (maybeLength >= 0) {
          const lastByte = stream.peekBytes(end + 1)[end];
632
          if (!(0, _core_utils.isWhiteSpace)(lastByte)) {
            break;
          }
636
          (0, _util.info)(`Found "${(0, _util.bytesToString)(TRUNCATED_SIGNATURE)}" when ` + "searching for endstream command.");
          actualLength = maybeLength;
          break;
        }
      }
642
      if (actualLength < 0) {
        throw new _util.FormatError("Missing endstream command.");
      }
    }
647
    length = actualLength;
    lexer.nextChar();
    this.shift();
    this.shift();
  }
653
  this.shift();
  stream = stream.makeSubStream(startPos, length, dict);
656
  if (cipherTransform) {
    stream = cipherTransform.createStream(stream, length);
  }
660
  stream = this.filter(stream, dict, length);
  stream.dict = dict;
  return stream;
}
665
filter(stream, dict, length) {
  let filter = dict.get("F", "Filter");
  let params = dict.get("DP", "DecodeParms");
669
  if (filter instanceof _primitives.Name) {
    if (Array.isArray(params)) {
      (0, _util.warn)("/DecodeParms should not be an Array, when /Filter is a Name.");
    }
674
    return this.makeFilter(stream, filter.name, length, params);
  }
677
  let maybeLength = length;
679
  if (Array.isArray(filter)) {
    const filterArray = filter;
    const paramsArray = params;
683
    for (let i = 0, ii = filterArray.length; i < ii; ++i) {
      filter = this.xref.fetchIfRef(filterArray[i]);
686
      if (!(filter instanceof _primitives.Name)) {
        throw new _util.FormatError(`Bad filter name "${filter}"`);
      }
690
      params = null;
692
      if (Array.isArray(paramsArray) && i in paramsArray) {
        params = this.xref.fetchIfRef(paramsArray[i]);
      }
696
      stream = this.makeFilter(stream, filter.name, maybeLength, params);
      maybeLength = null;
    }
  }
701
  return stream;
}
704
makeFilter(stream, name, maybeLength, params) {
  if (maybeLength === 0) {
    (0, _util.warn)(`Empty "${name}" stream.`);
    return new _stream.NullStream();
  }
710
  const xrefStats = this.xref.stats;
712
  try {
    switch (name) {
      case "Fl":
      case "FlateDecode":
        xrefStats.addStreamType(_util.StreamType.FLATE);
718
        if (params) {
          return new _predictor_stream.PredictorStream(new _flate_stream.FlateStream(stream, maybeLength), maybeLength, params);
        }
722
        return new _flate_stream.FlateStream(stream, maybeLength);
724
      case "LZW":
      case "LZWDecode":
        xrefStats.addStreamType(_util.StreamType.LZW);
        let earlyChange = 1;
729
        if (params) {
          if (params.has("EarlyChange")) {
            earlyChange = params.get("EarlyChange");
          }
734
          return new _predictor_stream.PredictorStream(new _lzw_stream.LZWStream(stream, maybeLength, earlyChange), maybeLength, params);
        }
737
        return new _lzw_stream.LZWStream(stream, maybeLength, earlyChange);
739
      case "DCT":
      case "DCTDecode":
        xrefStats.addStreamType(_util.StreamType.DCT);
        return new _jpeg_stream.JpegStream(stream, maybeLength, params);
744
      case "JPX":
      case "JPXDecode":
        xrefStats.addStreamType(_util.StreamType.JPX);
        return new _jpx_stream.JpxStream(stream, maybeLength, params);
749
      case "A85":
      case "ASCII85Decode":
        xrefStats.addStreamType(_util.StreamType.A85);
        return new _ascii_85_stream.Ascii85Stream(stream, maybeLength);
754
      case "AHx":
      case "ASCIIHexDecode":
        xrefStats.addStreamType(_util.StreamType.AHX);
        return new _ascii_hex_stream.AsciiHexStream(stream, maybeLength);
759
      case "CCF":
      case "CCITTFaxDecode":
        xrefStats.addStreamType(_util.StreamType.CCF);
        return new _ccitt_stream.CCITTFaxStream(stream, maybeLength, params);
764
      case "RL":
      case "RunLengthDecode":
        xrefStats.addStreamType(_util.StreamType.RLX);
        return new _run_length_stream.RunLengthStream(stream, maybeLength);
769
      case "JBIG2Decode":
        xrefStats.addStreamType(_util.StreamType.JBIG);
        return new _jbig2_stream.Jbig2Stream(stream, maybeLength, params);
    }
774
    (0, _util.warn)(`Filter "${name}" is not supported.`);
    return stream;
  } catch (ex) {
    if (ex instanceof _core_utils.MissingDataException) {
      throw ex;
    }
781
    (0, _util.warn)(`Invalid stream: "${ex}"`);
    return new _stream.NullStream();
  }
}
786
787}
788
789exports.Parser = Parser;
790const specialChars = [1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 2, 0, 0, 2, 2, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0];
791
792function toHexDigit(ch) {
if (ch >= 0x30 && ch <= 0x39) {
  return ch & 0x0f;
}
796
if (ch >= 0x41 && ch <= 0x46 || ch >= 0x61 && ch <= 0x66) {
  return (ch & 0x0f) + 9;
}
800
return -1;
802}
803
804class Lexer {
constructor(stream, knownCommands = null) {
  this.stream = stream;
  this.nextChar();
  this.strBuf = [];
  this.knownCommands = knownCommands;
  this._hexStringNumWarn = 0;
  this.beginInlineImagePos = -1;
}
813
nextChar() {
  return this.currentChar = this.stream.getByte();
}
817
peekChar() {
  return this.stream.peekByte();
}
821
getNumber() {
  let ch = this.currentChar;
  let eNotation = false;
  let divideBy = 0;
  let sign = 0;
827
  if (ch === 0x2d) {
    sign = -1;
    ch = this.nextChar();
831
    if (ch === 0x2d) {
      ch = this.nextChar();
    }
  } else if (ch === 0x2b) {
    sign = 1;
    ch = this.nextChar();
  }
839
  if (ch === 0x0a || ch === 0x0d) {
    do {
      ch = this.nextChar();
    } while (ch === 0x0a || ch === 0x0d);
  }
845
  if (ch === 0x2e) {
    divideBy = 10;
    ch = this.nextChar();
  }
850
  if (ch < 0x30 || ch > 0x39) {
    if ((0, _core_utils.isWhiteSpace)(ch) || ch === -1) {
      if (divideBy === 10 && sign === 0) {
        (0, _util.warn)("Lexer.getNumber - treating a single decimal point as zero.");
        return 0;
      }
857
      if (divideBy === 0 && sign === -1) {
        (0, _util.warn)("Lexer.getNumber - treating a single minus sign as zero.");
        return 0;
      }
    }
863
    throw new _util.FormatError(`Invalid number: ${String.fromCharCode(ch)} (charCode ${ch})`);
  }
866
  sign = sign || 1;
  let baseValue = ch - 0x30;
  let powerValue = 0;
  let powerValueSign = 1;
871
  while ((ch = this.nextChar()) >= 0) {
    if (ch >= 0x30 && ch <= 0x39) {
      const currentDigit = ch - 0x30;
875
      if (eNotation) {
        powerValue = powerValue * 10 + currentDigit;
      } else {
        if (divideBy !== 0) {
          divideBy *= 10;
        }
882
        baseValue = baseValue * 10 + currentDigit;
      }
    } else if (ch === 0x2e) {
      if (divideBy === 0) {
        divideBy = 1;
      } else {
        break;
      }
    } else if (ch === 0x2d) {
      (0, _util.warn)("Badly formatted number: minus sign in the middle");
    } else if (ch === 0x45 || ch === 0x65) {
      ch = this.peekChar();
895
      if (ch === 0x2b || ch === 0x2d) {
        powerValueSign = ch === 0x2d ? -1 : 1;
        this.nextChar();
      } else if (ch < 0x30 || ch > 0x39) {
        break;
      }
902
      eNotation = true;
    } else {
      break;
    }
  }
908
  if (divideBy !== 0) {
    baseValue /= divideBy;
  }
912
  if (eNotation) {
    baseValue *= 10 ** (powerValueSign * powerValue);
  }
916
  return sign * baseValue;
}
919
getString() {
  let numParen = 1;
  let done = false;
  const strBuf = this.strBuf;
  strBuf.length = 0;
  let ch = this.nextChar();
926
  while (true) {
    let charBuffered = false;
929
    switch (ch | 0) {
      case -1:
        (0, _util.warn)("Unterminated string");
        done = true;
        break;
935
      case 0x28:
        ++numParen;
        strBuf.push("(");
        break;
940
      case 0x29:
        if (--numParen === 0) {
          this.nextChar();
          done = true;
        } else {
          strBuf.push(")");
        }
948
        break;
950
      case 0x5c:
        ch = this.nextChar();
953
        switch (ch) {
          case -1:
            (0, _util.warn)("Unterminated string");
            done = true;
            break;
959
          case 0x6e:
            strBuf.push("\n");
            break;
963
          case 0x72:
            strBuf.push("\r");
            break;
967
          case 0x74:
            strBuf.push("\t");
            break;
971
          case 0x62:
            strBuf.push("\b");
            break;
975
          case 0x66:
            strBuf.push("\f");
            break;
979
          case 0x5c:
          case 0x28:
          case 0x29:
            strBuf.push(String.fromCharCode(ch));
            break;
985
          case 0x30:
          case 0x31:
          case 0x32:
          case 0x33:
          case 0x34:
          case 0x35:
          case 0x36:
          case 0x37:
            let x = ch & 0x0f;
            ch = this.nextChar();
            charBuffered = true;
997
            if (ch >= 0x30 && ch <= 0x37) {
              x = (x << 3) + (ch & 0x0f);
              ch = this.nextChar();
1001
              if (ch >= 0x30 && ch <= 0x37) {
                charBuffered = false;
                x = (x << 3) + (ch & 0x0f);
              }
            }
1007
            strBuf.push(String.fromCharCode(x));
            break;
1010
          case 0x0d:
            if (this.peekChar() === 0x0a) {
              this.nextChar();
            }
1015
            break;
1017
          case 0x0a:
            break;
1020
          default:
            strBuf.push(String.fromCharCode(ch));
            break;
        }
1025
        break;
1027
      default:
        strBuf.push(String.fromCharCode(ch));
        break;
    }
1032
    if (done) {
      break;
    }
1036
    if (!charBuffered) {
      ch = this.nextChar();
    }
  }
1041
  return strBuf.join("");
}
1044
getName() {
  let ch, previousCh;
  const strBuf = this.strBuf;
  strBuf.length = 0;
1049
  while ((ch = this.nextChar()) >= 0 && !specialChars[ch]) {
    if (ch === 0x23) {
      ch = this.nextChar();
1053
      if (specialChars[ch]) {
        (0, _util.warn)("Lexer_getName: " + "NUMBER SIGN (#) should be followed by a hexadecimal number.");
        strBuf.push("#");
        break;
      }
1059
      const x = toHexDigit(ch);
1061
      if (x !== -1) {
        previousCh = ch;
        ch = this.nextChar();
        const x2 = toHexDigit(ch);
1066
        if (x2 === -1) {
          (0, _util.warn)(`Lexer_getName: Illegal digit (${String.fromCharCode(ch)}) ` + "in hexadecimal number.");
          strBuf.push("#", String.fromCharCode(previousCh));
1070
          if (specialChars[ch]) {
            break;
          }
1074
          strBuf.push(String.fromCharCode(ch));
          continue;
        }
1078
        strBuf.push(String.fromCharCode(x << 4 | x2));
      } else {
        strBuf.push("#", String.fromCharCode(ch));
      }
    } else {
      strBuf.push(String.fromCharCode(ch));
    }
  }
1087
  if (strBuf.length > 127) {
    (0, _util.warn)(`Name token is longer than allowed by the spec: ${strBuf.length}`);
  }
1091
  return _primitives.Name.get(strBuf.join(""));
}
1094
_hexStringWarn(ch) {
  const MAX_HEX_STRING_NUM_WARN = 5;
1097
  if (this._hexStringNumWarn++ === MAX_HEX_STRING_NUM_WARN) {
    (0, _util.warn)("getHexString - ignoring additional invalid characters.");
    return;
  }
1102
  if (this._hexStringNumWarn > MAX_HEX_STRING_NUM_WARN) {
    return;
  }
1106
  (0, _util.warn)(`getHexString - ignoring invalid character: ${ch}`);
}
1109
getHexString() {
  const strBuf = this.strBuf;
  strBuf.length = 0;
  let ch = this.currentChar;
  let isFirstHex = true;
  let firstDigit, secondDigit;
  this._hexStringNumWarn = 0;
1117
  while (true) {
    if (ch < 0) {
      (0, _util.warn)("Unterminated hex string");
      break;
    } else if (ch === 0x3e) {
      this.nextChar();
      break;
    } else if (specialChars[ch] === 1) {
      ch = this.nextChar();
      continue;
    } else {
      if (isFirstHex) {
        firstDigit = toHexDigit(ch);
1131
        if (firstDigit === -1) {
          this._hexStringWarn(ch);
1134
          ch = this.nextChar();
          continue;
        }
      } else {
        secondDigit = toHexDigit(ch);
1140
        if (secondDigit === -1) {
          this._hexStringWarn(ch);
1143
          ch = this.nextChar();
          continue;
        }
1147
        strBuf.push(String.fromCharCode(firstDigit << 4 | secondDigit));
      }
1150
      isFirstHex = !isFirstHex;
      ch = this.nextChar();
    }
  }
1155
  return strBuf.join("");
}
1158
getObj() {
  let comment = false;
  let ch = this.currentChar;
1162
  while (true) {
    if (ch < 0) {
      return _primitives.EOF;
    }
1167
    if (comment) {
      if (ch === 0x0a || ch === 0x0d) {
        comment = false;
      }
    } else if (ch === 0x25) {
      comment = true;
    } else if (specialChars[ch] !== 1) {
      break;
    }
1177
    ch = this.nextChar();
  }
1180
  switch (ch | 0) {
    case 0x30:
    case 0x31:
    case 0x32:
    case 0x33:
    case 0x34:
    case 0x35:
    case 0x36:
    case 0x37:
    case 0x38:
    case 0x39:
    case 0x2b:
    case 0x2d:
    case 0x2e:
      return this.getNumber();
1196
    case 0x28:
      return this.getString();
1199
    case 0x2f:
      return this.getName();
1202
    case 0x5b:
      this.nextChar();
      return _primitives.Cmd.get("[");
1206
    case 0x5d:
      this.nextChar();
      return _primitives.Cmd.get("]");
1210
    case 0x3c:
      ch = this.nextChar();
1213
      if (ch === 0x3c) {
        this.nextChar();
        return _primitives.Cmd.get("<<");
      }
1218
      return this.getHexString();
1220
    case 0x3e:
      ch = this.nextChar();
1223
      if (ch === 0x3e) {
        this.nextChar();
        return _primitives.Cmd.get(">>");
      }
1228
      return _primitives.Cmd.get(">");
1230
    case 0x7b:
      this.nextChar();
      return _primitives.Cmd.get("{");
1234
    case 0x7d:
      this.nextChar();
      return _primitives.Cmd.get("}");
1238
    case 0x29:
      this.nextChar();
      throw new _util.FormatError(`Illegal character: ${ch}`);
  }
1243
  let str = String.fromCharCode(ch);
1245
  if (ch < 0x20 || ch > 0x7f) {
    const nextCh = this.peekChar();
1248
    if (nextCh >= 0x20 && nextCh <= 0x7f) {
      this.nextChar();
      return _primitives.Cmd.get(str);
    }
  }
1254
  const knownCommands = this.knownCommands;
  let knownCommandFound = knownCommands && knownCommands[str] !== undefined;
1257
  while ((ch = this.nextChar()) >= 0 && !specialChars[ch]) {
    const possibleCommand = str + String.fromCharCode(ch);
1260
    if (knownCommandFound && knownCommands[possibleCommand] === undefined) {
      break;
    }
1264
    if (str.length === 128) {
      throw new _util.FormatError(`Command token too long: ${str.length}`);
    }
1268
    str = possibleCommand;
    knownCommandFound = knownCommands && knownCommands[str] !== undefined;
  }
1272
  if (str === "true") {
    return true;
  }
1276
  if (str === "false") {
    return false;
  }
1280
  if (str === "null") {
    return null;
  }
1284
  if (str === "BI") {
    this.beginInlineImagePos = this.stream.pos;
  }
1288
  return _primitives.Cmd.get(str);
}
1291
peekObj() {
  const streamPos = this.stream.pos,
        currentChar = this.currentChar,
        beginInlineImagePos = this.beginInlineImagePos;
  let nextObj;
1297
  try {
    nextObj = this.getObj();
  } catch (ex) {
    if (ex instanceof _core_utils.MissingDataException) {
      throw ex;
    }
1304
    (0, _util.warn)(`peekObj: ${ex}`);
  }
1307
  this.stream.pos = streamPos;
  this.currentChar = currentChar;
  this.beginInlineImagePos = beginInlineImagePos;
  return nextObj;
}
1313
skipToNextLine() {
  let ch = this.currentChar;
1316
  while (ch >= 0) {
    if (ch === 0x0d) {
      ch = this.nextChar();
1320
      if (ch === 0x0a) {
        this.nextChar();
      }
1324
      break;
    } else if (ch === 0x0a) {
      this.nextChar();
      break;
    }
1330
    ch = this.nextChar();
  }
}
1334
1335}
1336
1337exports.Lexer = Lexer;
1338
1339class Linearization {
static create(stream) {
  function getInt(linDict, name, allowZeroValue = false) {
    const obj = linDict.get(name);
1343
    if (Number.isInteger(obj) && (allowZeroValue ? obj >= 0 : obj > 0)) {
      return obj;
    }
1347
    throw new Error(`The "${name}" parameter in the linearization ` + "dictionary is invalid.");
  }
1350
  function getHints(linDict) {
    const hints = linDict.get("H");
    let hintsLength;
1354
    if (Array.isArray(hints) && ((hintsLength = hints.length) === 2 || hintsLength === 4)) {
      for (let index = 0; index < hintsLength; index++) {
        const hint = hints[index];
1358
        if (!(Number.isInteger(hint) && hint > 0)) {
          throw new Error(`Hint (${index}) in the linearization dictionary is invalid.`);
        }
      }
1363
      return hints;
    }
1366
    throw new Error("Hint array in the linearization dictionary is invalid.");
  }
1369
  const parser = new Parser({
    lexer: new Lexer(stream),
    xref: null
  });
  const obj1 = parser.getObj();
  const obj2 = parser.getObj();
  const obj3 = parser.getObj();
  const linDict = parser.getObj();
  let obj, length;
1379
  if (!(Number.isInteger(obj1) && Number.isInteger(obj2) && (0, _primitives.isCmd)(obj3, "obj") && linDict instanceof _primitives.Dict && typeof (obj = linDict.get("Linearized")) === "number" && obj > 0)) {
    return null;
  } else if ((length = getInt(linDict, "L")) !== stream.length) {
    throw new Error('The "L" parameter in the linearization dictionary ' + "does not equal the stream length.");
  }
1385
  return {
    length,
    hints: getHints(linDict),
    objectNumberFirst: getInt(linDict, "O"),
    endFirst: getInt(linDict, "E"),
    numPages: getInt(linDict, "N"),
    mainXRefEntriesOffset: getInt(linDict, "T"),
    pageFirst: linDict.has("P") ? getInt(linDict, "P", true) : 0
  };
}
1396
1397}
1398
1399exports.Linearization = Linearization;
\No newline at end of file
1	`/**`
2	`* @licstart The following is the entire license notice for the`
3	`* JavaScript code in this page`
4	`*`
5	`* Copyright 2022 Mozilla Foundation`
6	`*`
7	`* Licensed under the Apache License, Version 2.0 (the "License");`
8	`* you may not use this file except in compliance with the License.`
9	`* You may obtain a copy of the License at`
10	`*`
11	`* http://www.apache.org/licenses/LICENSE-2.0`
12	`*`
13	`* Unless required by applicable law or agreed to in writing, software`
14	`* distributed under the License is distributed on an "AS IS" BASIS,`
15	`* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
16	`* See the License for the specific language governing permissions and`
17	`* limitations under the License.`
18	`*`
19	`* @licend The above is the entire license notice for the`
20	`* JavaScript code in this page`
21	`*/`
22	`"use strict";`
23
24	`Object.defineProperty(exports, "__esModule", {`
25	`value: true`
26	`});`
27	`exports.Parser = exports.Linearization = exports.Lexer = void 0;`
28
29	`var _util = require("../shared/util.js");`
30
31	`var _primitives = require("./primitives.js");`
32
33	`var _core_utils = require("./core_utils.js");`
34
35	`var _ascii_85_stream = require("./ascii_85_stream.js");`
36
37	`var _ascii_hex_stream = require("./ascii_hex_stream.js");`
38
39	`var _ccitt_stream = require("./ccitt_stream.js");`
40