/**
|
* @licstart The following is the entire license notice for the
|
* JavaScript code in this page
|
*
|
* Copyright 2022 Mozilla Foundation
|
*
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
* you may not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* http://www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*
|
* @licend The above is the entire license notice for the
|
* JavaScript code in this page
|
*/
|
"use strict";
|
|
Object.defineProperty(exports, "__esModule", {
|
value: true
|
});
|
exports.WorkerTask = exports.WorkerMessageHandler = void 0;
|
|
var _util = require("../shared/util.js");
|
|
var _primitives = require("./primitives.js");
|
|
var _core_utils = require("./core_utils.js");
|
|
var _pdf_manager = require("./pdf_manager.js");
|
|
var _cleanup_helper = require("./cleanup_helper.js");
|
|
var _writer = require("./writer.js");
|
|
var _is_node = require("../shared/is_node.js");
|
|
var _message_handler = require("../shared/message_handler.js");
|
|
var _worker_stream = require("./worker_stream.js");
|
|
class WorkerTask {
|
constructor(name) {
|
this.name = name;
|
this.terminated = false;
|
this._capability = (0, _util.createPromiseCapability)();
|
}
|
|
get finished() {
|
return this._capability.promise;
|
}
|
|
finish() {
|
this._capability.resolve();
|
}
|
|
terminate() {
|
this.terminated = true;
|
}
|
|
ensureNotTerminated() {
|
if (this.terminated) {
|
throw new Error("Worker task was terminated");
|
}
|
}
|
|
}
|
|
exports.WorkerTask = WorkerTask;
|
|
class WorkerMessageHandler {
|
static setup(handler, port) {
|
let testMessageProcessed = false;
|
handler.on("test", function wphSetupTest(data) {
|
if (testMessageProcessed) {
|
return;
|
}
|
|
testMessageProcessed = true;
|
handler.send("test", data instanceof Uint8Array);
|
});
|
handler.on("configure", function wphConfigure(data) {
|
(0, _util.setVerbosityLevel)(data.verbosity);
|
});
|
handler.on("GetDocRequest", function wphSetupDoc(data) {
|
return WorkerMessageHandler.createDocumentHandler(data, port);
|
});
|
}
|
|
static createDocumentHandler(docParams, port) {
|
let pdfManager;
|
let terminated = false;
|
let cancelXHRs = null;
|
const WorkerTasks = [];
|
const verbosity = (0, _util.getVerbosityLevel)();
|
const apiVersion = docParams.apiVersion;
|
const workerVersion = '2.16.105';
|
|
if (apiVersion !== workerVersion) {
|
throw new Error(`The API version "${apiVersion}" does not match ` + `the Worker version "${workerVersion}".`);
|
}
|
|
const enumerableProperties = [];
|
|
for (const property in []) {
|
enumerableProperties.push(property);
|
}
|
|
if (enumerableProperties.length) {
|
throw new Error("The `Array.prototype` contains unexpected enumerable properties: " + enumerableProperties.join(", ") + "; thus breaking e.g. `for...in` iteration of `Array`s.");
|
}
|
|
if (typeof ReadableStream === "undefined") {
|
const partialMsg = "The browser/environment lacks native support for critical " + "functionality used by the PDF.js library (e.g. `ReadableStream`); ";
|
|
if (_is_node.isNodeJS) {
|
throw new Error(partialMsg + "please use a `legacy`-build instead.");
|
}
|
|
throw new Error(partialMsg + "please update to a supported browser.");
|
}
|
|
const docId = docParams.docId;
|
const docBaseUrl = docParams.docBaseUrl;
|
const workerHandlerName = docParams.docId + "_worker";
|
let handler = new _message_handler.MessageHandler(workerHandlerName, docId, port);
|
|
function ensureNotTerminated() {
|
if (terminated) {
|
throw new Error("Worker was terminated");
|
}
|
}
|
|
function startWorkerTask(task) {
|
WorkerTasks.push(task);
|
}
|
|
function finishWorkerTask(task) {
|
task.finish();
|
const i = WorkerTasks.indexOf(task);
|
WorkerTasks.splice(i, 1);
|
}
|
|
async function loadDocument(recoveryMode) {
|
await pdfManager.ensureDoc("checkHeader");
|
await pdfManager.ensureDoc("parseStartXRef");
|
await pdfManager.ensureDoc("parse", [recoveryMode]);
|
await pdfManager.ensureDoc("checkFirstPage", [recoveryMode]);
|
await pdfManager.ensureDoc("checkLastPage", [recoveryMode]);
|
const isPureXfa = await pdfManager.ensureDoc("isPureXfa");
|
|
if (isPureXfa) {
|
const task = new WorkerTask("loadXfaFonts");
|
startWorkerTask(task);
|
await Promise.all([pdfManager.loadXfaFonts(handler, task).catch(reason => {}).then(() => finishWorkerTask(task)), pdfManager.loadXfaImages()]);
|
}
|
|
const [numPages, fingerprints] = await Promise.all([pdfManager.ensureDoc("numPages"), pdfManager.ensureDoc("fingerprints")]);
|
const htmlForXfa = isPureXfa ? await pdfManager.ensureDoc("htmlForXfa") : null;
|
return {
|
numPages,
|
fingerprints,
|
htmlForXfa
|
};
|
}
|
|
function getPdfManager(data, evaluatorOptions, enableXfa) {
|
const pdfManagerCapability = (0, _util.createPromiseCapability)();
|
let newPdfManager;
|
const source = data.source;
|
|
if (source.data) {
|
try {
|
newPdfManager = new _pdf_manager.LocalPdfManager(docId, source.data, source.password, handler, evaluatorOptions, enableXfa, docBaseUrl);
|
pdfManagerCapability.resolve(newPdfManager);
|
} catch (ex) {
|
pdfManagerCapability.reject(ex);
|
}
|
|
return pdfManagerCapability.promise;
|
}
|
|
let pdfStream,
|
cachedChunks = [];
|
|
try {
|
pdfStream = new _worker_stream.PDFWorkerStream(handler);
|
} catch (ex) {
|
pdfManagerCapability.reject(ex);
|
return pdfManagerCapability.promise;
|
}
|
|
const fullRequest = pdfStream.getFullReader();
|
fullRequest.headersReady.then(function () {
|
if (!fullRequest.isRangeSupported) {
|
return;
|
}
|
|
const disableAutoFetch = source.disableAutoFetch || fullRequest.isStreamingSupported;
|
newPdfManager = new _pdf_manager.NetworkPdfManager(docId, pdfStream, {
|
msgHandler: handler,
|
password: source.password,
|
length: fullRequest.contentLength,
|
disableAutoFetch,
|
rangeChunkSize: source.rangeChunkSize
|
}, evaluatorOptions, enableXfa, docBaseUrl);
|
|
for (const chunk of cachedChunks) {
|
newPdfManager.sendProgressiveData(chunk);
|
}
|
|
cachedChunks = [];
|
pdfManagerCapability.resolve(newPdfManager);
|
cancelXHRs = null;
|
}).catch(function (reason) {
|
pdfManagerCapability.reject(reason);
|
cancelXHRs = null;
|
});
|
let loaded = 0;
|
|
const flushChunks = function () {
|
const pdfFile = (0, _util.arraysToBytes)(cachedChunks);
|
|
if (source.length && pdfFile.length !== source.length) {
|
(0, _util.warn)("reported HTTP length is different from actual");
|
}
|
|
try {
|
newPdfManager = new _pdf_manager.LocalPdfManager(docId, pdfFile, source.password, handler, evaluatorOptions, enableXfa, docBaseUrl);
|
pdfManagerCapability.resolve(newPdfManager);
|
} catch (ex) {
|
pdfManagerCapability.reject(ex);
|
}
|
|
cachedChunks = [];
|
};
|
|
const readPromise = new Promise(function (resolve, reject) {
|
const readChunk = function ({
|
value,
|
done
|
}) {
|
try {
|
ensureNotTerminated();
|
|
if (done) {
|
if (!newPdfManager) {
|
flushChunks();
|
}
|
|
cancelXHRs = null;
|
return;
|
}
|
|
loaded += (0, _util.arrayByteLength)(value);
|
|
if (!fullRequest.isStreamingSupported) {
|
handler.send("DocProgress", {
|
loaded,
|
total: Math.max(loaded, fullRequest.contentLength || 0)
|
});
|
}
|
|
if (newPdfManager) {
|
newPdfManager.sendProgressiveData(value);
|
} else {
|
cachedChunks.push(value);
|
}
|
|
fullRequest.read().then(readChunk, reject);
|
} catch (e) {
|
reject(e);
|
}
|
};
|
|
fullRequest.read().then(readChunk, reject);
|
});
|
readPromise.catch(function (e) {
|
pdfManagerCapability.reject(e);
|
cancelXHRs = null;
|
});
|
|
cancelXHRs = function (reason) {
|
pdfStream.cancelAllRequests(reason);
|
};
|
|
return pdfManagerCapability.promise;
|
}
|
|
function setupDoc(data) {
|
function onSuccess(doc) {
|
ensureNotTerminated();
|
handler.send("GetDoc", {
|
pdfInfo: doc
|
});
|
}
|
|
function onFailure(ex) {
|
ensureNotTerminated();
|
|
if (ex instanceof _util.PasswordException) {
|
const task = new WorkerTask(`PasswordException: response ${ex.code}`);
|
startWorkerTask(task);
|
handler.sendWithPromise("PasswordRequest", ex).then(function ({
|
password
|
}) {
|
finishWorkerTask(task);
|
pdfManager.updatePassword(password);
|
pdfManagerReady();
|
}).catch(function () {
|
finishWorkerTask(task);
|
handler.send("DocException", ex);
|
});
|
} else if (ex instanceof _util.InvalidPDFException || ex instanceof _util.MissingPDFException || ex instanceof _util.UnexpectedResponseException || ex instanceof _util.UnknownErrorException) {
|
handler.send("DocException", ex);
|
} else {
|
handler.send("DocException", new _util.UnknownErrorException(ex.message, ex.toString()));
|
}
|
}
|
|
function pdfManagerReady() {
|
ensureNotTerminated();
|
loadDocument(false).then(onSuccess, function (reason) {
|
ensureNotTerminated();
|
|
if (!(reason instanceof _core_utils.XRefParseException)) {
|
onFailure(reason);
|
return;
|
}
|
|
pdfManager.requestLoadedStream();
|
pdfManager.onLoadedStream().then(function () {
|
ensureNotTerminated();
|
loadDocument(true).then(onSuccess, onFailure);
|
});
|
});
|
}
|
|
ensureNotTerminated();
|
const evaluatorOptions = {
|
maxImageSize: data.maxImageSize,
|
disableFontFace: data.disableFontFace,
|
ignoreErrors: data.ignoreErrors,
|
isEvalSupported: data.isEvalSupported,
|
fontExtraProperties: data.fontExtraProperties,
|
useSystemFonts: data.useSystemFonts,
|
cMapUrl: data.cMapUrl,
|
standardFontDataUrl: data.standardFontDataUrl
|
};
|
getPdfManager(data, evaluatorOptions, data.enableXfa).then(function (newPdfManager) {
|
if (terminated) {
|
newPdfManager.terminate(new _util.AbortException("Worker was terminated."));
|
throw new Error("Worker was terminated");
|
}
|
|
pdfManager = newPdfManager;
|
pdfManager.onLoadedStream().then(function (stream) {
|
handler.send("DataLoaded", {
|
length: stream.bytes.byteLength
|
});
|
});
|
}).then(pdfManagerReady, onFailure);
|
}
|
|
handler.on("GetPage", function wphSetupGetPage(data) {
|
return pdfManager.getPage(data.pageIndex).then(function (page) {
|
return Promise.all([pdfManager.ensure(page, "rotate"), pdfManager.ensure(page, "ref"), pdfManager.ensure(page, "userUnit"), pdfManager.ensure(page, "view")]).then(function ([rotate, ref, userUnit, view]) {
|
return {
|
rotate,
|
ref,
|
userUnit,
|
view
|
};
|
});
|
});
|
});
|
handler.on("GetPageIndex", function wphSetupGetPageIndex(data) {
|
const pageRef = _primitives.Ref.get(data.num, data.gen);
|
|
return pdfManager.ensureCatalog("getPageIndex", [pageRef]);
|
});
|
handler.on("GetDestinations", function wphSetupGetDestinations(data) {
|
return pdfManager.ensureCatalog("destinations");
|
});
|
handler.on("GetDestination", function wphSetupGetDestination(data) {
|
return pdfManager.ensureCatalog("getDestination", [data.id]);
|
});
|
handler.on("GetPageLabels", function wphSetupGetPageLabels(data) {
|
return pdfManager.ensureCatalog("pageLabels");
|
});
|
handler.on("GetPageLayout", function wphSetupGetPageLayout(data) {
|
return pdfManager.ensureCatalog("pageLayout");
|
});
|
handler.on("GetPageMode", function wphSetupGetPageMode(data) {
|
return pdfManager.ensureCatalog("pageMode");
|
});
|
handler.on("GetViewerPreferences", function (data) {
|
return pdfManager.ensureCatalog("viewerPreferences");
|
});
|
handler.on("GetOpenAction", function (data) {
|
return pdfManager.ensureCatalog("openAction");
|
});
|
handler.on("GetAttachments", function wphSetupGetAttachments(data) {
|
return pdfManager.ensureCatalog("attachments");
|
});
|
handler.on("GetJavaScript", function wphSetupGetJavaScript(data) {
|
return pdfManager.ensureCatalog("javaScript");
|
});
|
handler.on("GetDocJSActions", function wphSetupGetDocJSActions(data) {
|
return pdfManager.ensureCatalog("jsActions");
|
});
|
handler.on("GetPageJSActions", function ({
|
pageIndex
|
}) {
|
return pdfManager.getPage(pageIndex).then(function (page) {
|
return pdfManager.ensure(page, "jsActions");
|
});
|
});
|
handler.on("GetOutline", function wphSetupGetOutline(data) {
|
return pdfManager.ensureCatalog("documentOutline");
|
});
|
handler.on("GetOptionalContentConfig", function (data) {
|
return pdfManager.ensureCatalog("optionalContentConfig");
|
});
|
handler.on("GetPermissions", function (data) {
|
return pdfManager.ensureCatalog("permissions");
|
});
|
handler.on("GetMetadata", function wphSetupGetMetadata(data) {
|
return Promise.all([pdfManager.ensureDoc("documentInfo"), pdfManager.ensureCatalog("metadata")]);
|
});
|
handler.on("GetMarkInfo", function wphSetupGetMarkInfo(data) {
|
return pdfManager.ensureCatalog("markInfo");
|
});
|
handler.on("GetData", function wphSetupGetData(data) {
|
pdfManager.requestLoadedStream();
|
return pdfManager.onLoadedStream().then(function (stream) {
|
return stream.bytes;
|
});
|
});
|
handler.on("GetAnnotations", function ({
|
pageIndex,
|
intent
|
}) {
|
return pdfManager.getPage(pageIndex).then(function (page) {
|
const task = new WorkerTask(`GetAnnotations: page ${pageIndex}`);
|
startWorkerTask(task);
|
return page.getAnnotationsData(handler, task, intent).then(data => {
|
finishWorkerTask(task);
|
return data;
|
}, reason => {
|
finishWorkerTask(task);
|
});
|
});
|
});
|
handler.on("GetFieldObjects", function (data) {
|
return pdfManager.ensureDoc("fieldObjects");
|
});
|
handler.on("HasJSActions", function (data) {
|
return pdfManager.ensureDoc("hasJSActions");
|
});
|
handler.on("GetCalculationOrderIds", function (data) {
|
return pdfManager.ensureDoc("calculationOrderIds");
|
});
|
handler.on("SaveDocument", function ({
|
isPureXfa,
|
numPages,
|
annotationStorage,
|
filename
|
}) {
|
pdfManager.requestLoadedStream();
|
const newAnnotationsByPage = !isPureXfa ? (0, _core_utils.getNewAnnotationsMap)(annotationStorage) : null;
|
const promises = [pdfManager.onLoadedStream(), pdfManager.ensureCatalog("acroForm"), pdfManager.ensureCatalog("acroFormRef"), pdfManager.ensureDoc("xref"), pdfManager.ensureDoc("startXRef")];
|
|
if (newAnnotationsByPage) {
|
for (const [pageIndex, annotations] of newAnnotationsByPage) {
|
promises.push(pdfManager.getPage(pageIndex).then(page => {
|
const task = new WorkerTask(`Save (editor): page ${pageIndex}`);
|
return page.saveNewAnnotations(handler, task, annotations).finally(function () {
|
finishWorkerTask(task);
|
});
|
}));
|
}
|
}
|
|
if (isPureXfa) {
|
promises.push(pdfManager.serializeXfaData(annotationStorage));
|
} else {
|
for (let pageIndex = 0; pageIndex < numPages; pageIndex++) {
|
promises.push(pdfManager.getPage(pageIndex).then(function (page) {
|
const task = new WorkerTask(`Save: page ${pageIndex}`);
|
return page.save(handler, task, annotationStorage).finally(function () {
|
finishWorkerTask(task);
|
});
|
}));
|
}
|
}
|
|
return Promise.all(promises).then(function ([stream, acroForm, acroFormRef, xref, startXRef, ...refs]) {
|
let newRefs = [];
|
let xfaData = null;
|
|
if (isPureXfa) {
|
xfaData = refs[0];
|
|
if (!xfaData) {
|
return stream.bytes;
|
}
|
} else {
|
newRefs = refs.flat(2);
|
|
if (newRefs.length === 0) {
|
return stream.bytes;
|
}
|
}
|
|
const xfa = acroForm instanceof _primitives.Dict && acroForm.get("XFA") || null;
|
let xfaDatasetsRef = null;
|
let hasXfaDatasetsEntry = false;
|
|
if (Array.isArray(xfa)) {
|
for (let i = 0, ii = xfa.length; i < ii; i += 2) {
|
if (xfa[i] === "datasets") {
|
xfaDatasetsRef = xfa[i + 1];
|
acroFormRef = null;
|
hasXfaDatasetsEntry = true;
|
}
|
}
|
|
if (xfaDatasetsRef === null) {
|
xfaDatasetsRef = xref.getNewRef();
|
}
|
} else if (xfa) {
|
acroFormRef = null;
|
(0, _util.warn)("Unsupported XFA type.");
|
}
|
|
let newXrefInfo = Object.create(null);
|
|
if (xref.trailer) {
|
const infoObj = Object.create(null);
|
const xrefInfo = xref.trailer.get("Info") || null;
|
|
if (xrefInfo instanceof _primitives.Dict) {
|
xrefInfo.forEach((key, value) => {
|
if (typeof value === "string") {
|
infoObj[key] = (0, _util.stringToPDFString)(value);
|
}
|
});
|
}
|
|
newXrefInfo = {
|
rootRef: xref.trailer.getRaw("Root") || null,
|
encryptRef: xref.trailer.getRaw("Encrypt") || null,
|
newRef: xref.getNewRef(),
|
infoRef: xref.trailer.getRaw("Info") || null,
|
info: infoObj,
|
fileIds: xref.trailer.get("ID") || null,
|
startXRef,
|
filename
|
};
|
}
|
|
xref.resetNewRef();
|
return (0, _writer.incrementalUpdate)({
|
originalData: stream.bytes,
|
xrefInfo: newXrefInfo,
|
newRefs,
|
xref,
|
hasXfa: !!xfa,
|
xfaDatasetsRef,
|
hasXfaDatasetsEntry,
|
acroFormRef,
|
acroForm,
|
xfaData
|
});
|
});
|
});
|
handler.on("GetOperatorList", function wphSetupRenderPage(data, sink) {
|
const pageIndex = data.pageIndex;
|
pdfManager.getPage(pageIndex).then(function (page) {
|
const task = new WorkerTask(`GetOperatorList: page ${pageIndex}`);
|
startWorkerTask(task);
|
const start = verbosity >= _util.VerbosityLevel.INFOS ? Date.now() : 0;
|
page.getOperatorList({
|
handler,
|
sink,
|
task,
|
intent: data.intent,
|
cacheKey: data.cacheKey,
|
annotationStorage: data.annotationStorage
|
}).then(function (operatorListInfo) {
|
finishWorkerTask(task);
|
|
if (start) {
|
(0, _util.info)(`page=${pageIndex + 1} - getOperatorList: time=` + `${Date.now() - start}ms, len=${operatorListInfo.length}`);
|
}
|
|
sink.close();
|
}, function (reason) {
|
finishWorkerTask(task);
|
|
if (task.terminated) {
|
return;
|
}
|
|
handler.send("UnsupportedFeature", {
|
featureId: _util.UNSUPPORTED_FEATURES.errorOperatorList
|
});
|
sink.error(reason);
|
});
|
});
|
});
|
handler.on("GetTextContent", function wphExtractText(data, sink) {
|
const pageIndex = data.pageIndex;
|
pdfManager.getPage(pageIndex).then(function (page) {
|
const task = new WorkerTask("GetTextContent: page " + pageIndex);
|
startWorkerTask(task);
|
const start = verbosity >= _util.VerbosityLevel.INFOS ? Date.now() : 0;
|
page.extractTextContent({
|
handler,
|
task,
|
sink,
|
includeMarkedContent: data.includeMarkedContent,
|
combineTextItems: data.combineTextItems
|
}).then(function () {
|
finishWorkerTask(task);
|
|
if (start) {
|
(0, _util.info)(`page=${pageIndex + 1} - getTextContent: time=` + `${Date.now() - start}ms`);
|
}
|
|
sink.close();
|
}, function (reason) {
|
finishWorkerTask(task);
|
|
if (task.terminated) {
|
return;
|
}
|
|
sink.error(reason);
|
});
|
});
|
});
|
handler.on("GetStructTree", function wphGetStructTree(data) {
|
return pdfManager.getPage(data.pageIndex).then(function (page) {
|
return pdfManager.ensure(page, "getStructTree");
|
});
|
});
|
handler.on("FontFallback", function (data) {
|
return pdfManager.fontFallback(data.id, handler);
|
});
|
handler.on("Cleanup", function wphCleanup(data) {
|
return pdfManager.cleanup(true);
|
});
|
handler.on("Terminate", function wphTerminate(data) {
|
terminated = true;
|
const waitOn = [];
|
|
if (pdfManager) {
|
pdfManager.terminate(new _util.AbortException("Worker was terminated."));
|
const cleanupPromise = pdfManager.cleanup();
|
waitOn.push(cleanupPromise);
|
pdfManager = null;
|
} else {
|
(0, _cleanup_helper.clearGlobalCaches)();
|
}
|
|
if (cancelXHRs) {
|
cancelXHRs(new _util.AbortException("Worker was terminated."));
|
}
|
|
for (const task of WorkerTasks) {
|
waitOn.push(task.finished);
|
task.terminate();
|
}
|
|
return Promise.all(waitOn).then(function () {
|
handler.destroy();
|
handler = null;
|
});
|
});
|
handler.on("Ready", function wphReady(data) {
|
setupDoc(docParams);
|
docParams = null;
|
});
|
return workerHandlerName;
|
}
|
|
static initializeFromPort(port) {
|
const handler = new _message_handler.MessageHandler("worker", "main", port);
|
WorkerMessageHandler.setup(handler, port);
|
handler.send("ready", null);
|
}
|
|
}
|
|
exports.WorkerMessageHandler = WorkerMessageHandler;
|
|
function isMessagePort(maybePort) {
|
return typeof maybePort.postMessage === "function" && "onmessage" in maybePort;
|
}
|
|
if (typeof window === "undefined" && !_is_node.isNodeJS && typeof self !== "undefined" && isMessagePort(self)) {
|
WorkerMessageHandler.initializeFromPort(self);
|
}
|