In practice it's not uncommon for PDF documents to re-use the same TilingPatterns more than once, and parsing them is essentially equal to parsing of a (small) page since a `getOperatorList` call is required. By caching the internal TilingPattern representation we can thus avoid having to re-parse the same data over and over, and there's also *less* asynchronous parsing required for repeated TilingPatterns. Initially I had intended to include (standard) benchmark results with this patch, however it's not entirely clear that this is actually necessary here given the preliminary results. When testing this manually in the development viewer, using `pdfBug=Stats`, the following (approximate) reduction in rendering times were observed when comparing `master` against this patch: - http://pubs.usgs.gov/sim/3067/pdf/sim3067sheet-2.pdf (from issue 2765): `6800 ms` -> `4100 ms`. - https://github.com/mozilla/pdf.js/files/1046131/stepped.pdf (from issue 8473): `54000 ms` -> `13000 ms` - https://github.com/mozilla/pdf.js/files/1046130/proof.pdf (from issue 8473): `5900 ms` -> `2500 ms` As always, whenever you're dealing with documents which are "slow", there's usually a certain level of subjectivity involved with regards to what's deemed acceptable performance. Hence it's not clear to me that we want to regard any of the referenced issues as fixed, however the improvements are significant enough to warrant caching of TilingPatterns in my opinion.
260 lines
6.1 KiB
JavaScript
260 lines
6.1 KiB
JavaScript
/* Copyright 2019 Mozilla Foundation
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
import { assert, info, shadow, unreachable } from "../shared/util.js";
|
|
import { RefSetCache } from "./primitives.js";
|
|
|
|
class BaseLocalCache {
|
|
constructor(options) {
|
|
if (this.constructor === BaseLocalCache) {
|
|
unreachable("Cannot initialize BaseLocalCache.");
|
|
}
|
|
if (!options || !options.onlyRefs) {
|
|
this._nameRefMap = new Map();
|
|
this._imageMap = new Map();
|
|
}
|
|
this._imageCache = new RefSetCache();
|
|
}
|
|
|
|
getByName(name) {
|
|
const ref = this._nameRefMap.get(name);
|
|
if (ref) {
|
|
return this.getByRef(ref);
|
|
}
|
|
return this._imageMap.get(name) || null;
|
|
}
|
|
|
|
getByRef(ref) {
|
|
return this._imageCache.get(ref) || null;
|
|
}
|
|
|
|
set(name, ref, data) {
|
|
unreachable("Abstract method `set` called.");
|
|
}
|
|
}
|
|
|
|
class LocalImageCache extends BaseLocalCache {
|
|
set(name, ref = null, data) {
|
|
if (!name) {
|
|
throw new Error('LocalImageCache.set - expected "name" argument.');
|
|
}
|
|
if (ref) {
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
this._nameRefMap.set(name, ref);
|
|
this._imageCache.put(ref, data);
|
|
return;
|
|
}
|
|
// name
|
|
if (this._imageMap.has(name)) {
|
|
return;
|
|
}
|
|
this._imageMap.set(name, data);
|
|
}
|
|
}
|
|
|
|
class LocalColorSpaceCache extends BaseLocalCache {
|
|
set(name = null, ref = null, data) {
|
|
if (!name && !ref) {
|
|
throw new Error(
|
|
'LocalColorSpaceCache.set - expected "name" and/or "ref" argument.'
|
|
);
|
|
}
|
|
if (ref) {
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
if (name) {
|
|
// Optional when `ref` is defined.
|
|
this._nameRefMap.set(name, ref);
|
|
}
|
|
this._imageCache.put(ref, data);
|
|
return;
|
|
}
|
|
// name
|
|
if (this._imageMap.has(name)) {
|
|
return;
|
|
}
|
|
this._imageMap.set(name, data);
|
|
}
|
|
}
|
|
|
|
class LocalFunctionCache extends BaseLocalCache {
|
|
constructor(options) {
|
|
super({ onlyRefs: true });
|
|
}
|
|
|
|
getByName(name) {
|
|
unreachable("Should not call `getByName` method.");
|
|
}
|
|
|
|
set(name = null, ref, data) {
|
|
if (!ref) {
|
|
throw new Error('LocalFunctionCache.set - expected "ref" argument.');
|
|
}
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
this._imageCache.put(ref, data);
|
|
}
|
|
}
|
|
|
|
class LocalGStateCache extends BaseLocalCache {
|
|
set(name, ref = null, data) {
|
|
if (!name) {
|
|
throw new Error('LocalGStateCache.set - expected "name" argument.');
|
|
}
|
|
if (ref) {
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
this._nameRefMap.set(name, ref);
|
|
this._imageCache.put(ref, data);
|
|
return;
|
|
}
|
|
// name
|
|
if (this._imageMap.has(name)) {
|
|
return;
|
|
}
|
|
this._imageMap.set(name, data);
|
|
}
|
|
}
|
|
|
|
class LocalTilingPatternCache extends BaseLocalCache {
|
|
set(name, ref = null, data) {
|
|
if (!name) {
|
|
throw new Error(
|
|
'LocalTilingPatternCache.set - expected "name" argument.'
|
|
);
|
|
}
|
|
if (ref) {
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
this._nameRefMap.set(name, ref);
|
|
this._imageCache.put(ref, data);
|
|
return;
|
|
}
|
|
// name
|
|
if (this._imageMap.has(name)) {
|
|
return;
|
|
}
|
|
this._imageMap.set(name, data);
|
|
}
|
|
}
|
|
|
|
class GlobalImageCache {
|
|
static get NUM_PAGES_THRESHOLD() {
|
|
return shadow(this, "NUM_PAGES_THRESHOLD", 2);
|
|
}
|
|
|
|
static get MAX_IMAGES_TO_CACHE() {
|
|
return shadow(this, "MAX_IMAGES_TO_CACHE", 10);
|
|
}
|
|
|
|
constructor() {
|
|
if (
|
|
typeof PDFJSDev === "undefined" ||
|
|
PDFJSDev.test("!PRODUCTION || TESTING")
|
|
) {
|
|
assert(
|
|
GlobalImageCache.NUM_PAGES_THRESHOLD > 1,
|
|
"GlobalImageCache - invalid NUM_PAGES_THRESHOLD constant."
|
|
);
|
|
}
|
|
this._refCache = new RefSetCache();
|
|
this._imageCache = new RefSetCache();
|
|
}
|
|
|
|
shouldCache(ref, pageIndex) {
|
|
const pageIndexSet = this._refCache.get(ref);
|
|
const numPages = pageIndexSet
|
|
? pageIndexSet.size + (pageIndexSet.has(pageIndex) ? 0 : 1)
|
|
: 1;
|
|
|
|
if (numPages < GlobalImageCache.NUM_PAGES_THRESHOLD) {
|
|
return false;
|
|
}
|
|
if (
|
|
!this._imageCache.has(ref) &&
|
|
this._imageCache.size >= GlobalImageCache.MAX_IMAGES_TO_CACHE
|
|
) {
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
addPageIndex(ref, pageIndex) {
|
|
let pageIndexSet = this._refCache.get(ref);
|
|
if (!pageIndexSet) {
|
|
pageIndexSet = new Set();
|
|
this._refCache.put(ref, pageIndexSet);
|
|
}
|
|
pageIndexSet.add(pageIndex);
|
|
}
|
|
|
|
getData(ref, pageIndex) {
|
|
const pageIndexSet = this._refCache.get(ref);
|
|
if (!pageIndexSet) {
|
|
return null;
|
|
}
|
|
if (pageIndexSet.size < GlobalImageCache.NUM_PAGES_THRESHOLD) {
|
|
return null;
|
|
}
|
|
if (!this._imageCache.has(ref)) {
|
|
return null;
|
|
}
|
|
// Ensure that we keep track of all pages containing the image reference.
|
|
pageIndexSet.add(pageIndex);
|
|
|
|
return this._imageCache.get(ref);
|
|
}
|
|
|
|
setData(ref, data) {
|
|
if (!this._refCache.has(ref)) {
|
|
throw new Error(
|
|
'GlobalImageCache.setData - expected "addPageIndex" to have been called.'
|
|
);
|
|
}
|
|
if (this._imageCache.has(ref)) {
|
|
return;
|
|
}
|
|
if (this._imageCache.size >= GlobalImageCache.MAX_IMAGES_TO_CACHE) {
|
|
info(
|
|
"GlobalImageCache.setData - ignoring image above MAX_IMAGES_TO_CACHE."
|
|
);
|
|
return;
|
|
}
|
|
this._imageCache.put(ref, data);
|
|
}
|
|
|
|
clear(onlyData = false) {
|
|
if (!onlyData) {
|
|
this._refCache.clear();
|
|
}
|
|
this._imageCache.clear();
|
|
}
|
|
}
|
|
|
|
export {
|
|
LocalImageCache,
|
|
LocalColorSpaceCache,
|
|
LocalFunctionCache,
|
|
LocalGStateCache,
|
|
LocalTilingPatternCache,
|
|
GlobalImageCache,
|
|
};
|