mirror of
https://github.com/foliojs/pdfkit.git
synced 2025-12-08 20:15:54 +00:00
* pdf/a1b support initial commit Added mixin for support pdf/a1b and a few of the things it requires (xmp metadata, colour profile). Currently, the CIDSet stream is the only error it comes back with the test case I'm using, will try sorting it out next. * Adding CIDSet when generating PDF/A PDF/A1 b/a requires a CIDSet. This is not checked by a validator and other converters seem to add a CIDSet with a value of FF FF FF FF 0C, so this commit does the same. When extending support for PDF/A 2/3/4, we may not add a CIDSet (I think for PDF/A3 it's not required?) or we will look for a proper way to generate the CIDSet. At this point, PDFKit should be able to generate PDF/A1b which can pass veraPDF validation and PDF/A1a if tagged is enabled. All you have to do is set pdfa: '1a' or pdfa: '1b' in the options passed to new PDFDocument. * pdf/a intro docs * generalising subsets, reimplementing pdfa1 and added control over metadata added a generalised subsets mixin which can pull in a subset at runtime. reimplemented pdfa1 mixin as some features should be standardised across all subsets, such as storing /Info as xmp metadata for pdf >1.3 added a metadata class and mixing to control and write the metadata to a pdf * added tests for pdfa1 and metadata and moved joinTokens in helpers Addeds tests for pdfa1 subset and metadata. Moved joinTokens into helpers.js as it's now used in at least two places. Added tests for document to when metadata should be added (pdf version 1.4 or newer) and when it shouldn't (pdf version 1.3) * updated pdf/a docs to reflect latest changes * store color profile as icc file * Updated changelog to include PDF/A support in Unreleased section
398 lines
9.1 KiB
JavaScript
398 lines
9.1 KiB
JavaScript
/*
|
|
PDFDocument - represents an entire PDF document
|
|
By Devon Govett
|
|
*/
|
|
|
|
import stream from 'stream';
|
|
import fs from 'fs';
|
|
import PDFObject from './object';
|
|
import PDFReference from './reference';
|
|
import PDFPage from './page';
|
|
import PDFNameTree from './name_tree';
|
|
import PDFSecurity from './security';
|
|
import ColorMixin from './mixins/color';
|
|
import VectorMixin from './mixins/vector';
|
|
import FontsMixin from './mixins/fonts';
|
|
import TextMixin from './mixins/text';
|
|
import ImagesMixin from './mixins/images';
|
|
import AnnotationsMixin from './mixins/annotations';
|
|
import OutlineMixin from './mixins/outline';
|
|
import MarkingsMixin from './mixins/markings';
|
|
import AcroFormMixin from './mixins/acroform';
|
|
import AttachmentsMixin from './mixins/attachments';
|
|
import LineWrapper from './line_wrapper';
|
|
import SubsetMixin from './mixins/subsets';
|
|
import MetadataMixin from './mixins/metadata';
|
|
|
|
class PDFDocument extends stream.Readable {
|
|
constructor(options = {}) {
|
|
super(options);
|
|
this.options = options;
|
|
|
|
// PDF version
|
|
switch (options.pdfVersion) {
|
|
case '1.4':
|
|
this.version = 1.4;
|
|
break;
|
|
case '1.5':
|
|
this.version = 1.5;
|
|
break;
|
|
case '1.6':
|
|
this.version = 1.6;
|
|
break;
|
|
case '1.7':
|
|
case '1.7ext3':
|
|
this.version = 1.7;
|
|
break;
|
|
default:
|
|
this.version = 1.3;
|
|
break;
|
|
}
|
|
|
|
// Whether streams should be compressed
|
|
this.compress =
|
|
this.options.compress != null ? this.options.compress : true;
|
|
|
|
this._pageBuffer = [];
|
|
this._pageBufferStart = 0;
|
|
|
|
// The PDF object store
|
|
this._offsets = [];
|
|
this._waiting = 0;
|
|
this._ended = false;
|
|
this._offset = 0;
|
|
const Pages = this.ref({
|
|
Type: 'Pages',
|
|
Count: 0,
|
|
Kids: []
|
|
});
|
|
|
|
const Names = this.ref({
|
|
Dests: new PDFNameTree()
|
|
});
|
|
|
|
this._root = this.ref({
|
|
Type: 'Catalog',
|
|
Pages,
|
|
Names
|
|
});
|
|
|
|
if (this.options.lang) {
|
|
this._root.data.Lang = new String(this.options.lang);
|
|
}
|
|
|
|
// The current page
|
|
this.page = null;
|
|
|
|
// Initialize mixins
|
|
this.initMetadata();
|
|
this.initColor();
|
|
this.initVector();
|
|
this.initFonts(options.font);
|
|
this.initText();
|
|
this.initImages();
|
|
this.initOutline();
|
|
this.initMarkings(options);
|
|
this.initSubset(options);
|
|
|
|
// Initialize the metadata
|
|
this.info = {
|
|
Producer: 'PDFKit',
|
|
Creator: 'PDFKit',
|
|
CreationDate: new Date()
|
|
};
|
|
|
|
if (this.options.info) {
|
|
for (let key in this.options.info) {
|
|
const val = this.options.info[key];
|
|
this.info[key] = val;
|
|
}
|
|
}
|
|
|
|
if (this.options.displayTitle) {
|
|
this._root.data.ViewerPreferences = this.ref({
|
|
DisplayDocTitle: true
|
|
});
|
|
}
|
|
|
|
// Generate file ID
|
|
this._id = PDFSecurity.generateFileID(this.info);
|
|
|
|
// Initialize security settings
|
|
this._security = PDFSecurity.create(this, options);
|
|
|
|
// Write the header
|
|
// PDF version
|
|
this._write(`%PDF-${this.version}`);
|
|
|
|
// 4 binary chars, as recommended by the spec
|
|
this._write('%\xFF\xFF\xFF\xFF');
|
|
|
|
// Add the first page
|
|
if (this.options.autoFirstPage !== false) {
|
|
this.addPage();
|
|
}
|
|
}
|
|
|
|
addPage(options) {
|
|
if (options == null) {
|
|
({ options } = this);
|
|
}
|
|
|
|
// end the current page if needed
|
|
if (!this.options.bufferPages) {
|
|
this.flushPages();
|
|
}
|
|
|
|
// create a page object
|
|
this.page = new PDFPage(this, options);
|
|
this._pageBuffer.push(this.page);
|
|
|
|
// add the page to the object store
|
|
const pages = this._root.data.Pages.data;
|
|
pages.Kids.push(this.page.dictionary);
|
|
pages.Count++;
|
|
|
|
// reset x and y coordinates
|
|
this.x = this.page.margins.left;
|
|
this.y = this.page.margins.top;
|
|
|
|
// flip PDF coordinate system so that the origin is in
|
|
// the top left rather than the bottom left
|
|
this._ctm = [1, 0, 0, 1, 0, 0];
|
|
this.transform(1, 0, 0, -1, 0, this.page.height);
|
|
|
|
this.emit('pageAdded');
|
|
|
|
return this;
|
|
}
|
|
|
|
continueOnNewPage(options) {
|
|
const pageMarkings = this.endPageMarkings(this.page);
|
|
|
|
this.addPage(options);
|
|
|
|
this.initPageMarkings(pageMarkings);
|
|
|
|
return this;
|
|
}
|
|
|
|
bufferedPageRange() {
|
|
return { start: this._pageBufferStart, count: this._pageBuffer.length };
|
|
}
|
|
|
|
switchToPage(n) {
|
|
let page;
|
|
if (!(page = this._pageBuffer[n - this._pageBufferStart])) {
|
|
throw new Error(
|
|
`switchToPage(${n}) out of bounds, current buffer covers pages ${
|
|
this._pageBufferStart
|
|
} to ${this._pageBufferStart + this._pageBuffer.length - 1}`
|
|
);
|
|
}
|
|
|
|
return (this.page = page);
|
|
}
|
|
|
|
flushPages() {
|
|
// this local variable exists so we're future-proof against
|
|
// reentrant calls to flushPages.
|
|
const pages = this._pageBuffer;
|
|
this._pageBuffer = [];
|
|
this._pageBufferStart += pages.length;
|
|
for (let page of pages) {
|
|
this.endPageMarkings(page);
|
|
page.end();
|
|
}
|
|
}
|
|
|
|
addNamedDestination(name, ...args) {
|
|
if (args.length === 0) {
|
|
args = ['XYZ', null, null, null];
|
|
}
|
|
if (args[0] === 'XYZ' && args[2] !== null) {
|
|
args[2] = this.page.height - args[2];
|
|
}
|
|
args.unshift(this.page.dictionary);
|
|
this._root.data.Names.data.Dests.add(name, args);
|
|
}
|
|
|
|
addNamedEmbeddedFile(name, ref) {
|
|
if (!this._root.data.Names.data.EmbeddedFiles) {
|
|
// disabling /Limits for this tree fixes attachments not showing in Adobe Reader
|
|
this._root.data.Names.data.EmbeddedFiles = new PDFNameTree({ limits: false });
|
|
}
|
|
|
|
// add filespec to EmbeddedFiles
|
|
this._root.data.Names.data.EmbeddedFiles.add(name, ref);
|
|
}
|
|
|
|
addNamedJavaScript(name, js) {
|
|
if (!this._root.data.Names.data.JavaScript) {
|
|
this._root.data.Names.data.JavaScript = new PDFNameTree();
|
|
}
|
|
let data = {
|
|
JS: new String(js),
|
|
S: 'JavaScript'
|
|
};
|
|
this._root.data.Names.data.JavaScript.add(name, data);
|
|
}
|
|
|
|
ref(data) {
|
|
const ref = new PDFReference(this, this._offsets.length + 1, data);
|
|
this._offsets.push(null); // placeholder for this object's offset once it is finalized
|
|
this._waiting++;
|
|
return ref;
|
|
}
|
|
|
|
_read() {}
|
|
// do nothing, but this method is required by node
|
|
|
|
_write(data) {
|
|
if (!Buffer.isBuffer(data)) {
|
|
data = Buffer.from(data + '\n', 'binary');
|
|
}
|
|
|
|
this.push(data);
|
|
return (this._offset += data.length);
|
|
}
|
|
|
|
addContent(data) {
|
|
this.page.write(data);
|
|
return this;
|
|
}
|
|
|
|
_refEnd(ref) {
|
|
this._offsets[ref.id - 1] = ref.offset;
|
|
if (--this._waiting === 0 && this._ended) {
|
|
this._finalize();
|
|
return (this._ended = false);
|
|
}
|
|
}
|
|
|
|
write(filename, fn) {
|
|
// print a deprecation warning with a stacktrace
|
|
const err = new Error(`\
|
|
PDFDocument#write is deprecated, and will be removed in a future version of PDFKit. \
|
|
Please pipe the document into a Node stream.\
|
|
`);
|
|
|
|
console.warn(err.stack);
|
|
|
|
this.pipe(fs.createWriteStream(filename));
|
|
this.end();
|
|
return this.once('end', fn);
|
|
}
|
|
|
|
end() {
|
|
this.flushPages();
|
|
|
|
this._info = this.ref();
|
|
for (let key in this.info) {
|
|
let val = this.info[key];
|
|
if (typeof val === 'string') {
|
|
val = new String(val);
|
|
}
|
|
|
|
let entry = this.ref(val);
|
|
entry.end();
|
|
|
|
this._info.data[key] = entry;
|
|
}
|
|
|
|
this._info.end();
|
|
|
|
for (let name in this._fontFamilies) {
|
|
const font = this._fontFamilies[name];
|
|
font.finalize();
|
|
}
|
|
|
|
this.endOutline();
|
|
this.endMarkings();
|
|
|
|
if (this.subset) {
|
|
this.endSubset();
|
|
}
|
|
|
|
this.endMetadata();
|
|
|
|
this._root.end();
|
|
this._root.data.Pages.end();
|
|
this._root.data.Names.end();
|
|
this.endAcroForm();
|
|
|
|
if (this._root.data.ViewerPreferences) {
|
|
this._root.data.ViewerPreferences.end();
|
|
}
|
|
|
|
if (this._security) {
|
|
this._security.end();
|
|
}
|
|
|
|
if (this._waiting === 0) {
|
|
return this._finalize();
|
|
} else {
|
|
return (this._ended = true);
|
|
}
|
|
}
|
|
|
|
_finalize() {
|
|
// generate xref
|
|
const xRefOffset = this._offset;
|
|
this._write('xref');
|
|
this._write(`0 ${this._offsets.length + 1}`);
|
|
this._write('0000000000 65535 f ');
|
|
|
|
for (let offset of this._offsets) {
|
|
offset = `0000000000${offset}`.slice(-10);
|
|
this._write(offset + ' 00000 n ');
|
|
}
|
|
|
|
// trailer
|
|
const trailer = {
|
|
Size: this._offsets.length + 1,
|
|
Root: this._root,
|
|
Info: this._info,
|
|
ID: [this._id, this._id]
|
|
};
|
|
if (this._security) {
|
|
trailer.Encrypt = this._security.dictionary;
|
|
}
|
|
|
|
this._write('trailer');
|
|
this._write(PDFObject.convert(trailer));
|
|
|
|
this._write('startxref');
|
|
this._write(`${xRefOffset}`);
|
|
this._write('%%EOF');
|
|
|
|
// end the stream
|
|
return this.push(null);
|
|
}
|
|
|
|
toString() {
|
|
return '[object PDFDocument]';
|
|
}
|
|
}
|
|
|
|
const mixin = methods => {
|
|
Object.assign(PDFDocument.prototype, methods);
|
|
};
|
|
|
|
mixin(MetadataMixin);
|
|
mixin(ColorMixin);
|
|
mixin(VectorMixin);
|
|
mixin(FontsMixin);
|
|
mixin(TextMixin);
|
|
mixin(ImagesMixin);
|
|
mixin(AnnotationsMixin);
|
|
mixin(OutlineMixin);
|
|
mixin(MarkingsMixin);
|
|
mixin(AcroFormMixin);
|
|
mixin(AttachmentsMixin);
|
|
mixin(SubsetMixin);
|
|
|
|
PDFDocument.LineWrapper = LineWrapper;
|
|
|
|
export default PDFDocument;
|