Files
docx-js/src/patcher/from-docx.ts

147 lines
4.8 KiB
TypeScript
Raw Normal View History

2023-02-08 03:18:11 +00:00
import * as JSZip from "jszip";
2023-02-18 20:36:24 +00:00
import { Element, js2xml } from "xml-js";
2023-02-25 19:33:12 +00:00
import { ParagraphChild } from "@file/paragraph";
import { FileChild } from "@file/file-child";
2023-03-03 23:47:50 +00:00
import { IMediaData, Media } from "@file/media";
import { IViewWrapper } from "@file/document-wrapper";
import { File } from "@file/file";
import { IContext } from "@file/xml-components";
import { ImageReplacer } from "@export/packer/image-replacer";
2023-02-25 19:33:12 +00:00
2023-02-16 20:17:48 +00:00
import { replacer } from "./replacer";
2023-02-17 10:38:03 +00:00
import { findLocationOfText } from "./traverser";
2023-02-18 20:36:24 +00:00
import { toJson } from "./util";
2023-03-03 23:47:50 +00:00
import { appendRelationship, getNextRelationshipIndex } from "./relationship-manager";
import { appendContentType } from "./content-types-manager";
2023-02-08 03:18:11 +00:00
// eslint-disable-next-line functional/prefer-readonly-type
type InputDataType = Buffer | string | number[] | Uint8Array | ArrayBuffer | Blob | NodeJS.ReadableStream;
2023-02-25 19:33:12 +00:00
export enum PatchType {
DOCUMENT = "file",
PARAGRAPH = "paragraph",
2023-02-17 10:38:03 +00:00
}
2023-02-25 19:33:12 +00:00
type ParagraphPatch = {
readonly type: PatchType.PARAGRAPH;
readonly children: readonly ParagraphChild[];
};
type FilePatch = {
readonly type: PatchType.DOCUMENT;
readonly children: readonly FileChild[];
};
2023-03-03 23:47:50 +00:00
interface IRelationshipReplacement {
readonly key: string;
readonly mediaDatas: readonly IMediaData[];
}
2023-02-25 22:18:31 +00:00
export type IPatch = ParagraphPatch | FilePatch;
2023-02-25 19:33:12 +00:00
2023-02-17 10:38:03 +00:00
export interface PatchDocumentOptions {
2023-02-25 22:18:31 +00:00
readonly patches: { readonly [key: string]: IPatch };
2023-02-16 20:17:48 +00:00
}
2023-03-03 23:47:50 +00:00
const imageReplacer = new ImageReplacer();
2023-02-16 20:17:48 +00:00
export const patchDocument = async (data: InputDataType, options: PatchDocumentOptions): Promise<Buffer> => {
2023-02-08 03:18:11 +00:00
const zipContent = await JSZip.loadAsync(data);
2023-03-03 23:47:50 +00:00
const context: IContext = {
file: {
Media: new Media(),
} as unknown as File,
viewWrapper: {} as unknown as IViewWrapper,
stack: [],
};
2023-02-17 10:38:03 +00:00
const map = new Map<string, Element>();
2023-02-08 03:18:11 +00:00
2023-03-03 23:47:50 +00:00
// eslint-disable-next-line functional/prefer-readonly-type
const relationshipReplacement: IRelationshipReplacement[] = [];
let hasMedia = false;
2023-02-08 03:18:11 +00:00
for (const [key, value] of Object.entries(zipContent.files)) {
const json = toJson(await value.async("text"));
2023-03-03 23:47:50 +00:00
if (key.startsWith("word/") && !key.endsWith(".xml.rels")) {
2023-02-25 22:18:31 +00:00
for (const [patchKey, patchValue] of Object.entries(options.patches)) {
const patchText = `{{${patchKey}}}`;
const renderedParagraphs = findLocationOfText(json, patchText);
2023-02-25 22:18:56 +00:00
// TODO: mutates json. Make it immutable
2023-03-03 23:47:50 +00:00
replacer(json, patchValue, patchText, renderedParagraphs, context);
}
const mediaDatas = imageReplacer.getMediaData(JSON.stringify(json), context.file.Media);
if (mediaDatas.length > 0) {
hasMedia = true;
// eslint-disable-next-line functional/immutable-data
relationshipReplacement.push({
key,
mediaDatas,
});
2023-02-17 10:38:03 +00:00
}
2023-02-16 20:17:48 +00:00
}
2023-02-08 03:18:11 +00:00
map.set(key, json);
}
2023-03-03 23:47:50 +00:00
for (const { key, mediaDatas } of relationshipReplacement) {
// eslint-disable-next-line functional/immutable-data
const relationshipsJson = map.get(`word/_rels/${key.split("/").pop()}.rels`);
if (relationshipsJson) {
const index = getNextRelationshipIndex(relationshipsJson);
const newJson = imageReplacer.replace(JSON.stringify(map.get(key)), mediaDatas, index);
map.set(key, JSON.parse(newJson) as Element);
for (const { fileName } of mediaDatas) {
appendRelationship(
relationshipsJson,
index,
"http://schemas.openxmlformats.org/officeDocument/2006/relationships/image",
`media/${fileName}`,
);
}
}
}
if (hasMedia) {
const contentTypesJson = map.get("[Content_Types].xml");
if (!contentTypesJson) {
throw new Error("Could not find content types file");
}
appendContentType(contentTypesJson, "image/png", "png");
appendContentType(contentTypesJson, "image/jpeg", "jpeg");
appendContentType(contentTypesJson, "image/jpeg", "jpg");
appendContentType(contentTypesJson, "image/bmp", "bmp");
appendContentType(contentTypesJson, "image/gif", "gif");
}
2023-02-08 03:18:11 +00:00
const zip = new JSZip();
for (const [key, value] of map) {
const output = toXml(value);
zip.file(key, output);
}
2023-03-03 23:47:50 +00:00
for (const { stream, fileName } of context.file.Media.Array) {
zip.file(`word/media/${fileName}`, stream);
}
return zip.generateAsync({
2023-02-08 03:18:11 +00:00
type: "nodebuffer",
mimeType: "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
compression: "DEFLATE",
});
};
2023-02-17 10:38:03 +00:00
const toXml = (jsonObj: Element): string => {
2023-02-08 03:18:11 +00:00
const output = js2xml(jsonObj);
return output;
};