File size: 4,056 Bytes
1b756c8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
import { ClassicPreset } from 'rete';
import { BaseWorkflowNode } from './base-node';
import { pdfSocket } from '../sockets';
import type { PDFData, SocketData, MultiPDFData } from '../types';
import { PDFDocument } from 'pdf-lib';
import { readFileAsArrayBuffer, initializeQpdf } from '../../utils/helpers.js';

export class EncryptedPDFError extends Error {
  constructor(public readonly filename: string) {
    super(`PDF "${filename}" is password-protected`);
    this.name = 'EncryptedPDFError';
  }
}

export class PDFInputNode extends BaseWorkflowNode {
  readonly category = 'Input' as const;
  readonly icon = 'ph-file-pdf';
  readonly description = 'Upload one or more PDF files';

  private files: PDFData[] = [];

  constructor() {
    super('PDF Input');
    this.addOutput('pdf', new ClassicPreset.Output(pdfSocket, 'PDF'));
  }

  async addFile(file: File): Promise<void> {
    const arrayBuffer = await readFileAsArrayBuffer(file);
    const bytes = new Uint8Array(arrayBuffer as ArrayBuffer);

    let isEncrypted = false;
    try {
      await PDFDocument.load(bytes, { throwOnInvalidObject: false });
    } catch {
      isEncrypted = true;
    }

    if (isEncrypted) {
      try {
        await PDFDocument.load(bytes, {
          ignoreEncryption: true,
          throwOnInvalidObject: false,
        });
      } catch {
        throw new Error(
          `Failed to load "${file.name}" - file may be corrupted`
        );
      }
      throw new EncryptedPDFError(file.name);
    }

    const document = await PDFDocument.load(bytes, {
      throwOnInvalidObject: false,
    });
    this.files.push({
      type: 'pdf',
      document,
      bytes,
      filename: file.name,
    });
  }

  async addDecryptedFile(file: File, password: string): Promise<void> {
    const arrayBuffer = await readFileAsArrayBuffer(file);
    const bytes = new Uint8Array(arrayBuffer as ArrayBuffer);
    const qpdf = await initializeQpdf();
    const uid = `${Date.now()}_${Math.random().toString(36).slice(2, 9)}`;
    const inputPath = `/tmp/input_decrypt_${uid}.pdf`;
    const outputPath = `/tmp/output_decrypt_${uid}.pdf`;

    try {
      qpdf.FS.writeFile(inputPath, bytes);
      qpdf.callMain([
        inputPath,
        '--password=' + password,
        '--decrypt',
        outputPath,
      ]);
      const decryptedData = qpdf.FS.readFile(outputPath, {
        encoding: 'binary',
      });
      const decryptedBytes = new Uint8Array(decryptedData);
      const document = await PDFDocument.load(decryptedBytes, {
        throwOnInvalidObject: false,
      });
      this.files.push({
        type: 'pdf',
        document,
        bytes: decryptedBytes,
        filename: file.name,
      });
    } finally {
      try {
        qpdf.FS.unlink(inputPath);
      } catch {
        /* cleanup */
      }
      try {
        qpdf.FS.unlink(outputPath);
      } catch {
        /* cleanup */
      }
    }
  }

  async setFile(file: File): Promise<void> {
    this.files = [];
    await this.addFile(file);
  }

  async setFiles(fileList: File[]): Promise<void> {
    this.files = [];
    for (const file of fileList) {
      await this.addFile(file);
    }
  }

  removeFile(index: number): void {
    this.files.splice(index, 1);
  }

  hasFile(): boolean {
    return this.files.length > 0;
  }

  getFileCount(): number {
    return this.files.length;
  }

  getFilenames(): string[] {
    return this.files.map((f) => f.filename);
  }

  getFilename(): string {
    if (this.files.length === 0) return '';
    if (this.files.length === 1) return this.files[0].filename;
    return `${this.files.length} files`;
  }

  async data(
    _inputs: Record<string, SocketData[]>
  ): Promise<Record<string, SocketData>> {
    if (this.files.length === 0) {
      throw new Error('No PDF files uploaded in PDF Input node');
    }

    if (this.files.length === 1) {
      return { pdf: this.files[0] };
    }

    const multiData: MultiPDFData = {
      type: 'multi-pdf',
      items: this.files,
    };
    return { pdf: multiData };
  }
}