-
Notifications
You must be signed in to change notification settings - Fork 2.2k
/
buffer.ts
73 lines (69 loc) · 2.73 KB
/
buffer.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import type { readFile as ReadFileT } from "node:fs/promises";
import { Document } from "@langchain/core/documents";
import { getEnv } from "@langchain/core/utils/env";
import { BaseDocumentLoader } from "../base.js";
/**
* Abstract class that extends the `BaseDocumentLoader` class. It
* represents a document loader that loads documents from a buffer. The
* `load()` method is implemented to read the buffer contents and metadata
* based on the type of `filePathOrBlob`, and then calls the `parse()`
* method to parse the buffer and return the documents.
*/
export abstract class BufferLoader extends BaseDocumentLoader {
constructor(public filePathOrBlob: string | Blob) {
super();
}
/**
* Abstract method that needs to be implemented by subclasses. It is used
* to parse the buffer and return the documents.
* @param raw The buffer to be parsed.
* @param metadata Metadata of the document.
* @returns Promise that resolves with an array of `Document` objects.
*/
protected abstract parse(
raw: Buffer,
metadata: Document["metadata"]
): Promise<Document[]>;
/**
* Method that reads the buffer contents and metadata based on the type of
* `filePathOrBlob`, and then calls the `parse()` method to parse the
* buffer and return the documents.
* @returns Promise that resolves with an array of `Document` objects.
*/
public async load(): Promise<Document[]> {
let buffer: Buffer;
let metadata: Record<string, string>;
if (typeof this.filePathOrBlob === "string") {
const { readFile } = await BufferLoader.imports();
buffer = await readFile(this.filePathOrBlob);
metadata = { source: this.filePathOrBlob };
} else {
buffer = await this.filePathOrBlob
.arrayBuffer()
.then((ab) => Buffer.from(ab));
metadata = { source: "blob", blobType: this.filePathOrBlob.type };
}
return this.parse(buffer, metadata);
}
/**
* Static method that imports the `readFile` function from the
* `fs/promises` module in Node.js. It is used to dynamically import the
* function when needed. If the import fails, it throws an error
* indicating that the `fs/promises` module is not available in the
* current environment.
* @returns Promise that resolves with an object containing the `readFile` function.
*/
static async imports(): Promise<{
readFile: typeof ReadFileT;
}> {
try {
const { readFile } = await import("node:fs/promises");
return { readFile };
} catch (e) {
console.error(e);
throw new Error(
`Failed to load fs/promises. TextLoader available only on environment 'node'. It appears you are running environment '${getEnv()}'. See https://<link to docs> for alternatives.`
);
}
}
}