24 lines
1.2 KiB
TypeScript
24 lines
1.2 KiB
TypeScript
|
/// <reference types="node" resolution-mode="require"/>
|
||
|
import { Document } from "@langchain/core/documents";
|
||
|
import { BufferLoader } from "langchain/document_loaders/fs/buffer";
|
||
|
/**
|
||
|
* A class that extends the `BufferLoader` class. It represents a document
|
||
|
* loader that loads documents from DOCX files.
|
||
|
*/
|
||
|
export declare class DocxLoader extends BufferLoader {
|
||
|
constructor(filePathOrBlob: string | Blob);
|
||
|
/**
|
||
|
* A method that takes a `raw` buffer and `metadata` as parameters and
|
||
|
* returns a promise that resolves to an array of `Document` instances. It
|
||
|
* uses the `extractRawText` function from the `mammoth` module to extract
|
||
|
* the raw text content from the buffer. If the extracted text content is
|
||
|
* empty, it returns an empty array. Otherwise, it creates a new
|
||
|
* `Document` instance with the extracted text content and the provided
|
||
|
* metadata, and returns it as an array.
|
||
|
* @param raw The raw buffer from which to extract text content.
|
||
|
* @param metadata The metadata to be associated with the created `Document` instance.
|
||
|
* @returns A promise that resolves to an array of `Document` instances.
|
||
|
*/
|
||
|
parse(raw: Buffer, metadata: Document["metadata"]): Promise<Document[]>;
|
||
|
}
|