agsamantha/node_modules/@langchain/community/dist/document_loaders/web/pdf.d.ts
2024-10-02 15:15:21 -05:00

33 lines
1.1 KiB
TypeScript

/// <reference path="../../../src/types/pdf-parse.d.ts" />
import { Document } from "@langchain/core/documents";
import { BaseDocumentLoader } from "@langchain/core/document_loaders/base";
/**
* A document loader for loading data from PDFs.
* @example
* ```typescript
* const loader = new WebPDFLoader(new Blob());
* const docs = await loader.load();
* console.log({ docs });
* ```
*/
export declare class WebPDFLoader extends BaseDocumentLoader {
protected blob: Blob;
protected splitPages: boolean;
private pdfjs;
protected parsedItemSeparator: string;
constructor(blob: Blob, { splitPages, pdfjs, parsedItemSeparator, }?: {
splitPages?: boolean | undefined;
pdfjs?: typeof PDFLoaderImports | undefined;
parsedItemSeparator?: string | undefined;
});
/**
* Loads the contents of the PDF as documents.
* @returns An array of Documents representing the retrieved data.
*/
load(): Promise<Document[]>;
}
declare function PDFLoaderImports(): Promise<{
getDocument: typeof import("pdf-parse/lib/pdf.js/v1.10.100/build/pdf.js").getDocument;
version: string;
}>;
export {};