agsamantha/node_modules/@langchain/community/dist/embeddings/tensorflow.js
2024-10-02 15:15:21 -05:00

83 lines
2.8 KiB
JavaScript

import { load } from "@tensorflow-models/universal-sentence-encoder";
import * as tf from "@tensorflow/tfjs-core";
import { Embeddings } from "@langchain/core/embeddings";
/**
* Class that extends the Embeddings class and provides methods for
* generating embeddings using the Universal Sentence Encoder model from
* TensorFlow.js.
* @example
* ```typescript
* const embeddings = new TensorFlowEmbeddings();
* const store = new MemoryVectorStore(embeddings);
*
* const documents = [
* "A document",
* "Some other piece of text",
* "One more",
* "And another",
* ];
*
* await store.addDocuments(
* documents.map((pageContent) => new Document({ pageContent }))
* );
* ```
*/
export class TensorFlowEmbeddings extends Embeddings {
constructor(fields) {
super(fields ?? {});
Object.defineProperty(this, "_cached", {
enumerable: true,
configurable: true,
writable: true,
value: void 0
});
try {
tf.backend();
}
catch (e) {
throw new Error("No TensorFlow backend found, see instructions at ...");
}
}
/**
* Private method that loads the Universal Sentence Encoder model if it
* hasn't been loaded already. It returns a promise that resolves to the
* loaded model.
* @returns Promise that resolves to the loaded Universal Sentence Encoder model.
*/
async load() {
if (this._cached === undefined) {
this._cached = load();
}
return this._cached;
}
_embed(texts) {
return this.caller.call(async () => {
const model = await this.load();
return model.embed(texts);
});
}
/**
* Method that takes a document as input and returns a promise that
* resolves to an embedding for the document. It calls the _embed method
* with the document as the input and processes the result to return a
* single embedding.
* @param document Document to generate an embedding for.
* @returns Promise that resolves to an embedding for the input document.
*/
embedQuery(document) {
return this._embed([document])
.then((embeddings) => embeddings.array())
.then((embeddings) => embeddings[0]);
}
/**
* Method that takes an array of documents as input and returns a promise
* that resolves to a 2D array of embeddings for each document. It calls
* the _embed method with the documents as the input and processes the
* result to return the embeddings.
* @param documents Array of documents to generate embeddings for.
* @returns Promise that resolves to a 2D array of embeddings for each input document.
*/
embedDocuments(documents) {
return this._embed(documents).then((embeddings) => embeddings.array());
}
}