import { flatten } from 'lodash' import { Pinecone } from '@pinecone-database/pinecone' import { PineconeStoreParams, PineconeStore } from '@langchain/pinecone' import { Embeddings } from '@langchain/core/embeddings' import { Document } from '@langchain/core/documents' import { ICommonObject, INode, INodeData, INodeOutputsValue, INodeParams, IndexingResult } from '../../../src/Interface' import { getBaseClasses, getCredentialData, getCredentialParam } from '../../../src/utils' import { addMMRInputParams, resolveVectorStoreOrRetriever } from '../VectorStoreUtils' import { index } from '../../../src/indexing' class Pinecone_VectorStores implements INode { label: string name: string version: number description: string type: string icon: string category: string badge: string baseClasses: string[] inputs: INodeParams[] credential: INodeParams outputs: INodeOutputsValue[] constructor() { this.label = 'Pinecone' this.name = 'pinecone' this.version = 3.0 this.type = 'Pinecone' this.icon = 'pinecone.svg' this.category = 'Vector Stores' this.description = `Upsert embedded data and perform similarity or mmr search using Pinecone, a leading fully managed hosted vector database` this.baseClasses = [this.type, 'VectorStoreRetriever', 'BaseRetriever'] this.badge = 'NEW' this.credential = { label: 'Connect Credential', name: 'credential', type: 'credential', credentialNames: ['pineconeApi'] } this.inputs = [ { label: 'Document', name: 'document', type: 'Document', list: true, optional: true }, { label: 'Embeddings', name: 'embeddings', type: 'Embeddings' }, { label: 'Record Manager', name: 'recordManager', type: 'RecordManager', description: 'Keep track of the record to prevent duplication', optional: true }, { label: 'Pinecone Index', name: 'pineconeIndex', type: 'string' }, { label: 'Pinecone Namespace', name: 'pineconeNamespace', type: 'string', placeholder: 'my-first-namespace', additionalParams: true, optional: true }, { label: 'Pinecone Metadata Filter', name: 'pineconeMetadataFilter', type: 'json', optional: true, additionalParams: true }, { label: 'Top K', name: 'topK', description: 'Number of top results to fetch. Default to 4', placeholder: '4', type: 'number', additionalParams: true, optional: true } ] addMMRInputParams(this.inputs) this.outputs = [ { label: 'Pinecone Retriever', name: 'retriever', baseClasses: this.baseClasses }, { label: 'Pinecone Vector Store', name: 'vectorStore', baseClasses: [this.type, ...getBaseClasses(PineconeStore)] } ] } //@ts-ignore vectorStoreMethods = { async upsert(nodeData: INodeData, options: ICommonObject): Promise> { const _index = nodeData.inputs?.pineconeIndex as string const pineconeNamespace = nodeData.inputs?.pineconeNamespace as string const docs = nodeData.inputs?.document as Document[] const embeddings = nodeData.inputs?.embeddings as Embeddings const recordManager = nodeData.inputs?.recordManager const credentialData = await getCredentialData(nodeData.credential ?? '', options) const pineconeApiKey = getCredentialParam('pineconeApiKey', credentialData, nodeData) const client = new Pinecone({ apiKey: pineconeApiKey }) const pineconeIndex = client.Index(_index) const flattenDocs = docs && docs.length ? flatten(docs) : [] const finalDocs = [] for (let i = 0; i < flattenDocs.length; i += 1) { if (flattenDocs[i] && flattenDocs[i].pageContent) { finalDocs.push(new Document(flattenDocs[i])) } } const obj: PineconeStoreParams = { pineconeIndex } if (pineconeNamespace) obj.namespace = pineconeNamespace try { if (recordManager) { const vectorStore = await PineconeStore.fromExistingIndex(embeddings, obj) await recordManager.createSchema() const res = await index({ docsSource: finalDocs, recordManager, vectorStore, options: { cleanup: recordManager?.cleanup, sourceIdKey: recordManager?.sourceIdKey ?? 'source', vectorStoreName: pineconeNamespace } }) return res } else { await PineconeStore.fromDocuments(finalDocs, embeddings, obj) return { numAdded: finalDocs.length, addedDocs: finalDocs } } } catch (e) { throw new Error(e) } } } async init(nodeData: INodeData, _: string, options: ICommonObject): Promise { const index = nodeData.inputs?.pineconeIndex as string const pineconeNamespace = nodeData.inputs?.pineconeNamespace as string const pineconeMetadataFilter = nodeData.inputs?.pineconeMetadataFilter const embeddings = nodeData.inputs?.embeddings as Embeddings const credentialData = await getCredentialData(nodeData.credential ?? '', options) const pineconeApiKey = getCredentialParam('pineconeApiKey', credentialData, nodeData) const client = new Pinecone({ apiKey: pineconeApiKey }) await client.describeIndex(index) const pineconeIndex = client.Index(index) const obj: PineconeStoreParams = { pineconeIndex } if (pineconeNamespace) obj.namespace = pineconeNamespace if (pineconeMetadataFilter) { const metadatafilter = typeof pineconeMetadataFilter === 'object' ? pineconeMetadataFilter : JSON.parse(pineconeMetadataFilter) obj.filter = metadatafilter } const vectorStore = await PineconeStore.fromExistingIndex(embeddings, obj) return resolveVectorStoreOrRetriever(nodeData, vectorStore, obj.filter) } } module.exports = { nodeClass: Pinecone_VectorStores }