Meilisearch - Added metadata as filterable attributes and polling on enqueued tasks (#3042)

* added polling for enqueued tasks,metadata filterable

* delete index feature with polling on task

* added search filter interface

* Update pnpm-lock.yaml

---------

Co-authored-by: Henry Heng <henryheng@flowiseai.com>
This commit is contained in:
Mohamed Yasser Oaf
2024-08-23 18:27:07 +03:00
committed by GitHub
parent 72a03dc6e8
commit 0f58d31493
2 changed files with 116 additions and 12 deletions
@@ -55,7 +55,7 @@ class MeilisearchRetriever_node implements INode {
label: 'Host', label: 'Host',
name: 'host', name: 'host',
type: 'string', type: 'string',
description: 'This is the URL for the desired Meilisearch instance' description: "This is the URL for the desired Meilisearch instance, the URL must not end with a '/'"
}, },
{ {
label: 'Index Uid', label: 'Index Uid',
@@ -63,11 +63,17 @@ class MeilisearchRetriever_node implements INode {
type: 'string', type: 'string',
description: 'UID for the index to answer from' description: 'UID for the index to answer from'
}, },
{
label: 'Delete Index if exists',
name: 'deleteIndex',
type: 'boolean',
optional: true
},
{ {
label: 'Top K', label: 'Top K',
name: 'K', name: 'K',
type: 'number', type: 'number',
description: 'number of top searches to return as context', description: 'number of top searches to return as context, default is 4',
additionalParams: true, additionalParams: true,
optional: true optional: true
}, },
@@ -75,7 +81,15 @@ class MeilisearchRetriever_node implements INode {
label: 'Semantic Ratio', label: 'Semantic Ratio',
name: 'semanticRatio', name: 'semanticRatio',
type: 'number', type: 'number',
description: 'percentage of sematic reasoning in meilisearch hybrid search', description: 'percentage of sematic reasoning in meilisearch hybrid search, default is 0.75',
additionalParams: true,
optional: true
},
{
label: 'Search Filter',
name: 'searchFilter',
type: 'string',
description: 'search filter to apply on searchable attributes',
additionalParams: true, additionalParams: true,
optional: true optional: true
} }
@@ -104,6 +118,7 @@ class MeilisearchRetriever_node implements INode {
const docs = nodeData.inputs?.document as Document[] const docs = nodeData.inputs?.document as Document[]
const host = nodeData.inputs?.host as string const host = nodeData.inputs?.host as string
const indexUid = nodeData.inputs?.indexUid as string const indexUid = nodeData.inputs?.indexUid as string
const deleteIndex = nodeData.inputs?.deleteIndex as boolean
const embeddings = nodeData.inputs?.embeddings as Embeddings const embeddings = nodeData.inputs?.embeddings as Embeddings
let embeddingDimension: number = 384 let embeddingDimension: number = 384
const client = new Meilisearch({ const client = new Meilisearch({
@@ -132,17 +147,52 @@ class MeilisearchRetriever_node implements INode {
finalDocs.push(documentForIndexing) finalDocs.push(documentForIndexing)
} }
} }
let taskUid_created: number = 0
if (deleteIndex) {
try {
const deleteResponse = await client.deleteIndex(indexUid)
taskUid_created = deleteResponse.taskUid
let deleteTaskStatus = await client.getTask(taskUid_created)
while (deleteTaskStatus.status !== 'succeeded') {
deleteTaskStatus = await client.getTask(taskUid_created)
if (deleteTaskStatus.error !== null || deleteTaskStatus.status === 'failed') {
throw new Error('Error during index deletion task: ' + deleteTaskStatus.error)
}
}
} catch (error) {
console.error(error)
console.warn('Error occured when deleting your index, if it did not exist, we will create one for you... ')
}
}
let index: any let index: any
try { try {
index = await client.getIndex(indexUid) index = await client.getIndex(indexUid)
} catch (error) { } catch (error) {
console.error('Error fetching index:', error) console.warn('Index not found, creating a new index...')
await client.createIndex(indexUid, { primaryKey: 'objectID' })
} finally { try {
index = await client.getIndex(indexUid) const createResponse = await client.createIndex(indexUid, { primaryKey: 'objectID' })
taskUid_created = createResponse.taskUid
let createTaskStatus = await client.getTask(taskUid_created)
while (createTaskStatus.status !== 'succeeded') {
createTaskStatus = await client.getTask(taskUid_created)
if (createTaskStatus.error !== null || createTaskStatus.status === 'failed') {
throw new Error('Error during index creation task: ' + createTaskStatus.error)
}
}
index = await client.getIndex(indexUid)
} catch (taskError) {
console.error('Error during index creation process:', taskError)
}
} }
try { try {
await index.updateFilterableAttributes(['metadata'])
await index.updateSettings({ await index.updateSettings({
embedders: { embedders: {
ollama: { ollama: {
@@ -151,23 +201,72 @@ class MeilisearchRetriever_node implements INode {
} }
} }
}) })
await index.addDocuments(finalDocs) const addResponse = await index.addDocuments(finalDocs)
taskUid_created = addResponse.taskUid
let AddTaskStatus = await client.getTask(taskUid_created)
while (AddTaskStatus.status !== 'succeeded') {
AddTaskStatus = await client.getTask(taskUid_created)
if (AddTaskStatus.error !== null || AddTaskStatus.status === 'failed') {
throw new Error('Error during documents adding task: ' + AddTaskStatus.error)
}
}
index = await client.getIndex(indexUid)
} catch (error) { } catch (error) {
console.error('Error occurred while adding documents:', error) console.error('Error occurred while adding documents:', error)
} }
return return { numAdded: finalDocs.length, addedDocs: finalDocs }
} }
} }
async init(nodeData: INodeData, _: string, options: ICommonObject): Promise<any> { async init(nodeData: INodeData, _: string, options: ICommonObject): Promise<any> {
const credentialData = await getCredentialData(nodeData.credential ?? '', options) const credentialData = await getCredentialData(nodeData.credential ?? '', options)
const meilisearchSearchApiKey = getCredentialParam('meilisearchSearchApiKey', credentialData, nodeData) const meilisearchSearchApiKey = getCredentialParam('meilisearchSearchApiKey', credentialData, nodeData)
const meilisearchAdminApiKey = getCredentialParam('meilisearchAdminApiKey', credentialData, nodeData)
const host = nodeData.inputs?.host as string const host = nodeData.inputs?.host as string
const indexUid = nodeData.inputs?.indexUid as string const indexUid = nodeData.inputs?.indexUid as string
const K = nodeData.inputs?.K as string const K = nodeData.inputs?.K as string
const semanticRatio = nodeData.inputs?.semanticRatio as string const semanticRatio = nodeData.inputs?.semanticRatio as string
const embeddings = nodeData.inputs?.embeddings as Embeddings const embeddings = nodeData.inputs?.embeddings as Embeddings
const searchFilter = nodeData.inputs?.searchFilter as string
const hybridsearchretriever = new MeilisearchRetriever(host, meilisearchSearchApiKey, indexUid, K, semanticRatio, embeddings) const experimentalEndpoint = host + '/experimental-features/'
const token = meilisearchAdminApiKey
const experimentalOptions = {
method: 'PATCH',
headers: {
'Content-Type': 'application/json',
Authorization: `Bearer ${token}`
},
body: JSON.stringify({
vectorStore: true
})
}
try {
const response = await fetch(experimentalEndpoint, experimentalOptions)
if (!response.ok) {
throw new Error(`Failed to enable vectorStore: ${response.statusText}`)
}
const data = await response.json()
const vectorStoreEnabled = data.vectorStore
if (vectorStoreEnabled !== true) {
throw new Error('Failed to enable vectorStore, vectorStrore property returned is not true')
}
} catch (error) {
console.error('Error enabling vectorStore feature:', error)
}
const hybridsearchretriever = new MeilisearchRetriever(
host,
meilisearchSearchApiKey,
indexUid,
K,
semanticRatio,
embeddings,
searchFilter
)
return hybridsearchretriever return hybridsearchretriever
} }
} }
@@ -13,6 +13,7 @@ export class MeilisearchRetriever extends BaseRetriever {
private K: string private K: string
private semanticRatio: string private semanticRatio: string
private embeddings: Embeddings private embeddings: Embeddings
private searchFilter: string
constructor( constructor(
host: string, host: string,
meilisearchSearchApiKey: any, meilisearchSearchApiKey: any,
@@ -20,6 +21,7 @@ export class MeilisearchRetriever extends BaseRetriever {
K: string, K: string,
semanticRatio: string, semanticRatio: string,
embeddings: Embeddings, embeddings: Embeddings,
searchFilter: string,
fields?: CustomRetrieverInput fields?: CustomRetrieverInput
) { ) {
super(fields) super(fields)
@@ -27,9 +29,10 @@ export class MeilisearchRetriever extends BaseRetriever {
this.host = host this.host = host
this.indexUid = indexUid this.indexUid = indexUid
this.embeddings = embeddings this.embeddings = embeddings
this.searchFilter = searchFilter
if (semanticRatio == '') { if (semanticRatio == '') {
this.semanticRatio = '0.5' this.semanticRatio = '0.75'
} else { } else {
let semanticRatio_Float = parseFloat(semanticRatio) let semanticRatio_Float = parseFloat(semanticRatio)
if (semanticRatio_Float > 1.0) { if (semanticRatio_Float > 1.0) {
@@ -59,6 +62,7 @@ export class MeilisearchRetriever extends BaseRetriever {
const questionEmbedding = await this.embeddings.embedQuery(query) const questionEmbedding = await this.embeddings.embedQuery(query)
// Perform the search // Perform the search
const searchResults = await index.search(query, { const searchResults = await index.search(query, {
filter: this.searchFilter,
vector: questionEmbedding, vector: questionEmbedding,
limit: parseInt(this.K), // Optional: Limit the number of results limit: parseInt(this.K), // Optional: Limit the number of results
attributesToRetrieve: ['*'], // Optional: Specify which fields to retrieve attributesToRetrieve: ['*'], // Optional: Specify which fields to retrieve
@@ -80,7 +84,8 @@ export class MeilisearchRetriever extends BaseRetriever {
new Document({ new Document({
pageContent: hit.pageContent, pageContent: hit.pageContent,
metadata: { metadata: {
objectID: hit.objectID objectID: hit.objectID,
...hit.metadata
} }
}) })
) )