mirror of
https://github.com/farcasclaudiu/Flowise.git
synced 2026-06-29 11:01:18 +03:00
Adding support for LLM Caching.
This commit is contained in:
@@ -0,0 +1,44 @@
|
|||||||
|
import { INode, INodeData, INodeOutputsValue, INodeParams } from '../../../src/Interface'
|
||||||
|
import { InMemoryCache } from 'langchain/cache'
|
||||||
|
import { getBaseClasses } from '../../../src'
|
||||||
|
|
||||||
|
class LocalMemoryCache implements INode {
|
||||||
|
label: string
|
||||||
|
name: string
|
||||||
|
version: number
|
||||||
|
description: string
|
||||||
|
type: string
|
||||||
|
icon: string
|
||||||
|
category: string
|
||||||
|
baseClasses: string[]
|
||||||
|
inputs: INodeParams[]
|
||||||
|
outputs: INodeOutputsValue[]
|
||||||
|
inMemoryCache: any
|
||||||
|
|
||||||
|
constructor() {
|
||||||
|
this.label = 'Local (Builtin) Cache'
|
||||||
|
this.name = 'localCache'
|
||||||
|
this.version = 1.0
|
||||||
|
this.type = 'LLMCache'
|
||||||
|
this.icon = 'memorycache.png'
|
||||||
|
this.category = 'LLM Cache'
|
||||||
|
this.baseClasses = [this.type, 'LLMCacheBase']
|
||||||
|
this.inputs = []
|
||||||
|
this.outputs = [
|
||||||
|
{
|
||||||
|
label: 'LLM Cache',
|
||||||
|
name: 'cache',
|
||||||
|
baseClasses: [this.type, ...getBaseClasses(InMemoryCache)]
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
|
||||||
|
async init(nodeData: INodeData): Promise<any> {
|
||||||
|
if (!this.inMemoryCache) {
|
||||||
|
this.inMemoryCache = InMemoryCache.global()
|
||||||
|
}
|
||||||
|
return this.inMemoryCache
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
module.exports = { nodeClass: LocalMemoryCache }
|
||||||
Binary file not shown.
|
After Width: | Height: | Size: 2.7 KiB |
@@ -1,6 +1,8 @@
|
|||||||
import { ICommonObject, INode, INodeData, INodeParams } from '../../../src/Interface'
|
import { ICommonObject, INode, INodeData, INodeParams } from '../../../src/Interface'
|
||||||
import { getBaseClasses, getCredentialData, getCredentialParam } from '../../../src/utils'
|
import { getBaseClasses, getCredentialData, getCredentialParam } from '../../../src/utils'
|
||||||
import { OpenAI, OpenAIInput } from 'langchain/llms/openai'
|
import { OpenAI, OpenAIInput } from 'langchain/llms/openai'
|
||||||
|
import { BaseLLMParams } from 'langchain/dist/llms/base'
|
||||||
|
import { BaseCache } from 'langchain/schema'
|
||||||
|
|
||||||
class OpenAI_LLMs implements INode {
|
class OpenAI_LLMs implements INode {
|
||||||
label: string
|
label: string
|
||||||
@@ -17,7 +19,7 @@ class OpenAI_LLMs implements INode {
|
|||||||
constructor() {
|
constructor() {
|
||||||
this.label = 'OpenAI'
|
this.label = 'OpenAI'
|
||||||
this.name = 'openAI'
|
this.name = 'openAI'
|
||||||
this.version = 2.0
|
this.version = 3.0
|
||||||
this.type = 'OpenAI'
|
this.type = 'OpenAI'
|
||||||
this.icon = 'openai.png'
|
this.icon = 'openai.png'
|
||||||
this.category = 'LLMs'
|
this.category = 'LLMs'
|
||||||
@@ -30,6 +32,12 @@ class OpenAI_LLMs implements INode {
|
|||||||
credentialNames: ['openAIApi']
|
credentialNames: ['openAIApi']
|
||||||
}
|
}
|
||||||
this.inputs = [
|
this.inputs = [
|
||||||
|
{
|
||||||
|
label: 'Cache',
|
||||||
|
name: 'llmCache',
|
||||||
|
type: 'LLMCache',
|
||||||
|
optional: true
|
||||||
|
},
|
||||||
{
|
{
|
||||||
label: 'Model Name',
|
label: 'Model Name',
|
||||||
name: 'modelName',
|
name: 'modelName',
|
||||||
@@ -149,7 +157,9 @@ class OpenAI_LLMs implements INode {
|
|||||||
const credentialData = await getCredentialData(nodeData.credential ?? '', options)
|
const credentialData = await getCredentialData(nodeData.credential ?? '', options)
|
||||||
const openAIApiKey = getCredentialParam('openAIApiKey', credentialData, nodeData)
|
const openAIApiKey = getCredentialParam('openAIApiKey', credentialData, nodeData)
|
||||||
|
|
||||||
const obj: Partial<OpenAIInput> & { openAIApiKey?: string } = {
|
const llmCache = nodeData.inputs?.llmCache as BaseCache
|
||||||
|
|
||||||
|
const obj: Partial<OpenAIInput> & BaseLLMParams & { openAIApiKey?: string } = {
|
||||||
temperature: parseFloat(temperature),
|
temperature: parseFloat(temperature),
|
||||||
modelName,
|
modelName,
|
||||||
openAIApiKey,
|
openAIApiKey,
|
||||||
@@ -164,8 +174,9 @@ class OpenAI_LLMs implements INode {
|
|||||||
if (batchSize) obj.batchSize = parseInt(batchSize, 10)
|
if (batchSize) obj.batchSize = parseInt(batchSize, 10)
|
||||||
if (bestOf) obj.bestOf = parseInt(bestOf, 10)
|
if (bestOf) obj.bestOf = parseInt(bestOf, 10)
|
||||||
|
|
||||||
let parsedBaseOptions: any | undefined = undefined
|
if (llmCache) obj.cache = llmCache
|
||||||
|
|
||||||
|
let parsedBaseOptions: any | undefined = undefined
|
||||||
if (baseOptions) {
|
if (baseOptions) {
|
||||||
try {
|
try {
|
||||||
parsedBaseOptions = typeof baseOptions === 'object' ? baseOptions : JSON.parse(baseOptions)
|
parsedBaseOptions = typeof baseOptions === 'object' ? baseOptions : JSON.parse(baseOptions)
|
||||||
|
|||||||
@@ -42,7 +42,7 @@
|
|||||||
"google-auth-library": "^9.0.0",
|
"google-auth-library": "^9.0.0",
|
||||||
"graphql": "^16.6.0",
|
"graphql": "^16.6.0",
|
||||||
"html-to-text": "^9.0.5",
|
"html-to-text": "^9.0.5",
|
||||||
"langchain": "^0.0.152",
|
"langchain": "^0.0.154",
|
||||||
"langfuse-langchain": "^1.0.14-alpha.0",
|
"langfuse-langchain": "^1.0.14-alpha.0",
|
||||||
"langsmith": "^0.0.32",
|
"langsmith": "^0.0.32",
|
||||||
"linkifyjs": "^4.1.1",
|
"linkifyjs": "^4.1.1",
|
||||||
|
|||||||
@@ -1,6 +1,7 @@
|
|||||||
/**
|
/**
|
||||||
* Types
|
* Types
|
||||||
*/
|
*/
|
||||||
|
import { BaseCache } from 'langchain/schema'
|
||||||
|
|
||||||
export type NodeParamsType =
|
export type NodeParamsType =
|
||||||
| 'asyncOptions'
|
| 'asyncOptions'
|
||||||
@@ -176,3 +177,9 @@ export class VectorStoreRetriever {
|
|||||||
this.vectorStore = fields.vectorStore
|
this.vectorStore = fields.vectorStore
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
export interface LLMCacheBase {
|
||||||
|
name: string
|
||||||
|
description: string
|
||||||
|
baseCache: BaseCache
|
||||||
|
}
|
||||||
|
|||||||
@@ -151,6 +151,7 @@ export class CustomChainHandler extends BaseCallbackHandler {
|
|||||||
socketIOClientId = ''
|
socketIOClientId = ''
|
||||||
skipK = 0 // Skip streaming for first K numbers of handleLLMStart
|
skipK = 0 // Skip streaming for first K numbers of handleLLMStart
|
||||||
returnSourceDocuments = false
|
returnSourceDocuments = false
|
||||||
|
cachedResponse = true
|
||||||
|
|
||||||
constructor(socketIO: Server, socketIOClientId: string, skipK?: number, returnSourceDocuments?: boolean) {
|
constructor(socketIO: Server, socketIOClientId: string, skipK?: number, returnSourceDocuments?: boolean) {
|
||||||
super()
|
super()
|
||||||
@@ -161,6 +162,7 @@ export class CustomChainHandler extends BaseCallbackHandler {
|
|||||||
}
|
}
|
||||||
|
|
||||||
handleLLMStart() {
|
handleLLMStart() {
|
||||||
|
this.cachedResponse = false
|
||||||
if (this.skipK > 0) this.skipK -= 1
|
if (this.skipK > 0) this.skipK -= 1
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -175,13 +177,31 @@ export class CustomChainHandler extends BaseCallbackHandler {
|
|||||||
}
|
}
|
||||||
|
|
||||||
handleLLMEnd() {
|
handleLLMEnd() {
|
||||||
this.socketIO.to(this.socketIOClientId).emit('end')
|
/* send the end event from handleChainEnd */
|
||||||
|
// this.socketIO.to(this.socketIOClientId).emit('end')
|
||||||
}
|
}
|
||||||
|
|
||||||
handleChainEnd(outputs: ChainValues): void | Promise<void> {
|
handleChainEnd(outputs: ChainValues): void | Promise<void> {
|
||||||
if (this.returnSourceDocuments) {
|
if (this.returnSourceDocuments) {
|
||||||
this.socketIO.to(this.socketIOClientId).emit('sourceDocuments', outputs?.sourceDocuments)
|
this.socketIO.to(this.socketIOClientId).emit('sourceDocuments', outputs?.sourceDocuments)
|
||||||
}
|
}
|
||||||
|
/*
|
||||||
|
Langchain does not call handleLLMStart, handleLLMEnd, handleLLMNewToken when the chain is cached.
|
||||||
|
Callback Order is "Chain Start -> LLM Start --> LLM Token --> LLM End -> Chain End" for normal responses.
|
||||||
|
Callback Order is "Chain Start -> Chain End" for cached responses.
|
||||||
|
*/
|
||||||
|
if (this.cachedResponse) {
|
||||||
|
const cachedValue = outputs.text as string
|
||||||
|
//split at whitespace, and keep the whitespace. This is to preserve the original formatting.
|
||||||
|
const result = cachedValue.split(/(\s+)/)
|
||||||
|
result.forEach((token: string, index: number) => {
|
||||||
|
if (index === 0) {
|
||||||
|
this.socketIO.to(this.socketIOClientId).emit('start', token)
|
||||||
|
}
|
||||||
|
this.socketIO.to(this.socketIOClientId).emit('token', token)
|
||||||
|
})
|
||||||
|
}
|
||||||
|
this.socketIO.to(this.socketIOClientId).emit('end')
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user