Flowise/packages/components/nodes/tools/Arxiv/Arxiv.ts

145 lines
5.4 KiB
TypeScript

import { ICommonObject, INode, INodeData, INodeParams } from '../../../src/Interface'
import { getBaseClasses } from '../../../src/utils'
import { ArxivParameters, desc, ArxivTool } from './core'
class Arxiv_Tools implements INode {
label: string
name: string
version: number
description: string
type: string
icon: string
category: string
baseClasses: string[]
inputs: INodeParams[]
constructor() {
this.label = 'Arxiv'
this.name = 'arxiv'
this.version = 1.0
this.type = 'Arxiv'
this.icon = 'arxiv.png'
this.category = 'Tools'
this.description = 'Search and read content from academic papers on Arxiv'
this.baseClasses = [this.type, ...getBaseClasses(ArxivTool)]
this.inputs = [
{
label: 'Name',
name: 'arxivName',
type: 'string',
default: 'arxiv_search',
description: 'Name of the tool',
additionalParams: true,
optional: true
},
{
label: 'Description',
name: 'arxivDescription',
type: 'string',
rows: 4,
default: desc,
description: 'Describe to LLM when it should use this tool',
additionalParams: true,
optional: true
},
{
label: 'Top K Results',
name: 'topKResults',
type: 'number',
description: 'Number of top results to return from Arxiv search',
default: '3',
step: 1,
optional: true,
additionalParams: true
},
{
label: 'Max Query Length',
name: 'maxQueryLength',
type: 'number',
description: 'Maximum length of the search query',
default: '300',
step: 1,
optional: true,
additionalParams: true
},
{
label: 'Max Content Length',
name: 'docContentCharsMax',
type: 'number',
description: 'Maximum length of the returned content. Set to 0 for unlimited',
default: '10000',
step: 1,
optional: true,
additionalParams: true
},
{
label: 'Load Full Content',
name: 'loadFullContent',
type: 'boolean',
description:
'Download PDFs and extract full paper content instead of just summaries. Warning: This is slower and uses more resources.',
default: false,
optional: true,
additionalParams: true
},
{
label: 'Continue On Failure',
name: 'continueOnFailure',
type: 'boolean',
description:
'Continue processing other papers if one fails to download/parse (only applies when Load Full Content is enabled)',
default: false,
optional: true,
additionalParams: true
},
{
label: 'Use Legacy Build',
name: 'legacyBuild',
type: 'boolean',
description: 'Use legacy PDF.js build for PDF parsing (only applies when Load Full Content is enabled)',
default: false,
optional: true,
additionalParams: true
}
]
}
async init(nodeData: INodeData, _: string, options: ICommonObject): Promise<any> {
const name = (nodeData.inputs?.name as string) || (nodeData.inputs?.arxivName as string)
const description = (nodeData.inputs?.description as string) || (nodeData.inputs?.arxivDescription as string)
const topKResults = nodeData.inputs?.topKResults as string
const maxQueryLength = nodeData.inputs?.maxQueryLength as string
const docContentCharsMax = nodeData.inputs?.docContentCharsMax as string
const loadFullContent = nodeData.inputs?.loadFullContent as boolean
const continueOnFailure = nodeData.inputs?.continueOnFailure as boolean
const legacyBuild = nodeData.inputs?.legacyBuild as boolean
let logger
const orgId = options.orgId
if (process.env.DEBUG === 'true') {
logger = options.logger
}
const obj: ArxivParameters = {}
if (description) obj.description = description
if (name)
obj.name = name
.toLowerCase()
.replace(/ /g, '_')
.replace(/[^a-z0-9_-]/g, '')
if (topKResults) obj.topKResults = parseInt(topKResults, 10)
if (maxQueryLength) obj.maxQueryLength = parseInt(maxQueryLength, 10)
if (docContentCharsMax) {
const maxChars = parseInt(docContentCharsMax, 10)
obj.docContentCharsMax = maxChars === 0 ? undefined : maxChars
}
if (loadFullContent !== undefined) obj.loadFullContent = loadFullContent
if (continueOnFailure !== undefined) obj.continueOnFailure = continueOnFailure
if (legacyBuild !== undefined) obj.legacyBuild = legacyBuild
return new ArxivTool(obj, logger, orgId)
}
}
module.exports = { nodeClass: Arxiv_Tools }