UNPKG

@n8n/n8n-nodes-langchain

Version:

![Banner image](https://user-images.githubusercontent.com/10284570/173569848-c624317f-42b1-45a6-ab09-f0ea3c247648.png)

335 lines 13.8 kB
"use strict"; Object.defineProperty(exports, "__esModule", { value: true }); exports.DocumentDefaultDataLoader = void 0; const textsplitters_1 = require("@langchain/textsplitters"); const n8n_workflow_1 = require("n8n-workflow"); const ai_utilities_1 = require("@n8n/ai-utilities"); require("mammoth"); require("epub2"); require("pdf-parse"); function getInputs(parameters) { const inputs = []; const textSplittingMode = parameters?.textSplittingMode; if (!textSplittingMode || textSplittingMode === 'custom') { inputs.push({ displayName: 'Text Splitter', maxConnections: 1, type: 'ai_textSplitter', required: true, }); } return inputs; } class DocumentDefaultDataLoader { constructor() { this.description = { displayName: 'Default Data Loader', name: 'documentDefaultDataLoader', icon: 'node:default-data-loader', iconColor: 'gray', group: ['transform'], version: [1, 1.1], defaultVersion: 1.1, description: 'Load data from previous step in the workflow', defaults: { name: 'Default Data Loader', }, codex: { categories: ['AI'], subcategories: { AI: ['Document Loaders'], }, resources: { primaryDocumentation: [ { url: 'https://docs.n8n.io/integrations/builtin/cluster-nodes/sub-nodes/n8n-nodes-langchain.documentdefaultdataloader/', }, ], }, }, inputs: `={{ ((parameter) => { ${getInputs.toString()}; return getInputs(parameter) })($parameter) }}`, outputs: [n8n_workflow_1.NodeConnectionTypes.AiDocument], outputNames: ['Document'], builderHint: { inputs: { ai_textSplitter: { required: true, displayOptions: { show: { textSplittingMode: ['custom'] } }, }, }, }, properties: [ { displayName: 'This will load data from a previous step in the workflow. <a href="/templates/1962" target="_blank">Example</a>', name: 'notice', type: 'notice', default: '', }, { displayName: 'Type of Data', name: 'dataType', type: 'options', default: 'json', required: true, noDataExpression: true, options: [ { name: 'JSON', value: 'json', description: 'Process JSON data from previous step in the workflow', }, { name: 'Binary', value: 'binary', description: 'Process binary data from previous step in the workflow', }, ], }, { displayName: 'Mode', name: 'jsonMode', type: 'options', default: 'allInputData', required: true, displayOptions: { show: { dataType: ['json'], }, }, options: [ { name: 'Load All Input Data', value: 'allInputData', description: 'Use all JSON data that flows into the parent agent or chain', }, { name: 'Load Specific Data', value: 'expressionData', description: 'Load a subset of data, and/or data from any previous step in the workflow', }, ], }, { displayName: 'Mode', name: 'binaryMode', type: 'options', default: 'allInputData', required: true, displayOptions: { show: { dataType: ['binary'], }, }, options: [ { name: 'Load All Input Data', value: 'allInputData', description: 'Use all Binary data that flows into the parent agent or chain', }, { name: 'Load Specific Data', value: 'specificField', description: 'Load data from a specific field in the parent agent or chain', }, ], }, { displayName: 'Data Format', name: 'loader', type: 'options', default: 'auto', required: true, displayOptions: { show: { dataType: ['binary'], }, }, options: [ { name: 'Automatically Detect by Mime Type', value: 'auto', description: 'Uses the mime type to detect the format', }, { name: 'CSV', value: 'csvLoader', description: 'Load CSV files', }, { name: 'Docx', value: 'docxLoader', description: 'Load Docx documents', }, { name: 'EPub', value: 'epubLoader', description: 'Load EPub files', }, { name: 'JSON', value: 'jsonLoader', description: 'Load JSON files', }, { name: 'PDF', value: 'pdfLoader', description: 'Load PDF documents', }, { name: 'Text', value: 'textLoader', description: 'Load plain text files', }, ], }, { displayName: 'Data', name: 'jsonData', type: 'string', typeOptions: { rows: 6, }, default: '', required: true, description: 'Drag and drop fields from the input pane, or use an expression', displayOptions: { show: { dataType: ['json'], jsonMode: ['expressionData'], }, }, }, { displayName: 'Input Data Field Name', name: 'binaryDataKey', type: 'string', default: 'data', required: true, description: 'The name of the field in the agent or chain’s input that contains the binary file to be processed', displayOptions: { show: { dataType: ['binary'], }, hide: { binaryMode: ['allInputData'], }, }, }, { displayName: 'Text Splitting', name: 'textSplittingMode', type: 'options', default: 'simple', required: true, noDataExpression: true, displayOptions: { show: { '@version': [1.1], }, }, options: [ { name: 'Simple', value: 'simple', description: 'Splits every 1000 characters with a 200 character overlap', }, { name: 'Custom', value: 'custom', description: 'Connect a custom text-splitting sub-node', }, ], }, { displayName: 'Options', name: 'options', type: 'collection', placeholder: 'Add Option', default: {}, options: [ { displayName: 'JSON Pointers', name: 'pointers', type: 'string', default: '', description: 'Pointers to extract from JSON, e.g. "/text" or "/text, /meta/title"', displayOptions: { show: { '/loader': ['jsonLoader', 'auto'], }, }, }, { displayName: 'CSV Separator', name: 'separator', type: 'string', description: 'Separator to use for CSV', default: ',', displayOptions: { show: { '/loader': ['csvLoader', 'auto'], }, }, }, { displayName: 'CSV Column', name: 'column', type: 'string', default: '', description: 'Column to extract from CSV', displayOptions: { show: { '/loader': ['csvLoader', 'auto'], }, }, }, { displayName: 'Split Pages in PDF', description: 'Whether to split PDF pages into separate documents', name: 'splitPages', type: 'boolean', default: true, displayOptions: { show: { '/loader': ['pdfLoader', 'auto'], }, }, }, { ...ai_utilities_1.metadataFilterField, displayName: 'Metadata', description: 'Metadata to add to each document. Could be used for filtering during retrieval', placeholder: 'Add property', }, ], }, ], }; } async supplyData(itemIndex) { const node = this.getNode(); const dataType = this.getNodeParameter('dataType', itemIndex, 'json'); let textSplitter; if (node.typeVersion === 1.1) { const textSplittingMode = this.getNodeParameter('textSplittingMode', itemIndex, 'simple'); if (textSplittingMode === 'simple') { textSplitter = new textsplitters_1.RecursiveCharacterTextSplitter({ chunkSize: 1000, chunkOverlap: 200 }); } else if (textSplittingMode === 'custom') { textSplitter = (await this.getInputConnectionData(n8n_workflow_1.NodeConnectionTypes.AiTextSplitter, 0)); } } else { textSplitter = (await this.getInputConnectionData(n8n_workflow_1.NodeConnectionTypes.AiTextSplitter, 0)); } const binaryDataKey = this.getNodeParameter('binaryDataKey', itemIndex, ''); const processor = dataType === 'binary' ? new ai_utilities_1.N8nBinaryLoader(this, 'options.', binaryDataKey, textSplitter) : new ai_utilities_1.N8nJsonLoader(this, 'options.', textSplitter); return { response: (0, ai_utilities_1.logWrapper)(processor, this), }; } } exports.DocumentDefaultDataLoader = DocumentDefaultDataLoader; //# sourceMappingURL=DocumentDefaultDataLoader.node.js.map