1234567891011121314151617181920212223242526 |
- import { RecursiveCharacterTextSplitter } from 'langchain/text_splitter';
- import { BaseChunker } from './BaseChunker';
- interface TextSplitterChunkParams {
- chunkSize: number;
- chunkOverlap: number;
- keepSeparator: boolean;
- }
- const TEXT_SPLITTER_CHUNK_PARAMS: TextSplitterChunkParams = {
- chunkSize: 500,
- chunkOverlap: 0,
- keepSeparator: false,
- };
- class WebPageChunker extends BaseChunker {
- constructor() {
- const textSplitter = new RecursiveCharacterTextSplitter(
- TEXT_SPLITTER_CHUNK_PARAMS
- );
- super(textSplitter);
- }
- }
- export { WebPageChunker };
|