From 4be8308b55acbfa293826ab7234d2429073447e3 Mon Sep 17 00:00:00 2001 From: bhavnicksm Date: Mon, 23 Dec 2024 21:59:46 +0530 Subject: [PATCH] Add LateChunker support to chunker and module exports - Introduced LateChunker to the chunking module and updated the __init__.py files to include it in the public API. - Enhanced the chunking capabilities by integrating LateChunker, following recent improvements in its functionality. This commit builds on the previous work done for LateChunking, ensuring it is accessible for users of the chonkie library. --- src/chonkie/__init__.py | 4 ++++ src/chonkie/chunker/__init__.py | 2 ++ 2 files changed, 6 insertions(+) diff --git a/src/chonkie/__init__.py b/src/chonkie/__init__.py index 5945266..a635839 100644 --- a/src/chonkie/__init__.py +++ b/src/chonkie/__init__.py @@ -7,6 +7,7 @@ SentenceChunker, TokenChunker, WordChunker, + LateChunker, ) from .embeddings import ( AutoEmbeddings, @@ -26,6 +27,7 @@ SemanticSentence, Sentence, SentenceChunk, + LateChunk, ) __version__ = "0.3.0" @@ -47,6 +49,7 @@ "SemanticChunk", "Sentence", "SemanticSentence", + "LateChunk", ] # Add all chunker classes to __all__ @@ -57,6 +60,7 @@ "SentenceChunker", "SemanticChunker", "SDPMChunker", + "LateChunker", ] # Add all embeddings classes to __all__ diff --git a/src/chonkie/chunker/__init__.py b/src/chonkie/chunker/__init__.py index e04c980..24f62dc 100644 --- a/src/chonkie/chunker/__init__.py +++ b/src/chonkie/chunker/__init__.py @@ -6,6 +6,7 @@ from .sentence import SentenceChunker from .token import TokenChunker from .word import WordChunker +from .late import LateChunker __all__ = [ "BaseChunker", @@ -14,4 +15,5 @@ "SentenceChunker", "SemanticChunker", "SDPMChunker", + "LateChunker", ]