Struct LateChunkingStrategy

Source

pub struct LateChunkingStrategy { /* private fields */ }

Expand description

Context-aware chunking strategy for use with late-chunking embedding models

Splits text using HierarchicalChunker and records precise byte-offset spans in each chunk’s metadata. A late-chunking embedding provider (Jina API or a local candle model) can then use these spans to extract per-chunk representations from a single full-document forward pass.

§Examples

use graphrag_core::text::late_chunking::{LateChunkingStrategy, LateChunkingConfig};
use graphrag_core::core::{ChunkingStrategy, DocumentId};

let strategy = LateChunkingStrategy::with_defaults(DocumentId::new("doc-1".to_string()));
let chunks = strategy.chunk("First paragraph.\n\nSecond paragraph.");

for chunk in &chunks {
    // position_in_document ∈ [0.0, 1.0] — used by embedding provider for pooling
    assert!(chunk.metadata.position_in_document.is_some());
}

Struct LateChunkingStrategy Copy item path

§Examples

Implementations§

impl LateChunkingStrategy

pub fn new(config: LateChunkingConfig, document_id: DocumentId) -> Self

pub fn with_defaults(document_id: DocumentId) -> Self

pub fn with_max_doc_tokens(self, max_tokens: u32) -> Self

pub fn estimate_tokens(text: &str) -> u32

pub fn fits_in_context(&self, text: &str) -> bool

pub fn split_into_sections(&self, text: &str) -> Vec<String>

Trait Implementations§

impl ChunkingStrategy for LateChunkingStrategy

fn chunk(&self, text: &str) -> Vec<TextChunk>

Auto Trait Implementations§

impl Freeze for LateChunkingStrategy

impl RefUnwindSafe for LateChunkingStrategy

impl Send for LateChunkingStrategy

impl Sync for LateChunkingStrategy

impl Unpin for LateChunkingStrategy

impl UnsafeUnpin for LateChunkingStrategy

impl UnwindSafe for LateChunkingStrategy

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> ErasedDestructor for Twhere T: 'static,

Struct LateChunkingStrategy

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> ErasedDestructor for T
where T: 'static,