Struct Data

Source

pub struct Data {Show 23 fields
    pub id: Uuid,
    pub name: String,
    pub raw_data_location: String,
    pub original_data_location: String,
    pub extension: String,
    pub mime_type: String,
    pub content_hash: String,
    pub owner_id: Uuid,
    pub created_at: DateTime<Utc>,
    pub updated_at: Option<DateTime<Utc>>,
    pub label: Option<String>,
    pub original_extension: Option<String>,
    pub original_mime_type: Option<String>,
    pub loader_engine: Option<String>,
    pub raw_content_hash: Option<String>,
    pub tenant_id: Option<Uuid>,
    pub external_metadata: Option<String>,
    pub node_set: Option<String>,
    pub pipeline_status: Option<String>,
    pub token_count: i64,
    pub data_size: i64,
    pub last_accessed: Option<DateTime<Utc>>,
    pub importance_weight: Option<f64>,
}

Expand description

Represents a piece of data in the system, such as a file or a text. Fields match the Python cognee data table schema for cross-SDK compatibility.

Fields§

§id: Uuid

Unique identifier for this data record (UUID v5, deterministic from content hash)

§name: String

Display name derived from the source (filename, URL, or text_<md5>.txt for inline text)

§raw_data_location: String

file:// URI pointing to the stored raw content in the file storage backend

§original_data_location: String

Original source location before any processing (file path, URL, or same as raw_data_location for inline text)

§extension: String

File extension of the stored content (e.g. “txt”, “pdf”, “html”)

§mime_type: String

MIME type of the stored content (e.g. “text/plain”, “application/pdf”)

§content_hash: String

MD5 hex digest of the raw content bytes (content-only, no owner mixing)

§owner_id: Uuid

ID of the user or agent that owns this data record

§created_at: DateTime<Utc>

Timestamp when this record was first created

§updated_at: Option<DateTime<Utc>>

Timestamp of the last update to this record, if any

§label: Option<String>

Human-readable label for the data item (from DataItem wrapper or user-provided)

§original_extension: Option<String>

Original file extension before any conversion

§original_mime_type: Option<String>

Original MIME type before any conversion

§loader_engine: Option<String>

Python loader engine name (e.g. “text_loader”, “pypdf_loader”)

§raw_content_hash: Option<String>

MD5 hash of the extracted-text file stored by the loader at ADD time (Python parity, ingest_data.py:195). Equals content_hash only when the extracted text is byte-identical to the raw input (plain text); for inputs the loader transforms (PDF, CSV, HTML, image, audio) the two hashes differ.

§tenant_id: Option<Uuid>

Tenant/organisation ID for multi-tenant isolation

§external_metadata: Option<String>

Arbitrary JSON metadata blob

§node_set: Option<String>

JSON list of node IDs associated with this data item

§pipeline_status: Option<String>

Pipeline processing status

§token_count: i64

Token count of the data (-1 = not yet computed)

§data_size: i64

Size of the data in bytes (-1 = not yet computed)

§last_accessed: Option<DateTime<Utc>>

Last access timestamp

§importance_weight: Option<f64>

Importance weight for ranking (0.0 to 1.0). Influences relevance scoring.

Struct Data Copy item path

Fields§

Implementations§

impl Data

pub fn builder( id: Uuid, name: impl Into<String>, raw_data_location: impl Into<String>, original_data_location: impl Into<String>, extension: impl Into<String>, mime_type: impl Into<String>, content_hash: impl Into<String>, owner_id: Uuid, ) -> DataBuilder

Trait Implementations§

impl Clone for Data

fn clone(&self) -> Data

fn clone_from(&mut self, source: &Self)

impl Debug for Data

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for Data

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for Data

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for Data

impl RefUnwindSafe for Data

impl Send for Data

impl Sync for Data

impl Unpin for Data

impl UnsafeUnpin for Data

impl UnwindSafe for Data

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> DynClone for Twhere T: Clone,

fn __clone_box(&self, _: Private) -> *mut ()

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct Data

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T> DynClone for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,