TrainingDataExtractor

Struct TrainingDataExtractor 

Source
pub struct TrainingDataExtractor { /* private fields */ }
Expand description

Training data extractor

Implementations§

Source§

impl TrainingDataExtractor

Source

pub fn new(min_confidence: f32) -> Self

Create a new training data extractor

§Arguments
  • min_confidence - Minimum confidence threshold for auto-labeling (0.6-0.9)
§Examples
use organizational_intelligence_plugin::training::TrainingDataExtractor;

let extractor = TrainingDataExtractor::new(0.75);
Source

pub fn extract_training_data( &self, commits: &[CommitInfo], _repository_name: &str, ) -> Result<Vec<TrainingExample>>

Extract training examples from commit history

Filters commits and auto-labels using rule-based classifier.

§Arguments
  • commits - Raw commit history
  • repository_name - Name of the repository
§Returns
  • Ok(Vec<TrainingExample>) - Labeled training examples
  • Err - If extraction fails
§Examples
use organizational_intelligence_plugin::training::TrainingDataExtractor;
use organizational_intelligence_plugin::git::CommitInfo;

let extractor = TrainingDataExtractor::new(0.75);
let commits = vec![
    CommitInfo {
        hash: "abc123".to_string(),
        message: "fix: null pointer dereference".to_string(),
        author: "dev@example.com".to_string(),
        timestamp: 1234567890,
        files_changed: 2,
        lines_added: 10,
        lines_removed: 5,
    },
];

let examples = extractor.extract_training_data(&commits, "test-repo").unwrap();
assert_eq!(examples.len(), 1);
Source

pub fn create_splits( &self, examples: &[TrainingExample], repositories: &[String], ) -> Result<TrainingDataset>

Create train/test/validation splits

Uses 70/15/15 split (train/validation/test) as recommended by the spec.

§Arguments
  • examples - Labeled training examples
  • repositories - List of repository names
§Returns
  • Ok(TrainingDataset) - Dataset with splits
  • Err - If split fails
§Examples
use organizational_intelligence_plugin::training::TrainingDataExtractor;
use organizational_intelligence_plugin::training::TrainingExample;
use organizational_intelligence_plugin::classifier::DefectCategory;

let extractor = TrainingDataExtractor::new(0.75);
let examples = vec![
    TrainingExample {
        message: "fix: bug".to_string(),
        label: DefectCategory::MemorySafety,
        confidence: 0.85,
        commit_hash: "abc".to_string(),
        author: "dev".to_string(),
        timestamp: 123,
        lines_added: 5,
        lines_removed: 2,
        files_changed: 1,
        error_code: None,
        clippy_lint: None,
        has_suggestion: false,
        suggestion_applicability: None,
        source: organizational_intelligence_plugin::citl::TrainingSource::CommitMessage,
    },
];

let dataset = extractor.create_splits(&examples, &["repo1".to_string()]).unwrap();
assert!(dataset.train.len() + dataset.validation.len() + dataset.test.len() == 1);
Source

pub fn get_statistics(&self, examples: &[TrainingExample]) -> String

Get statistics about extracted training data

§Arguments
  • examples - Training examples
§Returns
  • Formatted statistics string

Trait Implementations§

Source§

impl Default for TrainingDataExtractor

Source§

fn default() -> Self

Returns the “default value” for a type. Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> PolicyExt for T
where T: ?Sized,

Source§

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more
Source§

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more
Source§

impl<T> Same for T

Source§

type Output = T

Should always be Self
Source§

impl<SS, SP> SupersetOf<SS> for SP
where SS: SubsetOf<SP>,

Source§

fn to_subset(&self) -> Option<SS>

The inverse inclusion map: attempts to construct self from the equivalent element of its superset. Read more
Source§

fn is_in_subset(&self) -> bool

Checks if self is actually part of its subset T (and can be converted to it).
Source§

fn to_subset_unchecked(&self) -> SS

Use with care! Same as self.to_subset but without any property checks. Always succeeds.
Source§

fn from_subset(element: &SS) -> SP

The inclusion map: converts self to the equivalent element of its superset.
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,