pub struct TextInput {
pub texts: Vec<String>,
}Expand description
Input for text embedding
Fields§
§texts: Vec<String>Implementations§
Source§impl TextInput
impl TextInput
pub fn new(texts: Vec<String>) -> Self
Sourcepub fn from_str(texts: &[&str]) -> Self
pub fn from_str(texts: &[&str]) -> Self
Examples found in repository?
examples/embed-mul-token.rs (lines 11-17)
3fn main() -> gte::util::result::Result<()> {
4 const TOKENIZER_PATH: &str = "models/gte-multilingual-base/tokenizer.json";
5 const MODEL_PATH: &str = "models/gte-multilingual-base/onnx/model.onnx";
6
7 let params = gte::params::Parameters::default().with_output_id("token_embeddings");
8 let pipeline = gte::embed::pipeline::TextEmbeddingPipeline::new(TOKENIZER_PATH, ¶ms)?;
9 let model = orp::model::Model::new(MODEL_PATH, orp::params::RuntimeParameters::default())?;
10
11 let inputs = gte::embed::input::TextInput::from_str(&[
12 "What is the capital of France?",
13 "How to implement quick sort in python?",
14 "Die Hauptstadt von Frankreich ist Paris.",
15 "La capital de Francia es París.",
16 "London is the capital of the UK",
17 ]);
18
19 let outputs = model.inference(inputs, &pipeline, ¶ms)?;
20 let distances = gte::util::test::distances_to_first(&outputs);
21
22 println!("Distances: {:?}", distances);
23
24 Ok(())
25}More examples
examples/embed-mul-sentence.rs (lines 14-20)
3fn main() -> gte::util::result::Result<()> {
4 const TOKENIZER_PATH: &str = "models/gte-multilingual-base/tokenizer.json";
5 const MODEL_PATH: &str = "models/gte-multilingual-base/onnx/model.onnx";
6
7 let params = gte::params::Parameters::default()
8 .with_output_id("sentence_embedding")
9 .with_mode(gte::embed::output::ExtractorMode::Raw);
10
11 let pipeline = gte::embed::pipeline::TextEmbeddingPipeline::new(TOKENIZER_PATH, ¶ms)?;
12 let model = orp::model::Model::new(MODEL_PATH, orp::params::RuntimeParameters::default())?;
13
14 let inputs = gte::embed::input::TextInput::from_str(&[
15 "What is the capital of France?",
16 "How to implement quick sort in python?",
17 "Die Hauptstadt von Frankreich ist Paris.",
18 "La capital de Francia es París.",
19 "London is the capital of the UK",
20 ]);
21
22 let outputs = model.inference(inputs, &pipeline, ¶ms)?;
23 let distances = gte::util::test::distances_to_first(&outputs);
24
25 println!("Distances: {:?}", distances);
26
27 Ok(())
28}examples/embed.rs (lines 14-19)
6fn main() -> gte::util::result::Result<()> {
7 const TOKENIZER_PATH: &str = "models/gte-modernbert-base/tokenizer.json";
8 const MODEL_PATH: &str = "models/gte-modernbert-base/onnx/model.onnx";
9
10 let params = gte::params::Parameters::default();
11 let pipeline = gte::embed::pipeline::TextEmbeddingPipeline::new(TOKENIZER_PATH, ¶ms)?;
12 let model = orp::model::Model::new(MODEL_PATH, orp::params::RuntimeParameters::default())?;
13
14 let inputs = gte::embed::input::TextInput::from_str(&[
15 "what is the capital of China?",
16 "how to implement quick sort in python?",
17 "Beijing",
18 "sorting algorithms",
19 ]);
20
21 const EXPECTED_DISTANCES: [f32; 3] = [0.4289073944091797, 0.7130911254882812, 0.33664554595947266];
22 const EPSILON: f32 = 0.000001;
23
24 let outputs = model.inference(inputs, &pipeline, ¶ms)?;
25 let distances = gte::util::test::distances_to_first(&outputs);
26
27 println!("Distances: {:?}", distances);
28 assert!(gte::util::test::is_close_to_a(&distances.view(), &EXPECTED_DISTANCES, EPSILON));
29
30 Ok(())
31}Trait Implementations§
Auto Trait Implementations§
impl Freeze for TextInput
impl RefUnwindSafe for TextInput
impl Send for TextInput
impl Sync for TextInput
impl Unpin for TextInput
impl UnwindSafe for TextInput
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more