List of all items
Structs
- abstractive_summary::CompressionSummarizer
- abstractive_summary::EnhancedCentroidSummarizer
- abstractive_summary::FusionSummarizer
- abstractive_summary::ScoredSentence
- advanced_classification::CountVectorizer
- advanced_classification::FastTextClassifier
- advanced_classification::NaiveBayesClassifier
- advanced_classification::TfidfTransformer
- alignment::AlignedCorpus
- batch_tokenizer::BatchConfig
- batch_tokenizer::BatchConfigExt
- batch_tokenizer::BatchEncoding
- bert_finetune::BertFineTuner
- bert_finetune::ClassificationHead
- bert_finetune::FineTuneConfig
- bpe_tokenizer::BpeVocab
- classification::BernoulliNaiveBayes
- classification::CrossValidationResult
- classification::FeatureHasher
- classification::FoldResult
- classification::MultiLabelClassifier
- classification::MultiLabelPrediction
- classification::MultinomialNaiveBayes
- classification::TextClassificationMetrics
- classification::TextClassificationPipeline
- classification::TextDataset
- classification::TextFeatureSelector
- classification::TfidfCosineClassifier
- cleansing::AdvancedTextCleaner
- coreference::CoreferenceChain
- coreference::Mention
- crosslingual::CrossLingualConfig
- crosslingual::CrossLingualNer
- crosslingual::CrossLingualNerConfig
- ctm::CorrelatedTopicModel
- ctm::CtmConfig
- ctm::CtmResult
- dialog::DialogPolicy
- dialog::DialogState
- dialog::EntityExtractor
- dialog::ExtractedEntity
- dialog::IntentClassifier
- dialog::PolicyAction
- dialog::SlotFiller
- discourse::CueLexicon
- discourse::DiscourseAnalysis
- discourse::DiscourseAnalyzer
- discourse::RhetoricalStructure
- discourse::RstNode
- doc_similarity::DocumentCluster
- doc_similarity::LatentSemanticAnalysis
- doc_similarity::MinHasher
- doc_similarity::Shingler
- doc_similarity::TfIdfEngine
- doc_similarity::WordShingler
- domain_processors::financial::FinancialTextProcessor
- domain_processors::legal::LegalTextProcessor
- domain_processors::medical::MedicalTextProcessor
- domain_processors::news::NewsTextProcessor
- domain_processors::patent::PatentTextProcessor
- domain_processors::scientific::ScientificTextProcessor
- domain_processors::social_media::SocialMediaTextProcessor
- domain_processors::types::DomainProcessorConfig
- domain_processors::types::ProcessedDomainText
- domain_processors::unified::UnifiedDomainProcessor
- dtm::DtmConfig
- dtm::DtmResult
- dtm::DynamicTopicModel
- embeddings::Word2Vec
- embeddings::Word2VecConfig
- embeddings::contrastive::ContrastiveModel
- embeddings::contrastive::SimCSEConfig
- embeddings::contrastive::SimCSETrainer
- embeddings::crosslingual::AlignmentMatrix
- embeddings::crosslingual::CrossLingualConfig
- embeddings::fasttext::FastText
- embeddings::fasttext::FastTextConfig
- embeddings::glove::CooccurrenceMatrix
- embeddings::glove::GloVe
- embeddings::glove::GloVeTrainer
- embeddings::glove::GloVeTrainerConfig
- embeddings::sentence::SentenceEmbedder
- embeddings::sentence::SentenceEmbedderConfig
- embeddings::sentence_encoder::SemanticSimilarity
- embeddings::sentence_encoder::SentenceEncoder
- embeddings::sentence_encoder::SimCseConfig
- embeddings::sentence_encoder::SimCseTrainer
- embeddings::universal::CrossLingualConfig
- embeddings::universal::TransformerEncoderLayer
- embeddings::universal::UniversalSentenceEncoder
- embeddings::universal::UseConfig
- enhanced_vectorize::EnhancedCountVectorizer
- enhanced_vectorize::EnhancedTfidfVectorizer
- evaluation::bleu::BleuConfig
- evaluation::meteor::MeteorConfig
- evaluation::meteor::MeteorScore
- evaluation::ner::ClassMetrics
- evaluation::ner::NerEvaluationResult
- evaluation::ner::NerSpan
- evaluation::online_lda::OnlineLda
- evaluation::online_lda::OnlineLdaConfig
- evaluation::perplexity::PerplexityReport
- evaluation::rouge::RougeScore
- evaluation::sequence_labeler::SequenceLabelMetrics
- evaluation::sequence_labeler::ViterbiDecoder
- evaluation::sts::StsReport
- event_extraction::Argument
- event_extraction::Event
- event_extraction::EventExtractor
- event_extraction::TriggerLexicon
- gpt_bpe::Gpt2BpeTokenizer
- hdp::HdpConfig
- hdp::HdpModel
- hdp::HdpResult
- huggingface_compat::adapter::HfModelAdapter
- huggingface_compat::config::HfConfig
- huggingface_compat::config::HfTokenizerConfig
- huggingface_compat::conversion::FormatConverter
- huggingface_compat::hub::HfHub
- huggingface_compat::hub::HfModelInfo
- huggingface_compat::manager::HfModelManager
- huggingface_compat::pipelines::ClassificationResult
- huggingface_compat::pipelines::FeatureExtractionPipeline
- huggingface_compat::pipelines::FillMaskPipeline
- huggingface_compat::pipelines::FillMaskResult
- huggingface_compat::pipelines::QuestionAnsweringPipeline
- huggingface_compat::pipelines::QuestionAnsweringResult
- huggingface_compat::pipelines::SummarizationPipeline
- huggingface_compat::pipelines::SummarizationResult
- huggingface_compat::pipelines::TextClassificationPipeline
- huggingface_compat::pipelines::TextGenerationPipeline
- huggingface_compat::pipelines::TextGenerationResult
- huggingface_compat::pipelines::TokenClassificationPipeline
- huggingface_compat::pipelines::TokenClassificationResult
- huggingface_compat::pipelines::TranslationPipeline
- huggingface_compat::pipelines::TranslationResult
- huggingface_compat::pipelines::ZeroShotClassificationPipeline
- huggingface_compat::tokenizer::HfEncodedInput
- huggingface_compat::tokenizer::HfTokenizer
- information_extraction::advanced_ner::AdvancedNerExtractor
- information_extraction::advanced_ner::CoreferenceCluster
- information_extraction::advanced_ner::RakeExtractor
- information_extraction::advanced_ner::SvoRelationExtractor
- information_extraction::advanced_ner::SvoTriple
- information_extraction::confidence::ConfidenceScorer
- information_extraction::coreference::CoreferenceChain
- information_extraction::coreference::CoreferenceMention
- information_extraction::coreference::CoreferenceResolver
- information_extraction::dep_relations::CorefResolver
- information_extraction::dep_relations::DependencyRelation
- information_extraction::dep_relations::DependencyRelationExtractor
- information_extraction::dep_relations::RelationPattern
- information_extraction::document::DocumentInformationExtractor
- information_extraction::document::DocumentSummary
- information_extraction::document::StructuredDocumentInformation
- information_extraction::document::Topic
- information_extraction::entities::Entity
- information_extraction::entities::EntityCluster
- information_extraction::extractors::KeyPhraseExtractor
- information_extraction::extractors::PatternExtractor
- information_extraction::extractors::RuleBasedNER
- information_extraction::linking::EntityLinker
- information_extraction::linking::KnowledgeBaseEntry
- information_extraction::linking::LinkedEntity
- information_extraction::patterns::DATE_PATTERN
- information_extraction::patterns::EMAIL_PATTERN
- information_extraction::patterns::MONEY_PATTERN
- information_extraction::patterns::PERCENTAGE_PATTERN
- information_extraction::patterns::PHONE_PATTERN
- information_extraction::patterns::TIME_PATTERN
- information_extraction::patterns::URL_PATTERN
- information_extraction::pipeline::AdvancedExtractedInformation
- information_extraction::pipeline::AdvancedExtractionPipeline
- information_extraction::pipeline::ExtractedInformation
- information_extraction::pipeline::InformationExtractionPipeline
- information_extraction::relations::Event
- information_extraction::relations::Relation
- information_extraction::relations::RelationExtractor
- information_extraction::seq_patterns::Match
- information_extraction::seq_patterns::Pattern
- information_extraction::seq_patterns::PatternMatcher
- information_extraction::seq_patterns::Token
- information_extraction::temporal::TemporalExtractor
- keyword_extraction::Keyword
- keyword_extraction::RakeKeywordExtractor
- keyword_extraction::TextRankKeywordExtractor
- keyword_extraction::TfIdfKeywordExtractor
- keywords::Rake
- keywords::Yake
- language_detection::LanguageDetectionOutput
- language_model::NgramModel
- language_models::BigramLM
- language_models::NgramLM
- language_models::PerplexityEval
- language_models::UnigramLM
- lemmatization::RuleBasedLemmatizer
- lemmatization::WordNetLemmatizer
- ml_integration::BatchTextProcessor
- ml_integration::MLTextPreprocessor
- ml_integration::TextFeatures
- ml_integration::TextMLPipeline
- ml_sentiment::ClassMetrics
- ml_sentiment::EvaluationMetrics
- ml_sentiment::MLSentimentAnalyzer
- ml_sentiment::MLSentimentConfig
- ml_sentiment::TrainingMetrics
- model_registry::ModelMetadata
- model_registry::ModelRegistry
- model_registry::PrebuiltModels
- model_registry::SerializableModelData
- multilingual::LanguageDetectionResult
- multilingual::LanguageDetector
- multilingual::MultilingualProcessor
- multilingual::ProcessedText
- multilingual::StopWords
- multilingual::Transliterator
- multilingual::UnicodeTokenizer
- multilingual::UnicodeTokenizerConfig
- named_entity_recognition::NerEntity
- named_entity_recognition::NerPatternConfig
- ner::Entity
- ner::NerConfig
- ner::NerExtractor
- neural_architectures::AdditiveAttention
- neural_architectures::BiLSTM
- neural_architectures::CNNLSTMHybrid
- neural_architectures::Conv1D
- neural_architectures::CrossAttention
- neural_architectures::Dropout
- neural_architectures::GRUCell
- neural_architectures::LSTMCell
- neural_architectures::LayerNorm
- neural_architectures::MaxPool1D
- neural_architectures::MultiHeadAttention
- neural_architectures::MultiScaleCNN
- neural_architectures::PositionwiseFeedForward
- neural_architectures::ResidualBlock1D
- neural_architectures::SelfAttention
- neural_architectures::TextCNN
- neural_nlp::attention_viz::AttentionHeatmap
- neural_nlp::attention_viz::AttentionVisualization
- neural_nlp::bert_classifier::BertClassifier
- neural_nlp::bert_classifier::BertClassifierConfig
- neural_nlp::neural_ner::NeuralNer
- neural_nlp::neural_ner::NeuralNerConfig
- neural_nlp::transformer_encoder::TransformerEncoderConfig
- neural_nlp::transformer_encoder::TransformerTextEncoder
- parallel::ParallelCorpusProcessor
- parallel::ParallelTextProcessor
- parallel::ParallelTokenizer
- parallel::ParallelVectorizer
- paraphrasing::ParaphraseConfig
- paraphrasing::ParaphraseResult
- paraphrasing::Paraphraser
- performance::AdvancedPerformanceMonitor
- performance::BottleneckAnalysis
- performance::DetailedPerformanceReport
- performance::NetworkIOSummary
- performance::OperationMonitor
- performance::OptimizationApplication
- performance::OptimizationRecommendation
- performance::PerformanceDataPoint
- performance::PerformanceSummary
- performance::PerformanceThresholds
- performance::ResourceUtilizationSummary
- performance::TrendAnalysis
- pipeline::BatchProcessor
- pipeline::NlpPipeline
- pipeline::PipelineBuilder
- pos_tagging::ContextualDisambiguator
- pos_tagging::MorphologicalAnalyzer
- pos_tagging::PosAwareLemmatizer
- pos_tagging::core::PosTagger
- pos_tagging::patterns::ADJ_PATTERNS
- pos_tagging::patterns::ADV_PATTERNS
- pos_tagging::patterns::ALL_CAPS_PATTERN
- pos_tagging::patterns::NOUN_PATTERNS
- pos_tagging::patterns::PROPER_NOUN_PATTERN
- pos_tagging::patterns::PatternMatcher
- pos_tagging::patterns::VERB_PATTERNS
- pos_tagging::types::PosTagResult
- pos_tagging::types::PosTaggerConfig
- pos_tagging::types::PosTaggingResult
- pos_tagging_original::ContextualDisambiguator
- pos_tagging_original::MorphologicalAnalyzer
- pos_tagging_original::PosAwareLemmatizer
- pos_tagging_original::PosTagResult
- pos_tagging_original::PosTagger
- pos_tagging_original::PosTaggerConfig
- pos_tagging_original::PosTaggingResult
- preprocess::BasicNormalizer
- preprocess::BasicTextCleaner
- preprocess::TextPreprocessor
- question_answering::AnswerSpan
- question_answering::QAContext
- regex_lite::Match
- regex_lite::RegexLite
- segmentation::SentenceSegmenter
- segmentation::TextChunk
- segmentation::TextChunker
- semantic_similarity::ConceptNode
- semantic_similarity::ConceptualSimilarity
- semantic_similarity::DistributionalSimilarity
- semantic_similarity::LcsSimilarity
- semantic_similarity::NGramSemanticSimilarity
- semantic_similarity::SemanticEditDistance
- semantic_similarity::SemanticSimilarityEnsemble
- semantic_similarity::SentenceEmbeddingSimilarity
- semantic_similarity::SoftCosineSimilarity
- semantic_similarity::TopicBasedSimilarity
- semantic_similarity::WeightedJaccard
- semantic_similarity::WordMoversDistance
- sentence_embeddings::SentenceEmbedder
- sentence_embeddings::SentenceEmbedderConfig
- sentence_embeddings::SimCseConfig
- sentence_embeddings::SimCseTrainer
- sentence_embeddings::autograd_projection::DifferentiableProjection
- sentence_embeddings::autograd_projection::ProjectionConfig
- sentence_embeddings::cross_lingual::AlignedEncoder
- sentence_embeddings::cross_lingual::CrossLingualAligner
- sentence_embeddings::encoder::SentenceEncoder
- sentence_embeddings::encoder::SentenceEncoderConfig
- sentence_embeddings::simcse::SimCSELoss
- sentence_embeddings::simcse::SimCSETrainer
- sentence_embeddings::trainer::SimcseConfig
- sentence_embeddings::trainer::SimcseTrainer
- sentence_embeddings::trainer::TrainStep
- sentence_embeddings::universal::UniversalSentenceEncoder
- sentencepiece::SpecialTokens
- sentencepiece::UnigramConfig
- sentencepiece::UnigramTokenizer
- sentencepiece::VocabPiece
- sentiment::AggregatedSentiment
- sentiment::AspectSentiment
- sentiment::AspectSentimentAnalyzer
- sentiment::LexiconSentimentAnalyzer
- sentiment::NaiveBayesSentiment
- sentiment::RuleBasedSentimentAnalyzer
- sentiment::SentimentLexicon
- sentiment::SentimentResult
- sentiment::SentimentRules
- sentiment::SentimentWordCounts
- sentiment::VaderResult
- sentiment::VaderSentimentAnalyzer
- simd_ops::basic_ops::SimdStringOps
- simd_ops::edit_distance::SimdEditDistance
- simd_ops::pattern_matching::SimdPatternMatcher
- simd_ops::text_analysis::AdvancedSIMDTextProcessor
- simd_ops::text_analysis::SimdTextAnalyzer
- simd_ops::text_analysis::TextAnalysisResult
- simd_ops::text_analysis::TextProcessingResult
- simd_ops::vectorized_ops::SimdNgramGenerator
- simd_ops::vectorized_ops::SimdParallelProcessor
- simd_ops::vectorized_ops::SimdTextNormalizer
- simd_ops::vectorized_ops::SimdTextSimilarity
- simd_ops::vectorized_ops::VectorizedStringOps
- similarity::SearchIndexConfig
- similarity::SemanticSearchIndex
- similarity::SemanticSimilarity
- sparse::ApproximateSparseMatrix
- sparse::BitPackedSparseVector
- sparse::BlockSparseMatrix
- sparse::CompressedBlock
- sparse::CooMatrix
- sparse::CscMatrix
- sparse::CsrMatrix
- sparse::DokMatrix
- sparse::HierarchicalSparseMatrix
- sparse::QuantizedSparseVector
- sparse::SparseMatrixBuilder
- sparse::SparseMemoryPool
- sparse::SparseVector
- sparse::StreamingSparseProcessor
- sparse_vectorize::MemoryStats
- sparse_vectorize::SparseCountVectorizer
- sparse_vectorize::SparseTfidfVectorizer
- spelling::DictionaryCorrector
- spelling::DictionaryCorrectorConfig
- spelling::ErrorModel
- spelling::NGramModel
- spelling::StatisticalCorrector
- spelling::StatisticalCorrectorConfig
- stemming::PorterStemmer
- stemming::SimpleLemmatizer
- stemming::SnowballStemmer
- stemming::lancaster::LancasterStemmer
- stemming::rule_lemmatizer::LemmaRule
- stemming::rule_lemmatizer::LemmatizerConfig
- stemming::rule_lemmatizer::RuleCondition
- stemming::rule_lemmatizer::RuleLemmatizer
- stemming::rule_lemmatizer::RuleLemmatizerBuilder
- streaming::AdvancedStreamingMetrics
- streaming::AdvancedStreamingProcessor
- streaming::CachedCorpus
- streaming::ChunkedCorpusReader
- streaming::CorpusIndex
- streaming::CorpusIterator
- streaming::CorpusStatistics
- streaming::DocumentStats
- streaming::MemoryMappedCorpus
- streaming::MemoryMonitor
- streaming::MultiFileCorpus
- streaming::MultiFileIterator
- streaming::ProgressTracker
- streaming::StreamingTextProcessor
- streaming::StreamingVectorizer
- string_metrics::AlignmentResult
- string_metrics::DamerauLevenshteinMetric
- string_metrics::Metaphone
- string_metrics::NeedlemanWunsch
- string_metrics::Nysiis
- string_metrics::SmithWaterman
- string_metrics::Soundex
- summarization::CentroidSummarizer
- summarization::KeywordExtractor
- summarization::TextRank
- summarize_advanced::ExtractiveSummarizer
- summarize_advanced::TextRankSummarizer
- text_classification::NaiveBayesClassifier
- text_classification::TextCnnLite
- text_classification::TfIdfLogisticClassifier
- text_coordinator::AdaptationTriggers
- text_coordinator::AdaptiveLearningSystem
- text_coordinator::AdaptiveOptimizationParams
- text_coordinator::AdaptiveTextEngine
- text_coordinator::AdvancedBatchClassificationResult
- text_coordinator::AdvancedClassificationResult
- text_coordinator::AdvancedMultipleTextResult
- text_coordinator::AdvancedSemanticSimilarityResult
- text_coordinator::AdvancedTextAnalytics
- text_coordinator::AdvancedTextConfig
- text_coordinator::AdvancedTextCoordinator
- text_coordinator::AdvancedTextPerformanceReport
- text_coordinator::AdvancedTextResult
- text_coordinator::AdvancedTopicModelingResult
- text_coordinator::AnalyticsPipeline
- text_coordinator::ClassificationResult
- text_coordinator::CrossModalAttention
- text_coordinator::DynamicModelSelector
- text_coordinator::EnhancedTopicModelingResult
- text_coordinator::GarbageCollectionOptimizer
- text_coordinator::HardwareCapabilityDetector
- text_coordinator::HistoricalAnalysis
- text_coordinator::InsightGenerator
- text_coordinator::MemoryUsagePredictor
- text_coordinator::ModelPerformanceMetrics
- text_coordinator::MultiModalFusionStrategies
- text_coordinator::MultiModalTextCoordinator
- text_coordinator::NamedEntity
- text_coordinator::NeuralProcessingEnsemble
- text_coordinator::NeuralProcessingOutputs
- text_coordinator::OptimizationRecommendation
- text_coordinator::PerformanceBottleneck
- text_coordinator::PerformanceMetricsSnapshot
- text_coordinator::PerformanceMonitor
- text_coordinator::PerformanceOptimizer
- text_coordinator::PredictiveTextInsights
- text_coordinator::PredictiveTextModeler
- text_coordinator::ProcessingTimingBreakdown
- text_coordinator::SimilarityAnalytics
- text_coordinator::SystemUtilization
- text_coordinator::TextAnalyticsEngine
- text_coordinator::TextAnomaly
- text_coordinator::TextAnomalyDetector
- text_coordinator::TextAudioProcessor
- text_coordinator::TextCacheManager
- text_coordinator::TextComplexityAnalysis
- text_coordinator::TextImageProcessor
- text_coordinator::TextMemoryOptimizer
- text_coordinator::TextMemoryPool
- text_coordinator::TextPerformanceMetrics
- text_coordinator::TextPerformanceTracker
- text_coordinator::TextProcessingResult
- text_coordinator::TextQualityMetrics
- text_coordinator::TextStyleAnalysis
- text_coordinator::TopicAnalytics
- text_coordinator::TopicModelingParams
- text_coordinator::TopicModelingResult
- text_coordinator::TopicQualityMetrics
- text_preprocess::PreprocessConfig
- text_preprocess::PreprocessResult
- text_preprocess::TextPreprocessor
- text_similarity::Bm25Config
- text_similarity::Bm25Scorer
- text_similarity::SimilarityResult
- text_similarity::TfIdfCosineSimilarity
- text_statistics::ReadabilityMetrics
- text_statistics::TextMetrics
- text_statistics::TextStatistics
- text_summarization::ScoredSentence
- token_filter::CompositeFilter
- token_filter::CustomFilter
- token_filter::FrequencyFilter
- token_filter::LengthFilter
- token_filter::RegexFilter
- token_filter::StopwordsFilter
- tokenization::bpe::BpeTokenizer
- tokenization::bpe::BpeVocab
- tokenization::byte_level_bpe::ByteLevelBpeConfig
- tokenization::byte_level_bpe::ByteLevelBpeTokenizer
- tokenization::hf_json::HfAddedToken
- tokenization::hf_json::HfModel
- tokenization::hf_json::HfTokenizerJson
- tokenization::language_agnostic::LanguageAgnosticTokenizer
- tokenization::llama::LlamaTokenizer
- tokenization::llama::LlamaTokenizerConfig
- tokenization::multilingual_bpe::LanguageCorpus
- tokenization::multilingual_bpe::MultilingualBpeConfig
- tokenization::multilingual_bpe::MultilingualBpeTokenizer
- tokenization::unicode_bpe::UnicodeBpeConfig
- tokenization::unicode_bpe::UnicodeBpeTokenizer
- tokenization::unicode_normalizer::UnicodeNormalizer
- tokenization::unicode_normalizer::UnicodeNormalizerConfig
- tokenization::wordpiece::BasicTokenizer
- tokenization::wordpiece::WordPieceTokenizer
- tokenize::CharacterTokenizer
- tokenize::NgramTokenizer
- tokenize::RegexTokenizer
- tokenize::SentenceTokenizer
- tokenize::WhitespaceTokenizer
- tokenize::WordTokenizer
- tokenize::bpe::BpeConfig
- tokenize::bpe::BpeTokenizer
- tokenize::bpe::BpeVocabulary
- tokenizer::BPETokenizer
- tokenizer::SimpleCharTokenizer
- tokenizer::SimpleWhitespaceTokenizer
- tokenizer::WordPieceTokenizer
- tokenizers::bert::BatchEncoding
- tokenizers::bert::BertEncoding
- tokenizers::bert::BertTokenizer
- tokenizers::bpe_enhanced::BpeVocab
- tokenizers::bpe_enhanced::ByteLevelBpe
- tokenizers::bpe_enhanced::ChatTemplate
- tokenizers::bpe_enhanced::Message
- tokenizers::bpe_enhanced::SpecialTokens
- tokenizers::hf_json::HfAddedToken
- tokenizers::hf_json::HfNormalizerConfig
- tokenizers::hf_json::HfTokenizerJson
- tokenizers::roberta::RobertaTokenizer
- tokenizers::unicode::UnicodeTokenizer
- tokenizers::unicode::UnicodeTokenizerConfig
- topic::hdp::Hdp
- topic::hdp::HdpConfig
- topic::hdp::HdpState
- topic::hdp::HdpTopicConfig
- topic::hdp::HdpTopicModel
- topic_coherence::TopicCoherence
- topic_coherence::TopicDiversity
- topic_model::GibbsLda
- topic_model::GibbsLdaConfig
- topic_model::NmfConfig
- topic_model::NmfTopicModel
- topic_model::TopicCoherenceScorer
- topic_modeling::LatentDirichletAllocation
- topic_modeling::LdaBuilder
- topic_modeling::LdaConfig
- topic_modeling::Topic
- transformer::FeedForward
- transformer::LayerNorm
- transformer::MultiHeadAttention
- transformer::PositionalEncoding
- transformer::TokenEmbedding
- transformer::TransformerConfig
- transformer::TransformerDecoder
- transformer::TransformerDecoderLayer
- transformer::TransformerEncoder
- transformer::TransformerEncoderLayer
- transformer::TransformerModel
- transliteration::ScriptTransliterator
- transliteration::TranslitConfig
- transliteration::cyrillic::CyrillicTransliterator
- transliteration::hepburn::HepburnTransliterator
- transliteration::pinyin::PinyinTransliterator
- vectorize::CountVectorizer
- vectorize::TfidfVectorizer
- visualization::AttentionVisualizer
- visualization::Color
- visualization::EmbeddingVisualizer
- visualization::SentimentVisualizer
- visualization::TextAnalyticsDashboard
- visualization::TopicVisualizer
- visualization::VisualizationConfig
- visualization::WordCloud
- vocabulary::Vocabulary
- weighted_distance::DamerauLevenshteinWeights
- weighted_distance::LevenshteinWeights
- weighted_distance::WeightedDamerauLevenshtein
- weighted_distance::WeightedLevenshtein
Enums
- alignment::AlignmentMethod
- batch_tokenizer::PaddingSide
- batch_tokenizer::PaddingStrategy
- batch_tokenizer::TruncationStrategy
- bert_finetune::FineTuneTask
- coreference::GenderNumber
- coreference::MentionType
- crosslingual::NerLabel
- dialog::DialogAct
- dialog::EntityKind
- dialog::PolicyState
- discourse::DiscourseRelation
- domain_processors::types::Domain
- embeddings::Word2VecAlgorithm
- embeddings::contrastive::ContrastiveLoss
- embeddings::crosslingual::AlignmentMethod
- embeddings::sentence::PoolingStrategy
- embeddings::sentence_encoder::PoolingStrategy
- embeddings::universal::UsePooling
- error::TextError
- evaluation::bleu::SmoothingMethod
- evaluation::sequence_labeler::BioTag
- evaluation::sts::StsDatasetFormat
- event_extraction::EventType
- huggingface_compat::pipelines::HfPipeline
- information_extraction::coreference::MentionType
- information_extraction::dep_relations::PronounGender
- information_extraction::entities::EntityType
- information_extraction::seq_patterns::PatternElement
- keyword_extraction::KeywordMethod
- language_detection::DetectedLanguage
- language_detection::DetectionStrategy
- language_model::SmoothingMethod
- ml_integration::FeatureExtractionMode
- model_registry::ModelType
- multilingual::Language
- multilingual::ScriptFamily
- named_entity_recognition::NerEntityType
- ner::EntityType
- neural_architectures::ActivationFunction
- neural_nlp::neural_ner::NerTag
- paraphrasing::ParaphraseStrategy
- performance::TrendDirection
- pipeline::PipelineStep
- question_answering::QAMethod
- question_answering::QuestionType
- semantic_similarity::PoolingStrategy
- semantic_similarity::TopicSimilarityMetric
- sentence_embeddings::PoolingStrategy
- sentence_embeddings::encoder::PoolingStrategy
- sentence_embeddings::similarity::PairwiseSimilarityMetric
- sentence_embeddings::universal::UniversalPoolingStrategy
- sentiment::Sentiment
- similarity::SimilarityMetric
- sparse::AdaptiveSparseMatrix
- spelling::EditOp
- stemming::rule_lemmatizer::PosTag
- summarize_advanced::SentenceSimilarity
- text_coordinator::AdaptationStrategy
- text_coordinator::EnsembleVotingStrategy
- text_coordinator::OptimizationStrategy
- text_preprocess::EmailHandling
- text_preprocess::MentionHandling
- text_preprocess::UrlHandling
- text_similarity::SimilarityMethod
- text_summarization::SummarizationMethod
- tokenization::hf_json::HfModelType
- tokenization::unicode_normalizer::NormForm
- tokenization::unicode_normalizer::Script
- tokenizers::bpe_enhanced::BpeError
- tokenizers::bpe_enhanced::ChatStyle
- topic::hdp::TopicError
- topic_modeling::LdaLearningMethod
- transliteration::ChineseSystem
- transliteration::JapaneseScript
- transliteration::Script
- transliteration::cyrillic::CyrillicScheme
- transliteration::pinyin::PinyinStyle
- visualization::ColorScheme
Traits
- embeddings::WordEmbedding
- evaluation::perplexity::LanguageModelLike
- lemmatization::Lemmatizer
- model_registry::RegistrableModel
- preprocess::TextCleaner
- preprocess::TextNormalizer
- sentence_embeddings::similarity::SentenceEncoderLike
- spelling::SpellingCorrector
- stemming::Stemmer
- string_metrics::PhoneticAlgorithm
- string_metrics::StringMetric
- text_coordinator::NeuralArchitecture
- token_filter::TokenFilter
- tokenize::Tokenizer
- tokenizer::TransformerTokenizer
- transliteration::Transliterator
- vectorize::Vectorizer
- weighted_distance::WeightedStringMetric
Functions
- abstractive_summary::rouge_l
- abstractive_summary::rouge_n
- advanced_distance::damerau_levenshtein
- advanced_distance::fuzzy_match
- advanced_distance::fuzzy_search
- advanced_distance::jaro
- advanced_distance::jaro_winkler
- advanced_distance::lcs
- advanced_distance::lcs_length
- advanced_distance::levenshtein
- advanced_distance::needleman_wunsch
- advanced_distance::normalized_levenshtein
- advanced_distance::smith_waterman
- advanced_distance::weighted_levenshtein
- alignment::alignment_f1
- alignment::ibm_model1
- alignment::symmetrize_alignments
- alignment::word_alignment
- batch_tokenizer::batch_encode
- batch_tokenizer::batch_encode_ext
- bpe_tokenizer::bpe_decode
- bpe_tokenizer::bpe_encode
- bpe_tokenizer::bpe_tokenize
- bpe_tokenizer::train_bpe
- classification::cross_validate_nb
- cleansing::expand_contractions
- cleansing::normalize_all_numbers
- cleansing::normalize_binary_numbers
- cleansing::normalize_currencies
- cleansing::normalize_dashes
- cleansing::normalize_dates
- cleansing::normalize_fractions
- cleansing::normalize_hex_numbers
- cleansing::normalize_ip_addresses
- cleansing::normalize_measurements
- cleansing::normalize_numbers
- cleansing::normalize_ordinals
- cleansing::normalize_percentages
- cleansing::normalize_quotes
- cleansing::normalize_roman_numerals
- cleansing::normalize_scientific_notation
- cleansing::normalize_temperatures
- cleansing::normalize_times
- cleansing::normalize_unicode
- cleansing::normalize_versions
- cleansing::normalize_whitespace
- cleansing::remove_accents
- cleansing::replace_emails
- cleansing::replace_phone_numbers
- cleansing::replace_urls
- cleansing::strip_html_tags
- coreference::antecedent_score
- coreference::gender_number_agreement
- coreference::infer_gender_number
- coreference::replace_pronouns
- coreference::resolve_coreferences
- coreference::resolve_pronouns
- crosslingual::align_embeddings
- crosslingual::compute_character_ngram_features
- ctm::inference::cholesky_inverse
- ctm::inference::e_step_doc
- ctm::inference::logistic_normal_ll
- ctm::inference::m_step_global
- ctm::model::log_likelihood
- ctm::model::softmax
- ctm::model::top_words
- ctm::model::topic_correlation_matrix
- dialog::classify_intent
- dialog::response_template
- discourse::coherence_score
- discourse::coherence_score_with_lexicon
- discourse::detect_discourse_relation
- distance::cosine_similarity
- distance::jaccard_similarity
- distance::jaro_winkler_similarity
- distance::levenshtein_distance
- distance::normalized_levenshtein_distance
- distance::text_cosine_similarity
- dtm::inference::kalman_backward
- dtm::inference::kalman_forward
- dtm::model::top_words_at_time
- dtm::model::topic_evolution
- embeddings::contrastive::nt_xent_loss_value
- embeddings::cosine_similarity
- embeddings::crosslingual::align_embeddings
- embeddings::crosslingual::alignment_quality
- embeddings::crosslingual::alignment_quality_score
- embeddings::crosslingual::translate_batch
- embeddings::crosslingual::translate_embedding
- embeddings::embedding_cosine_similarity
- embeddings::glove::cosine_similarity
- embeddings::pairwise_similarity
- embeddings::sentence::cosine_similarity
- embeddings::sentence::l2_norm
- evaluation::bleu::corpus_bleu
- evaluation::bleu::sentence_bleu
- evaluation::meteor::meteor_score
- evaluation::meteor::meteor_score_multi
- evaluation::ner::conll_format_report
- evaluation::ner::evaluate_ner
- evaluation::ner::evaluate_ner_checked
- evaluation::ner::extract_spans_from_bio
- evaluation::perplexity::load_token_corpus
- evaluation::perplexity::perplexity_evaluate
- evaluation::rouge::rouge_l
- evaluation::rouge::rouge_l_summary
- evaluation::rouge::rouge_n
- evaluation::rouge::rouge_n_multi
- evaluation::sequence_labeler::evaluate_sequence_labeling
- evaluation::sts::load_sts_from_tsv
- evaluation::sts::sts_evaluate
- event_extraction::event_coref
- event_extraction::event_coref_with_threshold
- event_extraction::extract_events
- information_extraction::advanced_ner::simple_coreference
- information_extraction::seq_patterns::build_ner_pattern_matcher
- keyword_extraction::extract_keywords
- keywords::english_stop_words
- keywords::textrank_keywords
- language_detection::detect_language
- language_detection::detect_language_with_strategy
- multilingual::is_cjk_char
- multilingual::is_combining_mark
- multilingual::is_cyrillic
- named_entity_recognition::extract_entities
- pipeline::basic_pipeline
- pipeline::lemmatization_pipeline
- pipeline::ngram_pipeline
- pipeline::stemming_pipeline
- pos_tagging::lexicon::initialize_lexicon
- question_answering::classify_question
- question_answering::extract_answer
- question_answering::tf_idf_similarity
- segmentation::token_byte_ranges
- sentence_embeddings::cross_lingual::procrustes_align
- sentence_embeddings::infonce::cosine_similarity_matrix
- sentence_embeddings::infonce::infonce_loss
- sentence_embeddings::infonce::top1_accuracy
- sentence_embeddings::similarity::semantic_similarity_matrix
- sentence_embeddings::similarity::semantic_similarity_tokens
- sentence_embeddings::similarity::semantic_similarity_vecs
- sentence_embeddings::similarity::vector_similarity
- sentiment::aggregate_sentiment
- sentiment::analyze_and_aggregate
- similarity::compute_similarity
- similarity::most_similar
- similarity::pairwise_similarity
- similarity::spearman_correlation
- similarity::sts_evaluate
- sparse_vectorize::sparse_cosine_similarity
- spelling::extract_words
- spelling::normalize_string
- spelling::split_sentences
- stemming::create_pos_aware_lemmatizer
- stemming::create_pos_aware_lemmatizer_with_config
- text_preprocess::edit_distance
- text_preprocess::normalize_whitespace
- text_preprocess::remove_diacritics_from_text
- text_preprocess::strip_html_tags
- text_similarity::bm25_score
- text_similarity::char_ngram_jaccard_similarity
- text_similarity::edit_distance_similarity
- text_similarity::jaccard_token_similarity
- text_similarity::text_similarity
- text_similarity::tfidf_cosine_similarity
- text_summarization::score_position
- text_summarization::score_textrank
- text_summarization::score_tfidf
- text_summarization::summarize
- tokenization::bpe::compute_merges
- tokenization::byte_level_bpe::bytes_to_unicode
- tokenization::hf_json::detect_model_type
- tokenization::unicode_normalizer::detect_script
- topic_model::select_n_topics
- transliteration::strip_diacritics
- utils::count_tokens
- utils::count_tokens_batch
- utils::count_tokens_batch_parallel
- utils::extract_collocations
- utils::extract_ngrams
- utils::filter_tokens
- utils::train_test_split
Type Aliases
- alignment::AlignmentPair
- error::Result
- evaluation::online_lda::SparseDoc
- sentence_embeddings::autograd_projection::ProjResult
- sentence_embeddings::cross_lingual::AlignResult
Statics
- transliteration::CYRILLIC_TO_LATIN
- transliteration::GREEK_TO_LATIN
- transliteration::HIRAGANA_TO_ROMAJI
- transliteration::KATAKANA_TO_ROMAJI