1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175
use crate::util::ShouldSkip;
use crate::{Query, ScoreMode};
/// Rescoring can help to improve precision by reordering just the top (eg 100 - 500)
/// documents returned by the [query](https://www.elastic.co/guide/en/elasticsearch/reference/current/search-search.html#request-body-search-query)
/// and [post_filter](https://www.elastic.co/guide/en/elasticsearch/reference/current/filter-search-results.html#post-filter)
/// phases, using a secondary (usually more costly) algorithm, instead of applying the costly algorithm to all documents in the index.
///
/// A `rescore` request is executed on each shard before it returns its results to be sorted by the node handling the overall search request.
///
/// Currently the rescore API has only one implementation: the query rescorer, which uses a query to tweak the scoring.
/// In the future, alternative rescorers may be made available, for example, a pair-wise rescorer.
///
/// To create a `rescore` query with simple `term` query:
/// ```
/// # use elasticsearch_dsl::rescoring::*;
/// # use elasticsearch_dsl::queries::*;
/// # use elasticsearch_dsl::queries::params::*;
/// # let rescore =
/// Rescore::new(Query::term("title", "test"));
/// ```
/// To create a `rescore` query with simple `term` query and optional fields:
/// ```
/// # use elasticsearch_dsl::rescoring::*;
/// # use elasticsearch_dsl::queries::*;
/// # use elasticsearch_dsl::queries::params::*;
/// # let query =
/// Rescore::new(Query::term("title", "test"))
/// .rescore_query_weight(0.2)
/// .window_size(100);
/// ```
/// <https://www.elastic.co/guide/en/elasticsearch/reference/current/filter-search-results.html#rescore>
#[derive(Debug, Clone, PartialEq, Serialize)]
pub struct Rescore {
query: RescoreQuery,
#[serde(skip_serializing_if = "ShouldSkip::should_skip")]
window_size: Option<u64>,
}
#[derive(Debug, Clone, PartialEq, Serialize)]
struct RescoreQuery {
rescore_query: Option<Query>,
#[serde(skip_serializing_if = "ShouldSkip::should_skip")]
rescore_query_weight: Option<f32>,
#[serde(skip_serializing_if = "ShouldSkip::should_skip")]
query_weight: Option<f32>,
#[serde(skip_serializing_if = "ShouldSkip::should_skip")]
score_mode: Option<ScoreMode>,
}
impl Rescore {
/// Creates a new instance of [Rescore]
///
/// - `query` - Second query which will be execute on top-k results returned by original query.
pub fn new<T>(query: T) -> Self
where
T: Into<Option<Query>>,
{
Self {
query: RescoreQuery {
rescore_query: query.into(),
rescore_query_weight: None,
query_weight: None,
score_mode: None,
},
window_size: None,
}
}
/// The number of docs which will be examined on each shard can be controlled by the `window_size` parameter, which defaults to 10.
pub fn window_size(mut self, window_size: u64) -> Self {
self.window_size = Some(window_size);
self
}
/// The relative importance of the rescore query can be controlled with the `rescore_query_weight` respectively. Both default to 1.
pub fn rescore_query_weight<T>(mut self, rescore_query_weight: T) -> Self
where
T: num_traits::AsPrimitive<f32>,
{
self.query.rescore_query_weight = Some(rescore_query_weight.as_());
self
}
/// The relative importance of the original query can be controlled with the `query_weight` respectively. Both default to 1.
pub fn query_weight<T>(mut self, query_weight: T) -> Self
where
T: num_traits::AsPrimitive<f32>,
{
self.query.query_weight = Some(query_weight.as_());
self
}
/// The way the scores are combined can be controlled with the
pub fn score_mode(mut self, score_mode: ScoreMode) -> Self {
self.query.score_mode = Some(score_mode);
self
}
}
impl ShouldSkip for Rescore {
fn should_skip(&self) -> bool {
self.query
.rescore_query
.as_ref()
.map_or(true, ShouldSkip::should_skip)
}
}
impl IntoIterator for Rescore {
type Item = Self;
type IntoIter = std::option::IntoIter<Self::Item>;
fn into_iter(self) -> Self::IntoIter {
Some(self).into_iter()
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::util::assert_serialize_rescore;
#[test]
fn should_skip() {
assert!(Rescore::new(Query::range("field")).should_skip());
assert!(!Rescore::new(Query::range("field").gte(1)).should_skip());
}
#[test]
fn serialization() {
assert_serialize_rescore(
Rescore::new(Query::term("title", "test")),
json!({
"query": {
"rescore_query": {
"term": {
"title": {
"value": "test"
}
}
}
}
}),
);
assert_serialize_rescore(
Rescore::new(Query::term("title", "test"))
.rescore_query_weight(0.2)
.query_weight(0.5)
.window_size(100)
.score_mode(ScoreMode::Max),
json!({
"window_size": 100,
"query": {
"query_weight": 0.5,
"rescore_query_weight": 0.2,
"score_mode": "max",
"rescore_query": {
"term": {
"title": {
"value": "test"
}
}
}
}
}),
);
}
}