Skip to main content

reifydb_engine/expression/
lookup.rs

1// SPDX-License-Identifier: Apache-2.0
2// Copyright (c) 2025 ReifyDB
3
4use reifydb_core::value::column::{Column, data::ColumnData};
5use reifydb_rql::expression::ColumnExpression;
6use reifydb_type::value::{
7	Value,
8	blob::Blob,
9	date::Date,
10	datetime::{CREATED_AT_COLUMN_NAME, DateTime, UPDATED_AT_COLUMN_NAME},
11	decimal::Decimal,
12	dictionary::DictionaryEntryId,
13	duration::Duration,
14	identity::IdentityId,
15	int::Int,
16	row_number::ROW_NUMBER_COLUMN_NAME,
17	time::Time,
18	r#type::Type,
19	uint::Uint,
20	uuid::{Uuid4, Uuid7},
21};
22
23use crate::{Result, expression::context::EvalContext, vm::stack::Variable};
24
25macro_rules! extract_typed_column {
26	($col:expr, $take:expr, $variant:ident($x:ident) => $transform:expr, $default:expr, $constructor:ident) => {{
27		let mut data = Vec::new();
28		let mut bitvec = Vec::new();
29		let mut count = 0;
30		for v in $col.data().iter() {
31			if count >= $take {
32				break;
33			}
34			match v {
35				Value::$variant($x) => {
36					data.push($transform);
37					bitvec.push(true);
38				}
39				_ => {
40					data.push($default);
41					bitvec.push(false);
42				}
43			}
44			count += 1;
45		}
46		Ok($col.with_new_data(ColumnData::$constructor(data, bitvec)))
47	}};
48}
49
50pub(crate) fn column_lookup(ctx: &EvalContext, column: &ColumnExpression) -> Result<Column> {
51	let name = column.0.name.text();
52
53	if name == ROW_NUMBER_COLUMN_NAME && !ctx.columns.row_numbers.is_empty() {
54		let row_numbers: Vec<u64> = ctx.columns.row_numbers.iter().map(|r| r.value()).collect();
55		return Ok(Column::new(ROW_NUMBER_COLUMN_NAME.to_string(), ColumnData::uint8(row_numbers)));
56	}
57
58	if name == CREATED_AT_COLUMN_NAME && !ctx.columns.created_at.is_empty() {
59		return Ok(Column::new(
60			CREATED_AT_COLUMN_NAME.to_string(),
61			ColumnData::datetime(ctx.columns.created_at.to_vec()),
62		));
63	}
64
65	if name == UPDATED_AT_COLUMN_NAME && !ctx.columns.updated_at.is_empty() {
66		return Ok(Column::new(
67			UPDATED_AT_COLUMN_NAME.to_string(),
68			ColumnData::datetime(ctx.columns.updated_at.to_vec()),
69		));
70	}
71
72	if let Some(col) = ctx.columns.iter().find(|c| c.name() == name) {
73		return extract_column_data(col, ctx);
74	}
75
76	if let Some(Variable::Columns {
77		columns: scalar_cols,
78	}) = ctx.symbols.get(name)
79		&& scalar_cols.is_scalar()
80		&& let Some(col) = scalar_cols.columns.first()
81	{
82		return extract_column_data(col, ctx);
83	}
84
85	Ok(Column::new(name.to_string(), ColumnData::none_typed(Type::Boolean, ctx.row_count)))
86}
87
88fn extract_column_data(col: &Column, ctx: &EvalContext) -> Result<Column> {
89	let take = ctx.take.unwrap_or(usize::MAX);
90
91	// Use the column's actual data type instead of checking the first value
92	// This handles cases where the first value is Undefined
93	let col_type = col.data().get_type();
94
95	// Unwrap Option to get the effective data type
96	let effective_type = match col_type {
97		Type::Option(inner) => *inner,
98		other => other,
99	};
100
101	extract_column_data_by_type(col, take, effective_type)
102}
103
104fn extract_column_data_by_type(col: &Column, take: usize, col_type: Type) -> Result<Column> {
105	match col_type {
106		Type::Boolean => extract_typed_column!(col, take, Boolean(b) => b, false, bool_with_bitvec),
107		Type::Float4 => extract_typed_column!(col, take, Float4(v) => v.value(), 0.0f32, float4_with_bitvec),
108		Type::Float8 => extract_typed_column!(col, take, Float8(v) => v.value(), 0.0f64, float8_with_bitvec),
109		Type::Int1 => extract_typed_column!(col, take, Int1(n) => n, 0, int1_with_bitvec),
110		Type::Int2 => extract_typed_column!(col, take, Int2(n) => n, 0, int2_with_bitvec),
111		Type::Int4 => extract_typed_column!(col, take, Int4(n) => n, 0, int4_with_bitvec),
112		Type::Int8 => extract_typed_column!(col, take, Int8(n) => n, 0, int8_with_bitvec),
113		Type::Int16 => extract_typed_column!(col, take, Int16(n) => n, 0, int16_with_bitvec),
114		Type::Utf8 => extract_typed_column!(col, take, Utf8(s) => s.clone(), "".to_string(), utf8_with_bitvec),
115		Type::Uint1 => extract_typed_column!(col, take, Uint1(n) => n, 0, uint1_with_bitvec),
116		Type::Uint2 => extract_typed_column!(col, take, Uint2(n) => n, 0, uint2_with_bitvec),
117		Type::Uint4 => extract_typed_column!(col, take, Uint4(n) => n, 0, uint4_with_bitvec),
118		Type::Uint8 => extract_typed_column!(col, take, Uint8(n) => n, 0, uint8_with_bitvec),
119		Type::Uint16 => extract_typed_column!(col, take, Uint16(n) => n, 0, uint16_with_bitvec),
120		Type::Date => extract_typed_column!(col, take, Date(d) => d, Date::default(), date_with_bitvec),
121		Type::DateTime => {
122			extract_typed_column!(col, take, DateTime(dt) => dt, DateTime::default(), datetime_with_bitvec)
123		}
124		Type::Time => extract_typed_column!(col, take, Time(t) => t, Time::default(), time_with_bitvec),
125		Type::Duration => {
126			extract_typed_column!(col, take, Duration(i) => i, Duration::default(), duration_with_bitvec)
127		}
128		Type::IdentityId => {
129			extract_typed_column!(col, take, IdentityId(i) => i, IdentityId::default(), identity_id_with_bitvec)
130		}
131		Type::Uuid4 => {
132			extract_typed_column!(col, take, Uuid4(i) => i, Uuid4::default(), uuid4_with_bitvec)
133		}
134		Type::Uuid7 => {
135			extract_typed_column!(col, take, Uuid7(i) => i, Uuid7::default(), uuid7_with_bitvec)
136		}
137		Type::DictionaryId => {
138			extract_typed_column!(col, take, DictionaryId(i) => i, DictionaryEntryId::default(), dictionary_id_with_bitvec)
139		}
140		Type::Blob => {
141			extract_typed_column!(col, take, Blob(b) => b.clone(), Blob::new(vec![]), blob_with_bitvec)
142		}
143		Type::Int => extract_typed_column!(col, take, Int(b) => b.clone(), Int::zero(), int_with_bitvec),
144		Type::Uint => extract_typed_column!(col, take, Uint(b) => b.clone(), Uint::zero(), uint_with_bitvec),
145		Type::Any => {
146			extract_typed_column!(col, take, Any(boxed) => Box::new(*boxed.clone()), Box::new(Value::none()), any_with_bitvec)
147		}
148		Type::Decimal => {
149			extract_typed_column!(col, take, Decimal(b) => b.clone(), Decimal::from_i64(0), decimal_with_bitvec)
150		}
151		Type::Option(inner) => extract_column_data_by_type(col, take, *inner),
152		Type::List(_) => {
153			extract_typed_column!(col, take, Any(boxed) => Box::new(*boxed.clone()), Box::new(Value::none()), any_with_bitvec)
154		}
155		Type::Record(_) => {
156			extract_typed_column!(col, take, Any(boxed) => Box::new(*boxed.clone()), Box::new(Value::none()), any_with_bitvec)
157		}
158		Type::Tuple(_) => {
159			extract_typed_column!(col, take, Any(boxed) => Box::new(*boxed.clone()), Box::new(Value::none()), any_with_bitvec)
160		}
161	}
162}
163
164#[cfg(test)]
165pub mod tests {
166	use reifydb_core::{
167		interface::identifier::{ColumnIdentifier, ColumnShape},
168		value::column::{Column, columns::Columns, data::ColumnData},
169	};
170	use reifydb_routine::function::registry::Functions;
171	use reifydb_rql::expression::ColumnExpression;
172	use reifydb_runtime::context::{RuntimeContext, clock::Clock};
173	use reifydb_type::{fragment::Fragment, params::Params, value::identity::IdentityId};
174
175	use super::column_lookup;
176	use crate::{expression::context::EvalContext, vm::stack::SymbolTable};
177
178	#[test]
179	fn test_column_not_found_returns_correct_row_count() {
180		// Create context with 5 rows
181		let columns =
182			Columns::new(vec![Column::new("existing_col".to_string(), ColumnData::int4([1, 2, 3, 4, 5]))]);
183
184		let runtime_ctx = RuntimeContext::with_clock(Clock::Real);
185		let base = EvalContext {
186			params: &Params::None,
187			symbols: &SymbolTable::new(),
188			functions: &Functions::empty(),
189			runtime_context: &runtime_ctx,
190			arena: None,
191			identity: IdentityId::root(),
192			is_aggregate_context: false,
193			columns: Columns::empty(),
194			row_count: 1,
195			target: None,
196			take: None,
197		};
198		let ctx = base.with_eval(columns, 5);
199
200		// Try to access a column that doesn't exist
201		let result = column_lookup(
202			&ctx,
203			&ColumnExpression(ColumnIdentifier {
204				shape: ColumnShape::Alias(Fragment::internal("nonexistent_col")),
205				name: Fragment::internal("nonexistent_col"),
206			}),
207		)
208		.unwrap();
209
210		// The column should have 5 rows (matching row_count), not 0
211		assert_eq!(
212			result.data().len(),
213			5,
214			"Column not found should return column with ctx.row_count rows, not 0"
215		);
216	}
217}