Skip to main content

activecube_rs/sql/
clickhouse.rs

1use std::collections::HashMap;
2
3use crate::compiler::ir::*;
4use crate::compiler::ir::{CompileResult, JoinType};
5use crate::sql::dialect::SqlDialect;
6
7pub struct ClickHouseDialect;
8
9impl ClickHouseDialect {
10    pub fn new() -> Self {
11        Self
12    }
13}
14
15impl Default for ClickHouseDialect {
16    fn default() -> Self {
17        Self::new()
18    }
19}
20
21impl SqlDialect for ClickHouseDialect {
22    fn compile(&self, ir: &QueryIR) -> CompileResult {
23        if let Some(ref builder) = ir.custom_query_builder {
24            return (builder.0)(ir);
25        }
26
27        let mut bindings = Vec::new();
28        let mut alias_remap: Vec<(String, String)> = Vec::new();
29
30        if ir.joins.is_empty() {
31            let inner_sql = self.compile_inner(ir, &mut bindings, &mut alias_remap);
32            return CompileResult { sql: inner_sql, bindings, alias_remap };
33        }
34
35        // When JOINs are present, force aliases on function expression columns
36        // (e.g. `argMaxMerge(latest_balance)`) so the outer SELECT can reference
37        // them by simple identifier names. Without aliases, `_main.argMaxMerge(x)`
38        // is parsed as a function call — a ClickHouse syntax error.
39        let mut ir_mod = ir.clone();
40        let mut mc_counter = 0u32;
41        for sel in &mut ir_mod.selects {
42            if let SelectExpr::Column { column, alias } = sel {
43                if column.contains('(') && alias.is_none() {
44                    let a = format!("__mc_{mc_counter}");
45                    mc_counter += 1;
46                    alias_remap.push((a.clone(), column.clone()));
47                    *alias = Some(a);
48                }
49            }
50        }
51
52        let mut jc_counter = 0u32;
53        for join in &mut ir_mod.joins {
54            for sel in &mut join.selects {
55                if let SelectExpr::Column { column, alias } = sel {
56                    if column.contains('(') && alias.is_none() {
57                        let a = format!("__jc_{jc_counter}");
58                        jc_counter += 1;
59                        *alias = Some(a);
60                    }
61                }
62            }
63        }
64
65        let inner_sql = self.compile_inner(&ir_mod, &mut bindings, &mut alias_remap);
66
67        // Build outer SELECT with explicit column listing.
68        // Always backtick-quote to prevent ClickHouse auto-prefixing ambiguous
69        // names when multiple JOINed tables share column names.
70        let main_cols: Vec<String> = ir_mod.selects.iter().map(|s| {
71            let col = match s {
72                SelectExpr::Column { column, alias } => alias.as_ref().unwrap_or(column).clone(),
73                SelectExpr::Aggregate { alias, .. } | SelectExpr::DimAggregate { alias, .. } => alias.clone(),
74            };
75            format!("_main.`{}` AS `{}`", col, col)
76        }).collect();
77
78        let mut sql = String::from("SELECT ");
79        sql.push_str(&main_cols.join(", "));
80
81        // Collect joined column aliases for the outer SELECT
82        for join in &ir_mod.joins {
83            for sel in &join.selects {
84                let col_name = match sel {
85                    SelectExpr::Column { column, alias } => alias.as_ref().unwrap_or(column).clone(),
86                    SelectExpr::Aggregate { alias, .. } | SelectExpr::DimAggregate { alias, .. } => alias.clone(),
87                };
88                let outer_alias = format!("{}.{}", join.alias, col_name);
89                if let SelectExpr::Column { column, alias: Some(_) } = sel {
90                    if column.contains('(') {
91                        let outer_original = format!("{}.{}", join.alias, column);
92                        alias_remap.push((outer_alias.clone(), outer_original));
93                    }
94                }
95                sql.push_str(&format!(", {}.`{}` AS `{}`",
96                    join.alias, col_name, outer_alias));
97            }
98        }
99
100        sql.push_str(&format!(" FROM ({}) AS _main", inner_sql));
101
102        // Build a lookup for main query aliases to resolve ON condition columns
103        // that might be function expressions (aliased above).
104        let main_alias_map: HashMap<String, String> = ir_mod.selects.iter()
105            .filter_map(|s| {
106                if let SelectExpr::Column { column, alias: Some(a) } = s {
107                    if column.contains('(') { Some((column.clone(), a.clone())) } else { None }
108                } else { None }
109            })
110            .collect();
111
112        for join in &ir_mod.joins {
113            let join_kw = join.join_type.sql_keyword();
114
115            if join.is_aggregate {
116                // Mode B: subquery JOIN for AggregatingMergeTree targets
117                sql.push_str(&format!(" {} (SELECT ", join_kw));
118                let mut sub_parts: Vec<String> = Vec::new();
119                for gb_col in &join.group_by {
120                    sub_parts.push(quote_col(gb_col));
121                }
122                for sel in &join.selects {
123                    match sel {
124                        SelectExpr::Column { column, alias } => {
125                            let col = if column.contains('(') { column.clone() } else { format!("`{column}`") };
126                            if let Some(a) = alias {
127                                sub_parts.push(format!("{col} AS `{a}`"));
128                            } else if column.contains('(') || !join.group_by.contains(column) {
129                                sub_parts.push(col);
130                            }
131                        }
132                        SelectExpr::Aggregate { function, column, alias, condition } => {
133                            let func = function.to_lowercase();
134                            let qcol = quote_col(column);
135                            let expr = match (func.as_str(), column.as_str(), condition) {
136                                ("count", "*", None) => format!("count() AS `{alias}`"),
137                                ("count", "*", Some(cond)) => format!("countIf({cond}) AS `{alias}`"),
138                                ("count", _, None) => format!("uniqExact({qcol}) AS `{alias}`"),
139                                ("count", _, Some(cond)) => format!("uniqExactIf({qcol}, {cond}) AS `{alias}`"),
140                                ("uniq", _, None) => format!("uniq({qcol}) AS `{alias}`"),
141                                ("uniq", _, Some(cond)) => format!("uniqIf({qcol}, {cond}) AS `{alias}`"),
142                                (f, _, None) => format!("{f}({qcol}) AS `{alias}`"),
143                                (f, _, Some(cond)) => format!("{f}If({qcol}, {cond}) AS `{alias}`"),
144                            };
145                            sub_parts.push(expr);
146                        }
147                        SelectExpr::DimAggregate { agg_type, value_column, compare_column, alias, condition } => {
148                            let func = match agg_type {
149                                DimAggType::ArgMax => "argMax",
150                                DimAggType::ArgMin => "argMin",
151                            };
152                            let qv = quote_col(value_column);
153                            let qc = quote_col(compare_column);
154                            let expr = match condition {
155                                None => format!("{func}({qv}, {qc}) AS `{alias}`"),
156                                Some(cond) => format!("{func}If({qv}, {qc}, {cond}) AS `{alias}`"),
157                            };
158                            sub_parts.push(expr);
159                        }
160                    }
161                }
162                sql.push_str(&sub_parts.join(", "));
163                sql.push_str(&format!(" FROM `{}`.`{}`", join.schema, join.table));
164                if !join.group_by.is_empty() {
165                    sql.push_str(" GROUP BY ");
166                    let gb: Vec<String> = join.group_by.iter().map(|c| quote_col(c)).collect();
167                    sql.push_str(&gb.join(", "));
168                }
169                sql.push_str(&format!(") AS {}", join.alias));
170            } else {
171                // Mode A: direct JOIN for MergeTree / ReplacingMergeTree targets
172                sql.push_str(&format!(" {} `{}`.`{}` AS {}",
173                    join_kw, join.schema, join.table, join.alias));
174                if join.use_final {
175                    sql.push_str(" FINAL");
176                }
177            }
178
179            if join.join_type == JoinType::Cross {
180                // CROSS JOIN has no ON clause
181                continue;
182            }
183
184            // ON conditions — use alias if the local column was a func expression
185            let on_parts: Vec<String> = join.conditions.iter().map(|(local, remote)| {
186                let local_ref = main_alias_map.get(local).unwrap_or(local);
187                format!("_main.`{}` = {}.`{}`", local_ref, join.alias, remote)
188            }).collect();
189            sql.push_str(" ON ");
190            sql.push_str(&on_parts.join(" AND "));
191        }
192
193        CompileResult { sql, bindings, alias_remap }
194    }
195
196    fn quote_identifier(&self, name: &str) -> String {
197        format!("`{name}`")
198    }
199
200    fn name(&self) -> &str {
201        "ClickHouse"
202    }
203}
204
205impl ClickHouseDialect {
206    fn compile_inner(
207        &self,
208        ir: &QueryIR,
209        bindings: &mut Vec<SqlValue>,
210        alias_remap: &mut Vec<(String, String)>,
211    ) -> String {
212        let mut sql = String::new();
213
214        let mut augmented_selects = ir.selects.clone();
215        let mut agg_alias_map: HashMap<String, String> = HashMap::new();
216        let mut alias_counter = 0u32;
217
218        let having_cols: std::collections::HashSet<String> =
219            collect_filter_columns(&ir.having).into_iter().collect();
220        let has_having_agg = having_cols.iter().any(|c| c.contains('('));
221
222        if has_having_agg {
223            for sel in &mut augmented_selects {
224                if let SelectExpr::Column { column, alias } = sel {
225                    if column.contains('(') && having_cols.contains(column.as_str()) {
226                        if alias.is_none() {
227                            let a = format!("__f_{alias_counter}");
228                            alias_counter += 1;
229                            alias_remap.push((a.clone(), column.clone()));
230                            agg_alias_map.insert(column.clone(), a.clone());
231                            *alias = Some(a);
232                        } else if let Some(existing) = alias {
233                            agg_alias_map.insert(column.clone(), existing.clone());
234                        }
235                    }
236                }
237            }
238            for col in &having_cols {
239                if col.contains('(') && !agg_alias_map.contains_key(col.as_str()) {
240                    let a = format!("__f_{alias_counter}");
241                    alias_counter += 1;
242                    agg_alias_map.insert(col.clone(), a.clone());
243                    augmented_selects.push(SelectExpr::Column {
244                        column: col.clone(),
245                        alias: Some(a),
246                    });
247                }
248            }
249        }
250
251        for sel in &augmented_selects {
252            if let SelectExpr::DimAggregate { agg_type, value_column, compare_column, alias, .. } = sel {
253                let func = match agg_type {
254                    DimAggType::ArgMax => "argMax",
255                    DimAggType::ArgMin => "argMin",
256                };
257                let qv = quote_col(value_column);
258                let qc = quote_col(compare_column);
259                let expr = format!("{func}({qv}, {qc})");
260                agg_alias_map.insert(expr, alias.clone());
261            }
262        }
263
264        sql.push_str("SELECT ");
265        let select_parts: Vec<String> = augmented_selects.iter().map(|s| match s {
266            SelectExpr::Column { column, alias } => {
267                let col = if column.contains('(') { column.clone() } else { format!("`{column}`") };
268                match alias {
269                    Some(a) => format!("{col} AS `{a}`"),
270                    None => col,
271                }
272            },
273            SelectExpr::Aggregate { function, column, alias, condition } => {
274                let func = function.to_uppercase();
275                let qcol = quote_col(column);
276                match (func.as_str(), column.as_str(), condition) {
277                    ("COUNT", "*", None) => format!("count() AS `{alias}`"),
278                    ("COUNT", "*", Some(cond)) => format!("countIf({cond}) AS `{alias}`"),
279                    ("COUNT", _, None) => format!("uniqExact({qcol}) AS `{alias}`"),
280                    ("COUNT", _, Some(cond)) => format!("uniqExactIf({qcol}, {cond}) AS `{alias}`"),
281                    ("UNIQ", _, None) => format!("uniq({qcol}) AS `{alias}`"),
282                    ("UNIQ", _, Some(cond)) => format!("uniqIf({qcol}, {cond}) AS `{alias}`"),
283                    (_, _, None) => format!("{f}({qcol}) AS `{alias}`", f = func.to_lowercase()),
284                    (_, _, Some(cond)) => format!("{f}If({qcol}, {cond}) AS `{alias}`", f = func.to_lowercase()),
285                }
286            }
287            SelectExpr::DimAggregate { agg_type, value_column, compare_column, alias, condition } => {
288                let func = match agg_type {
289                    DimAggType::ArgMax => "argMax",
290                    DimAggType::ArgMin => "argMin",
291                };
292                let qv = quote_col(value_column);
293                let qc = quote_col(compare_column);
294                match condition {
295                    None => format!("{func}({qv}, {qc}) AS `{alias}`"),
296                    Some(cond) => format!("{func}If({qv}, {qc}, {cond}) AS `{alias}`"),
297                }
298            }
299        }).collect();
300        sql.push_str(&select_parts.join(", "));
301
302        if let Some(ref subquery) = ir.from_subquery {
303            sql.push_str(&format!(" FROM ({}) AS _t", subquery));
304        } else {
305            sql.push_str(&format!(" FROM `{}`.`{}`", ir.schema, ir.table));
306            if ir.use_final {
307                sql.push_str(" FINAL");
308            }
309        }
310
311        let where_clause = compile_filter(&ir.filters, bindings);
312        if !where_clause.is_empty() {
313            sql.push_str(" WHERE ");
314            sql.push_str(&where_clause);
315        }
316
317        let effective_group_by = if !ir.group_by.is_empty() {
318            ir.group_by.clone()
319        } else {
320            let has_agg_cols = augmented_selects.iter().any(|s| match s {
321                SelectExpr::Column { column, .. } => column.contains("Merge("),
322                SelectExpr::Aggregate { .. } | SelectExpr::DimAggregate { .. } => true,
323            });
324            if has_agg_cols {
325                augmented_selects.iter().filter_map(|s| match s {
326                    SelectExpr::Column { column, .. } if !column.contains("Merge(") && !column.contains('(') => {
327                        Some(column.clone())
328                    }
329                    _ => None,
330                }).collect()
331            } else {
332                vec![]
333            }
334        };
335
336        if !effective_group_by.is_empty() {
337            sql.push_str(" GROUP BY ");
338            let cols: Vec<String> = effective_group_by.iter().map(|c| quote_col(c)).collect();
339            sql.push_str(&cols.join(", "));
340        }
341
342        if has_having_agg {
343            let having_clause = compile_filter_with_aliases(&ir.having, bindings, &agg_alias_map);
344            if !having_clause.is_empty() {
345                sql.push_str(" HAVING ");
346                sql.push_str(&having_clause);
347            }
348        } else {
349            let having_clause = compile_filter(&ir.having, bindings);
350            if !having_clause.is_empty() {
351                sql.push_str(" HAVING ");
352                sql.push_str(&having_clause);
353            }
354        }
355
356        if !ir.order_by.is_empty() {
357            sql.push_str(" ORDER BY ");
358            let parts: Vec<String> = ir.order_by.iter().map(|o| {
359                let col = if o.column.contains('(') {
360                    agg_alias_map.get(&o.column)
361                        .map(|a| format!("`{a}`"))
362                        .unwrap_or_else(|| o.column.clone())
363                } else {
364                    format!("`{}`", o.column)
365                };
366                let dir = if o.descending { "DESC" } else { "ASC" };
367                format!("{col} {dir}")
368            }).collect();
369            sql.push_str(&parts.join(", "));
370        }
371
372        if let Some(ref lb) = ir.limit_by {
373            let by_cols: Vec<String> = lb.columns.iter().map(|c| format!("`{c}`")).collect();
374            sql.push_str(&format!(" LIMIT {} BY {}", lb.count, by_cols.join(", ")));
375            if lb.offset > 0 {
376                sql.push_str(&format!(" OFFSET {}", lb.offset));
377            }
378        }
379
380        sql.push_str(&format!(" LIMIT {}", ir.limit));
381        if ir.offset > 0 {
382            sql.push_str(&format!(" OFFSET {}", ir.offset));
383        }
384
385        sql
386    }
387}
388
389/// Collect all column names referenced in a filter tree.
390fn collect_filter_columns(node: &FilterNode) -> Vec<String> {
391    match node {
392        FilterNode::Empty => vec![],
393        FilterNode::Condition { column, .. } => vec![column.clone()],
394        FilterNode::And(children) | FilterNode::Or(children) => {
395            children.iter().flat_map(collect_filter_columns).collect()
396        }
397        FilterNode::ArrayIncludes { array_columns, .. } => array_columns.clone(),
398    }
399}
400
401/// Like `compile_filter` but replaces aggregate expression columns with their
402/// SELECT aliases so ClickHouse can resolve them in HAVING scope.
403fn compile_filter_with_aliases(
404    node: &FilterNode,
405    bindings: &mut Vec<SqlValue>,
406    aliases: &HashMap<String, String>,
407) -> String {
408    match node {
409        FilterNode::Empty => String::new(),
410        FilterNode::Condition { column, op, value } => {
411            let effective_col = aliases.get(column)
412                .map(|a| a.as_str())
413                .unwrap_or(column.as_str());
414            compile_condition(effective_col, op, value, bindings)
415        }
416        FilterNode::And(children) => {
417            let parts: Vec<String> = children.iter()
418                .map(|c| compile_filter_with_aliases(c, bindings, aliases))
419                .filter(|s| !s.is_empty())
420                .collect();
421            match parts.len() {
422                0 => String::new(),
423                1 => parts.into_iter().next().unwrap(),
424                _ => format!("({})", parts.join(" AND ")),
425            }
426        }
427        FilterNode::Or(children) => {
428            let parts: Vec<String> = children.iter()
429                .map(|c| compile_filter_with_aliases(c, bindings, aliases))
430                .filter(|s| !s.is_empty())
431                .collect();
432            match parts.len() {
433                0 => String::new(),
434                1 => parts.into_iter().next().unwrap(),
435                _ => format!("({})", parts.join(" OR ")),
436            }
437        }
438        FilterNode::ArrayIncludes { array_columns, element_conditions } => {
439            compile_array_includes(array_columns, element_conditions, bindings)
440        }
441    }
442}
443
444fn compile_filter(node: &FilterNode, bindings: &mut Vec<SqlValue>) -> String {
445    match node {
446        FilterNode::Empty => String::new(),
447        FilterNode::Condition { column, op, value } => {
448            compile_condition(column, op, value, bindings)
449        }
450        FilterNode::And(children) => {
451            let parts: Vec<String> = children.iter()
452                .map(|c| compile_filter(c, bindings))
453                .filter(|s| !s.is_empty())
454                .collect();
455            match parts.len() {
456                0 => String::new(),
457                1 => parts.into_iter().next().unwrap(),
458                _ => format!("({})", parts.join(" AND ")),
459            }
460        }
461        FilterNode::Or(children) => {
462            let parts: Vec<String> = children.iter()
463                .map(|c| compile_filter(c, bindings))
464                .filter(|s| !s.is_empty())
465                .collect();
466            match parts.len() {
467                0 => String::new(),
468                1 => parts.into_iter().next().unwrap(),
469                _ => format!("({})", parts.join(" OR ")),
470            }
471        }
472        FilterNode::ArrayIncludes { array_columns, element_conditions } => {
473            compile_array_includes(array_columns, element_conditions, bindings)
474        }
475    }
476}
477
478/// Compile ArrayIncludes into one or more `arrayExists(lambda, arrays)` expressions.
479fn compile_array_includes(
480    array_columns: &[String],
481    element_conditions: &[Vec<FilterNode>],
482    bindings: &mut Vec<SqlValue>,
483) -> String {
484    let params: Vec<String> = (0..array_columns.len())
485        .map(|i| format!("_p{i}"))
486        .collect();
487    let arrays_sql: Vec<String> = array_columns.iter()
488        .map(|c| quote_col(c))
489        .collect();
490    let arrays_ref = arrays_sql.join(", ");
491    let params_ref = params.join(", ");
492
493    let col_to_param: std::collections::HashMap<&str, &str> = array_columns.iter()
494        .zip(params.iter())
495        .map(|(c, p)| (c.as_str(), p.as_str()))
496        .collect();
497
498    let exists_parts: Vec<String> = element_conditions.iter().map(|conds| {
499        let cond_parts: Vec<String> = conds.iter()
500            .map(|c| compile_filter_with_param_remap(c, bindings, &col_to_param))
501            .filter(|s| !s.is_empty())
502            .collect();
503        let cond_sql = match cond_parts.len() {
504            0 => "1".to_string(),
505            1 => cond_parts.into_iter().next().unwrap(),
506            _ => format!("({})", cond_parts.join(" AND ")),
507        };
508        format!("arrayExists(({params_ref}) -> {cond_sql}, {arrays_ref})")
509    }).collect();
510
511    match exists_parts.len() {
512        0 => String::new(),
513        1 => exists_parts.into_iter().next().unwrap(),
514        _ => format!("({})", exists_parts.join(" AND ")),
515    }
516}
517
518/// Compile a filter node but remap column names to lambda parameter names.
519/// Lambda parameters must NOT be backtick-quoted in ClickHouse.
520fn compile_filter_with_param_remap(
521    node: &FilterNode,
522    bindings: &mut Vec<SqlValue>,
523    col_to_param: &std::collections::HashMap<&str, &str>,
524) -> String {
525    match node {
526        FilterNode::Empty => String::new(),
527        FilterNode::Condition { column, op, value } => {
528            if let Some(&param) = col_to_param.get(column.as_str()) {
529                compile_condition_raw(param, op, value, bindings)
530            } else {
531                compile_condition(column, op, value, bindings)
532            }
533        }
534        FilterNode::And(children) => {
535            let parts: Vec<String> = children.iter()
536                .map(|c| compile_filter_with_param_remap(c, bindings, col_to_param))
537                .filter(|s| !s.is_empty())
538                .collect();
539            match parts.len() {
540                0 => String::new(),
541                1 => parts.into_iter().next().unwrap(),
542                _ => format!("({})", parts.join(" AND ")),
543            }
544        }
545        FilterNode::Or(children) => {
546            let parts: Vec<String> = children.iter()
547                .map(|c| compile_filter_with_param_remap(c, bindings, col_to_param))
548                .filter(|s| !s.is_empty())
549                .collect();
550            match parts.len() {
551                0 => String::new(),
552                1 => parts.into_iter().next().unwrap(),
553                _ => format!("({})", parts.join(" OR ")),
554            }
555        }
556        FilterNode::ArrayIncludes { array_columns, element_conditions } => {
557            compile_array_includes(array_columns, element_conditions, bindings)
558        }
559    }
560}
561
562fn quote_col(column: &str) -> String {
563    if column.contains('(') {
564        column.to_string()
565    } else {
566        format!("`{column}`")
567    }
568}
569
570/// Like compile_condition but uses the column name as-is (no backtick quoting).
571/// Used for lambda parameters in arrayExists.
572fn compile_condition_raw(
573    col: &str, op: &CompareOp, value: &SqlValue, bindings: &mut Vec<SqlValue>,
574) -> String {
575    compile_condition_inner(col, op, value, bindings)
576}
577
578fn compile_condition(
579    column: &str, op: &CompareOp, value: &SqlValue, bindings: &mut Vec<SqlValue>,
580) -> String {
581    let col = quote_col(column);
582    compile_condition_inner(&col, op, value, bindings)
583}
584
585fn compile_condition_inner(
586    col: &str, op: &CompareOp, value: &SqlValue, bindings: &mut Vec<SqlValue>,
587) -> String {
588    match op {
589        CompareOp::In | CompareOp::NotIn => {
590            if let SqlValue::String(csv) = value {
591                let items: Vec<&str> = csv.split(',').collect();
592                let placeholders: Vec<&str> = items.iter().map(|_| "?").collect();
593                for item in &items {
594                    bindings.push(SqlValue::String(item.trim().to_string()));
595                }
596                format!("{col} {} ({})", op.sql_op(), placeholders.join(", "))
597            } else {
598                bindings.push(value.clone());
599                format!("{col} {} (?)", op.sql_op())
600            }
601        }
602        CompareOp::Includes => {
603            if let SqlValue::String(s) = value {
604                bindings.push(SqlValue::String(format!("%{s}%")));
605            } else {
606                bindings.push(value.clone());
607            }
608            format!("{col} LIKE ?")
609        }
610        CompareOp::IsNull | CompareOp::IsNotNull => {
611            format!("{col} {}", op.sql_op())
612        }
613        _ => {
614            if let SqlValue::Expression(expr) = value {
615                format!("{col} {} {expr}", op.sql_op())
616            } else {
617                bindings.push(value.clone());
618                format!("{col} {} ?", op.sql_op())
619            }
620        }
621    }
622}
623
624#[cfg(test)]
625mod tests {
626    use super::*;
627
628    fn ch() -> ClickHouseDialect { ClickHouseDialect::new() }
629
630    #[test]
631    fn test_simple_select() {
632        let ir = QueryIR {
633            cube: "DEXTrades".into(), schema: "default".into(),
634            table: "dwd_dex_trades".into(),
635            selects: vec![
636                SelectExpr::Column { column: "tx_hash".into(), alias: None },
637                SelectExpr::Column { column: "token_a_amount".into(), alias: None },
638            ],
639            filters: FilterNode::Empty, having: FilterNode::Empty,
640            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
641            limit_by: None,
642            use_final: false,
643            joins: vec![],
644            custom_query_builder: None,
645            from_subquery: None,
646        };
647        let r = ch().compile(&ir);
648        assert_eq!(r.sql, "SELECT `tx_hash`, `token_a_amount` FROM `default`.`dwd_dex_trades` LIMIT 10");
649        assert!(r.bindings.is_empty());
650    }
651
652    #[test]
653    fn test_final_keyword() {
654        let ir = QueryIR {
655            cube: "T".into(), schema: "db".into(), table: "tokens".into(),
656            selects: vec![SelectExpr::Column { column: "id".into(), alias: None }],
657            filters: FilterNode::Empty, having: FilterNode::Empty,
658            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
659            limit_by: None,
660            use_final: true,
661            joins: vec![],
662            custom_query_builder: None,
663            from_subquery: None,
664        };
665        let r = ch().compile(&ir);
666        assert!(r.sql.contains("FROM `db`.`tokens` FINAL"), "FINAL should be appended, got: {}", r.sql);
667    }
668
669    #[test]
670    fn test_uniq_uses_native_function() {
671        let ir = QueryIR {
672            cube: "T".into(), schema: "db".into(), table: "t".into(),
673            selects: vec![
674                SelectExpr::Aggregate { function: "UNIQ".into(), column: "wallet".into(), alias: "__uniq".into(), condition: None },
675            ],
676            filters: FilterNode::Empty, having: FilterNode::Empty,
677            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
678            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
679        };
680        let r = ch().compile(&ir);
681        assert!(r.sql.contains("uniq(`wallet`) AS `__uniq`"), "ClickHouse should use native uniq(), got: {}", r.sql);
682    }
683
684    #[test]
685    fn test_count_star() {
686        let ir = QueryIR {
687            cube: "T".into(), schema: "db".into(), table: "t".into(),
688            selects: vec![
689                SelectExpr::Aggregate { function: "COUNT".into(), column: "*".into(), alias: "__count".into(), condition: None },
690            ],
691            filters: FilterNode::Empty, having: FilterNode::Empty,
692            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
693            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
694        };
695        let r = ch().compile(&ir);
696        assert!(r.sql.contains("count() AS `__count`"), "ClickHouse should use count() not COUNT(*), got: {}", r.sql);
697    }
698
699    #[test]
700    fn test_aggregate_lowercase() {
701        let ir = QueryIR {
702            cube: "T".into(), schema: "db".into(), table: "t".into(),
703            selects: vec![
704                SelectExpr::Aggregate { function: "SUM".into(), column: "amount".into(), alias: "__sum".into(), condition: None },
705                SelectExpr::Aggregate { function: "AVG".into(), column: "price".into(), alias: "__avg".into(), condition: None },
706            ],
707            filters: FilterNode::Empty, having: FilterNode::Empty,
708            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
709            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
710        };
711        let r = ch().compile(&ir);
712        assert!(r.sql.contains("sum(`amount`) AS `__sum`"), "ClickHouse functions should be lowercase, got: {}", r.sql);
713        assert!(r.sql.contains("avg(`price`) AS `__avg`"), "got: {}", r.sql);
714    }
715
716    #[test]
717    fn test_where_and_order() {
718        let ir = QueryIR {
719            cube: "T".into(), schema: "db".into(), table: "t".into(),
720            selects: vec![SelectExpr::Column { column: "id".into(), alias: None }],
721            filters: FilterNode::And(vec![
722                FilterNode::Condition { column: "chain_id".into(), op: CompareOp::Eq, value: SqlValue::Int(1) },
723                FilterNode::Condition { column: "amount_usd".into(), op: CompareOp::Gt, value: SqlValue::Float(1000.0) },
724            ]),
725            having: FilterNode::Empty, group_by: vec![],
726            order_by: vec![OrderExpr { column: "block_timestamp".into(), descending: true }],
727            limit: 25, offset: 0,
728            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
729        };
730        let r = ch().compile(&ir);
731        assert!(r.sql.contains("WHERE (`chain_id` = ? AND `amount_usd` > ?)"));
732        assert!(r.sql.contains("ORDER BY `block_timestamp` DESC"));
733        assert_eq!(r.bindings.len(), 2);
734    }
735
736    #[test]
737    fn test_having_with_aggregate_expr() {
738        let ir = QueryIR {
739            cube: "T".into(), schema: "db".into(), table: "t".into(),
740            selects: vec![
741                SelectExpr::Column { column: "token_address".into(), alias: None },
742                SelectExpr::Aggregate { function: "SUM".into(), column: "amount_usd".into(), alias: "__sum".into(), condition: None },
743            ],
744            filters: FilterNode::Empty,
745            having: FilterNode::Condition {
746                column: "sum(`amount_usd`)".into(), op: CompareOp::Gt, value: SqlValue::Float(1000000.0),
747            },
748            group_by: vec!["token_address".into()], order_by: vec![], limit: 25, offset: 0,
749            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
750        };
751        let r = ch().compile(&ir);
752        assert!(r.sql.contains("GROUP BY `token_address`"));
753        assert!(r.sql.contains("HAVING `__f_0` > ?"), "expected alias in HAVING, got: {}", r.sql);
754        assert!(r.sql.contains("sum(`amount_usd`) AS `__f_0`"), "expected alias in SELECT, got: {}", r.sql);
755        assert_eq!(r.bindings.len(), 1);
756    }
757
758    #[test]
759    fn test_having_appends_missing_agg_column() {
760        let ir = QueryIR {
761            cube: "T".into(), schema: "db".into(), table: "t".into(),
762            selects: vec![
763                SelectExpr::Column { column: "pool_address".into(), alias: None },
764                SelectExpr::Column { column: "argMaxMerge(latest_liquidity_usd_state)".into(), alias: None },
765            ],
766            filters: FilterNode::Empty,
767            having: FilterNode::And(vec![
768                FilterNode::Condition {
769                    column: "argMaxMerge(latest_liquidity_usd_state)".into(),
770                    op: CompareOp::Gt, value: SqlValue::Float(2.0),
771                },
772                FilterNode::Condition {
773                    column: "argMaxMerge(latest_token_a_amount_state)".into(),
774                    op: CompareOp::Gt, value: SqlValue::Float(3.0),
775                },
776            ]),
777            group_by: vec!["pool_address".into()], order_by: vec![], limit: 25, offset: 0,
778            limit_by: None, use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
779        };
780        let r = ch().compile(&ir);
781        assert!(r.sql.contains("argMaxMerge(latest_liquidity_usd_state) AS `__f_0`"),
782            "existing HAVING col should be aliased, got: {}", r.sql);
783        assert!(r.sql.contains("argMaxMerge(latest_token_a_amount_state) AS `__f_1`"),
784            "missing agg col should be appended, got: {}", r.sql);
785        assert!(r.sql.contains("HAVING (`__f_0` > ? AND `__f_1` > ?)"),
786            "HAVING should use aliases, got: {}", r.sql);
787        assert_eq!(r.bindings.len(), 2);
788        assert_eq!(r.alias_remap.len(), 1);
789        assert_eq!(r.alias_remap[0], ("__f_0".to_string(), "argMaxMerge(latest_liquidity_usd_state)".to_string()));
790    }
791
792    #[test]
793    fn test_limit_by() {
794        let ir = QueryIR {
795            cube: "T".into(), schema: "db".into(), table: "t".into(),
796            selects: vec![
797                SelectExpr::Column { column: "owner".into(), alias: None },
798                SelectExpr::Column { column: "amount".into(), alias: None },
799            ],
800            filters: FilterNode::Empty, having: FilterNode::Empty,
801            group_by: vec![], 
802            order_by: vec![OrderExpr { column: "amount".into(), descending: true }],
803            limit: 100, offset: 0,
804            limit_by: Some(LimitByExpr { count: 3, offset: 0, columns: vec!["owner".into()] }),
805            use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
806        };
807        let r = ch().compile(&ir);
808        let sql = &r.sql;
809        assert!(sql.contains("LIMIT 3 BY `owner`"), "LIMIT BY should be present, got: {sql}");
810        assert!(sql.contains("ORDER BY `amount` DESC"), "ORDER BY should be present, got: {sql}");
811        assert!(sql.contains("LIMIT 100"), "outer LIMIT should be present, got: {sql}");
812        let order_by_pos = sql.find("ORDER BY").unwrap();
813        let limit_by_pos = sql.find("LIMIT 3 BY").unwrap();
814        let limit_pos = sql.rfind("LIMIT 100").unwrap();
815        assert!(order_by_pos < limit_by_pos, "ORDER BY should come before LIMIT BY in ClickHouse");
816        assert!(limit_by_pos < limit_pos, "LIMIT BY should come before outer LIMIT");
817    }
818
819    #[test]
820    fn test_limit_by_with_offset() {
821        let ir = QueryIR {
822            cube: "T".into(), schema: "db".into(), table: "t".into(),
823            selects: vec![SelectExpr::Column { column: "id".into(), alias: None }],
824            filters: FilterNode::Empty, having: FilterNode::Empty,
825            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
826            limit_by: Some(LimitByExpr { count: 5, offset: 2, columns: vec!["token".into(), "wallet".into()] }),
827            use_final: false, joins: vec![], custom_query_builder: None, from_subquery: None,
828        };
829        let r = ch().compile(&ir);
830        assert!(r.sql.contains("LIMIT 5 BY `token`, `wallet` OFFSET 2"), "multi-column LIMIT BY with offset, got: {}", r.sql);
831    }
832
833    #[test]
834    fn test_join_direct() {
835        let ir = QueryIR {
836            cube: "DEXTrades".into(), schema: "dexes_dwd".into(),
837            table: "sol_dex_trades".into(),
838            selects: vec![
839                SelectExpr::Column { column: "tx_hash".into(), alias: None },
840                SelectExpr::Column { column: "buy_token_address".into(), alias: None },
841            ],
842            filters: FilterNode::Empty, having: FilterNode::Empty,
843            group_by: vec![], order_by: vec![], limit: 25, offset: 0,
844            limit_by: None, use_final: false,
845            joins: vec![JoinExpr {
846                schema: "dexes_dim".into(), table: "sol_tokens".into(),
847                alias: "_j0".into(),
848                conditions: vec![("buy_token_address".into(), "token_address".into())],
849                selects: vec![
850                    SelectExpr::Column { column: "name".into(), alias: None },
851                    SelectExpr::Column { column: "symbol".into(), alias: None },
852                ],
853                group_by: vec![], use_final: true, is_aggregate: false,
854                target_cube: "TokenSearch".into(), join_field: "joinBuyToken".into(),
855                join_type: JoinType::Left,
856            }],
857            custom_query_builder: None,
858            from_subquery: None,
859        };
860        let r = ch().compile(&ir);
861        assert!(r.sql.contains("FROM (SELECT"), "main query should be wrapped, got: {}", r.sql);
862        assert!(r.sql.contains("LEFT JOIN `dexes_dim`.`sol_tokens` AS _j0 FINAL"),
863            "direct JOIN with FINAL after alias, got: {}", r.sql);
864        assert!(r.sql.contains("_main.`buy_token_address` = _j0.`token_address`"),
865            "ON condition, got: {}", r.sql);
866        assert!(r.sql.contains("_j0.`name` AS `_j0.name`"), "joined col alias, got: {}", r.sql);
867    }
868
869    #[test]
870    fn test_join_aggregate_subquery() {
871        let ir = QueryIR {
872            cube: "DEXTrades".into(), schema: "dexes_dwd".into(),
873            table: "sol_dex_trades".into(),
874            selects: vec![
875                SelectExpr::Column { column: "tx_hash".into(), alias: None },
876                SelectExpr::Column { column: "buy_token_address".into(), alias: None },
877            ],
878            filters: FilterNode::Empty, having: FilterNode::Empty,
879            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
880            limit_by: None, use_final: false,
881            joins: vec![JoinExpr {
882                schema: "dexes_dws".into(), table: "sol_token_market_cap".into(),
883                alias: "_j0".into(),
884                conditions: vec![("buy_token_address".into(), "token_address".into())],
885                selects: vec![
886                    SelectExpr::Column { column: "argMaxMerge(latest_market_cap_usd_state)".into(), alias: None },
887                ],
888                group_by: vec!["token_address".into()],
889                use_final: false, is_aggregate: true,
890                target_cube: "TokenMarketCap".into(), join_field: "joinBuyTokenMarketCap".into(),
891                join_type: JoinType::Left,
892            }],
893            custom_query_builder: None,
894            from_subquery: None,
895        };
896        let r = ch().compile(&ir);
897        assert!(r.sql.contains("LEFT JOIN (SELECT"), "aggregate should use subquery, got: {}", r.sql);
898        assert!(r.sql.contains("GROUP BY `token_address`"), "subquery GROUP BY, got: {}", r.sql);
899        assert!(r.sql.contains("FROM `dexes_dws`.`sol_token_market_cap`"), "subquery FROM, got: {}", r.sql);
900        assert!(r.sql.contains("argMaxMerge(latest_market_cap_usd_state) AS `__jc_0`"),
901            "join func expr should be aliased in subquery, got: {}", r.sql);
902        assert!(r.sql.contains("_j0.`__jc_0` AS `_j0.__jc_0`"),
903            "outer SELECT should use alias for join func col, got: {}", r.sql);
904    }
905
906    #[test]
907    fn test_join_main_query_func_expression_columns() {
908        let ir = QueryIR {
909            cube: "TokenHolders".into(), schema: "dws".into(),
910            table: "sol_token_holders".into(),
911            selects: vec![
912                SelectExpr::Column { column: "token".into(), alias: None },
913                SelectExpr::Column { column: "holder".into(), alias: None },
914                SelectExpr::Column { column: "argMaxMerge(latest_balance)".into(), alias: None },
915                SelectExpr::Column { column: "argMaxMerge(latest_balance_usd)".into(), alias: None },
916                SelectExpr::Column { column: "minMerge(first_seen)".into(), alias: None },
917                SelectExpr::Column { column: "maxMerge(last_seen)".into(), alias: None },
918            ],
919            filters: FilterNode::Empty, having: FilterNode::Empty,
920            group_by: vec![], order_by: vec![
921                OrderExpr { column: "argMaxMerge(latest_balance_usd)".into(), descending: true },
922            ],
923            limit: 100, offset: 0,
924            limit_by: None, use_final: false,
925            joins: vec![JoinExpr {
926                schema: "dim".into(), table: "sol_tokens".into(),
927                alias: "_j0".into(),
928                conditions: vec![("token".into(), "token_address".into())],
929                selects: vec![
930                    SelectExpr::Column { column: "name".into(), alias: None },
931                    SelectExpr::Column { column: "symbol".into(), alias: None },
932                ],
933                group_by: vec![], use_final: true, is_aggregate: false,
934                target_cube: "TokenSearch".into(), join_field: "joinToken".into(),
935                join_type: JoinType::Left,
936            }],
937            custom_query_builder: None,
938            from_subquery: None,
939        };
940        let r = ch().compile(&ir);
941        let sql = &r.sql;
942
943        assert!(sql.contains("_main.`__mc_0` AS `__mc_0`"),
944            "func expr should use alias __mc_0 in outer SELECT, got: {sql}");
945        assert!(sql.contains("_main.`__mc_1` AS `__mc_1`"),
946            "func expr should use alias __mc_1, got: {sql}");
947        assert!(sql.contains("_main.`token` AS `token`"),
948            "simple col should be backtick-quoted, got: {sql}");
949
950        assert!(!sql.contains("_main.argMaxMerge("),
951            "outer SELECT must NOT have bare _main.argMaxMerge(...), got: {sql}");
952
953        assert!(sql.contains("argMaxMerge(latest_balance) AS `__mc_0`"),
954            "inner query should alias func expr, got: {sql}");
955
956        assert!(r.alias_remap.iter().any(|(a, o)| a == "__mc_0" && o == "argMaxMerge(latest_balance)"),
957            "alias_remap should map __mc_0 → original, got: {:?}", r.alias_remap);
958        assert!(r.alias_remap.iter().any(|(a, o)| a == "__mc_1" && o == "argMaxMerge(latest_balance_usd)"),
959            "alias_remap should map __mc_1, got: {:?}", r.alias_remap);
960    }
961
962    #[test]
963    fn test_join_inner_type() {
964        let ir = QueryIR {
965            cube: "DEXTrades".into(), schema: "dexes_dwd".into(),
966            table: "sol_dex_trades".into(),
967            selects: vec![
968                SelectExpr::Column { column: "tx_hash".into(), alias: None },
969            ],
970            filters: FilterNode::Empty, having: FilterNode::Empty,
971            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
972            limit_by: None, use_final: false,
973            joins: vec![JoinExpr {
974                schema: "dexes_dim".into(), table: "sol_tokens".into(),
975                alias: "_j0".into(),
976                conditions: vec![("buy_token_address".into(), "token_address".into())],
977                selects: vec![
978                    SelectExpr::Column { column: "name".into(), alias: None },
979                ],
980                group_by: vec![], use_final: false, is_aggregate: false,
981                target_cube: "TokenSearch".into(), join_field: "joinBuyToken".into(),
982                join_type: JoinType::Inner,
983            }],
984            custom_query_builder: None,
985            from_subquery: None,
986        };
987        let r = ch().compile(&ir);
988        assert!(r.sql.contains("INNER JOIN `dexes_dim`.`sol_tokens` AS _j0"),
989            "should use INNER JOIN, got: {}", r.sql);
990    }
991
992    #[test]
993    fn test_join_full_outer_type() {
994        let ir = QueryIR {
995            cube: "T".into(), schema: "db".into(), table: "t".into(),
996            selects: vec![
997                SelectExpr::Column { column: "id".into(), alias: None },
998            ],
999            filters: FilterNode::Empty, having: FilterNode::Empty,
1000            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1001            limit_by: None, use_final: false,
1002            joins: vec![JoinExpr {
1003                schema: "db2".into(), table: "t2".into(),
1004                alias: "_j0".into(),
1005                conditions: vec![("id".into(), "ref_id".into())],
1006                selects: vec![
1007                    SelectExpr::Column { column: "val".into(), alias: None },
1008                ],
1009                group_by: vec![], use_final: false, is_aggregate: false,
1010                target_cube: "Other".into(), join_field: "joinOther".into(),
1011                join_type: JoinType::Full,
1012            }],
1013            custom_query_builder: None,
1014            from_subquery: None,
1015        };
1016        let r = ch().compile(&ir);
1017        assert!(r.sql.contains("FULL OUTER JOIN `db2`.`t2` AS _j0"),
1018            "should use FULL OUTER JOIN, got: {}", r.sql);
1019    }
1020
1021    #[test]
1022    fn test_custom_query_builder() {
1023        let ir = QueryIR {
1024            cube: "Custom".into(), schema: "db".into(), table: "t".into(),
1025            selects: vec![
1026                SelectExpr::Column { column: "id".into(), alias: None },
1027            ],
1028            filters: FilterNode::Empty, having: FilterNode::Empty,
1029            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1030            limit_by: None, use_final: false, joins: vec![],
1031            custom_query_builder: Some(QueryBuilderFn(std::sync::Arc::new(|_ir| {
1032                CompileResult {
1033                    sql: "SELECT 1 FROM custom_view".into(),
1034                    bindings: vec![],
1035                    alias_remap: vec![],
1036                }
1037            }))),
1038            from_subquery: None,
1039        };
1040        let r = ch().compile(&ir);
1041        assert_eq!(r.sql, "SELECT 1 FROM custom_view",
1042            "custom builder should bypass standard compilation, got: {}", r.sql);
1043    }
1044
1045    #[test]
1046    fn test_from_subquery() {
1047        let ir = QueryIR {
1048            cube: "DEXTradeByTokens".into(), schema: "dwd".into(),
1049            table: "sol_trades".into(),
1050            selects: vec![
1051                SelectExpr::Column { column: "amount".into(), alias: None },
1052                SelectExpr::Column { column: "side_type".into(), alias: None },
1053            ],
1054            filters: FilterNode::Condition {
1055                column: "token".into(), op: CompareOp::Eq,
1056                value: SqlValue::String("SOL".into()),
1057            },
1058            having: FilterNode::Empty,
1059            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1060            limit_by: None, use_final: false, joins: vec![],
1061            custom_query_builder: None,
1062            from_subquery: Some(
1063                "SELECT amount, 'buy' AS side_type, token FROM dwd.sol_a UNION ALL SELECT amount, 'sell' AS side_type, token FROM dwd.sol_b".into()
1064            ),
1065        };
1066        let r = ch().compile(&ir);
1067        assert!(r.sql.starts_with("SELECT `amount`, `side_type` FROM (SELECT"),
1068            "should use subquery in FROM, got: {}", r.sql);
1069        assert!(r.sql.contains("UNION ALL"),
1070            "subquery should contain UNION ALL, got: {}", r.sql);
1071        assert!(r.sql.contains(") AS _t"),
1072            "subquery should be aliased as _t, got: {}", r.sql);
1073        assert!(r.sql.contains("WHERE `token` = ?"),
1074            "WHERE clause should be applied to subquery result, got: {}", r.sql);
1075        assert!(!r.sql.contains("FROM `dwd`.`sol_trades`"),
1076            "should NOT use schema.table when from_subquery is set, got: {}", r.sql);
1077    }
1078
1079    #[test]
1080    fn test_array_includes_single_condition() {
1081        let ir = QueryIR {
1082            cube: "Instructions".into(), schema: "dexes_dwd2".into(),
1083            table: "sol_instructions".into(),
1084            selects: vec![SelectExpr::Column { column: "tx_hash".into(), alias: None }],
1085            filters: FilterNode::ArrayIncludes {
1086                array_columns: vec![
1087                    "instruction_arg_names".into(),
1088                    "instruction_arg_types".into(),
1089                    "instruction_arg_values".into(),
1090                ],
1091                element_conditions: vec![vec![
1092                    FilterNode::Condition {
1093                        column: "instruction_arg_names".into(),
1094                        op: CompareOp::Eq,
1095                        value: SqlValue::String("amount_in".into()),
1096                    },
1097                ]],
1098            },
1099            having: FilterNode::Empty,
1100            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1101            limit_by: None, use_final: false, joins: vec![],
1102            custom_query_builder: None, from_subquery: None,
1103        };
1104        let r = ch().compile(&ir);
1105        assert!(r.sql.contains("arrayExists((_p0, _p1, _p2) -> _p0 = ?"),
1106            "should generate arrayExists with lambda params, got: {}", r.sql);
1107        assert!(r.sql.contains("`instruction_arg_names`, `instruction_arg_types`, `instruction_arg_values`"),
1108            "should reference all parallel array columns, got: {}", r.sql);
1109        assert_eq!(r.bindings.len(), 1);
1110    }
1111
1112    #[test]
1113    fn test_array_includes_multiple_conditions() {
1114        let ir = QueryIR {
1115            cube: "Instructions".into(), schema: "dexes_dwd2".into(),
1116            table: "sol_instructions".into(),
1117            selects: vec![SelectExpr::Column { column: "tx_hash".into(), alias: None }],
1118            filters: FilterNode::ArrayIncludes {
1119                array_columns: vec![
1120                    "instruction_arg_names".into(),
1121                    "instruction_arg_values".into(),
1122                ],
1123                element_conditions: vec![
1124                    vec![
1125                        FilterNode::Condition {
1126                            column: "instruction_arg_names".into(),
1127                            op: CompareOp::Eq,
1128                            value: SqlValue::String("amount_in".into()),
1129                        },
1130                        FilterNode::Condition {
1131                            column: "instruction_arg_values".into(),
1132                            op: CompareOp::Gt,
1133                            value: SqlValue::String("10000".into()),
1134                        },
1135                    ],
1136                    vec![
1137                        FilterNode::Condition {
1138                            column: "instruction_arg_names".into(),
1139                            op: CompareOp::Eq,
1140                            value: SqlValue::String("owner".into()),
1141                        },
1142                    ],
1143                ],
1144            },
1145            having: FilterNode::Empty,
1146            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1147            limit_by: None, use_final: false, joins: vec![],
1148            custom_query_builder: None, from_subquery: None,
1149        };
1150        let r = ch().compile(&ir);
1151        let sql = &r.sql;
1152        let count = sql.matches("arrayExists").count();
1153        assert_eq!(count, 2, "should have two arrayExists calls (AND-ed), got: {sql}");
1154        assert!(sql.contains(" AND arrayExists("),
1155            "two arrayExists should be AND-ed, got: {sql}");
1156        assert_eq!(r.bindings.len(), 3);
1157    }
1158
1159    #[test]
1160    fn test_array_includes_with_in_operator() {
1161        let ir = QueryIR {
1162            cube: "Instructions".into(), schema: "dexes_dwd2".into(),
1163            table: "sol_instructions".into(),
1164            selects: vec![SelectExpr::Column { column: "tx_hash".into(), alias: None }],
1165            filters: FilterNode::ArrayIncludes {
1166                array_columns: vec![
1167                    "instruction_arg_names".into(),
1168                    "instruction_arg_values".into(),
1169                ],
1170                element_conditions: vec![vec![
1171                    FilterNode::Condition {
1172                        column: "instruction_arg_names".into(),
1173                        op: CompareOp::Eq,
1174                        value: SqlValue::String("authorityType".into()),
1175                    },
1176                    FilterNode::Condition {
1177                        column: "instruction_arg_values".into(),
1178                        op: CompareOp::In,
1179                        value: SqlValue::String("0,1".into()),
1180                    },
1181                ]],
1182            },
1183            having: FilterNode::Empty,
1184            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1185            limit_by: None, use_final: false, joins: vec![],
1186            custom_query_builder: None, from_subquery: None,
1187        };
1188        let r = ch().compile(&ir);
1189        assert!(r.sql.contains("arrayExists((_p0, _p1) -> (_p0 = ? AND _p1 IN (?, ?))"),
1190            "should generate arrayExists with AND-ed conditions, got: {}", r.sql);
1191        assert_eq!(r.bindings.len(), 3);
1192    }
1193
1194    #[test]
1195    fn test_array_includes_combined_with_regular_filter() {
1196        let ir = QueryIR {
1197            cube: "Instructions".into(), schema: "dexes_dwd2".into(),
1198            table: "sol_instructions".into(),
1199            selects: vec![SelectExpr::Column { column: "tx_hash".into(), alias: None }],
1200            filters: FilterNode::And(vec![
1201                FilterNode::Condition {
1202                    column: "instruction_program_address".into(),
1203                    op: CompareOp::Eq,
1204                    value: SqlValue::String("pAMMBay6oceH9fJKBRHGP5D4bD4sWpmSwMn52FMfXEA".into()),
1205                },
1206                FilterNode::ArrayIncludes {
1207                    array_columns: vec!["instruction_arg_names".into(), "instruction_arg_values".into()],
1208                    element_conditions: vec![vec![
1209                        FilterNode::Condition {
1210                            column: "instruction_arg_names".into(),
1211                            op: CompareOp::Eq,
1212                            value: SqlValue::String("amount".into()),
1213                        },
1214                    ]],
1215                },
1216            ]),
1217            having: FilterNode::Empty,
1218            group_by: vec![], order_by: vec![], limit: 10, offset: 0,
1219            limit_by: None, use_final: false, joins: vec![],
1220            custom_query_builder: None, from_subquery: None,
1221        };
1222        let r = ch().compile(&ir);
1223        let sql = &r.sql;
1224        assert!(sql.contains("`instruction_program_address` = ?"),
1225            "should have regular condition, got: {sql}");
1226        assert!(sql.contains("arrayExists("),
1227            "should have arrayExists, got: {sql}");
1228        assert!(sql.contains(" AND "),
1229            "regular + array conditions should be AND-ed, got: {sql}");
1230    }
1231}