Skip to main content

sql_cli/sql/parser/expressions/
primary.rs

1// Primary expression parsing
2// Handles literals, identifiers, function calls, and parenthesized expressions
3
4use crate::sql::parser::ast::{ColumnRef, SqlExpression, WindowSpec};
5use crate::sql::parser::lexer::Token;
6use tracing::{debug, trace};
7
8use super::{log_parse_decision, trace_parse_entry, trace_parse_exit, ExpressionParser};
9
10/// Parser context for primary expressions
11pub struct PrimaryExpressionContext<'a> {
12    pub columns: &'a [String],
13    pub in_method_args: bool,
14}
15
16impl<'a> Default for PrimaryExpressionContext<'a> {
17    fn default() -> Self {
18        Self {
19            columns: &[],
20            in_method_args: false,
21        }
22    }
23}
24
25/// Parse a primary expression (literals, identifiers, functions, parentheses)
26/// This is the bottom of the expression hierarchy
27pub fn parse_primary<P>(
28    parser: &mut P,
29    ctx: &PrimaryExpressionContext,
30) -> Result<SqlExpression, String>
31where
32    P: ParsePrimary + ExpressionParser + ?Sized,
33{
34    trace_parse_entry("parse_primary", ExpressionParser::current_token(parser));
35
36    // Special case: check if a number literal could actually be a column name
37    // This handles cases where columns are named with pure numbers like "202204"
38    if let Token::NumberLiteral(num_str) = ExpressionParser::current_token(parser) {
39        if ctx.columns.iter().any(|col| col == num_str) {
40            log_parse_decision(
41                "parse_primary",
42                ExpressionParser::current_token(parser),
43                "Number literal matches column name, treating as column",
44            );
45            let expr = SqlExpression::Column(ColumnRef::unquoted(num_str.clone()));
46            ExpressionParser::advance(parser);
47            let result = Ok(expr);
48            trace_parse_exit("parse_primary", &result);
49            return result;
50        }
51    }
52
53    let result = match ExpressionParser::current_token(parser) {
54        Token::Case => {
55            debug!("Parsing CASE expression");
56            parser.parse_case_expression()
57        }
58
59        Token::DateTime => {
60            debug!("Parsing DateTime constructor");
61            parse_datetime_constructor(parser)
62        }
63
64        Token::Unnest => {
65            debug!("Parsing UNNEST expression");
66            parse_unnest(parser)
67        }
68
69        Token::Identifier(id) => {
70            let id_upper = id.to_uppercase();
71            let id_clone = id.clone();
72
73            // Check for boolean literals first
74            if id_upper == "TRUE" {
75                log_parse_decision(
76                    "parse_primary",
77                    ExpressionParser::current_token(parser),
78                    "Boolean literal TRUE",
79                );
80                ExpressionParser::advance(parser);
81                Ok(SqlExpression::BooleanLiteral(true))
82            } else if id_upper == "FALSE" {
83                log_parse_decision(
84                    "parse_primary",
85                    ExpressionParser::current_token(parser),
86                    "Boolean literal FALSE",
87                );
88                ExpressionParser::advance(parser);
89                Ok(SqlExpression::BooleanLiteral(false))
90            } else {
91                ExpressionParser::advance(parser);
92
93                // Check for table.column notation or method calls
94                if matches!(ExpressionParser::current_token(parser), Token::Dot) {
95                    ExpressionParser::advance(parser); // consume dot
96
97                    if let Token::Identifier(next_id) = ExpressionParser::current_token(parser) {
98                        let next_id = next_id.clone();
99                        ExpressionParser::advance(parser);
100
101                        // Check if this is a method call (followed by parentheses)
102                        if matches!(ExpressionParser::current_token(parser), Token::LeftParen) {
103                            debug!(object = %id_clone, method = %next_id, "Parsing method call");
104                            ExpressionParser::advance(parser); // consume (
105
106                            // Handle empty argument list
107                            let args = if matches!(
108                                ExpressionParser::current_token(parser),
109                                Token::RightParen
110                            ) {
111                                Vec::new()
112                            } else {
113                                parser.parse_expression_list()?
114                            };
115                            ExpressionParser::consume(parser, Token::RightParen)?;
116
117                            log_parse_decision(
118                                "parse_primary",
119                                &Token::Identifier(next_id.clone()),
120                                "Method call",
121                            );
122                            Ok(SqlExpression::MethodCall {
123                                object: id_clone,
124                                method: next_id,
125                                args,
126                            })
127                        } else {
128                            // It's a qualified column reference
129                            let col_ref = ColumnRef::qualified(id_clone, next_id.clone());
130                            log_parse_decision(
131                                "parse_primary",
132                                &Token::Identifier(next_id),
133                                "Qualified column reference",
134                            );
135                            Ok(SqlExpression::Column(col_ref))
136                        }
137                    } else {
138                        Err("Expected identifier after '.'".to_string())
139                    }
140                // Check if this is a function call
141                } else if matches!(ExpressionParser::current_token(parser), Token::LeftParen) {
142                    debug!(function = %id_upper, "Parsing function call");
143                    ExpressionParser::advance(parser); // consume (
144                    let (args, has_distinct) = parser.parse_function_args()?;
145                    ExpressionParser::consume(parser, Token::RightParen)?;
146
147                    // Check for OVER clause for window functions
148                    if matches!(ExpressionParser::current_token(parser), Token::Over) {
149                        debug!(function = %id_upper, "Window function detected");
150                        ExpressionParser::advance(parser); // consume OVER
151                        ExpressionParser::consume(parser, Token::LeftParen)?;
152                        let window_spec = parser.parse_window_spec()?;
153                        ExpressionParser::consume(parser, Token::RightParen)?;
154                        Ok(SqlExpression::WindowFunction {
155                            name: id_upper,
156                            args,
157                            window_spec,
158                        })
159                    } else {
160                        Ok(SqlExpression::FunctionCall {
161                            name: id_upper,
162                            args,
163                            distinct: has_distinct,
164                        })
165                    }
166                } else {
167                    // Otherwise treat as simple column
168                    log_parse_decision(
169                        "parse_primary",
170                        &Token::Identifier(id_clone.clone()),
171                        "Column reference",
172                    );
173                    Ok(SqlExpression::Column(ColumnRef::unquoted(id_clone)))
174                }
175            }
176        }
177
178        Token::QuotedIdentifier(id) => {
179            let expr = if ctx.in_method_args {
180                // In method arguments, treat quoted identifiers as string literals
181                log_parse_decision(
182                    "parse_primary",
183                    ExpressionParser::current_token(parser),
184                    "Quoted identifier in method args - treating as string",
185                );
186                SqlExpression::StringLiteral(id.clone())
187            } else {
188                // Otherwise it's a column name like "Customer Id"
189                log_parse_decision(
190                    "parse_primary",
191                    ExpressionParser::current_token(parser),
192                    "Quoted identifier as column name",
193                );
194                SqlExpression::Column(ColumnRef::quoted(id.clone()))
195            };
196            ExpressionParser::advance(parser);
197            Ok(expr)
198        }
199
200        Token::StringLiteral(s) => {
201            trace!("String literal: {}", s);
202            let expr = SqlExpression::StringLiteral(s.clone());
203            ExpressionParser::advance(parser);
204            Ok(expr)
205        }
206
207        Token::NumberLiteral(n) => {
208            trace!("Number literal: {}", n);
209            let expr = SqlExpression::NumberLiteral(n.clone());
210            ExpressionParser::advance(parser);
211            Ok(expr)
212        }
213
214        Token::Null => {
215            trace!("NULL literal");
216            ExpressionParser::advance(parser);
217            Ok(SqlExpression::Null)
218        }
219
220        // Handle LEFT and RIGHT as function names when followed by parentheses
221        Token::Left | Token::Right => {
222            let func_name = match ExpressionParser::current_token(parser) {
223                Token::Left => "LEFT".to_string(),
224                Token::Right => "RIGHT".to_string(),
225                _ => unreachable!(),
226            };
227
228            ExpressionParser::advance(parser);
229
230            // Check if this is a function call
231            if matches!(ExpressionParser::current_token(parser), Token::LeftParen) {
232                debug!(function = %func_name, "Parsing LEFT/RIGHT function call");
233                ExpressionParser::advance(parser); // consume (
234                let (args, _has_distinct) = parser.parse_function_args()?;
235                ExpressionParser::consume(parser, Token::RightParen)?;
236
237                Ok(SqlExpression::FunctionCall {
238                    name: func_name,
239                    args,
240                    distinct: false,
241                })
242            } else {
243                // If not followed by parenthesis, this is likely a JOIN keyword - error
244                Err(format!(
245                    "{} keyword unexpected in expression context",
246                    func_name
247                ))
248            }
249        }
250
251        Token::LeftParen => {
252            debug!("Parsing parenthesized expression or subquery");
253            ExpressionParser::advance(parser); // consume (
254
255            // Check if this is a subquery (starts with SELECT)
256            if matches!(ExpressionParser::current_token(parser), Token::Select) {
257                debug!("Detected subquery - parsing SELECT statement");
258                let subquery = parser.parse_subquery()?;
259                ExpressionParser::consume(parser, Token::RightParen)?;
260                Ok(SqlExpression::ScalarSubquery {
261                    query: Box::new(subquery),
262                })
263            } else {
264                // Regular parenthesized expression
265                debug!("Regular parenthesized expression");
266                let expr = parser.parse_logical_or()?;
267                ExpressionParser::consume(parser, Token::RightParen)?;
268                Ok(expr)
269            }
270        }
271
272        Token::Not => {
273            debug!("Parsing NOT expression");
274            parse_not_expression(parser)
275        }
276
277        Token::Star => {
278            // Handle * as a literal (like in COUNT(*))
279            trace!("Star token as literal");
280            ExpressionParser::advance(parser);
281            Ok(SqlExpression::StringLiteral("*".to_string()))
282        }
283
284        // Handle window-related keywords that can also be column names
285        Token::Row => {
286            trace!("ROW token treated as identifier in expression context");
287            ExpressionParser::advance(parser);
288            Ok(SqlExpression::Column(ColumnRef::unquoted(
289                "row".to_string(),
290            )))
291        }
292
293        Token::Rows => {
294            trace!("ROWS token treated as identifier in expression context");
295            ExpressionParser::advance(parser);
296            Ok(SqlExpression::Column(ColumnRef::unquoted(
297                "rows".to_string(),
298            )))
299        }
300
301        Token::Range => {
302            trace!("RANGE token treated as identifier in expression context");
303            ExpressionParser::advance(parser);
304            Ok(SqlExpression::Column(ColumnRef::unquoted(
305                "range".to_string(),
306            )))
307        }
308
309        Token::Minus => {
310            // Unary minus: -expr is parsed as 0 - expr
311            debug!("Parsing unary minus expression");
312            ExpressionParser::advance(parser);
313            let operand = parse_primary(parser, ctx)?;
314            Ok(SqlExpression::BinaryOp {
315                left: Box::new(SqlExpression::NumberLiteral("0".to_string())),
316                op: "-".to_string(),
317                right: Box::new(operand),
318            })
319        }
320
321        _ => {
322            let err = format!(
323                "Unexpected token in primary expression: {:?}",
324                ExpressionParser::current_token(parser)
325            );
326            debug!(error = %err);
327            Err(err)
328        }
329    };
330
331    trace_parse_exit("parse_primary", &result);
332    result
333}
334
335/// Parse DateTime constructor
336fn parse_datetime_constructor<P>(parser: &mut P) -> Result<SqlExpression, String>
337where
338    P: ParsePrimary + ExpressionParser + ?Sized,
339{
340    ExpressionParser::advance(parser); // consume DateTime
341    ExpressionParser::consume(parser, Token::LeftParen)?;
342
343    // Check if empty parentheses for DateTime() - today's date
344    if matches!(ExpressionParser::current_token(parser), Token::RightParen) {
345        ExpressionParser::advance(parser); // consume )
346        debug!("DateTime() - today's date");
347        return Ok(SqlExpression::DateTimeToday {
348            hour: None,
349            minute: None,
350            second: None,
351        });
352    }
353
354    // Parse year
355    let year = if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
356        n.parse::<i32>().map_err(|_| "Invalid year")?
357    } else {
358        return Err("Expected year in DateTime constructor".to_string());
359    };
360    ExpressionParser::advance(parser);
361    ExpressionParser::consume(parser, Token::Comma)?;
362
363    // Parse month
364    let month = if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
365        n.parse::<u32>().map_err(|_| "Invalid month")?
366    } else {
367        return Err("Expected month in DateTime constructor".to_string());
368    };
369    ExpressionParser::advance(parser);
370    ExpressionParser::consume(parser, Token::Comma)?;
371
372    // Parse day
373    let day = if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
374        n.parse::<u32>().map_err(|_| "Invalid day")?
375    } else {
376        return Err("Expected day in DateTime constructor".to_string());
377    };
378    ExpressionParser::advance(parser);
379
380    // Check for optional time components
381    let mut hour = None;
382    let mut minute = None;
383    let mut second = None;
384
385    if matches!(ExpressionParser::current_token(parser), Token::Comma) {
386        ExpressionParser::advance(parser); // consume comma
387
388        // Parse hour
389        if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
390            hour = Some(n.parse::<u32>().map_err(|_| "Invalid hour")?);
391            ExpressionParser::advance(parser);
392
393            // Check for minute
394            if matches!(ExpressionParser::current_token(parser), Token::Comma) {
395                ExpressionParser::advance(parser); // consume comma
396
397                if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
398                    minute = Some(n.parse::<u32>().map_err(|_| "Invalid minute")?);
399                    ExpressionParser::advance(parser);
400
401                    // Check for second
402                    if matches!(ExpressionParser::current_token(parser), Token::Comma) {
403                        ExpressionParser::advance(parser); // consume comma
404
405                        if let Token::NumberLiteral(n) = ExpressionParser::current_token(parser) {
406                            second = Some(n.parse::<u32>().map_err(|_| "Invalid second")?);
407                            ExpressionParser::advance(parser);
408                        }
409                    }
410                }
411            }
412        }
413    }
414
415    ExpressionParser::consume(parser, Token::RightParen)?;
416
417    debug!(year = year, month = month, day = day, hour = ?hour, minute = ?minute, second = ?second, "DateTime constructor parsed");
418
419    Ok(SqlExpression::DateTimeConstructor {
420        year,
421        month,
422        day,
423        hour,
424        minute,
425        second,
426    })
427}
428
429/// Parse NOT expression
430fn parse_not_expression<P>(parser: &mut P) -> Result<SqlExpression, String>
431where
432    P: ParsePrimary + ExpressionParser + ?Sized,
433{
434    ExpressionParser::advance(parser); // consume NOT
435
436    // Check if this is a NOT IN expression
437    if let Ok(inner_expr) = parser.parse_comparison() {
438        // After parsing the inner expression, check if we're followed by IN
439        if matches!(ExpressionParser::current_token(parser), Token::In) {
440            debug!("NOT IN expression detected");
441            ExpressionParser::advance(parser); // consume IN
442            ExpressionParser::consume(parser, Token::LeftParen)?;
443            let values = parser.parse_expression_list()?;
444            ExpressionParser::consume(parser, Token::RightParen)?;
445
446            Ok(SqlExpression::NotInList {
447                expr: Box::new(inner_expr),
448                values,
449            })
450        } else {
451            // Regular NOT expression
452            debug!("Regular NOT expression");
453            Ok(SqlExpression::Not {
454                expr: Box::new(inner_expr),
455            })
456        }
457    } else {
458        Err("Expected expression after NOT".to_string())
459    }
460}
461
462/// Parse UNNEST expression
463/// Syntax: UNNEST(column_expr, 'delimiter')
464fn parse_unnest<P>(parser: &mut P) -> Result<SqlExpression, String>
465where
466    P: ParsePrimary + ExpressionParser + ?Sized,
467{
468    debug!("parse_unnest: starting");
469    ExpressionParser::advance(parser); // consume UNNEST
470    ExpressionParser::consume(parser, Token::LeftParen)?;
471
472    // Parse the column expression (first argument)
473    let column = parser.parse_logical_or()?;
474    debug!("parse_unnest: parsed column expression");
475
476    // Expect comma
477    ExpressionParser::consume(parser, Token::Comma)?;
478
479    // Parse the delimiter (second argument - must be a string literal)
480    let delimiter = match ExpressionParser::current_token(parser) {
481        Token::StringLiteral(s) => {
482            let delim = s.clone();
483            ExpressionParser::advance(parser);
484            delim
485        }
486        _ => {
487            return Err("UNNEST delimiter must be a string literal".to_string());
488        }
489    };
490
491    debug!(delimiter = %delimiter, "parse_unnest: parsed delimiter");
492
493    ExpressionParser::consume(parser, Token::RightParen)?;
494
495    debug!("parse_unnest: complete");
496    Ok(SqlExpression::Unnest {
497        column: Box::new(column),
498        delimiter,
499    })
500}
501
502/// Trait that parsers must implement to use primary expression parsing
503pub trait ParsePrimary {
504    fn current_token(&self) -> &Token;
505    fn advance(&mut self);
506    fn consume(&mut self, expected: Token) -> Result<(), String>;
507
508    // These methods are called from parse_primary
509    fn parse_case_expression(&mut self) -> Result<SqlExpression, String>;
510    fn parse_function_args(&mut self) -> Result<(Vec<SqlExpression>, bool), String>;
511    fn parse_window_spec(&mut self) -> Result<WindowSpec, String>;
512    fn parse_logical_or(&mut self) -> Result<SqlExpression, String>;
513    fn parse_comparison(&mut self) -> Result<SqlExpression, String>;
514    fn parse_expression_list(&mut self) -> Result<Vec<SqlExpression>, String>;
515
516    // For subquery parsing (without parenthesis balance validation)
517    fn parse_subquery(&mut self) -> Result<crate::sql::parser::ast::SelectStatement, String>;
518}