reifydb-type 0.4.12

Core type system and value representations for ReifyDB
Documentation
// SPDX-License-Identifier: Apache-2.0
// Copyright (c) 2025 ReifyDB

use std::borrow::Cow;

use num_bigint::BigInt;

use crate::{
	error::{Error, TypeError},
	fragment::Fragment,
	value::{int::Int, r#type::Type},
};

pub fn parse_int(fragment: Fragment) -> Result<Int, Error> {
	// Fragment is already owned, no conversion needed
	let raw_value = fragment.text();

	// Fast path: check if we need any string processing
	let needs_trimming = raw_value.as_bytes().first().is_some_and(|&b| b.is_ascii_whitespace())
		|| raw_value.as_bytes().last().is_some_and(|&b| b.is_ascii_whitespace());
	let has_underscores = raw_value.as_bytes().contains(&b'_');

	let value = match (needs_trimming, has_underscores) {
		(false, false) => Cow::Borrowed(raw_value), // Fast path -
		// no processing
		// needed
		(true, false) => Cow::Borrowed(raw_value.trim()),
		(false, true) => Cow::Owned(raw_value.replace('_', "")),
		(true, true) => Cow::Owned(raw_value.trim().replace('_', "")),
	};

	if value.is_empty() {
		return Err(TypeError::InvalidNumberFormat {
			target: Type::Int,
			fragment,
		}
		.into());
	}

	// Try parsing as BigInt first
	match value.parse::<BigInt>() {
		Ok(v) => Ok(Int::from(v)),
		Err(_) => {
			// If BigInt parsing fails, try parsing as f64 for
			// scientific notation and truncation
			if let Ok(f) = value.parse::<f64>() {
				if f.is_infinite() {
					Err(TypeError::NumberOutOfRange {
						target: Type::Int,
						fragment,
						descriptor: None,
					}
					.into())
				} else {
					let truncated = f.trunc();
					// Convert the truncated float to BigInt
					if let Ok(bigint) = format!("{:.0}", truncated).parse::<BigInt>() {
						Ok(Int::from(bigint))
					} else {
						Err(TypeError::InvalidNumberFormat {
							target: Type::Int,
							fragment,
						}
						.into())
					}
				}
			} else {
				Err(TypeError::InvalidNumberFormat {
					target: Type::Int,
					fragment,
				}
				.into())
			}
		}
	}
}

#[cfg(test)]
pub mod tests {
	use super::*;

	#[test]
	fn test_parse_int_valid_zero() {
		assert_eq!(parse_int(Fragment::testing("0")).unwrap(), Int::zero());
	}

	#[test]
	fn test_parse_int_valid_positive() {
		let result = parse_int(Fragment::testing("12345")).unwrap();
		assert_eq!(format!("{}", result), "12345");
	}

	#[test]
	fn test_parse_int_valid_negative() {
		let result = parse_int(Fragment::testing("-12345")).unwrap();
		assert_eq!(format!("{}", result), "-12345");
	}

	#[test]
	fn test_parse_int_large_positive() {
		let large_num = "123456789012345678901234567890";
		let result = parse_int(Fragment::testing(large_num)).unwrap();
		assert_eq!(format!("{}", result), large_num);
	}

	#[test]
	fn test_parse_int_large_negative() {
		let large_num = "-123456789012345678901234567890";
		let result = parse_int(Fragment::testing(large_num)).unwrap();
		assert_eq!(format!("{}", result), large_num);
	}

	#[test]
	fn test_parse_int_scientific_notation() {
		let result = parse_int(Fragment::testing("1e5")).unwrap();
		assert_eq!(format!("{}", result), "100000");
	}

	#[test]
	fn test_parse_int_scientific_negative() {
		let result = parse_int(Fragment::testing("-1.5e3")).unwrap();
		assert_eq!(format!("{}", result), "-1500");
	}

	#[test]
	fn test_parse_int_float_truncation() {
		let result = parse_int(Fragment::testing("123.789")).unwrap();
		assert_eq!(format!("{}", result), "123");
	}

	#[test]
	fn test_parse_int_float_truncation_negative() {
		let result = parse_int(Fragment::testing("-123.789")).unwrap();
		assert_eq!(format!("{}", result), "-123");
	}

	#[test]
	fn test_parse_int_with_underscores() {
		let result = parse_int(Fragment::testing("1_234_567")).unwrap();
		assert_eq!(format!("{}", result), "1234567");
	}

	#[test]
	fn test_parse_int_with_leading_space() {
		let result = parse_int(Fragment::testing(" 12345")).unwrap();
		assert_eq!(format!("{}", result), "12345");
	}

	#[test]
	fn test_parse_int_with_trailing_space() {
		let result = parse_int(Fragment::testing("12345 ")).unwrap();
		assert_eq!(format!("{}", result), "12345");
	}

	#[test]
	fn test_parse_int_with_both_spaces() {
		let result = parse_int(Fragment::testing(" -12345 ")).unwrap();
		assert_eq!(format!("{}", result), "-12345");
	}

	#[test]
	fn test_parse_int_invalid_empty() {
		assert!(parse_int(Fragment::testing("")).is_err());
	}

	#[test]
	fn test_parse_int_invalid_whitespace() {
		assert!(parse_int(Fragment::testing("   ")).is_err());
	}

	#[test]
	fn test_parse_int_invalid_text() {
		assert!(parse_int(Fragment::testing("abc")).is_err());
	}

	#[test]
	fn test_parse_int_invalid_multiple_dots() {
		assert!(parse_int(Fragment::testing("1.2.3")).is_err());
	}

	#[test]
	fn test_parse_int_infinity() {
		assert!(parse_int(Fragment::testing("inf")).is_err());
	}

	#[test]
	fn test_parse_int_negative_infinity() {
		assert!(parse_int(Fragment::testing("-inf")).is_err());
	}
}