animalese 0.2.0

//! Animalese sound generator
//!
//! Recreates the Animal Crossing "animalese" speech effect by playing phonetic
//! sound sprites with pitch variation and intonation.
//!
//! ## Features
//!
//! - **8 voice types**: Female (f1-f4) and male (m1-m4) voices
//! - **Pitch control**: Shift pitch and add random variation for natural sound
//! - **Intonation**: Apply pitch glides for questions, statements, and excitement
//! - **Sound effects**: Built-in SFX for keyboard interactions
//! - **Bundled assets**: Audio files included in the crate
//!
//! ## Quick Start
//!
//! ```no_run
//! use animalese::Animalese;
//!
//! let engine = Animalese::new()?;
//! engine.speak("hello world")?;
//!
//! // Questions with rising intonation
//! engine.speak_question("What's that?")?;
//!
//! // Excited speech
//! engine.speak_excited("Amazing!")?;
//! # Ok::<(), Box<dyn std::error::Error>>(())
//! ```

use kira::{
    manager::{AudioManager, AudioManagerSettings, backend::DefaultBackend},
    sound::static_sound::{StaticSoundData, StaticSoundHandle},
    tween::Tween,
    Volume,
};
use std::path::{Path, PathBuf};
use std::sync::{Arc, Mutex};
use std::time::Duration;
use rand::Rng;

/// Returns the path to bundled voice assets
///
/// Most users don't need this - just use `Animalese::new()`.
/// Only useful if you need to know where the bundled assets are located.
pub fn bundled_assets_path() -> PathBuf {
    PathBuf::from(env!("CARGO_MANIFEST_DIR"))
        .join("assets")
        .join("audio")
        .join("voice")
}

/// Voice types available
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum VoiceType {
    F1, F2, F3, F4,
    M1, M2, M3, M4,
}

impl VoiceType {
    fn filename(&self) -> &'static str {
        match self {
            VoiceType::F1 => "f1.ogg",
            VoiceType::F2 => "f2.ogg",
            VoiceType::F3 => "f3.ogg",
            VoiceType::F4 => "f4.ogg",
            VoiceType::M1 => "m1.ogg",
            VoiceType::M2 => "m2.ogg",
            VoiceType::M3 => "m3.ogg",
            VoiceType::M4 => "m4.ogg",
        }
    }
}

/// Voice profile configuration
#[derive(Debug, Clone)]
pub struct VoiceProfile {
    pub voice_type: VoiceType,
    pub pitch_shift: f32,      // Fixed pitch shift in semitones
    pub pitch_variation: f32,  // Random variation range in semitones
    pub volume: f32,           // Volume multiplier (0.0 to 1.0)
    pub intonation: f32,       // Pitch glide over sentence: -1.0 (falling) to 1.0 (rising)
}

impl Default for VoiceProfile {
    fn default() -> Self {
        Self {
            voice_type: VoiceType::F1,
            pitch_shift: 0.0,
            pitch_variation: 0.8,
            volume: 0.65,
            intonation: 0.0,
        }
    }
}

/// Maps letters to their sprite positions in the audio file
/// Each letter gets 200ms starting at letter_index * 200ms
fn letter_to_sprite_time(c: char) -> Option<Duration> {
    let c = c.to_ascii_lowercase();
    if !c.is_ascii_lowercase() {
        return None;
    }

    let index = (c as u32 - 'a' as u32) as u64;
    Some(Duration::from_millis(index * 200))
}

/// Special sprite times for non-letter sounds
fn special_to_sprite_time(name: &str) -> Option<Duration> {
    match name {
        "ok" => Some(Duration::from_millis(5200)),
        "gwah" => Some(Duration::from_millis(5800)),
        "deska" => Some(Duration::from_millis(6400)),
        _ => None,
    }
}

/// SFX sprite times (600ms each)
fn sfx_to_sprite_time(name: &str) -> Option<Duration> {
    let index = match name {
        "backspace" => 0,
        "enter" => 1,
        "tab" => 2,
        "question" => 3,
        "exclamation" => 4,
        "at" => 5,
        "pound" => 6,
        "dollar" => 7,
        "caret" => 8,
        "ampersand" => 9,
        "asterisk" => 10,
        "parenthesis_open" => 11,
        "parenthesis_closed" => 12,
        "bracket_open" => 13,
        "bracket_closed" => 14,
        "brace_open" => 15,
        "brace_closed" => 16,
        "tilde" => 17,
        "default" => 18,
        "arrow_left" => 19,
        "arrow_up" => 20,
        "arrow_right" => 21,
        "arrow_down" => 22,
        "slash_forward" => 23,
        "slash_back" => 24,
        "percent" => 25,
        _ => return None,
    };
    Some(Duration::from_millis(index * 600))
}

/// Calculate playback rate from pitch shift in semitones
/// rate = 2^(semitones / 12)
fn semitones_to_rate(semitones: f32) -> f32 {
    2.0_f32.powf(semitones / 12.0)
}

/// Animalese sound engine with kira-based playback
pub struct Animalese {
    manager: Arc<Mutex<AudioManager>>,
    voice_path: String,
    sfx_path: String,
    profile: Arc<Mutex<VoiceProfile>>,
    active_sounds: Arc<Mutex<Vec<StaticSoundHandle>>>,
}

impl Animalese {
    /// Create a new Animalese engine with bundled assets
    ///
    /// # Example
    /// ```no_run
    /// use animalese::Animalese;
    ///
    /// let engine = Animalese::new().unwrap();
    /// engine.speak("hello world").unwrap();
    /// ```
    pub fn new() -> Result<Self, Box<dyn std::error::Error>> {
        Self::with_custom_assets(bundled_assets_path().to_string_lossy().to_string())
    }

    /// Create an Animalese engine with custom audio assets
    ///
    /// Only use this if you have custom audio files that match the expected
    /// format (sprite sheets with 200ms letter sounds, etc).
    ///
    /// # Arguments
    /// * `assets_path` - Path to your custom assets/audio/voice directory
    ///
    /// # Example
    /// ```no_run
    /// use animalese::Animalese;
    ///
    /// let engine = Animalese::with_custom_assets("./my_assets/voice").unwrap();
    /// ```
    pub fn with_custom_assets(assets_path: impl Into<String>) -> Result<Self, Box<dyn std::error::Error>> {
        let voice_path = assets_path.into();

        // SFX file is in parent directory of voice
        let sfx_path = Path::new(&voice_path)
            .parent()
            .ok_or("Invalid assets path")?
            .join("sfx.ogg")
            .to_string_lossy()
            .to_string();

        // Initialize kira audio manager
        let manager = AudioManager::<DefaultBackend>::new(AudioManagerSettings::default())?;

        let profile = Arc::new(Mutex::new(VoiceProfile::default()));
        let active_sounds = Arc::new(Mutex::new(Vec::new()));

        Ok(Self {
            manager: Arc::new(Mutex::new(manager)),
            voice_path,
            sfx_path,
            profile,
            active_sounds,
        })
    }

    /// Set the voice profile
    pub fn set_profile(&mut self, new_profile: VoiceProfile) {
        if let Ok(mut profile) = self.profile.lock() {
            *profile = new_profile;
        }
    }

    /// Get a copy of the current voice profile
    pub fn profile(&self) -> VoiceProfile {
        self.profile.lock().unwrap().clone()
    }

    /// Play a letter sound with the current voice profile
    pub fn play_letter(&self, c: char) -> Result<(), Box<dyn std::error::Error>> {
        self.play_letter_with_duration(c, None)
    }

    /// Play a letter sound with optional max duration (for fast typing)
    pub fn play_letter_with_duration(&self, c: char, max_duration: Option<Duration>) -> Result<(), Box<dyn std::error::Error>> {
        self.play_letter_with_options(c, max_duration, 0.0)
    }

    /// Play a letter sound with optional duration and intonation adjustment
    fn play_letter_with_options(&self, c: char, max_duration: Option<Duration>, intonation_shift: f32) -> Result<(), Box<dyn std::error::Error>> {
        let sprite_time = letter_to_sprite_time(c)
            .ok_or("Not a valid letter")?;

        self.play_sprite(&self.voice_path, sprite_time, Duration::from_millis(200), true, max_duration, intonation_shift)
    }

    /// Play a special sound (ok, gwah, deska)
    pub fn play_special(&self, name: &str) -> Result<(), Box<dyn std::error::Error>> {
        let sprite_time = special_to_sprite_time(name)
            .ok_or("Unknown special sound")?;

        self.play_sprite(&self.voice_path, sprite_time, Duration::from_millis(600), true, None, 0.0)
    }

    /// Play a sound effect (enter, backspace, etc)
    pub fn play_sfx(&self, name: &str) -> Result<(), Box<dyn std::error::Error>> {
        let sprite_time = sfx_to_sprite_time(name)
            .ok_or("Unknown SFX sound")?;

        self.play_sprite(&self.sfx_path, sprite_time, Duration::from_millis(600), false, None, 0.0)
    }

    /// Play text as animalese speech with intonation
    pub fn speak(&self, text: &str) -> Result<(), Box<dyn std::error::Error>> {
        let profile = self.profile.lock().unwrap();
        let base_intonation = profile.intonation;
        drop(profile);

        // Check if text ends with question mark for automatic rising intonation
        let has_question = text.trim_end().ends_with('?');
        let intonation = if has_question && base_intonation == 0.0 {
            0.5 // Apply gentle rising intonation for questions
        } else {
            base_intonation
        };

        // Count letters for position calculation
        let letters: Vec<char> = text.chars().filter(|c| c.is_ascii_alphabetic()).collect();
        let total_letters = letters.len() as f32;

        if total_letters == 0.0 {
            return Ok(());
        }

        let mut letter_index = 0.0;
        for c in text.chars() {
            if c.is_ascii_alphabetic() {
                // Calculate position (0.0 to 1.0) in the sentence
                let position = letter_index / total_letters;

                // Apply intonation curve
                // Positive intonation = rising (pitch increases)
                // Negative intonation = falling (pitch decreases)
                let intonation_shift = intonation * position * 3.0; // Scale to ~3 semitones max

                self.play_letter_with_options(c, None, intonation_shift)?;
                letter_index += 1.0;

                // Small delay between letters to simulate speech cadence
                std::thread::sleep(Duration::from_millis(50));
            }
        }
        Ok(())
    }

    /// Speak text with rising intonation (for questions)
    ///
    /// Automatically applies a rising pitch contour, perfect for questions
    /// or uncertain statements.
    ///
    /// # Example
    /// ```no_run
    /// use animalese::Animalese;
    ///
    /// let engine = Animalese::new().unwrap();
    /// engine.speak_question("What's that").unwrap();
    /// ```
    pub fn speak_question(&self, text: &str) -> Result<(), Box<dyn std::error::Error>> {
        // Temporarily set intonation to rising
        let original_intonation = {
            let mut profile = self.profile.lock().unwrap();
            let original = profile.intonation;
            profile.intonation = 0.6; // Moderate rising intonation
            original
        };

        let result = self.speak(text);

        // Restore original intonation
        if let Ok(mut profile) = self.profile.lock() {
            profile.intonation = original_intonation;
        }

        result
    }

    /// Speak text with excitement (higher pitch, rising intonation)
    ///
    /// Applies higher pitch and rising intonation for excited or enthusiastic
    /// speech. Great for exclamations!
    ///
    /// # Example
    /// ```no_run
    /// use animalese::Animalese;
    ///
    /// let engine = Animalese::new().unwrap();
    /// engine.speak_excited("Amazing!").unwrap();
    /// ```
    pub fn speak_excited(&self, text: &str) -> Result<(), Box<dyn std::error::Error>> {
        // Temporarily boost pitch and add rising intonation
        let (original_pitch, original_intonation) = {
            let mut profile = self.profile.lock().unwrap();
            let orig_pitch = profile.pitch_shift;
            let orig_intonation = profile.intonation;
            profile.pitch_shift += 2.0; // Raise pitch by 2 semitones
            profile.intonation = 0.4; // Gentle rising intonation
            (orig_pitch, orig_intonation)
        };

        let result = self.speak(text);

        // Restore original settings
        if let Ok(mut profile) = self.profile.lock() {
            profile.pitch_shift = original_pitch;
            profile.intonation = original_intonation;
        }

        result
    }

    /// Speak text with falling intonation (for statements)
    ///
    /// Applies a gentle falling pitch contour, typical of declarative
    /// statements and confident assertions.
    ///
    /// # Example
    /// ```no_run
    /// use animalese::Animalese;
    ///
    /// let engine = Animalese::new().unwrap();
    /// engine.speak_statement("I see").unwrap();
    /// ```
    pub fn speak_statement(&self, text: &str) -> Result<(), Box<dyn std::error::Error>> {
        // Temporarily set intonation to falling
        let original_intonation = {
            let mut profile = self.profile.lock().unwrap();
            let original = profile.intonation;
            profile.intonation = -0.3; // Gentle falling intonation
            original
        };

        let result = self.speak(text);

        // Restore original intonation
        if let Ok(mut profile) = self.profile.lock() {
            profile.intonation = original_intonation;
        }

        result
    }

    /// Internal method to play a sprite with kira
    fn play_sprite(&self, audio_path: &str, start: Duration, duration: Duration, apply_pitch: bool, max_duration: Option<Duration>, intonation_shift: f32) -> Result<(), Box<dyn std::error::Error>> {
        // Determine the full file path
        let file_path = if audio_path.ends_with(".ogg") {
            // It's already a full path to sfx.ogg
            audio_path.to_string()
        } else {
            // It's the voice directory, append the voice filename
            let profile = self.profile.lock().unwrap();
            let filename = profile.voice_type.filename();
            Path::new(audio_path).join(filename)
                .to_string_lossy()
                .to_string()
        };

        // Calculate parameters
        let actual_duration = max_duration.unwrap_or(duration);

        // Load sound data and slice to extract only the sprite region
        let start_time = start.as_secs_f64();
        let end_time = start_time + actual_duration.as_secs_f64();
        let mut sound_data = StaticSoundData::from_file(&file_path)?
            .slice(start_time..end_time);

        if apply_pitch {
            let profile = self.profile.lock().unwrap();
            let mut rng = rand::thread_rng();
            let random_variation = rng.gen_range(-1.0..=1.0) * profile.pitch_variation;
            let final_pitch = profile.pitch_shift + random_variation + intonation_shift;
            let playback_rate = semitones_to_rate(final_pitch);
            let volume = profile.volume;

            // Configure sound with pitch and volume
            sound_data = sound_data
                .playback_rate(playback_rate as f64)
                .volume(Volume::Amplitude(volume as f64))
                .fade_in_tween(Tween {
                    duration: std::time::Duration::from_millis(5),
                    ..Default::default()
                });
        } else {
            let profile = self.profile.lock().unwrap();
            let volume = profile.volume;

            sound_data = sound_data
                .volume(Volume::Amplitude(volume as f64))
                .fade_in_tween(Tween {
                    duration: std::time::Duration::from_millis(5),
                    ..Default::default()
                });
        }

        // Play the sound
        let mut manager = self.manager.lock().unwrap();
        let handle = manager.play(sound_data)?;

        // Store handle to keep it alive
        let mut active = self.active_sounds.lock().unwrap();
        active.push(handle);

        // Clean up finished sounds
        active.retain(|h| h.state() != kira::sound::PlaybackState::Stopped);

        Ok(())
    }

    /// Stop all currently playing sounds
    pub fn stop(&self) {
        let mut active = self.active_sounds.lock().unwrap();
        for handle in active.iter_mut() {
            let _ = handle.stop(Tween::default());
        }
        active.clear();
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use std::time::Duration;

    #[test]
    fn test_letter_to_sprite_time() {
        assert_eq!(letter_to_sprite_time('a'), Some(Duration::from_millis(0)));
        assert_eq!(letter_to_sprite_time('b'), Some(Duration::from_millis(200)));
        assert_eq!(letter_to_sprite_time('z'), Some(Duration::from_millis(5000)));
        assert_eq!(letter_to_sprite_time('A'), Some(Duration::from_millis(0)));
        assert_eq!(letter_to_sprite_time('1'), None);
    }

    #[test]
    fn test_semitones_to_rate() {
        assert!((semitones_to_rate(0.0) - 1.0).abs() < 0.001);
        assert!((semitones_to_rate(12.0) - 2.0).abs() < 0.001);
        assert!((semitones_to_rate(-12.0) - 0.5).abs() < 0.001);
    }

    #[test]
    fn test_special_sounds() {
        assert_eq!(special_to_sprite_time("ok"), Some(Duration::from_millis(5200)));
        assert_eq!(special_to_sprite_time("gwah"), Some(Duration::from_millis(5800)));
        assert_eq!(special_to_sprite_time("deska"), Some(Duration::from_millis(6400)));
        assert_eq!(special_to_sprite_time("unknown"), None);
    }

    #[test]
    fn test_voice_profile_default() {
        let profile = VoiceProfile::default();
        assert_eq!(profile.voice_type, VoiceType::F1);
        assert_eq!(profile.pitch_shift, 0.0);
        assert_eq!(profile.pitch_variation, 0.8);
        assert_eq!(profile.volume, 0.65);
        assert_eq!(profile.intonation, 0.0);
    }

    #[test]
    fn test_intonation_values() {
        let mut profile = VoiceProfile::default();

        // Test setting various intonation values
        profile.intonation = 0.5;
        assert_eq!(profile.intonation, 0.5);

        profile.intonation = -0.5;
        assert_eq!(profile.intonation, -0.5);

        profile.intonation = 1.0;
        assert_eq!(profile.intonation, 1.0);

        profile.intonation = -1.0;
        assert_eq!(profile.intonation, -1.0);
    }
}