aptu_core/ai/
provider.rs

1// SPDX-License-Identifier: Apache-2.0
2
3//! AI provider trait and shared implementations.
4//!
5//! Defines the `AiProvider` trait that all AI providers must implement,
6//! along with default implementations for shared logic like prompt building,
7//! request sending, and response parsing.
8
9use anyhow::{Context, Result};
10use async_trait::async_trait;
11use regex::Regex;
12use reqwest::Client;
13use secrecy::SecretString;
14use std::sync::LazyLock;
15use tracing::{debug, instrument};
16
17use super::AiResponse;
18use super::registry::PROVIDER_ANTHROPIC;
19use super::types::{
20    ChatCompletionRequest, ChatCompletionResponse, ChatMessage, IssueDetails, ResponseFormat,
21    TriageResponse,
22};
23use crate::history::AiStats;
24
25use super::prompts::{
26    build_create_system_prompt, build_pr_label_system_prompt, build_pr_review_system_prompt,
27    build_triage_system_prompt,
28};
29
30/// Maximum number of characters retained from an AI provider error response body.
31const MAX_ERROR_BODY_LENGTH: usize = 200;
32
33/// Redacts error body to prevent leaking sensitive API details.
34/// Truncates to [`MAX_ERROR_BODY_LENGTH`] characters and appends "[truncated]" if longer.
35fn redact_api_error_body(body: &str) -> String {
36    if body.chars().count() <= MAX_ERROR_BODY_LENGTH {
37        body.to_owned()
38    } else {
39        let truncated: String = body.chars().take(MAX_ERROR_BODY_LENGTH).collect();
40        format!("{truncated} [truncated]")
41    }
42}
43
44/// Parses JSON response from AI provider, detecting truncated responses.
45///
46/// If the JSON parsing fails with an EOF error (indicating the response was cut off),
47/// returns a `TruncatedResponse` error that can be retried. Other JSON errors are
48/// wrapped as `InvalidAIResponse`.
49///
50/// # Arguments
51///
52/// * `text` - The JSON text to parse
53/// * `provider` - The name of the AI provider (for error context)
54///
55/// # Returns
56///
57/// Parsed value of type T, or an error if parsing fails
58fn parse_ai_json<T: serde::de::DeserializeOwned>(text: &str, provider: &str) -> Result<T> {
59    match serde_json::from_str::<T>(text) {
60        Ok(value) => Ok(value),
61        Err(e) => {
62            // Check if this is an EOF error (truncated response)
63            if e.is_eof() {
64                Err(anyhow::anyhow!(
65                    crate::error::AptuError::TruncatedResponse {
66                        provider: provider.to_string(),
67                    }
68                ))
69            } else {
70                Err(anyhow::anyhow!(crate::error::AptuError::InvalidAIResponse(
71                    e
72                )))
73            }
74        }
75    }
76}
77
78/// Maximum length for issue body to stay within token limits.
79pub const MAX_BODY_LENGTH: usize = 4000;
80
81/// Maximum number of comments to include in the prompt.
82pub const MAX_COMMENTS: usize = 5;
83
84/// Maximum number of files to include in PR review prompt.
85pub const MAX_FILES: usize = 20;
86
87/// Maximum total diff size (in characters) for PR review prompt.
88pub const MAX_TOTAL_DIFF_SIZE: usize = 50_000;
89
90/// Maximum number of labels to include in the prompt.
91pub const MAX_LABELS: usize = 30;
92
93/// Maximum number of milestones to include in the prompt.
94pub const MAX_MILESTONES: usize = 10;
95
96/// Maximum characters per file's full content included in the PR review prompt.
97/// Content pre-truncated by `fetch_file_contents` may already be within this limit,
98/// but the prompt builder applies it as a second safety cap.
99pub const MAX_FULL_CONTENT_CHARS: usize = 4_000;
100
101/// Estimated overhead for XML tags, section headers, and schema preamble added by
102/// `build_pr_review_user_prompt`. Used to ensure the prompt budget accounts for
103/// non-content characters when estimating total prompt size.
104const PROMPT_OVERHEAD_CHARS: usize = 1_000;
105
106/// Preamble appended to every user-turn prompt to request a JSON response matching the schema.
107const SCHEMA_PREAMBLE: &str = "\n\nRespond with valid JSON matching this schema:\n";
108
109/// Matches structural XML delimiter tags (case-insensitive) used as prompt delimiters.
110/// These must be stripped from user-controlled fields to prevent prompt injection.
111///
112/// Covers: `pull_request`, `issue_content`, `issue_body`, `pr_diff`, `commit_message`, `pr_comment`, `file_content`.
113///
114/// The pattern uses a simple alternation with no quantifiers, so `ReDoS` is not a concern:
115/// regex engine complexity is O(n) in the input length regardless of content.
116static XML_DELIMITERS: LazyLock<Regex> = LazyLock::new(|| {
117    Regex::new(
118        r"(?i)</?(?:pull_request|issue_content|issue_body|pr_diff|commit_message|pr_comment|file_content)>",
119    )
120    .expect("valid regex")
121});
122
123/// Removes `<pull_request>` / `</pull_request>` and `<issue_content>` / `</issue_content>`
124/// XML delimiter tags from a user-supplied string, preventing prompt injection via XML tag
125/// smuggling.
126///
127/// Tags are removed entirely (replaced with empty string) rather than substituted with a
128/// placeholder. A visible placeholder such as `[sanitized]` could cause the LLM to reason
129/// about the substitution marker itself, which is unnecessary and potentially confusing.
130///
131/// Nested or malformed XML is not a concern: the only delimiters this code inserts into
132/// prompts are the exact strings `<pull_request>` / `</pull_request>` and
133/// `<issue_content>` / `</issue_content>` (no attributes, no nesting). Stripping those
134/// fixed forms is sufficient to prevent a user-supplied value from breaking out of the
135/// delimiter boundary.
136///
137/// Applied to all user-controlled fields inside prompt delimiter blocks:
138/// - Issue triage: `issue.title`, `issue.body`, comment author/body, related issue
139///   title/state, label name/description, milestone title/description.
140/// - PR review: `pr.title`, `pr.body`, `file.filename`, `file.status`, patch content.
141fn sanitize_prompt_field(s: &str) -> String {
142    XML_DELIMITERS.replace_all(s, "").into_owned()
143}
144
145/// AI provider trait for issue triage and creation.
146///
147/// Defines the interface that all AI providers must implement.
148/// Default implementations are provided for shared logic.
149#[async_trait]
150pub trait AiProvider: Send + Sync {
151    /// Returns the name of the provider (e.g., "gemini", "openrouter").
152    fn name(&self) -> &str;
153
154    /// Returns the API URL for this provider.
155    fn api_url(&self) -> &str;
156
157    /// Returns the environment variable name for the API key.
158    fn api_key_env(&self) -> &str;
159
160    /// Returns the HTTP client for making requests.
161    fn http_client(&self) -> &Client;
162
163    /// Returns the API key for authentication.
164    fn api_key(&self) -> &SecretString;
165
166    /// Returns the model name.
167    fn model(&self) -> &str;
168
169    /// Returns the maximum tokens for API responses.
170    fn max_tokens(&self) -> u32;
171
172    /// Returns the temperature for API requests.
173    fn temperature(&self) -> f32;
174
175    /// Returns whether this provider is Anthropic-compatible and supports
176    /// `cache_control` on message blocks.
177    ///
178    /// Default implementation checks `self.name() == "anthropic"`. Providers
179    /// that route through a different name but support Anthropic prompt caching
180    /// can override this method.
181    fn is_anthropic(&self) -> bool {
182        self.name() == PROVIDER_ANTHROPIC
183    }
184
185    /// Returns the maximum retry attempts for rate-limited requests.
186    ///
187    /// Default implementation returns 3. Providers can override
188    /// to use a different retry limit.
189    fn max_attempts(&self) -> u32 {
190        3
191    }
192
193    /// Returns the circuit breaker for this provider (optional).
194    ///
195    /// Default implementation returns None. Providers can override
196    /// to provide circuit breaker functionality.
197    fn circuit_breaker(&self) -> Option<&super::CircuitBreaker> {
198        None
199    }
200
201    /// Builds HTTP headers for API requests.
202    ///
203    /// Default implementation includes Authorization and Content-Type headers.
204    /// Providers can override to add custom headers.
205    fn build_headers(&self) -> reqwest::header::HeaderMap {
206        let mut headers = reqwest::header::HeaderMap::new();
207        if let Ok(val) = "application/json".parse() {
208            headers.insert("Content-Type", val);
209        }
210        headers
211    }
212
213    /// Validates the model configuration.
214    ///
215    /// Default implementation does nothing. Providers can override
216    /// to enforce constraints (e.g., free tier validation).
217    fn validate_model(&self) -> Result<()> {
218        Ok(())
219    }
220
221    /// Returns the custom guidance string for system prompt injection, if set.
222    ///
223    /// Default implementation returns `None`. Providers that store custom guidance
224    /// (e.g., from `AiConfig`) override this to supply it.
225    fn custom_guidance(&self) -> Option<&str> {
226        None
227    }
228
229    /// Sends a chat completion request to the provider's API (HTTP-only, no retry).
230    ///
231    /// Default implementation handles HTTP headers, error responses (401, 429).
232    /// Does not include retry logic - use `send_and_parse()` for retry behavior.
233    #[instrument(skip(self, request), fields(provider = self.name(), model = self.model()))]
234    async fn send_request_inner(
235        &self,
236        request: &ChatCompletionRequest,
237    ) -> Result<ChatCompletionResponse> {
238        use secrecy::ExposeSecret;
239        use tracing::warn;
240
241        use crate::error::AptuError;
242
243        let mut req = self.http_client().post(self.api_url());
244
245        // Add Authorization header (skip for Anthropic, which uses x-api-key)
246        if !self.is_anthropic() {
247            req = req.header(
248                "Authorization",
249                format!("Bearer {}", self.api_key().expose_secret()),
250            );
251        }
252
253        // Add custom headers from provider
254        for (key, value) in &self.build_headers() {
255            req = req.header(key.clone(), value.clone());
256        }
257
258        let response = req
259            .json(request)
260            .send()
261            .await
262            .context(format!("Failed to send request to {} API", self.name()))?;
263
264        // Check for HTTP errors
265        let status = response.status();
266        if !status.is_success() {
267            if status.as_u16() == 401 {
268                anyhow::bail!(
269                    "Invalid {} API key. Check your {} environment variable.",
270                    self.name(),
271                    self.api_key_env()
272                );
273            } else if status.as_u16() == 429 {
274                warn!("Rate limited by {} API", self.name());
275                // Parse Retry-After header (seconds), default to 0 if not present
276                let retry_after = response
277                    .headers()
278                    .get("Retry-After")
279                    .and_then(|h| h.to_str().ok())
280                    .and_then(|s| s.parse::<u64>().ok())
281                    .unwrap_or(0);
282                debug!(retry_after, "Parsed Retry-After header");
283                return Err(AptuError::RateLimited {
284                    provider: self.name().to_string(),
285                    retry_after,
286                }
287                .into());
288            }
289            let error_body = response.text().await.unwrap_or_default();
290            anyhow::bail!(
291                "{} API error (HTTP {}): {}",
292                self.name(),
293                status.as_u16(),
294                redact_api_error_body(&error_body)
295            );
296        }
297
298        // Parse response
299        let completion: ChatCompletionResponse = response
300            .json()
301            .await
302            .context(format!("Failed to parse {} API response", self.name()))?;
303
304        Ok(completion)
305    }
306
307    /// Sends a chat completion request and parses the response with retry logic.
308    ///
309    /// This method wraps both HTTP request and JSON parsing in a single retry loop,
310    /// allowing truncated responses to be retried. Includes circuit breaker handling.
311    ///
312    /// # Arguments
313    ///
314    /// * `request` - The chat completion request to send
315    ///
316    /// # Returns
317    ///
318    /// A tuple of (parsed response, stats) extracted from the API response
319    ///
320    /// # Errors
321    ///
322    /// Returns an error if:
323    /// - API request fails (network, timeout, rate limit)
324    /// - Response cannot be parsed as valid JSON (including truncated responses)
325    #[instrument(skip(self, request), fields(provider = self.name(), model = self.model()))]
326    async fn send_and_parse<T: serde::de::DeserializeOwned + Send>(
327        &self,
328        request: &ChatCompletionRequest,
329    ) -> Result<(T, AiStats)> {
330        use tracing::{info, warn};
331
332        use crate::error::AptuError;
333        use crate::retry::{extract_retry_after, is_retryable_anyhow};
334
335        // Check circuit breaker before attempting request
336        if let Some(cb) = self.circuit_breaker()
337            && cb.is_open()
338        {
339            return Err(AptuError::CircuitOpen.into());
340        }
341
342        // Start timing (outside retry loop to measure total time including retries)
343        let start = std::time::Instant::now();
344
345        // Custom retry loop that respects retry_after from RateLimited errors
346        let mut attempt: u32 = 0;
347        let max_attempts: u32 = self.max_attempts();
348
349        // Helper function to avoid closure-in-expression clippy warning
350        #[allow(clippy::items_after_statements)]
351        async fn try_request<T: serde::de::DeserializeOwned>(
352            provider: &(impl AiProvider + ?Sized),
353            request: &ChatCompletionRequest,
354        ) -> Result<(T, ChatCompletionResponse)> {
355            // Send HTTP request
356            let completion = provider.send_request_inner(request).await?;
357
358            // Extract message content
359            let content = completion
360                .choices
361                .first()
362                .and_then(|c| {
363                    c.message
364                        .content
365                        .clone()
366                        .or_else(|| c.message.reasoning.clone())
367                })
368                .context("No response from AI model")?;
369
370            debug!(response_length = content.len(), "Received AI response");
371
372            // Parse JSON response (inside retry loop, so truncated responses are retried)
373            let parsed: T = parse_ai_json(&content, provider.name())?;
374
375            Ok((parsed, completion))
376        }
377
378        let (parsed, completion): (T, ChatCompletionResponse) = loop {
379            attempt += 1;
380
381            let result = try_request(self, request).await;
382
383            match result {
384                Ok(success) => break success,
385                Err(err) => {
386                    // Check if error is retryable
387                    if !is_retryable_anyhow(&err) || attempt >= max_attempts {
388                        return Err(err);
389                    }
390
391                    // Extract retry_after if present, otherwise use exponential backoff
392                    let delay = if let Some(retry_after_duration) = extract_retry_after(&err) {
393                        debug!(
394                            retry_after_secs = retry_after_duration.as_secs(),
395                            "Using Retry-After value from rate limit error"
396                        );
397                        retry_after_duration
398                    } else {
399                        // Use exponential backoff with jitter: 1s, 2s, 4s + 0-500ms
400                        let backoff_secs = 2_u64.pow(attempt.saturating_sub(1));
401                        let jitter_ms = fastrand::u64(0..500);
402                        std::time::Duration::from_millis(backoff_secs * 1000 + jitter_ms)
403                    };
404
405                    let error_msg = err.to_string();
406                    warn!(
407                        error = %error_msg,
408                        delay_secs = delay.as_secs(),
409                        attempt,
410                        max_attempts,
411                        "Retrying after error"
412                    );
413
414                    // Drop err before await to avoid holding non-Send value across await
415                    drop(err);
416                    tokio::time::sleep(delay).await;
417                }
418            }
419        };
420
421        // Record success in circuit breaker
422        if let Some(cb) = self.circuit_breaker() {
423            cb.record_success();
424        }
425
426        // Calculate duration (total time including any retries)
427        #[allow(clippy::cast_possible_truncation)]
428        let duration_ms = start.elapsed().as_millis() as u64;
429
430        // Build AI stats from usage info (trust API's cost field)
431        let (input_tokens, output_tokens, cost_usd, cache_read_tokens, cache_write_tokens) =
432            if let Some(usage) = completion.usage {
433                (
434                    usage.prompt_tokens,
435                    usage.completion_tokens,
436                    usage.cost,
437                    usage.cache_read_tokens,
438                    usage.cache_write_tokens,
439                )
440            } else {
441                // If no usage info, default to 0
442                debug!("No usage information in API response");
443                (0, 0, None, 0, 0)
444            };
445
446        let ai_stats = AiStats {
447            provider: self.name().to_string(),
448            model: self.model().to_string(),
449            input_tokens,
450            output_tokens,
451            duration_ms,
452            cost_usd,
453            fallback_provider: None,
454            prompt_chars: 0,
455            cache_read_tokens,
456            cache_write_tokens,
457        };
458
459        // Emit structured metrics
460        info!(
461            duration_ms,
462            input_tokens,
463            output_tokens,
464            cache_read_tokens,
465            cache_write_tokens,
466            cost_usd = ?cost_usd,
467            model = %self.model(),
468            "AI request completed"
469        );
470
471        // Log cache hit/miss details
472        debug!(
473            cache_read_tokens = %cache_read_tokens,
474            cache_write_tokens = %cache_write_tokens,
475            "Cache token usage"
476        );
477
478        Ok((parsed, ai_stats))
479    }
480
481    /// Analyzes a GitHub issue using the provider's API.
482    ///
483    /// Returns a structured triage response with summary, labels, questions, duplicates, and usage stats.
484    ///
485    /// # Arguments
486    ///
487    /// * `issue` - Issue details to analyze
488    ///
489    /// # Errors
490    ///
491    /// Returns an error if:
492    /// - API request fails (network, timeout, rate limit)
493    /// - Response cannot be parsed as valid JSON
494    #[instrument(skip(self, issue), fields(issue_number = issue.number, repo = %format!("{}/{}", issue.owner, issue.repo)))]
495    async fn analyze_issue(&self, issue: &IssueDetails) -> Result<AiResponse> {
496        debug!(model = %self.model(), "Calling {} API", self.name());
497
498        // Build request
499        let system_content = if let Some(override_prompt) =
500            super::context::load_system_prompt_override("triage_system").await
501        {
502            override_prompt
503        } else {
504            Self::build_system_prompt(self.custom_guidance())
505        };
506
507        let mut messages = vec![
508            ChatMessage {
509                role: "system".to_string(),
510                content: Some(system_content),
511                reasoning: None,
512                cache_control: None,
513            },
514            ChatMessage {
515                role: "user".to_string(),
516                content: Some(Self::build_user_prompt(issue)),
517                reasoning: None,
518                cache_control: None,
519            },
520        ];
521
522        // Inject cache control on system message for Anthropic
523        if self.is_anthropic()
524            && let Some(msg) = messages.first_mut()
525        {
526            msg.cache_control = Some(super::types::CacheControl::ephemeral());
527        }
528
529        let request = ChatCompletionRequest {
530            model: self.model().to_string(),
531            messages,
532            response_format: Some(ResponseFormat {
533                format_type: "json_object".to_string(),
534                json_schema: None,
535            }),
536            max_tokens: Some(self.max_tokens()),
537            temperature: Some(self.temperature()),
538        };
539
540        // Send request and parse JSON with retry logic
541        let (triage, ai_stats) = self.send_and_parse::<TriageResponse>(&request).await?;
542
543        debug!(
544            input_tokens = ai_stats.input_tokens,
545            output_tokens = ai_stats.output_tokens,
546            duration_ms = ai_stats.duration_ms,
547            cost_usd = ?ai_stats.cost_usd,
548            "AI analysis complete"
549        );
550
551        Ok(AiResponse {
552            triage,
553            stats: ai_stats,
554        })
555    }
556
557    /// Creates a formatted GitHub issue using the provider's API.
558    ///
559    /// Takes raw issue title and body, formats them using AI (conventional commit style,
560    /// structured body), and returns the formatted content with suggested labels.
561    ///
562    /// # Arguments
563    ///
564    /// * `title` - Raw issue title from user
565    /// * `body` - Raw issue body/description from user
566    /// * `repo` - Repository name for context (owner/repo format)
567    ///
568    /// # Errors
569    ///
570    /// Returns an error if:
571    /// - API request fails (network, timeout, rate limit)
572    /// - Response cannot be parsed as valid JSON
573    #[instrument(skip(self), fields(repo = %repo))]
574    async fn create_issue(
575        &self,
576        title: &str,
577        body: &str,
578        repo: &str,
579    ) -> Result<(super::types::CreateIssueResponse, AiStats)> {
580        debug!(model = %self.model(), "Calling {} API for issue creation", self.name());
581
582        // Build request
583        let system_content = if let Some(override_prompt) =
584            super::context::load_system_prompt_override("create_system").await
585        {
586            override_prompt
587        } else {
588            Self::build_create_system_prompt(self.custom_guidance())
589        };
590
591        let mut messages = vec![
592            ChatMessage {
593                role: "system".to_string(),
594                content: Some(system_content),
595                reasoning: None,
596                cache_control: None,
597            },
598            ChatMessage {
599                role: "user".to_string(),
600                content: Some(Self::build_create_user_prompt(title, body, repo)),
601                reasoning: None,
602                cache_control: None,
603            },
604        ];
605
606        // Inject cache control on system message for Anthropic
607        if self.is_anthropic()
608            && let Some(msg) = messages.first_mut()
609        {
610            msg.cache_control = Some(super::types::CacheControl::ephemeral());
611        }
612
613        let request = ChatCompletionRequest {
614            model: self.model().to_string(),
615            messages,
616            response_format: Some(ResponseFormat {
617                format_type: "json_object".to_string(),
618                json_schema: None,
619            }),
620            max_tokens: Some(self.max_tokens()),
621            temperature: Some(self.temperature()),
622        };
623
624        // Send request and parse JSON with retry logic
625        let (create_response, ai_stats) = self
626            .send_and_parse::<super::types::CreateIssueResponse>(&request)
627            .await?;
628
629        debug!(
630            title_len = create_response.formatted_title.len(),
631            body_len = create_response.formatted_body.len(),
632            labels = create_response.suggested_labels.len(),
633            input_tokens = ai_stats.input_tokens,
634            output_tokens = ai_stats.output_tokens,
635            duration_ms = ai_stats.duration_ms,
636            "Issue formatting complete with stats"
637        );
638
639        Ok((create_response, ai_stats))
640    }
641
642    /// Builds the system prompt for issue triage.
643    #[must_use]
644    fn build_system_prompt(custom_guidance: Option<&str>) -> String {
645        let context = super::context::load_custom_guidance(custom_guidance);
646        build_triage_system_prompt(&context)
647    }
648
649    /// Builds the user prompt containing the issue details.
650    #[must_use]
651    fn build_user_prompt(issue: &IssueDetails) -> String {
652        use std::fmt::Write;
653
654        let mut prompt = String::new();
655
656        prompt.push_str("<issue_content>\n");
657        let _ = writeln!(prompt, "Title: {}\n", sanitize_prompt_field(&issue.title));
658
659        // Sanitize body before truncation (injection tag could straddle the boundary)
660        let sanitized_body = sanitize_prompt_field(&issue.body);
661        let body = if sanitized_body.len() > MAX_BODY_LENGTH {
662            format!(
663                "{}...\n[APTU: body truncated by size budget -- do not speculate on missing content]",
664                &sanitized_body[..MAX_BODY_LENGTH],
665            )
666        } else if sanitized_body.is_empty() {
667            "[No description provided]".to_string()
668        } else {
669            sanitized_body
670        };
671        let _ = writeln!(prompt, "Body:\n{body}\n");
672
673        // Include existing labels
674        if !issue.labels.is_empty() {
675            let _ = writeln!(prompt, "Existing Labels: {}\n", issue.labels.join(", "));
676        }
677
678        // Include recent comments (limited)
679        if !issue.comments.is_empty() {
680            prompt.push_str("Recent Comments:\n");
681            for comment in issue.comments.iter().take(MAX_COMMENTS) {
682                let sanitized_comment_body = sanitize_prompt_field(&comment.body);
683                let comment_body = if sanitized_comment_body.len() > 500 {
684                    format!("{}...", &sanitized_comment_body[..500])
685                } else {
686                    sanitized_comment_body
687                };
688                let _ = writeln!(
689                    prompt,
690                    "- @{}: {}",
691                    sanitize_prompt_field(&comment.author),
692                    comment_body
693                );
694            }
695            prompt.push('\n');
696        }
697
698        // Include related issues from search (for context)
699        if !issue.repo_context.is_empty() {
700            prompt.push_str("Related Issues in Repository (for context):\n");
701            for related in issue.repo_context.iter().take(10) {
702                let _ = writeln!(
703                    prompt,
704                    "- #{} [{}] {}",
705                    related.number,
706                    sanitize_prompt_field(&related.state),
707                    sanitize_prompt_field(&related.title)
708                );
709            }
710            prompt.push('\n');
711        }
712
713        // Include repository structure (source files)
714        if !issue.repo_tree.is_empty() {
715            prompt.push_str("Repository Structure (source files):\n");
716            for path in issue.repo_tree.iter().take(20) {
717                let _ = writeln!(prompt, "- {path}");
718            }
719            prompt.push('\n');
720        }
721
722        // Include available labels
723        if !issue.available_labels.is_empty() {
724            prompt.push_str("Available Labels:\n");
725            for label in issue.available_labels.iter().take(MAX_LABELS) {
726                let description = if label.description.is_empty() {
727                    String::new()
728                } else {
729                    format!(" - {}", sanitize_prompt_field(&label.description))
730                };
731                let _ = writeln!(
732                    prompt,
733                    "- {} (color: #{}){}",
734                    sanitize_prompt_field(&label.name),
735                    label.color,
736                    description
737                );
738            }
739            prompt.push('\n');
740        }
741
742        // Include available milestones
743        if !issue.available_milestones.is_empty() {
744            prompt.push_str("Available Milestones:\n");
745            for milestone in issue.available_milestones.iter().take(MAX_MILESTONES) {
746                let description = if milestone.description.is_empty() {
747                    String::new()
748                } else {
749                    format!(" - {}", sanitize_prompt_field(&milestone.description))
750                };
751                let _ = writeln!(
752                    prompt,
753                    "- {}{}",
754                    sanitize_prompt_field(&milestone.title),
755                    description
756                );
757            }
758            prompt.push('\n');
759        }
760
761        prompt.push_str("</issue_content>");
762        prompt.push_str(SCHEMA_PREAMBLE);
763        prompt.push_str(crate::ai::prompts::TRIAGE_SCHEMA);
764
765        prompt
766    }
767
768    /// Builds the system prompt for issue creation/formatting.
769    #[must_use]
770    fn build_create_system_prompt(custom_guidance: Option<&str>) -> String {
771        let context = super::context::load_custom_guidance(custom_guidance);
772        build_create_system_prompt(&context)
773    }
774
775    /// Builds the user prompt for issue creation/formatting.
776    #[must_use]
777    fn build_create_user_prompt(title: &str, body: &str, _repo: &str) -> String {
778        let sanitized_title = sanitize_prompt_field(title);
779        let sanitized_body = sanitize_prompt_field(body);
780        format!(
781            "Please format this GitHub issue:\n\nTitle: {sanitized_title}\n\nBody:\n{sanitized_body}{}{}",
782            SCHEMA_PREAMBLE,
783            crate::ai::prompts::CREATE_SCHEMA
784        )
785    }
786
787    /// Reviews a pull request using the provider's API.
788    ///
789    /// Analyzes PR metadata and file diffs to provide structured review feedback.
790    ///
791    /// # Arguments
792    ///
793    /// * `pr` - Pull request details including files and diffs
794    ///
795    /// # Errors
796    ///
797    /// Returns an error if:
798    /// - API request fails (network, timeout, rate limit)
799    /// - Response cannot be parsed as valid JSON
800    #[instrument(skip(self, pr, ast_context, call_graph), fields(pr_number = pr.number, repo = %format!("{}/{}", pr.owner, pr.repo)))]
801    async fn review_pr(
802        &self,
803        pr: &super::types::PrDetails,
804        mut ast_context: String,
805        mut call_graph: String,
806        review_config: &crate::config::ReviewConfig,
807    ) -> Result<(super::types::PrReviewResponse, AiStats)> {
808        debug!(model = %self.model(), "Calling {} API for PR review", self.name());
809
810        // Estimate preliminary size; enforce drop order for budget control
811        let mut estimated_size = pr.title.len()
812            + pr.body.len()
813            + pr.files
814                .iter()
815                .map(|f| f.patch.as_ref().map_or(0, String::len))
816                .sum::<usize>()
817            + pr.files
818                .iter()
819                .map(|f| f.full_content.as_ref().map_or(0, String::len))
820                .sum::<usize>()
821            + ast_context.len()
822            + call_graph.len()
823            + PROMPT_OVERHEAD_CHARS;
824
825        let max_prompt_chars = review_config.max_prompt_chars;
826
827        // Drop call_graph if over budget
828        if estimated_size > max_prompt_chars {
829            tracing::warn!(
830                section = "call_graph",
831                chars = call_graph.len(),
832                "Dropping section: prompt budget exceeded"
833            );
834            let dropped_chars = call_graph.len();
835            call_graph.clear();
836            estimated_size -= dropped_chars;
837        }
838
839        // Drop ast_context if still over budget
840        if estimated_size > max_prompt_chars {
841            tracing::warn!(
842                section = "ast_context",
843                chars = ast_context.len(),
844                "Dropping section: prompt budget exceeded"
845            );
846            let dropped_chars = ast_context.len();
847            ast_context.clear();
848            estimated_size -= dropped_chars;
849        }
850
851        // Step 3: Drop largest file patches first if still over budget
852        let mut pr_mut = pr.clone();
853        if estimated_size > max_prompt_chars {
854            // Collect files with their patch sizes
855            let mut file_sizes: Vec<(usize, usize)> = pr_mut
856                .files
857                .iter()
858                .enumerate()
859                .map(|(idx, f)| (idx, f.patch.as_ref().map_or(0, String::len)))
860                .collect();
861            // Sort by patch size descending
862            file_sizes.sort_by_key(|x| std::cmp::Reverse(x.1));
863
864            for (file_idx, patch_size) in file_sizes {
865                if estimated_size <= max_prompt_chars {
866                    break;
867                }
868                if patch_size > 0 {
869                    tracing::warn!(
870                        file = %pr_mut.files[file_idx].filename,
871                        patch_chars = patch_size,
872                        "Dropping file patch: prompt budget exceeded"
873                    );
874                    pr_mut.files[file_idx].patch = None;
875                    estimated_size -= patch_size;
876                }
877            }
878        }
879
880        // Step 4: drop full_content on all files
881        if estimated_size > max_prompt_chars {
882            for file in &mut pr_mut.files {
883                if let Some(fc) = file.full_content.take() {
884                    estimated_size = estimated_size.saturating_sub(fc.len());
885                    tracing::warn!(
886                        bytes = fc.len(),
887                        filename = %file.filename,
888                        "prompt budget: dropping full_content"
889                    );
890                }
891            }
892        }
893
894        tracing::info!(
895            prompt_chars = estimated_size,
896            max_chars = max_prompt_chars,
897            "PR review prompt assembled"
898        );
899
900        // Build request
901        let mut system_content = if let Some(override_prompt) =
902            super::context::load_system_prompt_override("pr_review_system").await
903        {
904            override_prompt
905        } else {
906            Self::build_pr_review_system_prompt(self.custom_guidance())
907        };
908
909        // Prepend repository instructions if available
910        if let Some(ref instructions) = pr.instructions {
911            // Escape XML delimiters to prevent tag injection
912            let escaped_instructions = instructions
913                .replace('&', "&amp;")
914                .replace('<', "&lt;")
915                .replace('>', "&gt;");
916            system_content = format!(
917                "<repo_instructions>\n{escaped_instructions}\n</repo_instructions>\n\n{system_content}"
918            );
919        }
920
921        // Assemble full prompt to measure actual size
922        let assembled_prompt =
923            Self::build_pr_review_user_prompt(&pr_mut, &ast_context, &call_graph);
924        let actual_prompt_chars = assembled_prompt.len();
925
926        tracing::info!(
927            actual_prompt_chars,
928            estimated_prompt_chars = estimated_size,
929            max_chars = max_prompt_chars,
930            "Actual assembled prompt size vs. estimate"
931        );
932
933        let mut messages = vec![
934            ChatMessage {
935                role: "system".to_string(),
936                content: Some(system_content),
937                reasoning: None,
938                cache_control: None,
939            },
940            ChatMessage {
941                role: "user".to_string(),
942                content: Some(assembled_prompt),
943                reasoning: None,
944                cache_control: None,
945            },
946        ];
947
948        // Inject cache control on system message for Anthropic
949        if self.is_anthropic()
950            && let Some(msg) = messages.first_mut()
951        {
952            msg.cache_control = Some(super::types::CacheControl::ephemeral());
953        }
954
955        let request = ChatCompletionRequest {
956            model: self.model().to_string(),
957            messages,
958            response_format: Some(ResponseFormat {
959                format_type: "json_object".to_string(),
960                json_schema: None,
961            }),
962            max_tokens: Some(self.max_tokens()),
963            temperature: Some(self.temperature()),
964        };
965
966        // Send request and parse JSON with retry logic
967        let (review, mut ai_stats) = self
968            .send_and_parse::<super::types::PrReviewResponse>(&request)
969            .await?;
970
971        ai_stats.prompt_chars = actual_prompt_chars;
972
973        debug!(
974            verdict = %review.verdict,
975            input_tokens = ai_stats.input_tokens,
976            output_tokens = ai_stats.output_tokens,
977            duration_ms = ai_stats.duration_ms,
978            prompt_chars = ai_stats.prompt_chars,
979            "PR review complete with stats"
980        );
981
982        Ok((review, ai_stats))
983    }
984
985    /// Suggests labels for a pull request using the provider's API.
986    ///
987    /// Analyzes PR title, body, and file paths to suggest relevant labels.
988    ///
989    /// # Arguments
990    ///
991    /// * `title` - Pull request title
992    /// * `body` - Pull request description
993    /// * `file_paths` - List of file paths changed in the PR
994    ///
995    /// # Errors
996    ///
997    /// Returns an error if:
998    /// - API request fails (network, timeout, rate limit)
999    /// - Response cannot be parsed as valid JSON
1000    #[instrument(skip(self), fields(title = %title))]
1001    async fn suggest_pr_labels(
1002        &self,
1003        title: &str,
1004        body: &str,
1005        file_paths: &[String],
1006    ) -> Result<(Vec<String>, AiStats)> {
1007        debug!(model = %self.model(), "Calling {} API for PR label suggestion", self.name());
1008
1009        // Build request
1010        let system_content = if let Some(override_prompt) =
1011            super::context::load_system_prompt_override("pr_label_system").await
1012        {
1013            override_prompt
1014        } else {
1015            Self::build_pr_label_system_prompt(self.custom_guidance())
1016        };
1017
1018        let mut messages = vec![
1019            ChatMessage {
1020                role: "system".to_string(),
1021                content: Some(system_content),
1022                reasoning: None,
1023                cache_control: None,
1024            },
1025            ChatMessage {
1026                role: "user".to_string(),
1027                content: Some(Self::build_pr_label_user_prompt(title, body, file_paths)),
1028                reasoning: None,
1029                cache_control: None,
1030            },
1031        ];
1032
1033        // Inject cache control on system message for Anthropic
1034        if self.is_anthropic()
1035            && let Some(msg) = messages.first_mut()
1036        {
1037            msg.cache_control = Some(super::types::CacheControl::ephemeral());
1038        }
1039
1040        let request = ChatCompletionRequest {
1041            model: self.model().to_string(),
1042            messages,
1043            response_format: Some(ResponseFormat {
1044                format_type: "json_object".to_string(),
1045                json_schema: None,
1046            }),
1047            max_tokens: Some(self.max_tokens()),
1048            temperature: Some(self.temperature()),
1049        };
1050
1051        // Send request and parse JSON with retry logic
1052        let (response, ai_stats) = self
1053            .send_and_parse::<super::types::PrLabelResponse>(&request)
1054            .await?;
1055
1056        debug!(
1057            label_count = response.suggested_labels.len(),
1058            input_tokens = ai_stats.input_tokens,
1059            output_tokens = ai_stats.output_tokens,
1060            duration_ms = ai_stats.duration_ms,
1061            "PR label suggestion complete with stats"
1062        );
1063
1064        Ok((response.suggested_labels, ai_stats))
1065    }
1066
1067    /// Builds the system prompt for PR review.
1068    #[must_use]
1069    fn build_pr_review_system_prompt(custom_guidance: Option<&str>) -> String {
1070        let context = super::context::load_custom_guidance(custom_guidance);
1071        build_pr_review_system_prompt(&context)
1072    }
1073
1074    /// Builds the user prompt for PR review.
1075    ///
1076    /// All user-controlled fields (title, body, filename, status, patch) are sanitized via
1077    /// [`sanitize_prompt_field`] before being written into the prompt to prevent prompt
1078    /// injection via XML tag smuggling.
1079    #[must_use]
1080    #[allow(clippy::too_many_lines)]
1081    fn build_pr_review_user_prompt(
1082        pr: &super::types::PrDetails,
1083        ast_context: &str,
1084        call_graph: &str,
1085    ) -> String {
1086        use std::fmt::Write;
1087
1088        let mut prompt = String::new();
1089
1090        prompt.push_str("<pull_request>\n");
1091        let _ = writeln!(prompt, "Title: {}\n", sanitize_prompt_field(&pr.title));
1092        let _ = writeln!(prompt, "Branch: {} -> {}\n", pr.head_branch, pr.base_branch);
1093
1094        // PR description - sanitize before truncation
1095        let sanitized_body = sanitize_prompt_field(&pr.body);
1096        let body = if sanitized_body.is_empty() {
1097            "[No description provided]".to_string()
1098        } else if sanitized_body.len() > MAX_BODY_LENGTH {
1099            format!(
1100                "{}...\n[APTU: description truncated by size budget -- do not speculate on missing content]",
1101                &sanitized_body[..MAX_BODY_LENGTH],
1102            )
1103        } else {
1104            sanitized_body
1105        };
1106        let _ = writeln!(prompt, "Description:\n{body}\n");
1107
1108        // File changes with limits
1109        prompt.push_str("Files Changed:\n");
1110        let mut total_diff_size = 0;
1111        let mut files_included = 0;
1112        let mut files_skipped = 0;
1113
1114        for file in &pr.files {
1115            // Check file count limit
1116            if files_included >= MAX_FILES {
1117                files_skipped += 1;
1118                continue;
1119            }
1120
1121            let _ = writeln!(
1122                prompt,
1123                "- {} ({}) +{} -{}\n",
1124                sanitize_prompt_field(&file.filename),
1125                sanitize_prompt_field(&file.status),
1126                file.additions,
1127                file.deletions
1128            );
1129
1130            // Include patch if available (sanitize then truncate large patches)
1131            if let Some(patch) = &file.patch {
1132                const MAX_PATCH_LENGTH: usize = 2000;
1133                let sanitized_patch = sanitize_prompt_field(patch);
1134                let patch_content = if sanitized_patch.len() > MAX_PATCH_LENGTH {
1135                    format!(
1136                        "{}...\n[APTU: patch truncated by size budget -- do not speculate on missing content]",
1137                        &sanitized_patch[..MAX_PATCH_LENGTH],
1138                    )
1139                } else {
1140                    sanitized_patch
1141                };
1142
1143                // Check if adding this patch would exceed total diff size limit
1144                let patch_size = patch_content.len();
1145                if total_diff_size + patch_size > MAX_TOTAL_DIFF_SIZE {
1146                    let _ = writeln!(
1147                        prompt,
1148                        "```diff\n[APTU: patch omitted due to size budget -- do not speculate on missing content]\n```\n"
1149                    );
1150                    files_skipped += 1;
1151                    continue;
1152                }
1153
1154                // Add annotation if patch was truncated by GitHub API
1155                if file.patch_truncated {
1156                    let _ = writeln!(
1157                        prompt,
1158                        "[APTU: patch truncated by GitHub API -- do not speculate on missing content]\n```diff\n{patch_content}\n```\n"
1159                    );
1160                } else {
1161                    let _ = writeln!(prompt, "```diff\n{patch_content}\n```\n");
1162                }
1163                total_diff_size += patch_size;
1164            }
1165
1166            // Include full file content if available (cap at MAX_FULL_CONTENT_CHARS)
1167            if let Some(content) = &file.full_content {
1168                let sanitized = sanitize_prompt_field(content);
1169                let is_truncated = sanitized.len() > MAX_FULL_CONTENT_CHARS;
1170                let displayed = if is_truncated {
1171                    sanitized[..MAX_FULL_CONTENT_CHARS].to_string()
1172                } else {
1173                    sanitized
1174                };
1175                let _ = writeln!(
1176                    prompt,
1177                    "<file_content path=\"{}\">\n{}\n</file_content>",
1178                    sanitize_prompt_field(&file.filename),
1179                    displayed
1180                );
1181                if is_truncated {
1182                    let _ = writeln!(
1183                        prompt,
1184                        "[APTU: file content truncated by size budget -- do not speculate on missing content]\n"
1185                    );
1186                } else {
1187                    let _ = writeln!(prompt);
1188                }
1189            }
1190
1191            files_included += 1;
1192        }
1193
1194        // Add truncation message if files were skipped
1195        if files_skipped > 0 {
1196            let _ = writeln!(
1197                prompt,
1198                "\n[{files_skipped} files omitted due to size limits (MAX_FILES={MAX_FILES}, MAX_TOTAL_DIFF_SIZE={MAX_TOTAL_DIFF_SIZE})]"
1199            );
1200        }
1201
1202        prompt.push_str("</pull_request>");
1203        if !ast_context.is_empty() {
1204            prompt.push_str(ast_context);
1205        }
1206        if !call_graph.is_empty() {
1207            prompt.push_str(call_graph);
1208        }
1209        prompt.push_str(SCHEMA_PREAMBLE);
1210        prompt.push_str(crate::ai::prompts::PR_REVIEW_SCHEMA);
1211
1212        prompt
1213    }
1214
1215    /// Builds the system prompt for PR label suggestion.
1216    #[must_use]
1217    fn build_pr_label_system_prompt(custom_guidance: Option<&str>) -> String {
1218        let context = super::context::load_custom_guidance(custom_guidance);
1219        build_pr_label_system_prompt(&context)
1220    }
1221
1222    /// Builds the user prompt for PR label suggestion.
1223    #[must_use]
1224    fn build_pr_label_user_prompt(title: &str, body: &str, file_paths: &[String]) -> String {
1225        use std::fmt::Write;
1226
1227        let mut prompt = String::new();
1228
1229        // Sanitize title and body to prevent prompt injection
1230        let sanitized_title = sanitize_prompt_field(title);
1231        let sanitized_body = sanitize_prompt_field(body);
1232
1233        prompt.push_str("<pull_request>\n");
1234        let _ = writeln!(prompt, "Title: {sanitized_title}\n");
1235
1236        // PR description
1237        let body_content = if sanitized_body.is_empty() {
1238            "[No description provided]".to_string()
1239        } else if sanitized_body.len() > MAX_BODY_LENGTH {
1240            format!(
1241                "{}...\n[APTU: description truncated by size budget -- do not speculate on missing content]",
1242                &sanitized_body[..MAX_BODY_LENGTH],
1243            )
1244        } else {
1245            sanitized_body.clone()
1246        };
1247        let _ = writeln!(prompt, "Description:\n{body_content}\n");
1248
1249        // File paths
1250        if !file_paths.is_empty() {
1251            prompt.push_str("Files Changed:\n");
1252            for path in file_paths.iter().take(20) {
1253                let _ = writeln!(prompt, "- {path}");
1254            }
1255            if file_paths.len() > 20 {
1256                let _ = writeln!(prompt, "- ... and {} more files", file_paths.len() - 20);
1257            }
1258            prompt.push('\n');
1259        }
1260
1261        prompt.push_str("</pull_request>");
1262        prompt.push_str(SCHEMA_PREAMBLE);
1263        prompt.push_str(crate::ai::prompts::PR_LABEL_SCHEMA);
1264
1265        prompt
1266    }
1267}
1268
1269#[cfg(test)]
1270mod tests {
1271    use super::*;
1272
1273    /// Shared struct for `parse_ai_json` error-path tests.
1274    /// The field is only used via serde deserialization; `_message` silences `dead_code`.
1275    #[derive(Debug, serde::Deserialize)]
1276    struct ErrorTestResponse {
1277        _message: String,
1278    }
1279
1280    struct TestProvider;
1281
1282    impl AiProvider for TestProvider {
1283        fn name(&self) -> &'static str {
1284            "test"
1285        }
1286
1287        fn api_url(&self) -> &'static str {
1288            "https://test.example.com"
1289        }
1290
1291        fn api_key_env(&self) -> &'static str {
1292            "TEST_API_KEY"
1293        }
1294
1295        fn http_client(&self) -> &Client {
1296            unimplemented!()
1297        }
1298
1299        fn api_key(&self) -> &SecretString {
1300            unimplemented!()
1301        }
1302
1303        fn model(&self) -> &'static str {
1304            "test-model"
1305        }
1306
1307        fn max_tokens(&self) -> u32 {
1308            2048
1309        }
1310
1311        fn temperature(&self) -> f32 {
1312            0.3
1313        }
1314    }
1315
1316    #[test]
1317    fn test_build_system_prompt_contains_json_schema() {
1318        let system_prompt = TestProvider::build_system_prompt(None);
1319        // Schema description strings are unique to the schema file and must NOT appear in the
1320        // system prompt after moving schema injection to the user turn.
1321        assert!(
1322            !system_prompt
1323                .contains("A 2-3 sentence summary of what the issue is about and its impact")
1324        );
1325
1326        // Schema MUST appear in the user prompt
1327        let issue = IssueDetails::builder()
1328            .owner("test".to_string())
1329            .repo("repo".to_string())
1330            .number(1)
1331            .title("Test".to_string())
1332            .body("Body".to_string())
1333            .labels(vec![])
1334            .comments(vec![])
1335            .url("https://github.com/test/repo/issues/1".to_string())
1336            .build();
1337        let user_prompt = TestProvider::build_user_prompt(&issue);
1338        assert!(
1339            user_prompt
1340                .contains("A 2-3 sentence summary of what the issue is about and its impact")
1341        );
1342        assert!(user_prompt.contains("suggested_labels"));
1343    }
1344
1345    #[test]
1346    fn test_build_user_prompt_with_delimiters() {
1347        let issue = IssueDetails::builder()
1348            .owner("test".to_string())
1349            .repo("repo".to_string())
1350            .number(1)
1351            .title("Test issue".to_string())
1352            .body("This is the body".to_string())
1353            .labels(vec!["bug".to_string()])
1354            .comments(vec![])
1355            .url("https://github.com/test/repo/issues/1".to_string())
1356            .build();
1357
1358        let prompt = TestProvider::build_user_prompt(&issue);
1359        assert!(prompt.starts_with("<issue_content>"));
1360        assert!(prompt.contains("</issue_content>"));
1361        assert!(prompt.contains("Respond with valid JSON matching this schema"));
1362        assert!(prompt.contains("Title: Test issue"));
1363        assert!(prompt.contains("This is the body"));
1364        assert!(prompt.contains("Existing Labels: bug"));
1365    }
1366
1367    #[test]
1368    fn test_build_user_prompt_truncates_long_body() {
1369        let long_body = "x".repeat(5000);
1370        let issue = IssueDetails::builder()
1371            .owner("test".to_string())
1372            .repo("repo".to_string())
1373            .number(1)
1374            .title("Test".to_string())
1375            .body(long_body)
1376            .labels(vec![])
1377            .comments(vec![])
1378            .url("https://github.com/test/repo/issues/1".to_string())
1379            .build();
1380
1381        let prompt = TestProvider::build_user_prompt(&issue);
1382        assert!(prompt.contains(
1383            "[APTU: body truncated by size budget -- do not speculate on missing content]"
1384        ));
1385    }
1386
1387    #[test]
1388    fn test_build_user_prompt_empty_body() {
1389        let issue = IssueDetails::builder()
1390            .owner("test".to_string())
1391            .repo("repo".to_string())
1392            .number(1)
1393            .title("Test".to_string())
1394            .body(String::new())
1395            .labels(vec![])
1396            .comments(vec![])
1397            .url("https://github.com/test/repo/issues/1".to_string())
1398            .build();
1399
1400        let prompt = TestProvider::build_user_prompt(&issue);
1401        assert!(prompt.contains("[No description provided]"));
1402    }
1403
1404    #[test]
1405    fn test_build_create_system_prompt_contains_json_schema() {
1406        let system_prompt = TestProvider::build_create_system_prompt(None);
1407        // Schema description strings are unique to the schema file and must NOT appear in system prompt.
1408        assert!(
1409            !system_prompt
1410                .contains("Well-formatted issue title following conventional commit style")
1411        );
1412
1413        // Schema MUST appear in the user prompt
1414        let user_prompt =
1415            TestProvider::build_create_user_prompt("My title", "My body", "test/repo");
1416        assert!(
1417            user_prompt.contains("Well-formatted issue title following conventional commit style")
1418        );
1419        assert!(user_prompt.contains("formatted_body"));
1420    }
1421
1422    #[test]
1423    fn test_build_pr_review_user_prompt_respects_file_limit() {
1424        use super::super::types::{PrDetails, PrFile};
1425
1426        let mut files = Vec::new();
1427        for i in 0..25 {
1428            files.push(PrFile {
1429                filename: format!("file{i}.rs"),
1430                status: "modified".to_string(),
1431                additions: 10,
1432                deletions: 5,
1433                patch: Some(format!("patch content {i}")),
1434                patch_truncated: false,
1435                full_content: None,
1436            });
1437        }
1438
1439        let pr = PrDetails {
1440            owner: "test".to_string(),
1441            repo: "repo".to_string(),
1442            number: 1,
1443            title: "Test PR".to_string(),
1444            body: "Description".to_string(),
1445            head_branch: "feature".to_string(),
1446            base_branch: "main".to_string(),
1447            url: "https://github.com/test/repo/pull/1".to_string(),
1448            files,
1449            labels: vec![],
1450            head_sha: String::new(),
1451            review_comments: vec![],
1452            instructions: None,
1453        };
1454
1455        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
1456        assert!(prompt.contains("files omitted due to size limits"));
1457        assert!(prompt.contains("MAX_FILES=20"));
1458    }
1459
1460    #[test]
1461    fn test_build_pr_review_user_prompt_respects_diff_size_limit() {
1462        use super::super::types::{PrDetails, PrFile};
1463
1464        // Create patches that will exceed the limit when combined
1465        // Each patch is ~30KB, so two will exceed 50KB limit
1466        let patch1 = "x".repeat(30_000);
1467        let patch2 = "y".repeat(30_000);
1468
1469        let files = vec![
1470            PrFile {
1471                filename: "file1.rs".to_string(),
1472                status: "modified".to_string(),
1473                additions: 100,
1474                deletions: 50,
1475                patch: Some(patch1),
1476                patch_truncated: false,
1477                full_content: None,
1478            },
1479            PrFile {
1480                filename: "file2.rs".to_string(),
1481                status: "modified".to_string(),
1482                additions: 100,
1483                deletions: 50,
1484                patch: Some(patch2),
1485                patch_truncated: false,
1486                full_content: None,
1487            },
1488        ];
1489
1490        let pr = PrDetails {
1491            owner: "test".to_string(),
1492            repo: "repo".to_string(),
1493            number: 1,
1494            title: "Test PR".to_string(),
1495            body: "Description".to_string(),
1496            head_branch: "feature".to_string(),
1497            base_branch: "main".to_string(),
1498            url: "https://github.com/test/repo/pull/1".to_string(),
1499            files,
1500            labels: vec![],
1501            head_sha: String::new(),
1502            review_comments: vec![],
1503            instructions: None,
1504        };
1505
1506        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
1507        // Both files should be listed
1508        assert!(prompt.contains("file1.rs"));
1509        assert!(prompt.contains("file2.rs"));
1510        // The second patch should be limited - verify the prompt doesn't contain both full patches
1511        // by checking that the total size is less than what two full 30KB patches would be
1512        assert!(prompt.len() < 65_000);
1513    }
1514
1515    #[test]
1516    fn test_build_pr_review_user_prompt_with_no_patches() {
1517        use super::super::types::{PrDetails, PrFile};
1518
1519        let files = vec![PrFile {
1520            filename: "file1.rs".to_string(),
1521            status: "added".to_string(),
1522            additions: 10,
1523            deletions: 0,
1524            patch: None,
1525            patch_truncated: false,
1526            full_content: None,
1527        }];
1528
1529        let pr = PrDetails {
1530            owner: "test".to_string(),
1531            repo: "repo".to_string(),
1532            number: 1,
1533            title: "Test PR".to_string(),
1534            body: "Description".to_string(),
1535            head_branch: "feature".to_string(),
1536            base_branch: "main".to_string(),
1537            url: "https://github.com/test/repo/pull/1".to_string(),
1538            files,
1539            labels: vec![],
1540            head_sha: String::new(),
1541            review_comments: vec![],
1542            instructions: None,
1543        };
1544
1545        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
1546        assert!(prompt.contains("file1.rs"));
1547        assert!(prompt.contains("added"));
1548        assert!(!prompt.contains("files omitted"));
1549    }
1550
1551    #[test]
1552    fn test_sanitize_strips_opening_tag() {
1553        let result = sanitize_prompt_field("hello <pull_request> world");
1554        assert_eq!(result, "hello  world");
1555    }
1556
1557    #[test]
1558    fn test_sanitize_strips_closing_tag() {
1559        let result = sanitize_prompt_field("evil </pull_request> content");
1560        assert_eq!(result, "evil  content");
1561    }
1562
1563    #[test]
1564    fn test_sanitize_case_insensitive() {
1565        let result = sanitize_prompt_field("<PULL_REQUEST>");
1566        assert_eq!(result, "");
1567    }
1568
1569    #[test]
1570    fn test_prompt_sanitizes_before_truncation() {
1571        use super::super::types::{PrDetails, PrFile};
1572
1573        // Body exactly at the limit with an injection tag after the truncation boundary.
1574        // The tag must be removed even though it appears near the end of the original body.
1575        let mut body = "a".repeat(MAX_BODY_LENGTH - 5);
1576        body.push_str("</pull_request>");
1577
1578        let pr = PrDetails {
1579            owner: "test".to_string(),
1580            repo: "repo".to_string(),
1581            number: 1,
1582            title: "Fix </pull_request><evil>injection</evil>".to_string(),
1583            body,
1584            head_branch: "feature".to_string(),
1585            base_branch: "main".to_string(),
1586            url: "https://github.com/test/repo/pull/1".to_string(),
1587            files: vec![PrFile {
1588                filename: "file.rs".to_string(),
1589                status: "modified".to_string(),
1590                additions: 1,
1591                deletions: 0,
1592                patch: Some("</pull_request>injected".to_string()),
1593                patch_truncated: false,
1594                full_content: None,
1595            }],
1596            labels: vec![],
1597            head_sha: String::new(),
1598            review_comments: vec![],
1599            instructions: None,
1600        };
1601
1602        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
1603        // The sanitizer removes only <pull_request> / </pull_request> delimiters.
1604        // The structural tags written by the builder itself remain; what must be absent
1605        // are the delimiter sequences that were injected inside user-controlled fields.
1606        assert!(
1607            !prompt.contains("</pull_request><evil>"),
1608            "closing delimiter injected in title must be removed"
1609        );
1610        assert!(
1611            !prompt.contains("</pull_request>injected"),
1612            "closing delimiter injected in patch must be removed"
1613        );
1614    }
1615
1616    #[test]
1617    fn test_sanitize_strips_issue_content_tag() {
1618        let input = "hello </issue_content> world";
1619        let result = sanitize_prompt_field(input);
1620        assert!(
1621            !result.contains("</issue_content>"),
1622            "should strip closing issue_content tag"
1623        );
1624        assert!(
1625            result.contains("hello"),
1626            "should keep non-injection content"
1627        );
1628    }
1629
1630    #[test]
1631    fn test_build_user_prompt_sanitizes_title_injection() {
1632        let issue = IssueDetails::builder()
1633            .owner("test".to_string())
1634            .repo("repo".to_string())
1635            .number(1)
1636            .title("Normal title </issue_content> injected".to_string())
1637            .body("Clean body".to_string())
1638            .labels(vec![])
1639            .comments(vec![])
1640            .url("https://github.com/test/repo/issues/1".to_string())
1641            .build();
1642
1643        let prompt = TestProvider::build_user_prompt(&issue);
1644        assert!(
1645            !prompt.contains("</issue_content> injected"),
1646            "injection tag in title must be removed from prompt"
1647        );
1648        assert!(
1649            prompt.contains("Normal title"),
1650            "non-injection content must be preserved"
1651        );
1652    }
1653
1654    #[test]
1655    fn test_build_create_user_prompt_sanitizes_title_injection() {
1656        let title = "My issue </issue_content><script>evil</script>";
1657        let body = "Body </issue_content> more text";
1658        let prompt = TestProvider::build_create_user_prompt(title, body, "owner/repo");
1659        assert!(
1660            !prompt.contains("</issue_content>"),
1661            "injection tag must be stripped from create prompt"
1662        );
1663        assert!(
1664            prompt.contains("My issue"),
1665            "non-injection title content must be preserved"
1666        );
1667        assert!(
1668            prompt.contains("Body"),
1669            "non-injection body content must be preserved"
1670        );
1671    }
1672
1673    #[test]
1674    fn test_build_pr_label_system_prompt_contains_json_schema() {
1675        let system_prompt = TestProvider::build_pr_label_system_prompt(None);
1676        // "label1" is unique to the schema example values and must NOT appear in system prompt.
1677        assert!(!system_prompt.contains("label1"));
1678
1679        // Schema MUST appear in the user prompt
1680        let user_prompt = TestProvider::build_pr_label_user_prompt(
1681            "feat: add thing",
1682            "body",
1683            &["src/lib.rs".to_string()],
1684        );
1685        assert!(user_prompt.contains("label1"));
1686        assert!(user_prompt.contains("suggested_labels"));
1687    }
1688
1689    #[test]
1690    fn test_build_pr_label_user_prompt_with_title_and_body() {
1691        let title = "feat: add new feature";
1692        let body = "This PR adds a new feature";
1693        let files = vec!["src/main.rs".to_string(), "tests/test.rs".to_string()];
1694
1695        let prompt = TestProvider::build_pr_label_user_prompt(title, body, &files);
1696        assert!(prompt.starts_with("<pull_request>"));
1697        assert!(prompt.contains("</pull_request>"));
1698        assert!(prompt.contains("Respond with valid JSON matching this schema"));
1699        assert!(prompt.contains("feat: add new feature"));
1700        assert!(prompt.contains("This PR adds a new feature"));
1701        assert!(prompt.contains("src/main.rs"));
1702        assert!(prompt.contains("tests/test.rs"));
1703    }
1704
1705    #[test]
1706    fn test_build_pr_label_user_prompt_empty_body() {
1707        let title = "fix: bug fix";
1708        let body = "";
1709        let files = vec!["src/lib.rs".to_string()];
1710
1711        let prompt = TestProvider::build_pr_label_user_prompt(title, body, &files);
1712        assert!(prompt.contains("[No description provided]"));
1713        assert!(prompt.contains("src/lib.rs"));
1714    }
1715
1716    #[test]
1717    fn test_build_pr_label_user_prompt_truncates_long_body() {
1718        let title = "test";
1719        let long_body = "x".repeat(5000);
1720        let files = vec![];
1721
1722        let prompt = TestProvider::build_pr_label_user_prompt(title, &long_body, &files);
1723        assert!(prompt.contains(
1724            "[APTU: description truncated by size budget -- do not speculate on missing content]"
1725        ));
1726    }
1727
1728    #[test]
1729    fn test_build_pr_label_user_prompt_respects_file_limit() {
1730        let title = "test";
1731        let body = "test";
1732        let mut files = Vec::new();
1733        for i in 0..25 {
1734            files.push(format!("file{i}.rs"));
1735        }
1736
1737        let prompt = TestProvider::build_pr_label_user_prompt(title, body, &files);
1738        assert!(prompt.contains("file0.rs"));
1739        assert!(prompt.contains("file19.rs"));
1740        assert!(!prompt.contains("file20.rs"));
1741        assert!(prompt.contains("... and 5 more files"));
1742    }
1743
1744    #[test]
1745    fn test_build_pr_label_user_prompt_empty_files() {
1746        let title = "test";
1747        let body = "test";
1748        let files: Vec<String> = vec![];
1749
1750        let prompt = TestProvider::build_pr_label_user_prompt(title, body, &files);
1751        assert!(prompt.contains("Title: test"));
1752        assert!(prompt.contains("Description:\ntest"));
1753        assert!(!prompt.contains("Files Changed:"));
1754    }
1755
1756    #[test]
1757    fn test_parse_ai_json_with_valid_json() {
1758        #[derive(serde::Deserialize)]
1759        struct TestResponse {
1760            message: String,
1761        }
1762
1763        let json = r#"{"message": "hello"}"#;
1764        let result: Result<TestResponse> = parse_ai_json(json, "test-provider");
1765        assert!(result.is_ok());
1766        let response = result.unwrap();
1767        assert_eq!(response.message, "hello");
1768    }
1769
1770    #[test]
1771    fn test_parse_ai_json_with_truncated_json() {
1772        let json = r#"{"message": "hello"#;
1773        let result: Result<ErrorTestResponse> = parse_ai_json(json, "test-provider");
1774        assert!(result.is_err());
1775        let err = result.unwrap_err();
1776        assert!(
1777            err.to_string()
1778                .contains("Truncated response from test-provider")
1779        );
1780    }
1781
1782    #[test]
1783    fn test_parse_ai_json_with_malformed_json() {
1784        let json = r#"{"message": invalid}"#;
1785        let result: Result<ErrorTestResponse> = parse_ai_json(json, "test-provider");
1786        assert!(result.is_err());
1787        let err = result.unwrap_err();
1788        assert!(err.to_string().contains("Invalid JSON response from AI"));
1789    }
1790
1791    #[tokio::test]
1792    async fn test_load_system_prompt_override_returns_none_when_absent() {
1793        let result =
1794            super::super::context::load_system_prompt_override("__nonexistent_test_override__")
1795                .await;
1796        assert!(result.is_none());
1797    }
1798
1799    #[tokio::test]
1800    async fn test_load_system_prompt_override_returns_content_when_present() {
1801        use std::io::Write;
1802        let dir = tempfile::tempdir().expect("create tempdir");
1803        let file_path = dir.path().join("test_override.md");
1804        let mut f = std::fs::File::create(&file_path).expect("create file");
1805        writeln!(f, "Custom override content").expect("write file");
1806        drop(f);
1807
1808        let content = tokio::fs::read_to_string(&file_path).await.ok();
1809        assert_eq!(content.as_deref(), Some("Custom override content\n"));
1810    }
1811
1812    #[test]
1813    fn test_build_pr_review_prompt_omits_call_graph_when_oversized() {
1814        use super::super::types::{PrDetails, PrFile};
1815
1816        // Arrange: simulate review_pr dropping call_graph due to budget.
1817        // When call_graph is oversized, review_pr clears it before calling build_pr_review_user_prompt.
1818        let pr = PrDetails {
1819            owner: "test".to_string(),
1820            repo: "repo".to_string(),
1821            number: 1,
1822            title: "Budget drop test".to_string(),
1823            body: "body".to_string(),
1824            head_branch: "feat".to_string(),
1825            base_branch: "main".to_string(),
1826            url: "https://github.com/test/repo/pull/1".to_string(),
1827            files: vec![PrFile {
1828                filename: "lib.rs".to_string(),
1829                status: "modified".to_string(),
1830                additions: 1,
1831                deletions: 0,
1832                patch: Some("+line".to_string()),
1833                patch_truncated: false,
1834                full_content: None,
1835            }],
1836            labels: vec![],
1837            head_sha: String::new(),
1838            review_comments: vec![],
1839            instructions: None,
1840        };
1841
1842        // Act: call build_pr_review_user_prompt with empty call_graph (dropped by review_pr)
1843        // and non-empty ast_context (retained because it fits after call_graph drop)
1844        let ast_context = "Y".repeat(500);
1845        let call_graph = "";
1846        let prompt = TestProvider::build_pr_review_user_prompt(&pr, &ast_context, call_graph);
1847
1848        // Assert: call_graph absent, ast_context present
1849        assert!(
1850            !prompt.contains(&"X".repeat(10)),
1851            "call_graph content must not appear in prompt after budget drop"
1852        );
1853        assert!(
1854            prompt.contains(&"Y".repeat(10)),
1855            "ast_context content must appear in prompt (fits within budget)"
1856        );
1857    }
1858
1859    #[test]
1860    fn test_build_pr_review_prompt_omits_ast_after_call_graph() {
1861        use super::super::types::{PrDetails, PrFile};
1862
1863        // Arrange: simulate review_pr dropping both call_graph and ast_context due to budget.
1864        let pr = PrDetails {
1865            owner: "test".to_string(),
1866            repo: "repo".to_string(),
1867            number: 1,
1868            title: "Budget drop test".to_string(),
1869            body: "body".to_string(),
1870            head_branch: "feat".to_string(),
1871            base_branch: "main".to_string(),
1872            url: "https://github.com/test/repo/pull/1".to_string(),
1873            files: vec![PrFile {
1874                filename: "lib.rs".to_string(),
1875                status: "modified".to_string(),
1876                additions: 1,
1877                deletions: 0,
1878                patch: Some("+line".to_string()),
1879                patch_truncated: false,
1880                full_content: None,
1881            }],
1882            labels: vec![],
1883            head_sha: String::new(),
1884            review_comments: vec![],
1885            instructions: None,
1886        };
1887
1888        // Act: call build_pr_review_user_prompt with both empty (dropped by review_pr)
1889        let ast_context = "";
1890        let call_graph = "";
1891        let prompt = TestProvider::build_pr_review_user_prompt(&pr, ast_context, call_graph);
1892
1893        // Assert: both absent, PR title retained
1894        assert!(
1895            !prompt.contains(&"C".repeat(10)),
1896            "call_graph content must not appear after budget drop"
1897        );
1898        assert!(
1899            !prompt.contains(&"A".repeat(10)),
1900            "ast_context content must not appear after budget drop"
1901        );
1902        assert!(
1903            prompt.contains("Budget drop test"),
1904            "PR title must be retained in prompt"
1905        );
1906    }
1907
1908    #[test]
1909    fn test_build_pr_review_prompt_drops_patches_when_over_budget() {
1910        use super::super::types::{PrDetails, PrFile};
1911
1912        // Arrange: simulate review_pr dropping patches due to budget.
1913        // Create 3 files with patches of different sizes.
1914        let pr = PrDetails {
1915            owner: "test".to_string(),
1916            repo: "repo".to_string(),
1917            number: 1,
1918            title: "Patch drop test".to_string(),
1919            body: "body".to_string(),
1920            head_branch: "feat".to_string(),
1921            base_branch: "main".to_string(),
1922            url: "https://github.com/test/repo/pull/1".to_string(),
1923            files: vec![
1924                PrFile {
1925                    filename: "large.rs".to_string(),
1926                    status: "modified".to_string(),
1927                    additions: 100,
1928                    deletions: 50,
1929                    patch: Some("L".repeat(5000)),
1930                    patch_truncated: false,
1931                    full_content: None,
1932                },
1933                PrFile {
1934                    filename: "medium.rs".to_string(),
1935                    status: "modified".to_string(),
1936                    additions: 50,
1937                    deletions: 25,
1938                    patch: Some("M".repeat(3000)),
1939                    patch_truncated: false,
1940                    full_content: None,
1941                },
1942                PrFile {
1943                    filename: "small.rs".to_string(),
1944                    status: "modified".to_string(),
1945                    additions: 10,
1946                    deletions: 5,
1947                    patch: Some("S".repeat(1000)),
1948                    patch_truncated: false,
1949                    full_content: None,
1950                },
1951            ],
1952            labels: vec![],
1953            head_sha: String::new(),
1954            review_comments: vec![],
1955            instructions: None,
1956        };
1957
1958        // Act: simulate review_pr dropping largest patches first
1959        let mut pr_mut = pr.clone();
1960        pr_mut.files[0].patch = None; // Drop largest patch
1961        pr_mut.files[1].patch = None; // Drop medium patch
1962        // Keep smallest patch
1963
1964        let ast_context = "";
1965        let call_graph = "";
1966        let prompt = TestProvider::build_pr_review_user_prompt(&pr_mut, ast_context, call_graph);
1967
1968        // Assert: largest patches absent, smallest present
1969        assert!(
1970            !prompt.contains(&"L".repeat(10)),
1971            "largest patch must be absent after drop"
1972        );
1973        assert!(
1974            !prompt.contains(&"M".repeat(10)),
1975            "medium patch must be absent after drop"
1976        );
1977        assert!(
1978            prompt.contains(&"S".repeat(10)),
1979            "smallest patch must be present"
1980        );
1981    }
1982
1983    #[test]
1984    fn test_build_pr_review_prompt_drops_full_content_as_last_resort() {
1985        use super::super::types::{PrDetails, PrFile};
1986
1987        // Arrange: simulate review_pr dropping full_content as last resort.
1988        let pr = PrDetails {
1989            owner: "test".to_string(),
1990            repo: "repo".to_string(),
1991            number: 1,
1992            title: "Full content drop test".to_string(),
1993            body: "body".to_string(),
1994            head_branch: "feat".to_string(),
1995            base_branch: "main".to_string(),
1996            url: "https://github.com/test/repo/pull/1".to_string(),
1997            files: vec![
1998                PrFile {
1999                    filename: "file1.rs".to_string(),
2000                    status: "modified".to_string(),
2001                    additions: 10,
2002                    deletions: 5,
2003                    patch: None,
2004                    patch_truncated: false,
2005                    full_content: Some("F".repeat(5000)),
2006                },
2007                PrFile {
2008                    filename: "file2.rs".to_string(),
2009                    status: "modified".to_string(),
2010                    additions: 10,
2011                    deletions: 5,
2012                    patch: None,
2013                    patch_truncated: false,
2014                    full_content: Some("C".repeat(3000)),
2015                },
2016            ],
2017            labels: vec![],
2018            head_sha: String::new(),
2019            review_comments: vec![],
2020            instructions: None,
2021        };
2022
2023        // Act: simulate review_pr dropping all full_content
2024        let mut pr_mut = pr.clone();
2025        for file in &mut pr_mut.files {
2026            file.full_content = None;
2027        }
2028
2029        let ast_context = "";
2030        let call_graph = "";
2031        let prompt = TestProvider::build_pr_review_user_prompt(&pr_mut, ast_context, call_graph);
2032
2033        // Assert: no file_content XML blocks appear
2034        assert!(
2035            !prompt.contains("<file_content"),
2036            "file_content blocks must not appear when full_content is cleared"
2037        );
2038        assert!(
2039            !prompt.contains(&"F".repeat(10)),
2040            "full_content from file1 must not appear"
2041        );
2042        assert!(
2043            !prompt.contains(&"C".repeat(10)),
2044            "full_content from file2 must not appear"
2045        );
2046    }
2047
2048    #[test]
2049    fn test_redact_api_error_body_truncates() {
2050        // Arrange: Create a long error body
2051        let long_body = "x".repeat(300);
2052
2053        // Act: Redact the error body
2054        let result = redact_api_error_body(&long_body);
2055
2056        // Assert: Result should be truncated and marked
2057        assert!(result.len() < long_body.len());
2058        assert!(result.ends_with("[truncated]"));
2059        assert_eq!(result.len(), 200 + " [truncated]".len());
2060    }
2061
2062    #[test]
2063    fn test_redact_api_error_body_short() {
2064        // Arrange: Create a short error body
2065        let short_body = "Short error";
2066
2067        // Act: Redact the error body
2068        let result = redact_api_error_body(short_body);
2069
2070        // Assert: Result should be unchanged
2071        assert_eq!(result, short_body);
2072    }
2073
2074    #[test]
2075    fn test_full_content_truncation_annotation_added() {
2076        use super::super::types::{PrDetails, PrFile};
2077
2078        // Arrange: PR with file content that will be truncated
2079        let pr = PrDetails {
2080            owner: "test".to_string(),
2081            repo: "repo".to_string(),
2082            number: 1,
2083            title: "Test PR".to_string(),
2084            body: "body".to_string(),
2085            head_branch: "feat".to_string(),
2086            base_branch: "main".to_string(),
2087            url: "https://github.com/test/repo/pull/1".to_string(),
2088            files: vec![PrFile {
2089                filename: "large_file.rs".to_string(),
2090                status: "modified".to_string(),
2091                additions: 10,
2092                deletions: 5,
2093                patch: Some("--- a/file\n+++ b/file\n@@ -1 @@\n+added".to_string()),
2094                patch_truncated: false,
2095                full_content: Some("x".repeat(10000)), // Will be truncated
2096            }],
2097            labels: vec![],
2098            head_sha: String::new(),
2099            review_comments: vec![],
2100            instructions: None,
2101        };
2102
2103        // Act: build prompt
2104        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
2105
2106        // Assert: truncation annotation is present outside file_content tags
2107        assert!(
2108            prompt.contains("[APTU: file content truncated by size budget -- do not speculate on missing content]"),
2109            "truncation annotation must be present for truncated full_content"
2110        );
2111        // Verify annotation is outside the XML tags
2112        let file_content_end = prompt
2113            .find("</file_content>")
2114            .expect("file_content tags must exist");
2115        let annotation_pos = prompt
2116            .find("[APTU: file content truncated")
2117            .expect("annotation must exist");
2118        assert!(
2119            annotation_pos > file_content_end,
2120            "annotation must be outside </file_content> tags"
2121        );
2122    }
2123
2124    #[test]
2125    fn test_all_truncation_annotations_consistent_format() {
2126        use super::super::types::{IssueDetails, PrDetails, PrFile};
2127
2128        // Arrange: issue with truncated body
2129        let issue = IssueDetails::builder()
2130            .owner("test".to_string())
2131            .repo("repo".to_string())
2132            .number(1)
2133            .title("Test Issue".to_string())
2134            .body("x".repeat(40000)) // Will be truncated
2135            .labels(vec![])
2136            .url("https://github.com/test/repo/issues/1".to_string())
2137            .comments(vec![])
2138            .build();
2139
2140        // Act: build triage prompt
2141        let prompt = TestProvider::build_user_prompt(&issue);
2142
2143        // Assert: body truncation uses consistent format
2144        assert!(
2145            prompt.contains(
2146                "[APTU: body truncated by size budget -- do not speculate on missing content]"
2147            ),
2148            "body truncation must use [APTU: ...] format"
2149        );
2150
2151        // Arrange: PR with truncated description and patch
2152        let pr = PrDetails {
2153            owner: "test".to_string(),
2154            repo: "repo".to_string(),
2155            number: 1,
2156            title: "Test PR".to_string(),
2157            body: "x".repeat(40000), // Will be truncated
2158            head_branch: "feat".to_string(),
2159            base_branch: "main".to_string(),
2160            url: "https://github.com/test/repo/pull/1".to_string(),
2161            files: vec![
2162                PrFile {
2163                    filename: "file1.rs".to_string(),
2164                    status: "modified".to_string(),
2165                    additions: 10,
2166                    deletions: 5,
2167                    patch: Some("x".repeat(3000)), // Will be truncated
2168                    patch_truncated: false,
2169                    full_content: None,
2170                },
2171                PrFile {
2172                    filename: "file2.rs".to_string(),
2173                    status: "modified".to_string(),
2174                    additions: 10,
2175                    deletions: 5,
2176                    patch: Some("--- a/file\n+++ b/file\n@@ -1 @@\n+added".to_string()),
2177                    patch_truncated: true, // GitHub API truncated
2178                    full_content: None,
2179                },
2180            ],
2181            labels: vec![],
2182            head_sha: String::new(),
2183            review_comments: vec![],
2184            instructions: None,
2185        };
2186
2187        // Act: build review prompt
2188        let prompt = TestProvider::build_pr_review_user_prompt(&pr, "", "");
2189
2190        // Assert: all truncation annotations use consistent [APTU: ...] format
2191        assert!(
2192            prompt.contains("[APTU: description truncated by size budget -- do not speculate on missing content]"),
2193            "description truncation must use [APTU: ...] format"
2194        );
2195        assert!(
2196            prompt.contains(
2197                "[APTU: patch truncated by size budget -- do not speculate on missing content]"
2198            ),
2199            "patch budget truncation must use [APTU: ...] format"
2200        );
2201        assert!(
2202            prompt.contains(
2203                "[APTU: patch truncated by GitHub API -- do not speculate on missing content]"
2204            ),
2205            "GitHub API patch truncation must use [APTU: ...] format"
2206        );
2207    }
2208}
aptu_core/ai/provider.rs

aptu_core/ai/
provider.rs