use super::config::ContextConfig;
use super::partitions::ContextPartitions;
use super::pressure::PressureAction;
use super::summarizer::Summarizer;
use super::token_engine::ContextTokenEngine;
use crate::types::message::{Content, ContentPart, Message};
#[derive(Default)]
pub struct CompressResult {
pub tokens_saved: u32,
pub summary: Option<String>,
pub archived: Vec<Message>,
pub prefix_invalidated_at: Option<usize>,
}
pub trait Compressor: Send + Sync {
fn compress(
&self,
partitions: &mut ContextPartitions,
target_tokens: u32,
max_tokens: u32,
preserve_k: usize,
summarizer: &dyn Summarizer,
engine: &ContextTokenEngine,
) -> CompressResult;
}
pub struct SnipCompactor {
pub per_msg_ratio: f64,
}
impl Compressor for SnipCompactor {
fn compress(
&self,
partitions: &mut ContextPartitions,
_target_tokens: u32,
max_tokens: u32,
preserve_k: usize,
_summarizer: &dyn Summarizer,
engine: &ContextTokenEngine,
) -> CompressResult {
let per_msg_limit = ((max_tokens as f64 * self.per_msg_ratio) as u32).max(50);
let mut saved = 0u32;
let partition = &mut partitions.history;
let prefix_keep = prefix_keep_for(partition.messages.len(), preserve_k);
let indices =
oversized_text_message_indices(&partition.messages, per_msg_limit, prefix_keep, engine);
for &i in &indices {
let msg = &mut partition.messages[i];
let original_tokens = msg.token_count.unwrap_or_else(|| engine.count_message(msg));
if let Content::Text(ref t) = msg.content {
let head_limit = per_msg_limit / 2;
let tail_limit = per_msg_limit.saturating_sub(head_limit);
let head_text = engine.truncate(t, head_limit);
let chars: Vec<char> = t.chars().collect();
let mut low = head_text.chars().count();
let mut high = chars.len();
let mut suffix_start = chars.len();
while low <= high {
let mid = (low + high) / 2;
if mid >= chars.len() {
break;
}
let candidate: String = chars[mid..].iter().collect();
let tokens = engine.count(&candidate);
if tokens <= tail_limit {
suffix_start = mid;
if mid == 0 {
break;
}
high = mid - 1;
} else {
low = mid + 1;
}
}
let tail_text: String = chars[suffix_start..].iter().collect();
let omitted = original_tokens
.saturating_sub(head_limit)
.saturating_sub(tail_limit);
msg.content = Content::Text(format!(
"{}… [… {} tokens omitted …] …{}",
head_text, omitted, tail_text
));
msg.token_count = Some(per_msg_limit);
saved += original_tokens.saturating_sub(per_msg_limit);
}
}
partition.token_count = partition.token_count.saturating_sub(saved);
CompressResult {
tokens_saved: saved,
prefix_invalidated_at: indices.iter().min().copied(),
..Default::default()
}
}
}
fn prefix_keep_for(len: usize, preserve_k: usize) -> usize {
if len >= preserve_k.saturating_mul(3) {
preserve_k
} else {
0
}
}
fn oversized_text_message_indices(
messages: &[Message],
per_msg_limit: u32,
prefix_keep: usize,
engine: &ContextTokenEngine,
) -> Vec<usize> {
messages
.iter()
.enumerate()
.filter(|(i, msg)| {
if *i < prefix_keep {
return false;
}
if !matches!(msg.content, Content::Text(_)) {
return false;
}
let toks = msg.token_count.unwrap_or_else(|| engine.count_message(msg));
toks > per_msg_limit && toks > 10
})
.map(|(i, _)| i)
.collect()
}
fn utc_now() -> String {
format!("{:?}", std::time::SystemTime::now())
}
fn extract_json_excerpt(output: &str) -> Option<String> {
let val: serde_json::Value = serde_json::from_str(output).ok()?;
match val {
serde_json::Value::Object(map) => {
let mut summary_parts = Vec::new();
let mut keys = Vec::new();
for (k, v) in &map {
keys.push(k.as_str());
if v.is_number() || v.is_boolean() {
summary_parts.push(format!("{}: {}", k, v));
} else if let Some(s) = v.as_str() {
if s.len() <= 50 {
summary_parts.push(format!("{}: \"{}\"", k, s));
}
}
}
Some(format!(
"JSON Keys: [{}]\nJSON Fields: {{{}}}",
keys.join(", "),
summary_parts.join(", ")
))
}
serde_json::Value::Array(arr) => {
if arr.is_empty() {
return Some("JSON Array: []".to_string());
}
let mut headers = Vec::new();
if let Some(serde_json::Value::Object(first_map)) = arr.first() {
for k in first_map.keys() {
headers.push(k.as_str());
}
}
let len = arr.len();
Some(format!(
"JSON Array: {} items. Keys: [{}]",
len,
headers.join(", ")
))
}
_ => None,
}
}
fn excerpt_text(
text: &str,
head_tokens: u32,
tail_tokens: u32,
engine: &ContextTokenEngine,
) -> String {
let total_tokens = engine.count(text);
if total_tokens <= head_tokens + tail_tokens {
return text.to_string();
}
let head = engine.truncate(text, head_tokens);
let chars: Vec<char> = text.chars().collect();
let mut low = head.chars().count();
let mut high = chars.len();
let mut suffix_start = chars.len();
while low <= high {
let mid = (low + high) / 2;
if mid >= chars.len() {
break;
}
let candidate: String = chars[mid..].iter().collect();
let tokens = engine.count(&candidate);
if tokens <= tail_tokens {
suffix_start = mid;
if mid == 0 {
break;
}
high = mid - 1;
} else {
low = mid + 1;
}
}
let tail: String = chars[suffix_start..].iter().collect();
let remaining = total_tokens
.saturating_sub(head_tokens)
.saturating_sub(tail_tokens);
format!("{}… [… {} tokens omitted …] …{}", head, remaining, tail)
}
fn excerptable_tool_result_indices(
messages: &[Message],
preserved_refs: &[String],
prefix_keep: usize,
engine: &ContextTokenEngine,
) -> Vec<usize> {
messages
.iter()
.enumerate()
.filter_map(|(i, msg)| {
if i < prefix_keep {
return None;
}
let toks = msg.token_count.unwrap_or_else(|| engine.count_message(msg));
if toks < 200 {
return None;
}
let Content::Parts(parts) = &msg.content else {
return None;
};
let call_id = parts.iter().find_map(|p| match p {
ContentPart::ToolResult { call_id, .. } => Some(call_id.to_string()),
_ => None,
})?;
(!preserved_refs.contains(&call_id)).then_some(i)
})
.collect()
}
pub struct MicroCompactor;
impl Compressor for MicroCompactor {
fn compress(
&self,
partitions: &mut ContextPartitions,
_target_tokens: u32,
_max_tokens: u32,
preserve_k: usize,
_summarizer: &dyn Summarizer,
engine: &ContextTokenEngine,
) -> CompressResult {
let find_tool_name = |call_id: &str, msgs: &[Message]| -> Option<String> {
for m in msgs {
for tc in &m.tool_calls {
if tc.id == call_id {
return Some(tc.name.to_string());
}
}
}
None
};
let prefix_keep = prefix_keep_for(partitions.history.messages.len(), preserve_k);
let indices = excerptable_tool_result_indices(
&partitions.history.messages,
&partitions.task_state.preserved_refs,
prefix_keep,
engine,
);
let messages_clone = partitions.history.messages.clone();
let partition = &mut partitions.history;
let mut saved = 0u32;
for &i in &indices {
let msg = &mut partition.messages[i];
let original_tokens = msg.token_count.unwrap_or_else(|| engine.count_message(msg));
if let Content::Parts(ref mut parts) = msg.content {
let tool_result_index = parts
.iter()
.position(|p| matches!(p, ContentPart::ToolResult { .. }));
if let Some(idx) = tool_result_index {
if let ContentPart::ToolResult {
call_id,
output,
is_error: _,
} = &mut parts[idx]
{
let tool_name = find_tool_name(call_id, &messages_clone)
.unwrap_or_else(|| "unknown".to_string());
let new_output = if original_tokens > 2000 {
if let Some(json_excerpt) = extract_json_excerpt(output) {
format!(
"[tool result: {} | {} | {} tokens]\n{}",
call_id, tool_name, original_tokens, json_excerpt
)
} else {
let excerpt = excerpt_text(output, 30, 10, engine);
format!(
"[tool result: {} | {} | {} tokens]\n{}",
call_id, tool_name, original_tokens, excerpt
)
}
} else {
let excerpt = excerpt_text(output, 150, 50, engine);
format!(
"[tool result: {} | {} | {} tokens]\n{}",
call_id, tool_name, original_tokens, excerpt
)
};
let new_tokens = engine.count(&new_output);
msg.content = Content::Text(new_output);
msg.token_count = Some(new_tokens);
saved += original_tokens.saturating_sub(new_tokens);
}
}
}
}
partition.token_count = partition.token_count.saturating_sub(saved);
CompressResult {
tokens_saved: saved,
prefix_invalidated_at: indices.iter().min().copied(),
..Default::default()
}
}
}
pub fn plan_drop_oldest(
messages: &[Message],
total_tokens: u32,
target_tokens: u32,
keep: usize,
engine: &ContextTokenEngine,
) -> (usize, u32) {
let limit = messages.len().saturating_sub(keep);
let mut saved = 0u32;
let mut n = 0usize;
for (i, msg) in messages.iter().take(limit).enumerate() {
if total_tokens.saturating_sub(saved) <= target_tokens {
break;
}
saved += msg.token_count.unwrap_or_else(|| engine.count_message(msg));
n = i + 1;
}
(n, saved)
}
pub struct CollapseCompactor;
impl Compressor for CollapseCompactor {
fn compress(
&self,
partitions: &mut ContextPartitions,
target_tokens: u32,
_max_tokens: u32,
preserve_k: usize,
_summarizer: &dyn Summarizer,
engine: &ContextTokenEngine,
) -> CompressResult {
let partition = &mut partitions.history;
let keep = preserve_k * 2; let (n, saved) =
plan_drop_oldest(&partition.messages, partition.token_count, target_tokens, keep, engine);
if n == 0 {
return CompressResult::default();
}
let archived: Vec<Message> = partition.messages.drain(..n).collect();
partition.token_count = partition.token_count.saturating_sub(saved);
CompressResult {
tokens_saved: saved,
archived,
prefix_invalidated_at: Some(0),
..Default::default()
}
}
}
pub struct AutoCompactor;
impl Compressor for AutoCompactor {
fn compress(
&self,
partitions: &mut ContextPartitions,
_target_tokens: u32,
_max_tokens: u32,
preserve_k: usize,
_summarizer: &dyn Summarizer,
engine: &ContextTokenEngine,
) -> CompressResult {
let partition = &mut partitions.history;
if partition.messages.is_empty() {
return CompressResult::default();
}
let original_tokens = partition.token_count;
let keep = preserve_k * 2;
let limit = partition.messages.len().saturating_sub(keep);
let (archived, kept): (Vec<Message>, Vec<Message>) = if limit > 0 {
let archived_msgs = partition.messages.drain(..limit).collect();
let kept_msgs = partition.messages.drain(..).collect();
(archived_msgs, kept_msgs)
} else {
(vec![], partition.messages.drain(..).collect())
};
if archived.is_empty() {
partition.messages = kept;
return CompressResult::default();
}
partition.messages = kept;
let kept_tokens: u32 = partition
.messages
.iter()
.map(|m| m.token_count.unwrap_or_else(|| engine.count_message(m)))
.sum();
partition.token_count = kept_tokens;
CompressResult {
tokens_saved: original_tokens.saturating_sub(kept_tokens),
archived,
prefix_invalidated_at: Some(0),
..Default::default()
}
}
}
#[derive(Debug, Clone, PartialEq)]
pub enum CompactionStep {
Excerpt { msg_idx: Vec<usize> },
Snip { msg_idx: Vec<usize>, per_msg_limit: u32 },
DropOldest { count: usize },
}
impl CompactionStep {
pub fn invalidates_prefix_at(&self) -> Option<usize> {
match self {
CompactionStep::Excerpt { msg_idx } | CompactionStep::Snip { msg_idx, .. } => {
msg_idx.iter().min().copied()
}
CompactionStep::DropOldest { count } => (*count > 0).then_some(0),
}
}
}
pub fn plan_cache_cost(steps: &[CompactionStep]) -> Option<usize> {
steps.iter().filter_map(|s| s.invalidates_prefix_at()).min()
}
pub struct CompressionPipeline {
stages: Vec<(PressureAction, Box<dyn Compressor>)>,
preserve_recent_turns: usize,
}
impl CompressionPipeline {
pub fn new(config: &ContextConfig) -> Self {
Self {
preserve_recent_turns: config.preserve_recent_turns,
stages: vec![
(
PressureAction::SnipCompact,
Box::new(SnipCompactor {
per_msg_ratio: config.snip_per_msg_ratio,
}),
),
(PressureAction::MicroCompact, Box::new(MicroCompactor)),
(PressureAction::ContextCollapse, Box::new(CollapseCompactor)),
(PressureAction::AutoCompact, Box::new(AutoCompactor)),
],
}
}
pub fn compress(
&self,
partitions: &mut ContextPartitions,
action: PressureAction,
max_tokens: u32,
target_tokens: u32,
engine: &ContextTokenEngine,
) -> (u32, Option<String>, Vec<Message>, Option<usize>) {
if action == PressureAction::None {
return (0, None, vec![], None);
}
let mut total_saved = 0;
let mut all_archived = vec![];
let mut cache_at: Option<usize> = None;
let summarizer = super::summarizer::RuleSummarizer;
for (stage_action, compressor) in &self.stages {
if *stage_action <= action {
if partitions.total_tokens(engine) <= target_tokens {
break;
}
let res = compressor.compress(
partitions,
target_tokens,
max_tokens,
self.preserve_recent_turns,
&summarizer,
engine,
);
total_saved += res.tokens_saved;
cache_at = [cache_at, res.prefix_invalidated_at].into_iter().flatten().min();
all_archived.extend(res.archived);
}
}
let summary = if all_archived.is_empty() {
None
} else {
let s = summarizer.summarize(&all_archived, action, target_tokens);
partitions.task_state.log_compression(action.label(), s.clone());
Some(s)
};
(total_saved, summary, all_archived, cache_at)
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::context::config::ContextConfig;
use crate::context::partitions::ContextPartitions;
use crate::context::token_engine::ContextTokenEngine;
use crate::types::message::Message;
fn engine() -> ContextTokenEngine {
ContextTokenEngine::char_approx()
}
fn config() -> ContextConfig {
ContextConfig::default()
}
fn summarizer() -> super::super::summarizer::RuleSummarizer {
super::super::summarizer::RuleSummarizer
}
const MAX: u32 = 1_000;
#[test]
fn snip_compactor_truncates_oversized_messages() {
let cfg = ContextConfig {
snip_per_msg_ratio: 0.10,
..Default::default()
};
let compactor = SnipCompactor {
per_msg_ratio: cfg.snip_per_msg_ratio,
};
let mut ctx = ContextPartitions::new(&cfg);
ctx.history.push(Message::user("a".repeat(800)), 200);
let result = compactor.compress(&mut ctx, 0, MAX, 0, &summarizer(), &engine());
assert!(result.tokens_saved > 0);
if let Content::Text(ref t) = ctx.history.messages[0].content {
assert!(t.contains("… [… 100 tokens omitted …] …"), "got: {t}");
}
}
#[test]
fn snip_compactor_leaves_small_messages_untouched() {
let cfg = ContextConfig {
snip_per_msg_ratio: 0.10,
..Default::default()
};
let compactor = SnipCompactor {
per_msg_ratio: cfg.snip_per_msg_ratio,
};
let mut ctx = ContextPartitions::new(&cfg);
ctx.history.push(Message::user("short"), 5);
let result = compactor.compress(&mut ctx, 0, MAX, 2, &summarizer(), &engine());
assert_eq!(result.tokens_saved, 0);
}
#[test]
fn micro_compactor_replaces_tool_results_with_measured_placeholder() {
use crate::types::message::{ContentPart, Role};
use compact_str::CompactString;
let compactor = MicroCompactor;
let mut ctx = ContextPartitions::new(&config());
let parts = vec![ContentPart::ToolResult {
call_id: CompactString::new("c1"),
output: "a".repeat(1200),
is_error: false,
}];
let msg = Message {
role: Role::Tool,
content: Content::Parts(parts),
tool_calls: vec![],
token_count: Some(300),
};
ctx.history.messages.push(msg);
ctx.history.token_count = 300;
let result = compactor.compress(&mut ctx, 0, MAX, 0, &summarizer(), &engine());
assert!(result.tokens_saved > 0);
let text = ctx.history.messages[0].content.as_text().unwrap();
assert!(
text.contains("[tool result: c1 | unknown | 300 tokens]"),
"got: {text}"
);
}
#[test]
fn collapse_compactor_drops_oldest_to_reach_target() {
let compactor = CollapseCompactor;
let mut ctx = ContextPartitions::new(&config());
for _ in 0..8 {
ctx.history.push(Message::user("msg"), 50);
}
let result = compactor.compress(&mut ctx, 250, MAX, 2, &summarizer(), &engine());
assert!(result.tokens_saved > 0);
assert!(ctx.history.messages.len() < 8);
assert!(!result.archived.is_empty(), "drained messages are returned to the pipeline");
assert!(result.summary.is_none(), "compactor no longer self-summarizes");
assert!(ctx.task_state.compression_log.is_empty(), "compactor no longer logs");
}
#[test]
fn rule_summarizer_formats_correctly() {
use crate::context::summarizer::RuleSummarizer;
use crate::types::message::{Content, Message, Role};
let summarizer = RuleSummarizer;
let mut messages = vec![];
messages.push(Message {
role: Role::User,
content: Content::Text("hello".to_string()),
tool_calls: vec![],
token_count: Some(5),
});
messages.push(Message {
role: Role::Assistant,
content: Content::Text("world".to_string()),
tool_calls: vec![],
token_count: Some(6),
});
let summary = summarizer.summarize(&messages, PressureAction::SnipCompact, 100);
assert!(summary.contains("[Compressed: snip_compact]"));
assert!(summary.contains("2 messages / 11 tokens archived"));
assert!(summary.contains("last assistant output: world"));
}
#[test]
fn micro_compactor_preserves_refs_in_preserved_refs() {
use crate::types::message::{ContentPart, Role};
use compact_str::CompactString;
let compactor = MicroCompactor;
let mut ctx = ContextPartitions::new(&config());
ctx.task_state.preserved_refs = vec!["keep_me".to_string()];
let parts = vec![ContentPart::ToolResult {
call_id: CompactString::new("keep_me"),
output: "a".repeat(1200),
is_error: false,
}];
let msg = Message {
role: Role::Tool,
content: Content::Parts(parts),
tool_calls: vec![],
token_count: Some(300),
};
ctx.history.messages.push(msg);
ctx.history.token_count = 300;
let result = compactor.compress(&mut ctx, 0, MAX, 2, &summarizer(), &engine());
assert_eq!(result.tokens_saved, 0);
let text_opt = ctx.history.messages[0].content.as_text();
assert!(
text_opt.is_none(),
"should not be replaced to text placeholder"
);
}
#[test]
fn auto_compactor_merges_all_except_last_two_turns() {
let compactor = AutoCompactor;
let mut ctx = ContextPartitions::new(&config());
for i in 0..10 {
ctx.history.push(Message::user(format!("msg {i}")), 10);
}
let result = compactor.compress(&mut ctx, 0, MAX, 2, &summarizer(), &engine());
assert!(result.tokens_saved > 0);
assert_eq!(ctx.history.messages.len(), 4); assert!(!result.archived.is_empty(), "drained messages returned to the pipeline");
assert!(result.summary.is_none(), "compactor no longer self-summarizes");
assert!(ctx.task_state.compression_log.is_empty(), "compactor no longer logs");
}
#[test]
fn plan_drop_oldest_respects_target_and_preserve_floor() {
let msgs: Vec<Message> = (0..8)
.map(|i| {
let mut m = Message::user(format!("m{i}"));
m.token_count = Some(50);
m
})
.collect();
assert_eq!(plan_drop_oldest(&msgs, 400, 250, 2, &engine()), (3, 150));
assert_eq!(plan_drop_oldest(&msgs, 400, 0, 2, &engine()), (6, 300));
assert_eq!(plan_drop_oldest(&msgs, 400, 500, 2, &engine()), (0, 0));
}
#[test]
fn prefix_keep_yields_without_drop_fallback() {
assert_eq!(prefix_keep_for(6, 2), 2, "len 6 >= 6 → protect oldest 2");
assert_eq!(prefix_keep_for(5, 2), 0, "len 5 < 6 → would leave an untouchable message");
assert_eq!(prefix_keep_for(3, 2), 0);
assert_eq!(prefix_keep_for(0, 2), 0);
}
#[test]
fn compaction_step_prefix_cost() {
assert_eq!(CompactionStep::Excerpt { msg_idx: vec![5, 8] }.invalidates_prefix_at(), Some(5));
assert_eq!(
CompactionStep::Snip { msg_idx: vec![3, 9], per_msg_limit: 50 }.invalidates_prefix_at(),
Some(3)
);
assert_eq!(CompactionStep::DropOldest { count: 4 }.invalidates_prefix_at(), Some(0));
assert_eq!(CompactionStep::DropOldest { count: 0 }.invalidates_prefix_at(), None);
assert_eq!(CompactionStep::Excerpt { msg_idx: vec![] }.invalidates_prefix_at(), None);
}
#[test]
fn plan_cache_cost_is_the_earliest_break() {
let late = vec![
CompactionStep::Excerpt { msg_idx: vec![6] },
CompactionStep::Snip { msg_idx: vec![7], per_msg_limit: 50 },
];
assert_eq!(plan_cache_cost(&late), Some(6));
let mut with_drop = late.clone();
with_drop.push(CompactionStep::DropOldest { count: 3 });
assert_eq!(plan_cache_cost(&with_drop), Some(0));
assert_eq!(plan_cache_cost(&[]), None);
}
#[test]
fn pipeline_reports_accurate_prefix_invalidation() {
let cfg = config();
let mut ctx = baseline_partitions();
let (_s, _u, _a, cache_at) = CompressionPipeline::new(&cfg).compress(
&mut ctx,
PressureAction::SnipCompact,
MAX,
500,
&engine(),
);
assert_eq!(cache_at, Some(3), "snip protected the oldest 2 → earliest touch is msg 3");
let mut ctx2 = baseline_partitions();
let (_s2, _u2, _a2, cache_at2) = CompressionPipeline::new(&cfg).compress(
&mut ctx2,
PressureAction::AutoCompact,
MAX,
500,
&engine(),
);
assert_eq!(cache_at2, Some(0), "dropping the oldest breaks the cache prefix at 0");
}
use crate::types::message::Role;
use compact_str::CompactString;
fn baseline_partitions() -> ContextPartitions {
let cfg = config();
let mut ctx = ContextPartitions::new(&cfg);
ctx.history.push(Message::user("u0 ".repeat(120)), 300);
ctx.history.push(Message::assistant("a0 ".repeat(120)), 300);
ctx.history.messages.push(Message {
role: Role::Tool,
content: Content::Parts(vec![ContentPart::ToolResult {
call_id: CompactString::new("call_1"),
output: serde_json::json!({"rows": 42, "ok": true, "name": "alpha"}).to_string()
+ &"-pad".repeat(400),
is_error: false,
}]),
tool_calls: vec![],
token_count: Some(400),
});
ctx.history.token_count += 400;
ctx.history.push(Message::user("u1 ".repeat(120)), 300);
ctx.history.push(Message::assistant("a1 ".repeat(120)), 300);
ctx.history.messages.push(Message {
role: Role::Tool,
content: Content::Parts(vec![ContentPart::ToolResult {
call_id: CompactString::new("call_2"),
output: "y".repeat(1600),
is_error: false,
}]),
tool_calls: vec![],
token_count: Some(400),
});
ctx.history.token_count += 400;
ctx
}
fn run_baseline(action: PressureAction) -> (u32, u32, Option<String>, usize, usize, u32) {
let mut ctx = baseline_partitions();
let before = ctx.total_tokens(&engine());
let (saved, summary, archived, _cache_at) =
CompressionPipeline::new(&config()).compress(&mut ctx, action, MAX, 500, &engine());
let archived_len = archived.len();
let msgs_after = ctx.history.messages.len();
let total_after = ctx.total_tokens(&engine());
(before, saved, summary, archived_len, msgs_after, total_after)
}
#[test]
fn baseline_snip_only_caps_text_no_archival() {
let (before, saved, summary, archived, msgs, total) = run_baseline(PressureAction::SnipCompact);
assert_eq!(before, 2001);
assert_eq!(saved, 500, "2 non-prefix oversized turns × 250 (oldest 2 protected; was 1000)");
assert_eq!(archived, 0);
assert!(summary.is_none());
assert_eq!(msgs, 6, "snip mutates in place, drops no messages");
assert_eq!(total, 1501);
}
#[test]
fn baseline_micro_excerpts_tool_results() {
let (before, saved, summary, archived, msgs, total) = run_baseline(PressureAction::MicroCompact);
assert_eq!(before, 2001);
assert_eq!(saved, 862, "snip(500, prefix-protected) + excerpt(362); was 1362");
assert_eq!(archived, 0);
assert!(summary.is_none());
assert_eq!(msgs, 6);
assert_eq!(total, 1139);
}
#[test]
fn baseline_collapse_drops_oldest_and_summarizes() {
let (before, saved, summary, archived, msgs, total) =
run_baseline(PressureAction::ContextCollapse);
assert_eq!(before, 2001);
assert_eq!(saved, 1462);
assert_eq!(archived, 2, "drops the 2 oldest messages above the preserve floor");
assert_eq!(msgs, 4, "preserve_recent_turns=2 → 4 messages kept");
assert_eq!(total, 539);
let summary = summary.expect("collapse summarizes archived messages");
assert!(
summary.contains("[Compressed: context_collapse]"),
"summary routes the collapse action: {summary}"
);
}
#[test]
fn baseline_auto_attributes_summary_to_auto_compact() {
let (before, saved, summary, archived, msgs, total) = run_baseline(PressureAction::AutoCompact);
assert_eq!(before, 2001);
assert_eq!(saved, 1462);
assert_eq!(archived, 2);
assert_eq!(msgs, 4);
assert_eq!(total, 539);
let summary = summary.expect("auto-compact summarizes the archived messages");
assert!(summary.contains("[Compressed: auto_compact]"), "got: {summary}");
}
#[test]
fn baseline_saved_is_monotonic_in_action_level() {
let snip = run_baseline(PressureAction::SnipCompact).1;
let micro = run_baseline(PressureAction::MicroCompact).1;
let collapse = run_baseline(PressureAction::ContextCollapse).1;
let auto = run_baseline(PressureAction::AutoCompact).1;
assert!(snip <= micro, "{snip} <= {micro}");
assert!(micro <= collapse, "{micro} <= {collapse}");
assert!(collapse <= auto, "{collapse} <= {auto}");
}
#[test]
fn pipeline_stops_cascade_when_target_reached() {
let cfg = ContextConfig {
snip_per_msg_ratio: 0.25,
preserve_recent_turns: 0,
..Default::default()
};
let pipeline = CompressionPipeline::new(&cfg);
let mut ctx = ContextPartitions::new(&cfg);
ctx.history.push(Message::user("a".repeat(3600)), 900);
let (saved, summary, archived, _cache_at) = pipeline.compress(
&mut ctx,
PressureAction::AutoCompact,
1_000,
500,
&engine(),
);
assert!(saved > 0);
assert!(summary.is_none(), "auto compactor should not run after snip reaches target");
assert!(archived.is_empty(), "heavier archival stages should not run");
assert_eq!(ctx.history.messages.len(), 1);
assert!(ctx.total_tokens(&engine()) <= 500);
}
}