Skip to main content

sol_parser_sdk/grpc/
instruction_parser.rs

1//! Instruction 解析器 - 完整支持 instruction + inner instruction
2//!
3//! 设计原则:
4//! - 简洁:单一入口函数,清晰的解析流程
5//! - 高性能:零拷贝,内联优化,并行处理
6//! - 可读性:每个步骤都有明确的注释
7
8use crate::core::{
9    events::*, merger::merge_events, pumpfun_fee_enrich::enrich_pumpfun_same_tx_post_merge,
10};
11use crate::grpc::types::EventTypeFilter;
12use crate::instr::read_pubkey_fast;
13use solana_sdk::pubkey::Pubkey;
14use solana_sdk::signature::Signature;
15use std::collections::HashMap;
16use yellowstone_grpc_proto::prelude::{Transaction, TransactionStatusMeta};
17
18/// 解析交易中的所有指令事件(instruction + inner instruction)
19///
20/// # 解析流程
21/// 1. 解析主指令(outer instructions)- 8字节 discriminator
22/// 2. 解析内部指令(inner instructions)- 16字节 discriminator
23/// 3. 合并相关事件(instruction + inner instruction)
24/// 4. 填充账户上下文
25///
26/// # 性能优化
27/// - 零分配泄漏:`program_invokes` 全程 `Pubkey` 键,与账户填充 / `fill_data` 共用同一表
28/// - 零拷贝读取指令账户字节、`read_pubkey_fast` 解码
29/// - 热路径 `#[inline]`
30/// - `should_parse_instructions` 提前跳过整段 ix 解析
31#[inline]
32pub fn parse_instructions_enhanced(
33    meta: &TransactionStatusMeta,
34    transaction: &Option<Transaction>,
35    sig: Signature,
36    slot: u64,
37    tx_idx: u64,
38    block_us: Option<i64>,
39    grpc_us: i64,
40    filter: Option<&EventTypeFilter>,
41) -> Vec<DexEvent> {
42    let Some(tx) = transaction else { return Vec::new() };
43    let Some(msg) = &tx.message else { return Vec::new() };
44
45    let recent_blockhash = if msg.recent_blockhash.is_empty() {
46        None
47    } else {
48        Some(bs58::encode(&msg.recent_blockhash).into_string())
49    };
50
51    // 提前检查:是否需要解析 instruction(根据 filter)
52    if !should_parse_instructions(filter) {
53        return Vec::new();
54    }
55
56    // 与 log 解析一致:同笔交易内若有 PumpFun create,则本 tx 的 buy 事件标记为 is_created_buy(创建者首次买入)
57    let is_created_buy = crate::logs::optimized_matcher::detect_pumpfun_create(&meta.log_messages);
58
59    // 构建账户查找表
60    let keys_len = msg.account_keys.len();
61    let writable_len = meta.loaded_writable_addresses.len();
62    let get_key = |i: usize| -> Option<&Vec<u8>> {
63        if i < keys_len {
64            msg.account_keys.get(i)
65        } else if i < keys_len + writable_len {
66            meta.loaded_writable_addresses.get(i - keys_len)
67        } else {
68            meta.loaded_readonly_addresses.get(i - keys_len - writable_len)
69        }
70    };
71
72    let mut result = Vec::with_capacity(8);
73    let mut invokes: HashMap<Pubkey, Vec<(i32, i32)>> = HashMap::with_capacity(8);
74
75    // 步骤 1: 解析所有主指令
76    for (i, ix) in msg.instructions.iter().enumerate() {
77        let pid = get_key(ix.program_id_index as usize)
78            .map_or(Pubkey::default(), |k| read_pubkey_fast(k));
79
80        invokes.entry(pid).or_default().push((i as i32, -1));
81
82        // 解析主指令(8字节 discriminator)
83        if let Some(event) = parse_outer_instruction(
84            &ix.data,
85            &pid,
86            sig,
87            slot,
88            tx_idx,
89            block_us,
90            grpc_us,
91            &ix.accounts,
92            &get_key,
93            filter,
94            is_created_buy,
95        ) {
96            result.push((i, None, event)); // (outer_idx, inner_idx, event)
97        }
98    }
99
100    // 步骤 2: 解析所有 inner instructions
101    for inner in &meta.inner_instructions {
102        let outer_idx = inner.index as usize;
103
104        for (j, inner_ix) in inner.instructions.iter().enumerate() {
105            let pid = get_key(inner_ix.program_id_index as usize)
106                .map_or(Pubkey::default(), |k| read_pubkey_fast(k));
107
108            invokes.entry(pid).or_default().push((outer_idx as i32, j as i32));
109
110            // 解析 inner instruction(16字节 discriminator)
111            if let Some(event) = parse_inner_instruction(
112                &inner_ix.data,
113                &pid,
114                sig,
115                slot,
116                tx_idx,
117                block_us,
118                grpc_us,
119                filter,
120                is_created_buy,
121            ) {
122                result.push((outer_idx, Some(j), event)); // (outer_idx, Some(inner_idx), event)
123            }
124        }
125    }
126
127    // 步骤 3: 合并相关事件(instruction + inner instruction)
128    let mut merged = merge_instruction_events(result);
129    enrich_pumpfun_same_tx_post_merge(&mut merged);
130
131    for e in merged.iter_mut() {
132        if let Some(m) = e.metadata_mut() {
133            m.recent_blockhash = recent_blockhash.clone();
134        }
135    }
136
137    // 步骤 4: 填充账户上下文(invokes 与 fill_data 均使用 Pubkey 键,无堆泄漏)
138    let mut final_result = Vec::with_capacity(merged.len());
139    for mut event in merged {
140        crate::core::account_dispatcher::fill_accounts_with_owned_keys(
141            &mut event,
142            meta,
143            transaction,
144            &invokes,
145        );
146        crate::core::common_filler::fill_data(&mut event, meta, transaction, &invokes);
147        final_result.push(event);
148    }
149
150    final_result
151}
152
153// ============================================================================
154// 辅助函数
155// ============================================================================
156
157/// 解析单个主指令(outer instruction)
158///
159/// 主指令使用 8 字节 discriminator
160#[inline(always)]
161fn parse_outer_instruction<'a>(
162    data: &[u8],
163    program_id: &Pubkey,
164    sig: Signature,
165    slot: u64,
166    tx_idx: u64,
167    block_us: Option<i64>,
168    grpc_us: i64,
169    account_indices: &[u8],
170    get_key: &dyn Fn(usize) -> Option<&'a Vec<u8>>,
171    filter: Option<&EventTypeFilter>,
172    _is_created_buy: bool,
173) -> Option<DexEvent> {
174    // 检查指令数据长度(至少8字节 discriminator)
175    if data.len() < 8 {
176        return None;
177    }
178
179    // 常见 DEX 指令账户数远小于 64;栈上缓冲避免每笔 outer 一次 Vec 分配
180    const STACK_CAP: usize = 64;
181    if account_indices.len() <= STACK_CAP {
182        let mut stack = [Pubkey::default(); STACK_CAP];
183        let mut n = 0usize;
184        for &idx in account_indices {
185            if let Some(k) = get_key(idx as usize) {
186                stack[n] = read_pubkey_fast(k);
187                n += 1;
188            }
189        }
190        crate::instr::parse_instruction_unified(
191            data,
192            &stack[..n],
193            sig,
194            slot,
195            tx_idx,
196            block_us,
197            grpc_us,
198            filter,
199            program_id,
200        )
201    } else {
202        let accounts: Vec<Pubkey> = account_indices
203            .iter()
204            .filter_map(|&idx| get_key(idx as usize).map(|k| read_pubkey_fast(k)))
205            .collect();
206        crate::instr::parse_instruction_unified(
207            data, &accounts, sig, slot, tx_idx, block_us, grpc_us, filter, program_id,
208        )
209    }
210}
211
212/// 解析单个 inner instruction
213///
214/// Inner instructions 使用 16 字节 discriminator(前8字节是event hash,后8字节是magic)
215#[inline(always)]
216fn parse_inner_instruction(
217    data: &[u8],
218    program_id: &Pubkey,
219    sig: Signature,
220    slot: u64,
221    tx_idx: u64,
222    block_us: Option<i64>,
223    grpc_us: i64,
224    filter: Option<&EventTypeFilter>,
225    is_created_buy: bool,
226) -> Option<DexEvent> {
227    // 检查数据长度(至少16字节 discriminator)
228    if data.len() < 16 {
229        return None;
230    }
231
232    let metadata = EventMetadata {
233        signature: sig,
234        slot,
235        tx_index: tx_idx,
236        block_time_us: block_us.unwrap_or(0),
237        grpc_recv_us: grpc_us,
238        recent_blockhash: None, // set later on merged events in parse_instructions_enhanced
239    };
240
241    // 提取 16 字节 discriminator
242    let mut discriminator = [0u8; 16];
243    discriminator.copy_from_slice(&data[..16]);
244    let inner_data = &data[16..];
245
246    use crate::instr::{all_inner, program_ids, pump_amm_inner, pump_inner, raydium_clmm_inner};
247
248    // 根据 program_id 路由到对应的 inner instruction 解析器
249    if *program_id == program_ids::PUMPFUN_PROGRAM_ID {
250        if let Some(f) = filter {
251            if !f.includes_pumpfun() {
252                return None;
253            }
254        }
255        pump_inner::parse_pumpfun_inner_instruction(
256            &discriminator,
257            inner_data,
258            metadata,
259            is_created_buy,
260        )
261    } else if *program_id == program_ids::PUMPSWAP_PROGRAM_ID {
262        if let Some(f) = filter {
263            if !f.includes_pumpswap() {
264                return None;
265            }
266        }
267        pump_amm_inner::parse_pumpswap_inner_instruction(&discriminator, inner_data, metadata)
268    } else if *program_id == program_ids::RAYDIUM_CLMM_PROGRAM_ID {
269        raydium_clmm_inner::parse_raydium_clmm_inner_instruction(
270            &discriminator,
271            inner_data,
272            metadata,
273        )
274    } else if *program_id == program_ids::RAYDIUM_CPMM_PROGRAM_ID {
275        all_inner::raydium_cpmm::parse(&discriminator, inner_data, metadata)
276    } else if *program_id == program_ids::RAYDIUM_AMM_V4_PROGRAM_ID {
277        all_inner::raydium_amm::parse(&discriminator, inner_data, metadata)
278    } else if *program_id == program_ids::ORCA_WHIRLPOOL_PROGRAM_ID {
279        all_inner::orca::parse(&discriminator, inner_data, metadata)
280    } else if *program_id == program_ids::METEORA_POOLS_PROGRAM_ID {
281        all_inner::meteora_amm::parse(&discriminator, inner_data, metadata)
282    } else if *program_id == program_ids::METEORA_DAMM_V2_PROGRAM_ID {
283        if let Some(f) = filter {
284            if !f.includes_meteora_damm_v2() {
285                return None;
286            }
287        }
288        all_inner::meteora_damm::parse(&discriminator, inner_data, metadata)
289    } else if *program_id == program_ids::BONK_PROGRAM_ID {
290        all_inner::bonk::parse(&discriminator, inner_data, metadata)
291    } else {
292        None
293    }
294}
295
296/// 合并相关的 instruction 和 inner instruction 事件
297///
298/// 合并策略:
299/// 1. 同一个 outer_idx 的 instruction 和 inner instruction 可以合并
300/// 2. Inner instruction 在 outer instruction 之后出现(排序保证主指令在前)
301/// 3. 同一 outer 下若有多个 inner,依次链式合并进同一条事件,再输出
302/// 4. 合并后返回更完整的事件
303#[inline(always)]
304fn merge_instruction_events(events: Vec<(usize, Option<usize>, DexEvent)>) -> Vec<DexEvent> {
305    if events.is_empty() {
306        return Vec::new();
307    }
308
309    // 按 (outer_idx, inner_idx) 排序,确保顺序:同一 outer 下 **主指令在前、inner 在后**
310    // (`None` 若用 MAX 会把 outer 排到 inner 后面,导致无法 merge)
311    let mut events = events;
312    events.sort_by_key(|(outer, inner, _)| (*outer, inner.map_or(0, |i| i + 1)));
313
314    let mut result = Vec::with_capacity(events.len());
315    let mut pending_outer: Option<(usize, DexEvent)> = None;
316
317    for (outer_idx, inner_idx, event) in events {
318        match inner_idx {
319            None => {
320                // 这是一个 outer instruction
321                // 先处理之前的 pending_outer
322                if let Some((_, outer_event)) = pending_outer.take() {
323                    result.push(outer_event);
324                }
325                // 保存当前的 outer instruction,等待可能的 inner instruction
326                pending_outer = Some((outer_idx, event));
327            }
328            Some(_) => {
329                // 这是一个 inner instruction
330                if let Some((pending_outer_idx, mut outer_event)) = pending_outer.take() {
331                    if pending_outer_idx == outer_idx {
332                        // 合并进当前 outer(可多次:多段 inner 链式叠在同一条事件上)
333                        merge_events(&mut outer_event, event);
334                        pending_outer = Some((outer_idx, outer_event));
335                    } else {
336                        // 不匹配,分别保留
337                        result.push(outer_event);
338                        result.push(event);
339                    }
340                } else {
341                    // 没有 pending outer,直接添加 inner event
342                    result.push(event);
343                }
344            }
345        }
346    }
347
348    // 处理最后一个 pending_outer
349    if let Some((_, outer_event)) = pending_outer {
350        result.push(outer_event);
351    }
352
353    result
354}
355
356/// 检查是否需要解析 instructions(根据 filter)
357#[inline(always)]
358fn should_parse_instructions(filter: Option<&EventTypeFilter>) -> bool {
359    // 如果没有 filter,总是解析
360    let Some(filter) = filter else { return true };
361
362    // 如果 filter.include_only 为空,总是解析
363    let Some(ref include_only) = filter.include_only else { return true };
364
365    // PumpFun:外层 BUY/SELL 在 `instr/pump.rs` 不解析,但每笔买 inner 里仍有 Trade CPI;
366    // 仅走 `log_messages` 时,若 RPC 截断日志会 **丢多笔 Trade**。
367    // 打开 instruction+inner 解析,与日志在 `dedupe_log_instruction_events` 中按序去重合并。
368    if filter.includes_pumpfun() {
369        return true;
370    }
371
372    if filter.includes_pump_fees() {
373        return true;
374    }
375
376    // 其它协议:按需解析
377    include_only.iter().any(|t| {
378        use crate::grpc::types::EventType::*;
379        matches!(
380            t,
381            PumpFunMigrate
382                | MeteoraDammV2Swap
383                | MeteoraDammV2AddLiquidity
384                | MeteoraDammV2CreatePosition
385                | MeteoraDammV2ClosePosition
386                | MeteoraDammV2RemoveLiquidity
387        )
388    })
389}
390
391#[cfg(test)]
392mod tests {
393    use super::*;
394
395    #[test]
396    fn test_should_parse_instructions() {
397        // 无 filter - 应该解析
398        assert!(should_parse_instructions(None));
399
400        // 有 filter 但 include_only 为空 - 应该解析
401        let filter = EventTypeFilter { include_only: None, exclude_types: None };
402        assert!(should_parse_instructions(Some(&filter)));
403
404        // 包含需要 instruction 解析的事件类型
405        use crate::grpc::types::EventType;
406        let filter = EventTypeFilter {
407            include_only: Some(vec![EventType::PumpFunMigrate]),
408            exclude_types: None,
409        };
410        assert!(should_parse_instructions(Some(&filter)));
411
412        // PumpFun 订阅:需要 instruction+inner,避免仅日志时截断丢腿
413        let filter = EventTypeFilter {
414            include_only: Some(vec![EventType::PumpFunTrade]),
415            exclude_types: None,
416        };
417        assert!(should_parse_instructions(Some(&filter)));
418    }
419
420    #[test]
421    fn test_merge_instruction_events() {
422        use solana_sdk::signature::Signature;
423
424        let metadata = EventMetadata {
425            signature: Signature::default(),
426            slot: 100,
427            tx_index: 1,
428            block_time_us: 1000,
429            grpc_recv_us: 2000,
430            recent_blockhash: None,
431        };
432
433        // 模拟:outer instruction + inner instruction(应该合并)
434        let outer_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
435            metadata: metadata.clone(),
436            bonding_curve: Pubkey::new_unique(),
437            ..Default::default()
438        });
439
440        let inner_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
441            metadata: metadata.clone(),
442            sol_amount: 1000,
443            token_amount: 2000,
444            ..Default::default()
445        });
446
447        let events = vec![
448            (0, None, outer_event),    // outer instruction at index 0
449            (0, Some(0), inner_event), // inner instruction at index 0
450        ];
451
452        let result = merge_instruction_events(events);
453
454        // 应该合并为1个事件
455        assert_eq!(result.len(), 1);
456
457        // 验证合并结果包含两者的数据
458        if let DexEvent::PumpFunTrade(trade) = &result[0] {
459            assert_eq!(trade.sol_amount, 1000); // 来自 inner
460            assert_eq!(trade.token_amount, 2000); // 来自 inner
461            assert_ne!(trade.bonding_curve, Pubkey::default()); // 来自 outer
462        } else {
463            panic!("Expected PumpFunTrade event");
464        }
465    }
466
467    #[test]
468    fn test_merge_instruction_events_chains_multiple_inners_same_outer() {
469        use solana_sdk::signature::Signature;
470
471        let metadata = EventMetadata {
472            signature: Signature::default(),
473            slot: 100,
474            tx_index: 1,
475            block_time_us: 1000,
476            grpc_recv_us: 2000,
477            recent_blockhash: None,
478        };
479
480        let bc = Pubkey::new_unique();
481        let fee = Pubkey::new_unique();
482
483        let outer_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
484            metadata: metadata.clone(),
485            bonding_curve: bc,
486            ..Default::default()
487        });
488
489        let inner_trade = DexEvent::PumpFunTrade(PumpFunTradeEvent {
490            metadata: metadata.clone(),
491            sol_amount: 1000,
492            token_amount: 2000,
493            is_buy: true,
494            ..Default::default()
495        });
496
497        // 第二段 inner 仅有 fee_recipient,无成交量 —— 不应抹掉第一段金额
498        let inner_fee_only = DexEvent::PumpFunTrade(PumpFunTradeEvent {
499            metadata: metadata.clone(),
500            fee_recipient: fee,
501            ..Default::default()
502        });
503
504        let events =
505            vec![(0, None, outer_event), (0, Some(0), inner_trade), (0, Some(1), inner_fee_only)];
506
507        let result = merge_instruction_events(events);
508        assert_eq!(result.len(), 1);
509        if let DexEvent::PumpFunTrade(trade) = &result[0] {
510            assert_eq!(trade.bonding_curve, bc);
511            assert_eq!(trade.sol_amount, 1000);
512            assert_eq!(trade.token_amount, 2000);
513            assert_eq!(trade.fee_recipient, fee);
514        } else {
515            panic!("Expected PumpFunTrade event");
516        }
517    }
518}