Skip to main content

sol_parser_sdk/grpc/
instruction_parser.rs

1//! Instruction 解析器 - 完整支持 instruction + inner instruction
2//!
3//! 设计原则:
4//! - 简洁:单一入口函数,清晰的解析流程
5//! - 高性能:零拷贝,内联优化,并行处理
6//! - 可读性:每个步骤都有明确的注释
7
8use crate::core::{
9    events::*, merger::merge_events, pumpfun_fee_enrich::enrich_pumpfun_same_tx_post_merge,
10};
11use crate::grpc::types::EventTypeFilter;
12use crate::instr::read_pubkey_fast;
13use solana_sdk::pubkey::Pubkey;
14use solana_sdk::signature::Signature;
15use std::collections::HashMap;
16use yellowstone_grpc_proto::prelude::{Transaction, TransactionStatusMeta};
17
18/// 解析交易中的所有指令事件(instruction + inner instruction)
19///
20/// # 解析流程
21/// 1. 解析主指令(outer instructions)- 8字节 discriminator
22/// 2. 解析内部指令(inner instructions)- 16字节 discriminator
23/// 3. 合并相关事件(instruction + inner instruction)
24/// 4. 填充账户上下文
25///
26/// # 性能优化
27/// - 零分配泄漏:`program_invokes` 全程 `Pubkey` 键,与账户填充 / `fill_data` 共用同一表
28/// - 零拷贝读取指令账户字节、`read_pubkey_fast` 解码
29/// - 热路径 `#[inline]`
30/// - `should_parse_instructions` 提前跳过整段 ix 解析
31#[inline]
32pub fn parse_instructions_enhanced(
33    meta: &TransactionStatusMeta,
34    transaction: &Option<Transaction>,
35    sig: Signature,
36    slot: u64,
37    tx_idx: u64,
38    block_us: Option<i64>,
39    grpc_us: i64,
40    filter: Option<&EventTypeFilter>,
41) -> Vec<DexEvent> {
42    let Some(tx) = transaction else { return Vec::new() };
43    let Some(msg) = &tx.message else { return Vec::new() };
44
45    let recent_blockhash = if msg.recent_blockhash.is_empty() {
46        None
47    } else {
48        Some(bs58::encode(&msg.recent_blockhash).into_string())
49    };
50
51    // 提前检查:是否需要解析 instruction(根据 filter)
52    if !should_parse_instructions(filter) {
53        return Vec::new();
54    }
55
56    // 与 log 解析一致:同笔交易内若有 PumpFun create,则本 tx 的 buy 事件标记为 is_created_buy(创建者首次买入)
57    let is_created_buy = crate::logs::optimized_matcher::detect_pumpfun_create(&meta.log_messages);
58
59    // 构建账户查找表
60    let keys_len = msg.account_keys.len();
61    let writable_len = meta.loaded_writable_addresses.len();
62    let get_key = |i: usize| -> Option<&Vec<u8>> {
63        if i < keys_len {
64            msg.account_keys.get(i)
65        } else if i < keys_len + writable_len {
66            meta.loaded_writable_addresses.get(i - keys_len)
67        } else {
68            meta.loaded_readonly_addresses.get(i - keys_len - writable_len)
69        }
70    };
71
72    let mut result = Vec::with_capacity(8);
73    let mut invokes: HashMap<Pubkey, Vec<(i32, i32)>> = HashMap::with_capacity(8);
74
75    // 步骤 1: 解析所有主指令
76    for (i, ix) in msg.instructions.iter().enumerate() {
77        let pid = get_key(ix.program_id_index as usize)
78            .map_or(Pubkey::default(), |k| read_pubkey_fast(k));
79
80        invokes.entry(pid).or_default().push((i as i32, -1));
81
82        // 解析主指令(8字节 discriminator)
83        if let Some(event) = parse_outer_instruction(
84            &ix.data,
85            &pid,
86            sig,
87            slot,
88            tx_idx,
89            block_us,
90            grpc_us,
91            &ix.accounts,
92            &get_key,
93            filter,
94            is_created_buy,
95        ) {
96            result.push((i, None, event)); // (outer_idx, inner_idx, event)
97        }
98    }
99
100    // 步骤 2: 解析所有 inner instructions
101    for inner in &meta.inner_instructions {
102        let outer_idx = inner.index as usize;
103
104        for (j, inner_ix) in inner.instructions.iter().enumerate() {
105            let pid = get_key(inner_ix.program_id_index as usize)
106                .map_or(Pubkey::default(), |k| read_pubkey_fast(k));
107
108            invokes.entry(pid).or_default().push((outer_idx as i32, j as i32));
109
110            // 解析 inner instruction(16字节 discriminator)
111            if let Some(event) = parse_inner_instruction(
112                &inner_ix.data,
113                &pid,
114                sig,
115                slot,
116                tx_idx,
117                block_us,
118                grpc_us,
119                filter,
120                is_created_buy,
121            ) {
122                result.push((outer_idx, Some(j), event)); // (outer_idx, Some(inner_idx), event)
123            }
124        }
125    }
126
127    // 步骤 3: 合并相关事件(instruction + inner instruction)
128    let mut merged = merge_instruction_events(result);
129    enrich_pumpfun_same_tx_post_merge(&mut merged);
130
131    for e in merged.iter_mut() {
132        if let Some(m) = e.metadata_mut() {
133            m.recent_blockhash = recent_blockhash.clone();
134        }
135    }
136
137    // 步骤 4: 填充账户上下文(invokes 与 fill_data 均使用 Pubkey 键,无堆泄漏)
138    let mut final_result = Vec::with_capacity(merged.len());
139    for mut event in merged {
140        crate::core::account_dispatcher::fill_accounts_with_owned_keys(
141            &mut event,
142            meta,
143            transaction,
144            &invokes,
145        );
146        crate::core::common_filler::fill_data(&mut event, meta, transaction, &invokes);
147        final_result.push(event);
148    }
149
150    final_result
151}
152
153// ============================================================================
154// 辅助函数
155// ============================================================================
156
157/// 解析单个主指令(outer instruction)
158///
159/// 主指令使用 8 字节 discriminator
160#[inline(always)]
161fn parse_outer_instruction<'a>(
162    data: &[u8],
163    program_id: &Pubkey,
164    sig: Signature,
165    slot: u64,
166    tx_idx: u64,
167    block_us: Option<i64>,
168    grpc_us: i64,
169    account_indices: &[u8],
170    get_key: &dyn Fn(usize) -> Option<&'a Vec<u8>>,
171    filter: Option<&EventTypeFilter>,
172    _is_created_buy: bool,
173) -> Option<DexEvent> {
174    // 检查指令数据长度(至少8字节 discriminator)
175    if data.len() < 8 {
176        return None;
177    }
178
179    // 常见 DEX 指令账户数远小于 64;栈上缓冲避免每笔 outer 一次 Vec 分配
180    const STACK_CAP: usize = 64;
181    if account_indices.len() <= STACK_CAP {
182        let mut stack = [Pubkey::default(); STACK_CAP];
183        let mut n = 0usize;
184        for &idx in account_indices {
185            let k = get_key(idx as usize)?;
186            stack[n] = read_pubkey_fast(k);
187            n += 1;
188        }
189        crate::instr::parse_instruction_unified(
190            data,
191            &stack[..n],
192            sig,
193            slot,
194            tx_idx,
195            block_us,
196            grpc_us,
197            filter,
198            program_id,
199        )
200    } else {
201        let accounts: Vec<Pubkey> = account_indices
202            .iter()
203            .map(|&idx| get_key(idx as usize).map(|k| read_pubkey_fast(k)))
204            .collect::<Option<_>>()?;
205        crate::instr::parse_instruction_unified(
206            data, &accounts, sig, slot, tx_idx, block_us, grpc_us, filter, program_id,
207        )
208    }
209}
210
211/// 解析单个 inner instruction
212///
213/// Inner instructions 使用 16 字节 discriminator(前8字节是event hash,后8字节是magic)
214#[inline(always)]
215fn parse_inner_instruction(
216    data: &[u8],
217    program_id: &Pubkey,
218    sig: Signature,
219    slot: u64,
220    tx_idx: u64,
221    block_us: Option<i64>,
222    grpc_us: i64,
223    filter: Option<&EventTypeFilter>,
224    is_created_buy: bool,
225) -> Option<DexEvent> {
226    // 检查数据长度(至少16字节 discriminator)
227    if data.len() < 16 {
228        return None;
229    }
230
231    let metadata = EventMetadata {
232        signature: sig,
233        slot,
234        tx_index: tx_idx,
235        block_time_us: block_us.unwrap_or(0),
236        grpc_recv_us: grpc_us,
237        recent_blockhash: None, // set later on merged events in parse_instructions_enhanced
238    };
239
240    // 提取 16 字节 discriminator
241    let mut discriminator = [0u8; 16];
242    discriminator.copy_from_slice(&data[..16]);
243    let inner_data = &data[16..];
244
245    use crate::instr::{all_inner, program_ids, pump_amm_inner, pump_inner, raydium_clmm_inner};
246
247    // 根据 program_id 路由到对应的 inner instruction 解析器
248    if *program_id == program_ids::PUMPFUN_PROGRAM_ID {
249        if let Some(f) = filter {
250            if !f.includes_pumpfun() {
251                return None;
252            }
253        }
254        pump_inner::parse_pumpfun_inner_instruction(
255            &discriminator,
256            inner_data,
257            metadata,
258            is_created_buy,
259        )
260    } else if *program_id == program_ids::PUMPSWAP_PROGRAM_ID {
261        if let Some(f) = filter {
262            if !f.includes_pumpswap() {
263                return None;
264            }
265        }
266        pump_amm_inner::parse_pumpswap_inner_instruction(&discriminator, inner_data, metadata)
267    } else if *program_id == program_ids::RAYDIUM_CLMM_PROGRAM_ID {
268        raydium_clmm_inner::parse_raydium_clmm_inner_instruction(
269            &discriminator,
270            inner_data,
271            metadata,
272        )
273    } else if *program_id == program_ids::RAYDIUM_CPMM_PROGRAM_ID {
274        all_inner::raydium_cpmm::parse(&discriminator, inner_data, metadata)
275    } else if *program_id == program_ids::RAYDIUM_AMM_V4_PROGRAM_ID {
276        all_inner::raydium_amm::parse(&discriminator, inner_data, metadata)
277    } else if *program_id == program_ids::ORCA_WHIRLPOOL_PROGRAM_ID {
278        all_inner::orca::parse(&discriminator, inner_data, metadata)
279    } else if *program_id == program_ids::METEORA_POOLS_PROGRAM_ID {
280        all_inner::meteora_amm::parse(&discriminator, inner_data, metadata)
281    } else if *program_id == program_ids::METEORA_DAMM_V2_PROGRAM_ID {
282        if let Some(f) = filter {
283            if !f.includes_meteora_damm_v2() {
284                return None;
285            }
286        }
287        all_inner::meteora_damm::parse(&discriminator, inner_data, metadata)
288    } else if *program_id == program_ids::BONK_PROGRAM_ID {
289        all_inner::bonk::parse(&discriminator, inner_data, metadata)
290    } else {
291        None
292    }
293}
294
295/// 合并相关的 instruction 和 inner instruction 事件
296///
297/// 合并策略:
298/// 1. 同一个 outer_idx 的 instruction 和 inner instruction 可以合并
299/// 2. Inner instruction 在 outer instruction 之后出现(排序保证主指令在前)
300/// 3. 同一 outer 下若有多个 inner,依次链式合并进同一条事件,再输出
301/// 4. 合并后返回更完整的事件
302#[inline(always)]
303fn merge_instruction_events(events: Vec<(usize, Option<usize>, DexEvent)>) -> Vec<DexEvent> {
304    if events.is_empty() {
305        return Vec::new();
306    }
307
308    // 按 (outer_idx, inner_idx) 排序,确保顺序:同一 outer 下 **主指令在前、inner 在后**
309    // (`None` 若用 MAX 会把 outer 排到 inner 后面,导致无法 merge)
310    let mut events = events;
311    events.sort_by_key(|(outer, inner, _)| (*outer, inner.map_or(0, |i| i + 1)));
312
313    let mut result = Vec::with_capacity(events.len());
314    let mut pending_outer: Option<(usize, DexEvent)> = None;
315
316    for (outer_idx, inner_idx, event) in events {
317        match inner_idx {
318            None => {
319                // 这是一个 outer instruction
320                // 先处理之前的 pending_outer
321                if let Some((_, outer_event)) = pending_outer.take() {
322                    result.push(outer_event);
323                }
324                // 保存当前的 outer instruction,等待可能的 inner instruction
325                pending_outer = Some((outer_idx, event));
326            }
327            Some(_) => {
328                // 这是一个 inner instruction
329                if let Some((pending_outer_idx, mut outer_event)) = pending_outer.take() {
330                    if pending_outer_idx == outer_idx {
331                        // 合并进当前 outer(可多次:多段 inner 链式叠在同一条事件上)
332                        merge_events(&mut outer_event, event);
333                        pending_outer = Some((outer_idx, outer_event));
334                    } else {
335                        // 不匹配,分别保留
336                        result.push(outer_event);
337                        result.push(event);
338                    }
339                } else {
340                    // 没有 pending outer,直接添加 inner event
341                    result.push(event);
342                }
343            }
344        }
345    }
346
347    // 处理最后一个 pending_outer
348    if let Some((_, outer_event)) = pending_outer {
349        result.push(outer_event);
350    }
351
352    result
353}
354
355/// 检查是否需要解析 instructions(根据 filter)
356#[inline(always)]
357fn should_parse_instructions(filter: Option<&EventTypeFilter>) -> bool {
358    // 如果没有 filter,总是解析
359    let Some(filter) = filter else { return true };
360
361    // 如果 filter.include_only 为空,总是解析
362    let Some(ref include_only) = filter.include_only else { return true };
363
364    // PumpFun:外层 BUY/SELL 在 `instr/pump.rs` 不解析,但每笔买 inner 里仍有 Trade CPI;
365    // 仅走 `log_messages` 时,若 RPC 截断日志会 **丢多笔 Trade**。
366    // 打开 instruction+inner 解析,与日志在 `dedupe_log_instruction_events` 中按序去重合并。
367    if filter.includes_pumpfun() {
368        return true;
369    }
370
371    if filter.includes_pump_fees() {
372        return true;
373    }
374
375    // 其它协议:按需解析
376    include_only.iter().any(|t| {
377        use crate::grpc::types::EventType::*;
378        matches!(
379            t,
380            PumpFunMigrate
381                | MeteoraDammV2Swap
382                | MeteoraDammV2AddLiquidity
383                | MeteoraDammV2CreatePosition
384                | MeteoraDammV2ClosePosition
385                | MeteoraDammV2RemoveLiquidity
386        )
387    })
388}
389
390#[cfg(test)]
391mod tests {
392    use super::*;
393
394    #[test]
395    fn test_should_parse_instructions() {
396        // 无 filter - 应该解析
397        assert!(should_parse_instructions(None));
398
399        // 有 filter 但 include_only 为空 - 应该解析
400        let filter = EventTypeFilter { include_only: None, exclude_types: None };
401        assert!(should_parse_instructions(Some(&filter)));
402
403        // 包含需要 instruction 解析的事件类型
404        use crate::grpc::types::EventType;
405        let filter = EventTypeFilter {
406            include_only: Some(vec![EventType::PumpFunMigrate]),
407            exclude_types: None,
408        };
409        assert!(should_parse_instructions(Some(&filter)));
410
411        // PumpFun 订阅:需要 instruction+inner,避免仅日志时截断丢腿
412        let filter = EventTypeFilter {
413            include_only: Some(vec![EventType::PumpFunTrade]),
414            exclude_types: None,
415        };
416        assert!(should_parse_instructions(Some(&filter)));
417    }
418
419    #[test]
420    fn test_merge_instruction_events() {
421        use solana_sdk::signature::Signature;
422
423        let metadata = EventMetadata {
424            signature: Signature::default(),
425            slot: 100,
426            tx_index: 1,
427            block_time_us: 1000,
428            grpc_recv_us: 2000,
429            recent_blockhash: None,
430        };
431
432        // 模拟:outer instruction + inner instruction(应该合并)
433        let outer_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
434            metadata: metadata.clone(),
435            bonding_curve: Pubkey::new_unique(),
436            ..Default::default()
437        });
438
439        let inner_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
440            metadata: metadata.clone(),
441            sol_amount: 1000,
442            token_amount: 2000,
443            ..Default::default()
444        });
445
446        let events = vec![
447            (0, None, outer_event),    // outer instruction at index 0
448            (0, Some(0), inner_event), // inner instruction at index 0
449        ];
450
451        let result = merge_instruction_events(events);
452
453        // 应该合并为1个事件
454        assert_eq!(result.len(), 1);
455
456        // 验证合并结果包含两者的数据
457        if let DexEvent::PumpFunTrade(trade) = &result[0] {
458            assert_eq!(trade.sol_amount, 1000); // 来自 inner
459            assert_eq!(trade.token_amount, 2000); // 来自 inner
460            assert_ne!(trade.bonding_curve, Pubkey::default()); // 来自 outer
461        } else {
462            panic!("Expected PumpFunTrade event");
463        }
464    }
465
466    #[test]
467    fn test_merge_instruction_events_chains_multiple_inners_same_outer() {
468        use solana_sdk::signature::Signature;
469
470        let metadata = EventMetadata {
471            signature: Signature::default(),
472            slot: 100,
473            tx_index: 1,
474            block_time_us: 1000,
475            grpc_recv_us: 2000,
476            recent_blockhash: None,
477        };
478
479        let bc = Pubkey::new_unique();
480        let fee = Pubkey::new_unique();
481
482        let outer_event = DexEvent::PumpFunTrade(PumpFunTradeEvent {
483            metadata: metadata.clone(),
484            bonding_curve: bc,
485            ..Default::default()
486        });
487
488        let inner_trade = DexEvent::PumpFunTrade(PumpFunTradeEvent {
489            metadata: metadata.clone(),
490            sol_amount: 1000,
491            token_amount: 2000,
492            is_buy: true,
493            ..Default::default()
494        });
495
496        // 第二段 inner 仅有 fee_recipient,无成交量 —— 不应抹掉第一段金额
497        let inner_fee_only = DexEvent::PumpFunTrade(PumpFunTradeEvent {
498            metadata: metadata.clone(),
499            fee_recipient: fee,
500            ..Default::default()
501        });
502
503        let events =
504            vec![(0, None, outer_event), (0, Some(0), inner_trade), (0, Some(1), inner_fee_only)];
505
506        let result = merge_instruction_events(events);
507        assert_eq!(result.len(), 1);
508        if let DexEvent::PumpFunTrade(trade) = &result[0] {
509            assert_eq!(trade.bonding_curve, bc);
510            assert_eq!(trade.sol_amount, 1000);
511            assert_eq!(trade.token_amount, 2000);
512            assert_eq!(trade.fee_recipient, fee);
513        } else {
514            panic!("Expected PumpFunTrade event");
515        }
516    }
517}