1use core::fmt::Display;
2
3use alloc::string::ToString;
4use alloc::vec::Vec;
5
6use crate::{Allocator, AtomicOp, Bitwise, Comparison, Operator};
7
8use super::{
9    Arithmetic, Branch, CoopMma, ElemType, Instruction, Metadata, Operation, UIntKind, Variable,
10    VariableKind,
11};
12
13pub trait Processor: core::fmt::Debug {
14    fn transform(&self, processing: ScopeProcessing, allocator: Allocator) -> ScopeProcessing;
15}
16
17pub struct ScopeProcessing {
19    pub variables: Vec<Variable>,
21    pub instructions: Vec<Instruction>,
23}
24
25impl Display for ScopeProcessing {
26    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
27        writeln!(f, "{{")?;
28        for instruction in self.instructions.iter() {
29            let instruction_str = instruction.to_string();
30            if !instruction_str.is_empty() {
31                writeln!(f, "    {instruction_str}")?;
32            }
33        }
34        write!(f, "}}")?;
35        Ok(())
36    }
37}
38
39impl ScopeProcessing {
40    pub fn optimize(self) -> Self {
48        self.sanitize_constant_scalars()
49    }
50
51    fn sanitize_constant_scalars(mut self) -> Self {
54        self.instructions
55            .iter_mut()
56            .for_each(|inst| match &mut inst.operation {
57                Operation::Copy(op) => {
58                    sanitize_constant_scalar_ref_var(op, &inst.out.unwrap());
59                }
60                Operation::Arithmetic(op) => match op {
61                    Arithmetic::Add(op) => {
62                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
63                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
64                    }
65                    Arithmetic::SaturatingAdd(op) => {
66                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
67                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
68                    }
69                    Arithmetic::Fma(op) => {
70                        sanitize_constant_scalar_ref_var(&mut op.a, &inst.out.unwrap());
71                        sanitize_constant_scalar_ref_var(&mut op.b, &inst.out.unwrap());
72                        sanitize_constant_scalar_ref_var(&mut op.c, &inst.out.unwrap());
73                    }
74                    Arithmetic::Sub(op) => {
75                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
76                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
77                    }
78                    Arithmetic::SaturatingSub(op) => {
79                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
80                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
81                    }
82                    Arithmetic::Mul(op) => {
83                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
84                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
85                    }
86                    Arithmetic::Div(op) => {
87                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
88                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
89                    }
90                    Arithmetic::MulHi(op) => {
91                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
92                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
93                    }
94                    Arithmetic::Abs(op) => {
95                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
96                    }
97                    Arithmetic::Exp(op) => {
98                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
99                    }
100                    Arithmetic::Log(op) => {
101                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
102                    }
103                    Arithmetic::Log1p(op) => {
104                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
105                    }
106                    Arithmetic::Cos(op) => {
107                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
108                    }
109                    Arithmetic::Sin(op) => {
110                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
111                    }
112                    Arithmetic::Tanh(op) => {
113                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
114                    }
115                    Arithmetic::Powf(op) => {
116                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
117                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
118                    }
119                    Arithmetic::Powi(op) => {
120                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
121                    }
122                    Arithmetic::Sqrt(op) => {
123                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
124                    }
125                    Arithmetic::Round(op) => {
126                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
127                    }
128                    Arithmetic::Floor(op) => {
129                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
130                    }
131                    Arithmetic::Ceil(op) => {
132                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
133                    }
134                    Arithmetic::Trunc(op) => {
135                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
136                    }
137                    Arithmetic::Erf(op) => {
138                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
139                    }
140                    Arithmetic::Recip(op) => {
141                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
142                    }
143                    Arithmetic::Clamp(op) => {
144                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
145                        sanitize_constant_scalar_ref_var(&mut op.min_value, &inst.out.unwrap());
146                        sanitize_constant_scalar_ref_var(&mut op.max_value, &inst.out.unwrap());
147                    }
148                    Arithmetic::Modulo(op) => {
149                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
150                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
151                    }
152                    Arithmetic::Neg(op) => {
153                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap())
154                    }
155                    Arithmetic::Max(op) => {
156                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
157                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
158                    }
159                    Arithmetic::Min(op) => {
160                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
161                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
162                    }
163                    Arithmetic::Remainder(op) => {
164                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
165                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
166                    }
167                    Arithmetic::Magnitude(op) => {
168                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
169                    }
170                    Arithmetic::Normalize(op) => {
171                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
172                    }
173                    Arithmetic::Dot(op) => {
174                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
175                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
176                    }
177                },
178                Operation::Comparison(op) => match op {
179                    Comparison::Greater(op) => {
180                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
181                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
182                    }
183                    Comparison::LowerEqual(op) => {
184                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
185                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
186                    }
187                    Comparison::GreaterEqual(op) => {
188                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
189                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
190                    }
191                    Comparison::Equal(op) => {
192                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
193                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
194                    }
195                    Comparison::NotEqual(op) => {
196                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
197                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
198                    }
199                    Comparison::Lower(op) => {
200                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
201                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
202                    }
203                    Comparison::IsNan(_op) | Comparison::IsInf(_op) => {
204                        }
206                },
207                Operation::Bitwise(op) => match op {
208                    Bitwise::BitwiseAnd(op) => {
209                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
210                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
211                    }
212                    Bitwise::BitwiseOr(op) => {
213                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
214                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
215                    }
216                    Bitwise::BitwiseXor(op) => {
217                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
218                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
219                    }
220                    Bitwise::CountOnes(_) | Bitwise::LeadingZeros(_) | Bitwise::FindFirstSet(_) => {
221                        }
223                    Bitwise::ReverseBits(op) => {
224                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
225                    }
226                    Bitwise::ShiftLeft(op) => {
227                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
228                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
229                    }
230                    Bitwise::ShiftRight(op) => {
231                        sanitize_constant_scalar_ref_var(&mut op.lhs, &inst.out.unwrap());
232                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
233                    }
234                    Bitwise::BitwiseNot(op) => {
235                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
236                    }
237                },
238                Operation::Operator(op) => match op {
239                    Operator::Index(op) => {
240                        sanitize_constant_scalar_ref_var(&mut op.list, &inst.out.unwrap());
241                        sanitize_constant_scalar_ref_elem(
242                            &mut op.index,
243                            ElemType::UInt(UIntKind::U32),
244                        );
245                    }
246                    Operator::UncheckedIndex(op) => {
247                        sanitize_constant_scalar_ref_var(&mut op.list, &inst.out.unwrap());
248                        sanitize_constant_scalar_ref_elem(
249                            &mut op.index,
250                            ElemType::UInt(UIntKind::U32),
251                        );
252                    }
253                    Operator::IndexAssign(op) => {
254                        sanitize_constant_scalar_ref_elem(
255                            &mut op.index,
256                            ElemType::UInt(UIntKind::U32),
257                        );
258                        sanitize_constant_scalar_ref_var(&mut op.value, &inst.out.unwrap());
259                    }
260                    Operator::UncheckedIndexAssign(op) => {
261                        sanitize_constant_scalar_ref_elem(
262                            &mut op.index,
263                            ElemType::UInt(UIntKind::U32),
264                        );
265                        sanitize_constant_scalar_ref_var(&mut op.value, &inst.out.unwrap());
266                    }
267                    Operator::And(op) => {
268                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
269                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
270                    }
271                    Operator::Or(op) => {
272                        sanitize_constant_scalar_ref_var(&mut op.lhs, &op.rhs);
273                        sanitize_constant_scalar_ref_var(&mut op.rhs, &op.lhs);
274                    }
275                    Operator::Not(op) => {
276                        sanitize_constant_scalar_ref_elem(&mut op.input, ElemType::Bool);
277                    }
278                    Operator::InitLine(_) => {
279                        }
281                    Operator::CopyMemory(op) => {
282                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
283                        sanitize_constant_scalar_ref_elem(
284                            &mut op.in_index,
285                            ElemType::UInt(UIntKind::U32),
286                        );
287                        sanitize_constant_scalar_ref_elem(
288                            &mut op.out_index,
289                            ElemType::UInt(UIntKind::U32),
290                        );
291                    }
292                    Operator::CopyMemoryBulk(op) => {
293                        sanitize_constant_scalar_ref_var(&mut op.input, &inst.out.unwrap());
294                        sanitize_constant_scalar_ref_elem(
295                            &mut op.in_index,
296                            ElemType::UInt(UIntKind::U32),
297                        );
298                        sanitize_constant_scalar_ref_elem(
299                            &mut op.out_index,
300                            ElemType::UInt(UIntKind::U32),
301                        );
302                    }
303                    Operator::Select(op) => {
304                        sanitize_constant_scalar_ref_elem(&mut op.cond, ElemType::Bool);
305                        sanitize_constant_scalar_ref_var(&mut op.then, &inst.out.unwrap());
306                        sanitize_constant_scalar_ref_var(&mut op.or_else, &inst.out.unwrap());
307                    }
308                    Operator::Cast(_) => {}
309                    Operator::Reinterpret(_) => {}
310                },
311                Operation::Atomic(op) => match op {
312                    AtomicOp::Load(_) => {}
313                    AtomicOp::Store(_) => {}
314                    AtomicOp::Swap(op) => {
315                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
316                    }
317                    AtomicOp::CompareAndSwap(op) => {
318                        sanitize_constant_scalar_ref_var(&mut op.cmp, &inst.out.unwrap());
319                        sanitize_constant_scalar_ref_var(&mut op.val, &inst.out.unwrap());
320                    }
321                    AtomicOp::Add(op) => {
322                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
323                    }
324                    AtomicOp::Sub(op) => {
325                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
326                    }
327                    AtomicOp::Max(op) => {
328                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
329                    }
330                    AtomicOp::Min(op) => {
331                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
332                    }
333                    AtomicOp::And(op) => {
334                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
335                    }
336                    AtomicOp::Or(op) => {
337                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
338                    }
339                    AtomicOp::Xor(op) => {
340                        sanitize_constant_scalar_ref_var(&mut op.rhs, &inst.out.unwrap());
341                    }
342                },
343                Operation::Metadata(op) => match op {
344                    Metadata::Stride { dim, .. } => {
345                        sanitize_constant_scalar_ref_elem(dim, ElemType::UInt(UIntKind::U32));
346                    }
347                    Metadata::Shape { dim, .. } => {
348                        sanitize_constant_scalar_ref_elem(dim, ElemType::UInt(UIntKind::U32));
349                    }
350                    Metadata::Length { .. }
351                    | Metadata::BufferLength { .. }
352                    | Metadata::Rank { .. } => {
353                        }
355                },
356                Operation::Branch(op) => match op {
357                    Branch::If(op) => {
358                        sanitize_constant_scalar_ref_elem(&mut op.cond, ElemType::Bool);
359                    }
360                    Branch::IfElse(op) => {
361                        sanitize_constant_scalar_ref_elem(&mut op.cond, ElemType::Bool);
362                    }
363                    Branch::RangeLoop(op) => {
364                        sanitize_constant_scalar_ref_var(&mut op.end, &op.start);
365                        sanitize_constant_scalar_ref_var(&mut op.i, &op.start);
366                        if let Some(step) = &mut op.step {
367                            sanitize_constant_scalar_ref_elem(step, ElemType::UInt(UIntKind::U32));
368                        }
369                    }
370                    _ => {
371                        }
373                },
374                Operation::Synchronization(_) => {
375                    }
377                Operation::Plane(_) => {
378                    }
380                Operation::CoopMma(op) => match op {
381                    CoopMma::Fill { value } => {
382                        sanitize_constant_scalar_ref_var(value, &inst.out.unwrap());
383                    }
384                    CoopMma::Load { value, stride, .. } => {
385                        sanitize_constant_scalar_ref_var(value, &inst.out.unwrap());
386                        sanitize_constant_scalar_ref_elem(stride, ElemType::UInt(UIntKind::U32));
387                    }
388                    CoopMma::Execute { .. }
389                    | CoopMma::ExecuteManual { .. }
390                    | CoopMma::ExecuteScaled { .. } => {
391                        }
393                    CoopMma::Store { stride, .. } => {
394                        sanitize_constant_scalar_ref_elem(stride, ElemType::UInt(UIntKind::U32));
395                    }
396                    CoopMma::Cast { .. } => {
397                        }
399                    CoopMma::RowIndex { lane_id, i, .. } => {
400                        sanitize_constant_scalar_ref_elem(lane_id, ElemType::UInt(UIntKind::U32));
401                        sanitize_constant_scalar_ref_elem(i, ElemType::UInt(UIntKind::U32));
402                    }
403                    CoopMma::ColIndex { lane_id, i, .. } => {
404                        sanitize_constant_scalar_ref_elem(lane_id, ElemType::UInt(UIntKind::U32));
405                        sanitize_constant_scalar_ref_elem(i, ElemType::UInt(UIntKind::U32));
406                    }
407                },
408                Operation::NonSemantic(_) => {
409                    }
411                Operation::Barrier(_) => {
412                    }
414                Operation::Tma(_) => {
415                    }
417                Operation::Free(_) => {
418                    }
420            });
421        self
422    }
423}
424
425fn sanitize_constant_scalar_ref_var(var: &mut Variable, reference: &Variable) {
426    let elem = reference.ty.elem_type();
427    sanitize_constant_scalar_ref_elem(var, elem);
428}
429
430fn sanitize_constant_scalar_ref_elem(var: &mut Variable, elem: ElemType) {
431    if let VariableKind::ConstantScalar(scalar) = var.kind
432        && scalar.elem_type() != elem
433    {
434        *var = match scalar {
435            super::ConstantScalarValue::Int(val, _) => elem.constant_from_i64(val),
436            super::ConstantScalarValue::Float(val, _) => elem.constant_from_f64(val),
437            super::ConstantScalarValue::UInt(val, _) => elem.constant_from_u64(val),
438            super::ConstantScalarValue::Bool(val) => elem.constant_from_bool(val),
439        };
440    }
441}