diff --git a/deep_gemm/jit/interleave_ffma.py b/deep_gemm/jit/interleave_ffma.py index 74e8358..fcb377e 100644 --- a/deep_gemm/jit/interleave_ffma.py +++ b/deep_gemm/jit/interleave_ffma.py @@ -73,7 +73,7 @@ def parse_registers(line): def modify_segment(m, name, ffma_lines): - num_lines = len(ffma_lines) + num_lines = (len(ffma_lines) * 9 // 16) // 2 * 2 assert num_lines % 2 == 0 le_bytes, new_le_bytes = [], []