Skip to content

Commit 2b89dc2

Browse files
authored
[CI] Add i8->i32 matmul pack-peel-4-level-tiling performance tests (nod-ai#1072)
Adds new Strix performance tests with 4 levels of tiling, which should result in better performance. Note that this couldn't be added before as this needed the fix from nod-ai#1060.
1 parent b29bd11 commit 2b89dc2

File tree

1 file changed

+30
-0
lines changed
  • build_tools/ci/cpu_comparison

1 file changed

+30
-0
lines changed

build_tools/ci/cpu_comparison/run.py

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2082,6 +2082,36 @@ def __init__(self):
20822082
"run_on_target": "npu4",
20832083
"skip_numerics": True,
20842084
},
2085+
{
2086+
"M": 512,
2087+
"N": 4096,
2088+
"K": 512,
2089+
"in_dtype": "i8",
2090+
"out_dtype": "i32",
2091+
"use_ukernel": True,
2092+
"peano_opt_level": 3,
2093+
"outline": "all",
2094+
"transpose_a": False,
2095+
"transpose_b": False,
2096+
"tile_pipeline": "pack-peel-4-level-tiling",
2097+
"run_on_target": "npu4",
2098+
},
2099+
{
2100+
"M": 512,
2101+
"N": 4096,
2102+
"K": 512,
2103+
"in_dtype": "i8",
2104+
"out_dtype": "i32",
2105+
"use_ukernel": False,
2106+
"peano_opt_level": 3,
2107+
"outline": "all",
2108+
"outline_to_empty_function": True,
2109+
"transpose_a": False,
2110+
"transpose_b": False,
2111+
"tile_pipeline": "pack-peel-4-level-tiling",
2112+
"run_on_target": "npu4",
2113+
"skip_numerics": True,
2114+
},
20852115
]
20862116

20872117
# Some bf16 Performance tests:

0 commit comments

Comments
 (0)