|
40 | 40 | "type": "IR-GEN",
|
41 | 41 | "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
42 | 42 | "environment": {},
|
43 |
| - "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], |
| 43 | + "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32,1 '" ], |
44 | 44 | "extensions": ["avx512.*"]
|
45 | 45 | },
|
46 | 46 | "gemm_fp32_mlir_vector_avx2": {
|
47 | 47 | "type": "IR-GEN",
|
48 | 48 | "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
49 | 49 | "environment": {},
|
50 |
| - "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=4,16 '" ], |
| 50 | + "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=4,16,1 '" ], |
51 | 51 | "extensions": ["avx2"]
|
52 | 52 | },
|
53 | 53 | "gemm_fp32_mlir_vector_sve": {
|
54 | 54 | "type": "IR-GEN",
|
55 | 55 | "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
56 | 56 | "environment": {},
|
57 |
| - "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=4,32 '" ], |
| 57 | + "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=4,32,1 '" ], |
58 | 58 | "extensions": ["asimd"]
|
59 | 59 | },
|
60 | 60 | "gemm_bf16_dp2_mlir": {
|
|
82 | 82 | "type": "IR-GEN",
|
83 | 83 | "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
84 | 84 | "environment": {},
|
85 |
| - "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], |
| 85 | + "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32,1 '" ], |
86 | 86 | "extensions": ["avx512.*"]
|
87 | 87 | },
|
88 | 88 | "mlp_fp32_mlir_vector_avx2": {
|
89 | 89 | "type": "IR-GEN",
|
90 | 90 | "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
91 | 91 | "environment": {},
|
92 |
| - "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=4,16 '" ], |
| 92 | + "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=4,16,1 '" ], |
93 | 93 | "extensions": ["avx2" ]
|
94 | 94 | },
|
95 | 95 | "mlp_fp32_mlir_vector_sve": {
|
96 | 96 | "type": "IR-GEN",
|
97 | 97 | "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ],
|
98 | 98 | "environment": {},
|
99 |
| - "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=4,32 '" ], |
| 99 | + "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=4,32,1 '" ], |
100 | 100 | "extensions": ["asimd"]
|
101 | 101 | },
|
102 | 102 | "mlp_bf16_dp2_mlir": {
|
|
127 | 127 | "type": "IR-GEN",
|
128 | 128 | "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ],
|
129 | 129 | "environment": {},
|
130 |
| - "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], |
| 130 | + "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32,1 '" ], |
131 | 131 | "extensions": [ "avx512.*" ]
|
132 | 132 | },
|
133 | 133 | "fp32_3x1024_args_mlir": {
|
|
141 | 141 | "type": "IR-GEN",
|
142 | 142 | "benchmark": [ "mlir-gen", "--kernel=args --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ],
|
143 | 143 | "environment": {},
|
144 |
| - "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], |
| 144 | + "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32,1 '" ], |
145 | 145 | "extensions": [ "avx512.*" ]
|
146 | 146 | },
|
147 | 147 | "bf16_3x1024_const_mlir": {
|
|
172 | 172 | "type": "IR-GEN",
|
173 | 173 | "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ],
|
174 | 174 | "environment": {},
|
175 |
| - "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], |
| 175 | + "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32,1 '" ], |
176 | 176 | "extensions": [ "avx512.*" ]
|
177 | 177 | },
|
178 | 178 | "fp32_3x1024_args_mlir": {
|
|
186 | 186 | "type": "IR-GEN",
|
187 | 187 | "benchmark": [ "mlir-gen", "--kernel=args --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ],
|
188 | 188 | "environment": {},
|
189 |
| - "flags": [ "-n", "100", "-run-args=' --def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], |
| 189 | + "flags": [ "-n", "100", "-run-args=' --def-parallel --vector-to-kernels --registerBlocking=8,32,1 '" ], |
190 | 190 | "extensions": [ "avx512.*" ]
|
191 | 191 | },
|
192 | 192 | "bf16_3x1024_const_mlir": {
|
|
0 commit comments