diff --git a/benchmarks/config/base/base.json b/benchmarks/config/base/base.json index a1a4e8163..f8495339d 100644 --- a/benchmarks/config/base/base.json +++ b/benchmarks/config/base/base.json @@ -41,7 +41,7 @@ "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": {}, "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": ["avx512f"] + "extensions": ["avx512.*"] }, "gemm_fp32_mlir_vector_avx2": { "type": "IR-GEN", @@ -83,7 +83,7 @@ "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": {}, "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": ["avx512f"] + "extensions": ["avx512.*"] }, "mlp_fp32_mlir_vector_avx2": { "type": "IR-GEN", @@ -128,7 +128,7 @@ "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ], "environment": {}, "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_args_mlir": { "type": "IR-GEN", @@ -142,7 +142,7 @@ "benchmark": [ "mlir-gen", "--kernel=args --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ], "environment": {}, "flags": [ "-n", "100", "-run-args='--vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "bf16_3x1024_const_mlir": { "type": "IR-GEN", @@ -173,7 +173,7 @@ "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ], "environment": {}, "flags": [ "-n", "100", "-run-args='--def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_args_mlir": { "type": "IR-GEN", @@ -187,7 +187,7 @@ "benchmark": [ "mlir-gen", "--kernel=args --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024" ], "environment": {}, "flags": [ "-n", "100", "-run-args=' --def-parallel --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "bf16_3x1024_const_mlir": { "type": "IR-GEN", diff --git a/benchmarks/config/omp/mlir-fp32-vector-to-kernel.json b/benchmarks/config/omp/mlir-fp32-vector-to-kernel.json index e78318fdf..a5f47a4bd 100644 --- a/benchmarks/config/omp/mlir-fp32-vector-to-kernel.json +++ b/benchmarks/config/omp/mlir-fp32-vector-to-kernel.json @@ -6,28 +6,28 @@ "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "2", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=8,16 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_4_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "4", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=8,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_8_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "8", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_16_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=2,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] } }}, { @@ -37,28 +37,28 @@ "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "2", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=8,16 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_4_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "4", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=8,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_8_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "8", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_16_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=32,32,32" ], "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=2,8 --vector-to-kernels --registerBlocking=8,32 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] } }}, { @@ -68,28 +68,28 @@ "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "2", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,8 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_4_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "4", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_8_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "8", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=2,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_16_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=1,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] } }}, { @@ -99,28 +99,28 @@ "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "2", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,8 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_4_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "4", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=4,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_8_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "8", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=2,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] }, "fp32_3x1024_omp_16_mlir": { "type": "IR-GEN", "benchmark": [ "mlir-gen", "--kernel=const --bias --relu --float-type=f32 --batch=256 --layers=1024,1024,1024,1024 --tiles=64,64,64" ], "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, "flags": [ "-n", "100", "-run-args='--def-parallel --parallel-task-grid=1,4 --vector-to-kernels --registerBlocking=4,64 '" ], - "extensions": [ "avx512f" ] + "extensions": [ "avx512.*" ] } }}, {