From 5f82e0d74bec507222fe05d1fc1a84633815822a Mon Sep 17 00:00:00 2001 From: Alexander Heinecke Date: Sat, 8 Feb 2025 00:22:59 -0800 Subject: [PATCH] updated more libxsmm scripts --- benchmarks/config/base/base.json | 8 ++++---- benchmarks/config/fc/1024x1024x512.json | 12 ++++++------ benchmarks/config/fc/1024x2560x1024.json | 12 ++++++------ benchmarks/config/fc/1024x352x512.json | 12 ++++++------ benchmarks/config/fc/1024x512x256.json | 12 ++++++------ benchmarks/config/fc/128x1024x1024.json | 12 ++++++------ benchmarks/config/fc/128x1024x4096.json | 12 ++++++------ benchmarks/config/fc/128x3072x768.json | 12 ++++++------ benchmarks/config/fc/128x4096x1024.json | 12 ++++++------ benchmarks/config/fc/128x768x2304.json | 12 ++++++------ benchmarks/config/fc/128x768x3072.json | 12 ++++++------ benchmarks/config/fc/256x1024x1024.json | 12 ++++++------ benchmarks/config/fc/256x1024x4096.json | 12 ++++++------ benchmarks/config/fc/256x3072x768.json | 12 ++++++------ benchmarks/config/fc/256x4096x1024.json | 12 ++++++------ benchmarks/config/fc/256x768x3072.json | 12 ++++++------ benchmarks/config/fc/256x768x768.json | 12 ++++++------ 17 files changed, 100 insertions(+), 100 deletions(-) diff --git a/benchmarks/config/base/base.json b/benchmarks/config/base/base.json index f8495339d..15e2f3d06 100644 --- a/benchmarks/config/base/base.json +++ b/benchmarks/config/base/base.json @@ -5,28 +5,28 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": {}, - "flags": [ "100", "256", "0", "F", "32", "32", "32", "0", "0", "1024", "1024", "1024", "1024" ], + "flags": [ "100", "256", "0", "F", "32", "32", "32", "0", "1", "1024", "1024", "1024", "1024" ], "extensions": [] }, "gemm_bf16_dnn_target": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": {}, - "flags": [ "100", "256", "0", "F", "32", "32", "32", "1", "1", "1024", "1024", "1024", "1024" ], + "flags": [ "100", "256", "0", "F", "32", "32", "32", "1", "2", "1024", "1024", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "mlp_fp32_dnn_target": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": {}, - "flags": [ "100", "256", "5", "F", "32", "32", "32", "0", "0", "1024", "1024", "1024", "1024" ], + "flags": [ "100", "256", "5", "F", "32", "32", "32", "0", "1", "1024", "1024", "1024", "1024" ], "extensions": [] }, "mlp_bf16_dnn_target": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": {}, - "flags": [ "100", "256", "5", "F", "32", "32", "32", "1", "1", "1024", "1024", "1024", "1024" ], + "flags": [ "100", "256", "5", "F", "32", "32", "32", "1", "2", "1024", "1024", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "gemm_fp32_mlir": { diff --git a/benchmarks/config/fc/1024x1024x512.json b/benchmarks/config/fc/1024x1024x512.json index a19df9cdb..d98fd17c3 100644 --- a/benchmarks/config/fc/1024x1024x512.json +++ b/benchmarks/config/fc/1024x1024x512.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "512", "1024" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "512", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "512", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "512", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "512", "1024" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "512", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "512", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "512", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/1024x2560x1024.json b/benchmarks/config/fc/1024x2560x1024.json index 8db88e17a..67b71ca95 100644 --- a/benchmarks/config/fc/1024x2560x1024.json +++ b/benchmarks/config/fc/1024x2560x1024.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "1024", "2560" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "1024", "2560" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "1024", "2560" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "1024", "2560" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "1024", "2560" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "1024", "2560" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "1024", "2560" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "1024", "2560" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/1024x352x512.json b/benchmarks/config/fc/1024x352x512.json index 3502704b1..2afda78e2 100644 --- a/benchmarks/config/fc/1024x352x512.json +++ b/benchmarks/config/fc/1024x352x512.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "32", "32", "32", "0", "0", "512", "352" ], + "flags": [ "100", "1024", "3", "F", "32", "32", "32", "0", "1", "512", "352" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "32", "32", "32", "0", "0", "512", "352" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "32", "32", "32", "0", "1", "512", "352" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "32", "32", "32", "1", "1", "512", "352" ], + "flags": [ "100", "1024", "3", "F", "32", "32", "32", "1", "2", "512", "352" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "32", "32", "32", "1", "1", "512", "352" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "32", "32", "32", "1", "2", "512", "352" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/1024x512x256.json b/benchmarks/config/fc/1024x512x256.json index 02526aec2..d6c08a3eb 100644 --- a/benchmarks/config/fc/1024x512x256.json +++ b/benchmarks/config/fc/1024x512x256.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "256", "512" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "256", "512" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "0", "256", "512" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "0", "1", "256", "512" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "256", "512" ], + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "256", "512" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "1", "256", "512" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "1024", "3", "F", "64", "64", "64", "1", "2", "256", "512" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x1024x1024.json b/benchmarks/config/fc/128x1024x1024.json index a39c766e4..32ee065b5 100644 --- a/benchmarks/config/fc/128x1024x1024.json +++ b/benchmarks/config/fc/128x1024x1024.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "1024", "1024" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "1024", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "1024", "1024" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "1024", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x1024x4096.json b/benchmarks/config/fc/128x1024x4096.json index 91d3d0d3a..5bb7d2fb5 100644 --- a/benchmarks/config/fc/128x1024x4096.json +++ b/benchmarks/config/fc/128x1024x4096.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "4096", "1024" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "4096", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "4096", "1024" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "4096", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x3072x768.json b/benchmarks/config/fc/128x3072x768.json index 74ef3c736..89f412c03 100644 --- a/benchmarks/config/fc/128x3072x768.json +++ b/benchmarks/config/fc/128x3072x768.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "768", "3072" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "768", "3072" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "768", "3072" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "768", "3072" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x4096x1024.json b/benchmarks/config/fc/128x4096x1024.json index 78f909abc..4bd8707e0 100644 --- a/benchmarks/config/fc/128x4096x1024.json +++ b/benchmarks/config/fc/128x4096x1024.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "1024", "4096" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "0", "1024", "4096" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "0", "1", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "1024", "4096" ], + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "1", "1024", "4096" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "64", "1", "2", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x768x2304.json b/benchmarks/config/fc/128x768x2304.json index b136d59cb..2735bba1f 100644 --- a/benchmarks/config/fc/128x768x2304.json +++ b/benchmarks/config/fc/128x768x2304.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "48", "0", "0", "2304", "768" ], + "flags": [ "100", "128", "3", "F", "64", "64", "48", "0", "1", "2304", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "48", "0", "0", "2304", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "48", "0", "1", "2304", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "64", "64", "48", "1", "1", "2304", "768" ], + "flags": [ "100", "128", "3", "F", "64", "64", "48", "1", "2", "2304", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "64", "64", "48", "1", "1", "2304", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "64", "64", "48", "1", "2", "2304", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/128x768x3072.json b/benchmarks/config/fc/128x768x3072.json index 187f5b9ab..04228c324 100644 --- a/benchmarks/config/fc/128x768x3072.json +++ b/benchmarks/config/fc/128x768x3072.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "32", "32", "48", "0", "0", "3072", "768" ], + "flags": [ "100", "128", "3", "F", "32", "32", "48", "0", "1", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "32", "32", "48", "0", "0", "3072", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "32", "32", "48", "0", "1", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "128", "3", "F", "32", "32", "48", "1", "1", "3072", "768" ], + "flags": [ "100", "128", "3", "F", "32", "32", "48", "1", "2", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "128", "3", "F", "32", "32", "48", "1", "1", "3072", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "128", "3", "F", "32", "32", "48", "1", "2", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x1024x1024.json b/benchmarks/config/fc/256x1024x1024.json index 9cae42455..9d86d7d35 100644 --- a/benchmarks/config/fc/256x1024x1024.json +++ b/benchmarks/config/fc/256x1024x1024.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "1024", "1024" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "1024", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "1024", "1024" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "1024", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "1024", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x1024x4096.json b/benchmarks/config/fc/256x1024x4096.json index 6f3d16eab..47ec92120 100644 --- a/benchmarks/config/fc/256x1024x4096.json +++ b/benchmarks/config/fc/256x1024x4096.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "4096", "1024" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "4096", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "4096", "1024" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "4096", "1024" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "4096", "1024" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x3072x768.json b/benchmarks/config/fc/256x3072x768.json index 66dfbc06d..725e9b756 100644 --- a/benchmarks/config/fc/256x3072x768.json +++ b/benchmarks/config/fc/256x3072x768.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "768", "3072" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "768", "3072" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "768", "3072" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "768", "3072" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "768", "3072" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x4096x1024.json b/benchmarks/config/fc/256x4096x1024.json index 5df4f8dde..72e4a6d93 100644 --- a/benchmarks/config/fc/256x4096x1024.json +++ b/benchmarks/config/fc/256x4096x1024.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "1024", "4096" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "1024", "4096" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "1024", "4096" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "1024", "4096" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "1024", "4096" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x768x3072.json b/benchmarks/config/fc/256x768x3072.json index a5bde928a..795b5cee2 100644 --- a/benchmarks/config/fc/256x768x3072.json +++ b/benchmarks/config/fc/256x768x3072.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "3072", "768" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "3072", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "3072", "768" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "3072", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "3072", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, diff --git a/benchmarks/config/fc/256x768x768.json b/benchmarks/config/fc/256x768x768.json index eea447d19..681ac7b7b 100644 --- a/benchmarks/config/fc/256x768x768.json +++ b/benchmarks/config/fc/256x768x768.json @@ -5,14 +5,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "768", "768" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "768", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_fp32_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "0", "768", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "0", "1", "768", "768" ], "extensions": [ "(avx2|asimd)" ] } }}, @@ -22,14 +22,14 @@ "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", "environment": { "OMP_NUM_THREADS": "1" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "768", "768" ], + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "768", "768" ], "extensions": [ "(avx2|asimd)" ] }, "fc_bf16_omp_16_dnn": { "type": "XSMM-DNN", "benchmark": "xsmm_dnn_mlp", - "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0" }, - "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "1", "768", "768" ], + "environment": { "OMP_NUM_THREADS": "16", "KMP_AFFINITY": "granularity=fine,verbose,compact,1,0", "LIBXSMM_DNN_DISABLE_SFC": "1" }, + "flags": [ "100", "256", "3", "F", "64", "64", "64", "1", "2", "768", "768" ], "extensions": [ "(avx2|asimd)" ] } }},