From ac831a6e28cb8a4f5ecf4b514d34e1a3541d900f Mon Sep 17 00:00:00 2001 From: Rahul Jauhari Date: Fri, 18 Oct 2024 11:44:17 +0530 Subject: [PATCH] Update env scripts for MatMul Algo settings - Remove the assignement of MatMul algo from environment scripts. - Add comment for recommended values. Change-Id: Ib51dd28c75b00a6368364cd2947d04acf7ca71b3 Signed-off-by: Rahul Jauhari Reviewed-on: http://gerrit-git.amd.com/c/amd/ec/ZenDNN_ONNXRuntime/+/1138979 Reviewed-by: Chandra Kumar Ramasamy Tested-by: Pratap Gadi (cherry picked from commit a9523c09242d0a67071256a979c6dc9a96a79d25) Reviewed-on: http://gerrit-git.amd.com/c/amd/ec/ZenDNN_ONNXRuntime/+/1139041 Reviewed-by: Kiriti Pendyala Tested-by: Kiriti Pendyala --- scripts/zendnn_ONNXRT_env_setup.sh | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/scripts/zendnn_ONNXRT_env_setup.sh b/scripts/zendnn_ONNXRT_env_setup.sh index 8ff7b84153..470eb6c7f4 100644 --- a/scripts/zendnn_ONNXRT_env_setup.sh +++ b/scripts/zendnn_ONNXRT_env_setup.sh @@ -188,9 +188,12 @@ echo "ZENDNN_INT8_SUPPORT=$ZENDNN_INT8_SUPPORT" export ZENDNN_RELU_UPPERBOUND=0 echo "ZENDNN_RELU_UPPERBOUND=$ZENDNN_RELU_UPPERBOUND" -# ZENDNN_MATMUL_ALGO is set to FP32:3 and BF16:0 by default -export ZENDNN_MATMUL_ALGO=FP32:3,BF16:0 -echo "ZENDNN_MATMUL_ALGO=$ZENDNN_MATMUL_ALGO" +# Matmul Algorithms Settings. By default, it is ZENDNN_MATMUL_ALGO=FP32:4,BF16:3. +# We recommend to override the default settings for NLPs & LLMs models by +# uncommenting the following 'export' and 'echo' commands. Note: Do not +# uncomment for AMP (Auto-Mixed Precision) mode runs of any models. +# export ZENDNN_MATMUL_ALGO=FP32:3,BF16:0 +# echo "ZENDNN_MATMUL_ALGO=$ZENDNN_MATMUL_ALGO" #Use local copy of ZenDNN library source code when building ONNXRT #Default is build from local source for development and verification. @@ -296,9 +299,6 @@ echo "ZENDNN_QUANTIZE_CONV_ADD_FUSION_ENABLE: $ZENDNN_QUANTIZE_CONV_ADD_FUSION_E export ZENDNN_QCONV_CLIP_FUSION_ENABLE=0 echo "ZENDNN_QCONV_CLIP_FUSION_ENABLE: $ZENDNN_QCONV_CLIP_FUSION_ENABLE" -export ZENDNN_WEIGHT_CACHING=1 -echo "ZENDNN_WEIGHT_CACHING: $ZENDNN_WEIGHT_CACHING" - # By default build Open sourced ONNXRuntime and ZenDNN export ZENDNN_ONNXRUNTIME_USE_OPENSOURCE=1 echo "ZENDNN_ONNXRUNTIME_USE_OPENSOURCE: $ZENDNN_ONNXRUNTIME_USE_OPENSOURCE"