From: Xianwei Zhang Date: Thu, 28 Jun 2018 06:13:29 +0000 (-0400) Subject: config: fix settings of kernel boundary sync flags X-Git-Tag: v20.1.0.0~562 X-Git-Url: https://git.libre-soc.org/?a=commitdiff_plain;h=f552ab85cb4f8d8256116490d6cc644deb4d55be;p=gem5.git config: fix settings of kernel boundary sync flags Change-Id: I58a8edc5d324bdcaa84e3d715e2712a43e8ede0d Reviewed-on: https://gem5-review.googlesource.com/c/public/gem5/+/29918 Reviewed-by: Anthony Gutierrez Reviewed-by: Matt Sinclair Reviewed-by: Xianwei Zhang Maintainer: Anthony Gutierrez Tested-by: kokoro --- diff --git a/configs/example/apu_se.py b/configs/example/apu_se.py index fee85f09d..0ff80d8e1 100644 --- a/configs/example/apu_se.py +++ b/configs/example/apu_se.py @@ -209,13 +209,23 @@ shader = Shader(n_wf = options.wfs_per_simd, # So, all GPU protocols other than GPU_RfO should make their writes # visible to the global memory and should read from global memory # during kernal boundary. The pipeline initiates(or do not initiate) -# the acquire/release operation depending on this impl_kern_boundary_sync -# flag. This flag=true means pipeline initiates a acquire/release operation -# at kernel boundary. +# the acquire/release operation depending on these impl_kern_launch_rel +# and impl_kern_end_rel flags. The flag=true means pipeline initiates +# a acquire/release operation at kernel launch/end. +# VIPER protocols (GPU_VIPER, GPU_VIPER_Region and GPU_VIPER_Baseline) +# are write-through based, and thus only imple_kern_launch_acq needs to +# set. if buildEnv['PROTOCOL'] == 'GPU_RfO': - shader.impl_kern_boundary_sync = False + shader.impl_kern_launch_acq = False + shader.impl_kern_end_rel = False +elif (buildEnv['PROTOCOL'] != 'GPU_VIPER' or + buildEnv['PROTOCOL'] != 'GPU_VIPER_Region' or + buildEnv['PROTOCOL'] != 'GPU_VIPER_Baseline'): + shader.impl_kern_launch_acq = True + shader.impl_kern_end_rel = False else: - shader.impl_kern_boundary_sync = True + shader.impl_kern_launch_acq = True + shader.impl_kern_end_rel = True # Switching off per-lane TLB by default per_lane = False