From c9e0a5f200a023b0687428561fbcefc9332f93c2 Mon Sep 17 00:00:00 2001 From: Tony Gutierrez Date: Mon, 8 Apr 2019 12:21:53 -0400 Subject: [PATCH] arch: Bump MaxVecRegLenInBytes to 4096 The GPU model uses the generic vector register containers, however the maximum vector register length is fixed at 256, which is an invalid assumption for the GPU model as it can operate on vectors up to 4096B. Change-Id: Id85e0ed45c9a9c1a4bb6e712c44eaeec2d628fce Reviewed-on: https://gem5-review.googlesource.com/c/public/gem5/+/17908 Reviewed-by: Anthony Gutierrez Maintainer: Anthony Gutierrez Tested-by: kokoro --- src/arch/generic/vec_reg.hh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/arch/generic/vec_reg.hh b/src/arch/generic/vec_reg.hh index ed2545c64..aab307b42 100644 --- a/src/arch/generic/vec_reg.hh +++ b/src/arch/generic/vec_reg.hh @@ -154,7 +154,7 @@ #include "base/cprintf.hh" #include "base/logging.hh" -constexpr unsigned MaxVecRegLenInBytes = 256; +constexpr unsigned MaxVecRegLenInBytes = 4096; template class VecRegContainer; @@ -523,6 +523,7 @@ class VecLaneT friend class VecRegContainer<32>; friend class VecRegContainer<64>; friend class VecRegContainer<128>; + friend class VecRegContainer<256>; friend class VecRegContainer; /** My type alias. */ -- 2.30.2