From a0195132e8739fdea9cbfcef5d04ab1afcfb17c8 Mon Sep 17 00:00:00 2001 From: moneta <lorenzo.moneta@cern.ch> Date: Tue, 21 Aug 2018 10:10:43 +0200 Subject: [PATCH] Use fast zero GPU initialisation for Cuda matrices --- .../src/DNN/Architectures/Cuda/Initialization.cu | 13 ++----------- 1 file changed, 2 insertions(+), 11 deletions(-) diff --git a/tmva/tmva/src/DNN/Architectures/Cuda/Initialization.cu b/tmva/tmva/src/DNN/Architectures/Cuda/Initialization.cu index 6efd88ddcd2..3acb8afebfd 100644 --- a/tmva/tmva/src/DNN/Architectures/Cuda/Initialization.cu +++ b/tmva/tmva/src/DNN/Architectures/Cuda/Initialization.cu @@ -158,17 +158,8 @@ void TCuda<AFloat>::InitializeIdentity(TCudaMatrix<AFloat> & A) template<typename AFloat> void TCuda<AFloat>::InitializeZero(TCudaMatrix<AFloat> & A) { - size_t m,n; - m = A.GetNrows(); - n = A.GetNcols(); - TMatrixT<AFloat> B(m, n); - - for (size_t i = 0; i < m; i++) { - for (size_t j = 0; j < n ; j++) { - B(i,j) = 0.0; - } - } - A = B; + // use fast zero initialization on the device + A.Zero(); } } // namespace DNN -- GitLab