From 40949e60857fcea8e7b8d9c476c01bca027a2057 Mon Sep 17 00:00:00 2001 From: Olivier Marsden Date: Mon, 17 Jun 2024 08:33:45 +0000 Subject: [PATCH] Improved runtime information on GPU binary. --- src/trans/gpu/external/setup_trans0.F90 | 20 +++++++++++++++++--- 1 file changed, 17 insertions(+), 3 deletions(-) diff --git a/src/trans/gpu/external/setup_trans0.F90 b/src/trans/gpu/external/setup_trans0.F90 index 2c18a35d..b6dedbde 100755 --- a/src/trans/gpu/external/setup_trans0.F90 +++ b/src/trans/gpu/external/setup_trans0.F90 @@ -191,10 +191,24 @@ SUBROUTINE SETUP_TRANS0(KOUT,KERR,KPRINTLEV,KMAX_RESOL,KPROMATR,& WRITE(NOUT,'(A)') WRITE(NOUT,'(A)') "ecTrans at version: " // ECTRANS_VERSION_STR() WRITE(NOUT,'(A)') "commit: " // ECTRANS_GIT_SHA1() -#ifdef USE_CUDA_AWARE_MPI_FT -WRITE(NOUT,'(A)') "GPU version with GPU-aware MPI" +WRITE(NOUT,'(A)') +WRITE(NOUT,'(A)') "GPU version, with following compile-time options : " +#ifdef ACCGPU + WRITE(NOUT,'(A)') " - OpenACC-based offload" #else -WRITE(NOUT,'(A)') "GPU version" + WRITE(NOUT,'(A)') " - OpenMP-based offload" +#endif +#ifdef USE_CUDA_AWARE_MPI_FT + WRITE(NOUT,'(A)') " - GPU-aware MPI" +#endif +#ifdef USE_GRAPHS_GEMM + WRITE(NOUT,'(A)') " - graph-based GEMM scheduling" +#endif +#ifdef USE_CUTLASS + WRITE(NOUT,'(A)') " - Cutlass-based GEMM operations" +#endif +#ifdef USE_3XTF32 + WRITE(NOUT,'(A)') " - tensor-core usage for 32b Cutlass operations" #endif WRITE(NOUT,'(A)')