[libgomp, nvptx] Report launch dimensions in GOMP_OFFLOAD_run

author Tom de Vries <tdevries@suse.de>

Thu, 8 Oct 2020 06:22:39 +0000 (08:22 +0200)

committer Tom de Vries <tdevries@suse.de>

Thu, 8 Oct 2020 09:03:29 +0000 (11:03 +0200)
author Tom de Vries <tdevries@suse.de>
Thu, 8 Oct 2020 06:22:39 +0000 (08:22 +0200)
committer Tom de Vries <tdevries@suse.de>
Thu, 8 Oct 2020 09:03:29 +0000 (11:03 +0200)
diff --git a/libgomp/plugin/plugin-nvptx.c b/libgomp/plugin/plugin-nvptx.c

index a63dd1a99fbc58b23e0d7bfd68f22254e4238795..11d4ceeae62e141fa7d63a1772d6dcb50de5d6fb 100644 (file)
--- a/libgomp/plugin/plugin-nvptx.c
+++ b/libgomp/plugin/plugin-nvptx.c
@@ -1891,7 +1891,11 @@ nvptx_stacks_free (void *p, int num)
  void
  GOMP_OFFLOAD_run (int ord, void *tgt_fn, void *tgt_vars, void **args)
  {
  void
  GOMP_OFFLOAD_run (int ord, void *tgt_fn, void *tgt_vars, void **args)
  {
-  CUfunction function = ((struct targ_fn_descriptor *) tgt_fn)->fn;
+  struct targ_fn_descriptor *tgt_fn_desc
+    = (struct targ_fn_descriptor *) tgt_fn;
+  CUfunction function = tgt_fn_desc->fn;
+  const struct targ_fn_launch *launch = tgt_fn_desc->launch;
+  const char *fn_name = launch->fn;
    CUresult r;
    struct ptx_device *ptx_dev = ptx_devices[ord];
    const char *maybe_abort_msg = "(perhaps abort was called)";
    CUresult r;
    struct ptx_device *ptx_dev = ptx_devices[ord];
    const char *maybe_abort_msg = "(perhaps abort was called)";
@@ -1926,6 +1930,9 @@ GOMP_OFFLOAD_run (int ord, void *tgt_fn, void *tgt_vars, void **args)
      CU_LAUNCH_PARAM_BUFFER_SIZE, &fn_args_size,
      CU_LAUNCH_PARAM_END
    };
      CU_LAUNCH_PARAM_BUFFER_SIZE, &fn_args_size,
      CU_LAUNCH_PARAM_END
    };
+  GOMP_PLUGIN_debug (0, "  %s: kernel %s: launch"
+                    " [(teams: %u), 1, 1] [(lanes: 32), (threads: %u), 1]\n",
+                    __FUNCTION__, fn_name, teams, threads);
    r = CUDA_CALL_NOCHECK (cuLaunchKernel, function, teams, 1, 1,
                          32, threads, 1, 0, NULL, NULL, config);
    if (r != CUDA_SUCCESS)
    r = CUDA_CALL_NOCHECK (cuLaunchKernel, function, teams, 1, 1,
                          32, threads, 1, 0, NULL, NULL, config);
    if (r != CUDA_SUCCESS)
author	Tom de Vries <tdevries@suse.de>
	Thu, 8 Oct 2020 06:22:39 +0000 (08:22 +0200)
committer	Tom de Vries <tdevries@suse.de>
	Thu, 8 Oct 2020 09:03:29 +0000 (11:03 +0200)