6c84c8bf9b
Add generic support for the OpenACC 2.6 `acc_get_property' and `acc_get_property_string' routines, as well as full handlers for the host and the NVPTX offload targets and minimal handlers for the HSA, Intel MIC, and AMD GCN offload targets. Included are C/C++ and Fortran tests that, in particular, print the property values for acc_property_vendor, acc_property_memory, acc_property_free_memory, acc_property_name, and acc_property_driver. The output looks as follows: Vendor: GNU Name: GOMP Total memory: 0 Free memory: 0 Driver: 1.0 with the host driver (where the memory related properties are not supported for the host device and yield 0, conforming to the standard) and output like: Vendor: Nvidia Total memory: 12651462656 Free memory: 12202737664 Name: TITAN V Driver: CUDA Driver 9.1 with the NVPTX driver. 2019-12-22 Maciej W. Rozycki <macro@codesourcery.com> Frederik Harwath <frederik@codesourcery.com> Thomas Schwinge <tschwinge@codesourcery.com> include/ * gomp-constants.h (gomp_device_property): New enum. libgomp/ * libgomp.h (gomp_device_descr): Add `get_property_func' member. * libgomp-plugin.h (gomp_device_property_value): New union. (gomp_device_property_value): New prototype. * openacc.h (acc_device_t): Add `acc_device_current' enumeration constant. (acc_device_property_t): New enum. (acc_get_property, acc_get_property_string): New prototypes. * oacc-init.c (acc_get_device_type): Also assert that result is not `acc_device_current'. (get_property_any, acc_get_property, acc_get_property_string): New functions. * openacc.f90 (openacc_kinds): Add `acc_device_current' and `acc_property_memory', `acc_property_free_memory', `acc_property_name', `acc_property_vendor' and `acc_property_driver' constants. Add `acc_device_property' data type. (openacc_internal): Add `acc_get_property' and `acc_get_property_string' interfaces. Add `acc_get_property_h', `acc_get_property_string_h', `acc_get_property_l' and `acc_get_property_string_l'. * oacc-host.c (host_get_property): New function. (host_dispatch): Wire it. * target.c (gomp_load_plugin_for_device): Handle `get_property'. * libgomp.map (OACC_2.6): Add `acc_get_property', `acc_get_property_h_', `acc_get_property_string' and `acc_get_property_string_h_' symbols. * libgomp.texi (OpenACC Runtime Library Routines): Add `acc_get_property'. (acc_get_property): New node. * plugin/plugin-gcn.c (GOMP_OFFLOAD_get_property): New function (stub). * plugin/plugin-hsa.c (GOMP_OFFLOAD_get_property): New function. * plugin/plugin-nvptx.c (CUDA_CALLS): Add `cuDeviceGetName', `cuDeviceTotalMem', `cuDriverGetVersion' and `cuMemGetInfo' calls. (GOMP_OFFLOAD_get_property): New function. (struct ptx_device): Add new field "name". (cuda_driver_version_s): Add new static variable ... (nvptx_init): ... and init from here. * testsuite/libgomp.oacc-c-c++-common/acc_get_property.c: New test. * testsuite/libgomp.oacc-c-c++-common/acc_get_property-2.c: New test. * testsuite/libgomp.oacc-c-c++-common/acc_get_property-3.c: New test. * testsuite/libgomp.oacc-c-c++-common/acc_get_property-aux.c: New file with test helper functions. * testsuite/libgomp.oacc-fortran/acc_get_property.f90: New test. liboffloadmic/ * plugin/libgomp-plugin-intelmic.cpp (GOMP_OFFLOAD_get_property): New function. Reviewed-by: Thomas Schwinge <thomas@codesourcery.com> Co-Authored-By: Frederik Harwath <frederik@codesourcery.com> Co-Authored-By: Thomas Schwinge <tschwinge@codesourcery.com> From-SVN: r279710
322 lines
7.7 KiB
C
322 lines
7.7 KiB
C
/* OpenACC Runtime Library: acc_device_host.
|
|
|
|
Copyright (C) 2013-2019 Free Software Foundation, Inc.
|
|
|
|
Contributed by Mentor Embedded.
|
|
|
|
This file is part of the GNU Offloading and Multi Processing Library
|
|
(libgomp).
|
|
|
|
Libgomp is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "libgomp.h"
|
|
#include "oacc-int.h"
|
|
#include "gomp-constants.h"
|
|
|
|
#include <stdbool.h>
|
|
#include <stddef.h>
|
|
|
|
static struct gomp_device_descr host_dispatch;
|
|
|
|
static const char *
|
|
host_get_name (void)
|
|
{
|
|
return host_dispatch.name;
|
|
}
|
|
|
|
static unsigned int
|
|
host_get_caps (void)
|
|
{
|
|
return host_dispatch.capabilities;
|
|
}
|
|
|
|
static int
|
|
host_get_type (void)
|
|
{
|
|
return host_dispatch.type;
|
|
}
|
|
|
|
static int
|
|
host_get_num_devices (void)
|
|
{
|
|
return 1;
|
|
}
|
|
|
|
static union gomp_device_property_value
|
|
host_get_property (int n, int prop)
|
|
{
|
|
union gomp_device_property_value nullval = { .val = 0 };
|
|
|
|
if (n >= host_get_num_devices ())
|
|
return nullval;
|
|
|
|
switch (prop)
|
|
{
|
|
case GOMP_DEVICE_PROPERTY_NAME:
|
|
return (union gomp_device_property_value) { .ptr = "GOMP" };
|
|
case GOMP_DEVICE_PROPERTY_VENDOR:
|
|
return (union gomp_device_property_value) { .ptr = "GNU" };
|
|
case GOMP_DEVICE_PROPERTY_DRIVER:
|
|
return (union gomp_device_property_value) { .ptr = VERSION };
|
|
default:
|
|
return nullval;
|
|
}
|
|
}
|
|
|
|
static bool
|
|
host_init_device (int n __attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_fini_device (int n __attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static unsigned
|
|
host_version (void)
|
|
{
|
|
return GOMP_VERSION;
|
|
}
|
|
|
|
static int
|
|
host_load_image (int n __attribute__ ((unused)),
|
|
unsigned v __attribute__ ((unused)),
|
|
const void *t __attribute__ ((unused)),
|
|
struct addr_pair **r __attribute__ ((unused)))
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static bool
|
|
host_unload_image (int n __attribute__ ((unused)),
|
|
unsigned v __attribute__ ((unused)),
|
|
const void *t __attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static void *
|
|
host_alloc (int n __attribute__ ((unused)), size_t s)
|
|
{
|
|
return gomp_malloc (s);
|
|
}
|
|
|
|
static bool
|
|
host_free (int n __attribute__ ((unused)), void *p)
|
|
{
|
|
free (p);
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_dev2host (int n __attribute__ ((unused)),
|
|
void *h __attribute__ ((unused)),
|
|
const void *d __attribute__ ((unused)),
|
|
size_t s __attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_host2dev (int n __attribute__ ((unused)),
|
|
void *d __attribute__ ((unused)),
|
|
const void *h __attribute__ ((unused)),
|
|
size_t s __attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static void
|
|
host_run (int n __attribute__ ((unused)), void *fn_ptr, void *vars,
|
|
void **args __attribute__((unused)))
|
|
{
|
|
void (*fn)(void *) = (void (*)(void *)) fn_ptr;
|
|
|
|
fn (vars);
|
|
}
|
|
|
|
static void
|
|
host_openacc_exec (void (*fn) (void *),
|
|
size_t mapnum __attribute__ ((unused)),
|
|
void **hostaddrs,
|
|
void **devaddrs __attribute__ ((unused)),
|
|
unsigned *dims __attribute__ ((unused)),
|
|
void *targ_mem_desc __attribute__ ((unused)))
|
|
{
|
|
fn (hostaddrs);
|
|
}
|
|
|
|
static void
|
|
host_openacc_async_exec (void (*fn) (void *),
|
|
size_t mapnum __attribute__ ((unused)),
|
|
void **hostaddrs,
|
|
void **devaddrs __attribute__ ((unused)),
|
|
unsigned *dims __attribute__ ((unused)),
|
|
void *targ_mem_desc __attribute__ ((unused)),
|
|
struct goacc_asyncqueue *aq __attribute__ ((unused)))
|
|
{
|
|
fn (hostaddrs);
|
|
}
|
|
|
|
static int
|
|
host_openacc_async_test (struct goacc_asyncqueue *aq __attribute__ ((unused)))
|
|
{
|
|
return 1;
|
|
}
|
|
|
|
static bool
|
|
host_openacc_async_synchronize (struct goacc_asyncqueue *aq
|
|
__attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_openacc_async_serialize (struct goacc_asyncqueue *aq1
|
|
__attribute__ ((unused)),
|
|
struct goacc_asyncqueue *aq2
|
|
__attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_openacc_async_host2dev (int ord __attribute__ ((unused)),
|
|
void *dst __attribute__ ((unused)),
|
|
const void *src __attribute__ ((unused)),
|
|
size_t n __attribute__ ((unused)),
|
|
struct goacc_asyncqueue *aq
|
|
__attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static bool
|
|
host_openacc_async_dev2host (int ord __attribute__ ((unused)),
|
|
void *dst __attribute__ ((unused)),
|
|
const void *src __attribute__ ((unused)),
|
|
size_t n __attribute__ ((unused)),
|
|
struct goacc_asyncqueue *aq
|
|
__attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static void
|
|
host_openacc_async_queue_callback (struct goacc_asyncqueue *aq
|
|
__attribute__ ((unused)),
|
|
void (*callback_fn)(void *)
|
|
__attribute__ ((unused)),
|
|
void *userptr __attribute__ ((unused)))
|
|
{
|
|
}
|
|
|
|
static struct goacc_asyncqueue *
|
|
host_openacc_async_construct (int device __attribute__((unused)))
|
|
{
|
|
/* Non-NULL 0xffff... value as opaque dummy. */
|
|
return (struct goacc_asyncqueue *) -1;
|
|
}
|
|
|
|
static bool
|
|
host_openacc_async_destruct (struct goacc_asyncqueue *aq
|
|
__attribute__ ((unused)))
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static void *
|
|
host_openacc_create_thread_data (int ord __attribute__ ((unused)))
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static void
|
|
host_openacc_destroy_thread_data (void *tls_data __attribute__ ((unused)))
|
|
{
|
|
}
|
|
|
|
static struct gomp_device_descr host_dispatch =
|
|
{
|
|
.name = "host",
|
|
.capabilities = (GOMP_OFFLOAD_CAP_SHARED_MEM
|
|
| GOMP_OFFLOAD_CAP_NATIVE_EXEC
|
|
| GOMP_OFFLOAD_CAP_OPENACC_200),
|
|
.target_id = 0,
|
|
.type = OFFLOAD_TARGET_TYPE_HOST,
|
|
|
|
.get_name_func = host_get_name,
|
|
.get_caps_func = host_get_caps,
|
|
.get_type_func = host_get_type,
|
|
.get_num_devices_func = host_get_num_devices,
|
|
.get_property_func = host_get_property,
|
|
.init_device_func = host_init_device,
|
|
.fini_device_func = host_fini_device,
|
|
.version_func = host_version,
|
|
.load_image_func = host_load_image,
|
|
.unload_image_func = host_unload_image,
|
|
.alloc_func = host_alloc,
|
|
.free_func = host_free,
|
|
.dev2host_func = host_dev2host,
|
|
.host2dev_func = host_host2dev,
|
|
.run_func = host_run,
|
|
|
|
.mem_map = { NULL },
|
|
/* .lock initialized in goacc_host_init. */
|
|
.state = GOMP_DEVICE_UNINITIALIZED,
|
|
|
|
.openacc = {
|
|
.exec_func = host_openacc_exec,
|
|
|
|
.create_thread_data_func = host_openacc_create_thread_data,
|
|
.destroy_thread_data_func = host_openacc_destroy_thread_data,
|
|
|
|
.async = {
|
|
.construct_func = host_openacc_async_construct,
|
|
.destruct_func = host_openacc_async_destruct,
|
|
.test_func = host_openacc_async_test,
|
|
.synchronize_func = host_openacc_async_synchronize,
|
|
.serialize_func = host_openacc_async_serialize,
|
|
.queue_callback_func = host_openacc_async_queue_callback,
|
|
.exec_func = host_openacc_async_exec,
|
|
.dev2host_func = host_openacc_async_dev2host,
|
|
.host2dev_func = host_openacc_async_host2dev,
|
|
},
|
|
|
|
.cuda = {
|
|
.get_current_device_func = NULL,
|
|
.get_current_context_func = NULL,
|
|
.get_stream_func = NULL,
|
|
.set_stream_func = NULL,
|
|
}
|
|
}
|
|
};
|
|
|
|
/* Initialize and register this device type. */
|
|
void
|
|
goacc_host_init (void)
|
|
{
|
|
gomp_mutex_init (&host_dispatch.lock);
|
|
goacc_register (&host_dispatch);
|
|
}
|