| /* Copyright (C) 2013-2021 Free Software Foundation, Inc. |
| |
| Contributed by Mentor Embedded. |
| |
| This file is part of the GNU Offloading and Multi Processing Library |
| (libgomp). |
| |
| Libgomp is free software; you can redistribute it and/or modify it |
| under the terms of the GNU General Public License as published by |
| the Free Software Foundation; either version 3, or (at your option) |
| any later version. |
| |
| Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY |
| WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
| FOR A PARTICULAR PURPOSE. See the GNU General Public License for |
| more details. |
| |
| Under Section 7 of GPL version 3, you are granted additional |
| permissions described in the GCC Runtime Library Exception, version |
| 3.1, as published by the Free Software Foundation. |
| |
| You should have received a copy of the GNU General Public License and |
| a copy of the GCC Runtime Library Exception along with this program; |
| see the files COPYING3 and COPYING.RUNTIME respectively. If not, see |
| <http://www.gnu.org/licenses/>. */ |
| |
| /* This file handles OpenACC constructs. */ |
| |
| #include "openacc.h" |
| #include "libgomp.h" |
| #include "gomp-constants.h" |
| #include "oacc-int.h" |
| #ifdef HAVE_INTTYPES_H |
| # include <inttypes.h> /* For PRIu64. */ |
| #endif |
| #include <string.h> |
| #include <stdarg.h> |
| #include <assert.h> |
| |
| |
| /* In the ABI, the GOACC_FLAGs are encoded as an inverted bitmask, so that we |
| continue to support the following two legacy values. */ |
| _Static_assert (GOACC_FLAGS_UNMARSHAL (GOMP_DEVICE_ICV) == 0, |
| "legacy GOMP_DEVICE_ICV broken"); |
| _Static_assert (GOACC_FLAGS_UNMARSHAL (GOMP_DEVICE_HOST_FALLBACK) |
| == GOACC_FLAG_HOST_FALLBACK, |
| "legacy GOMP_DEVICE_HOST_FALLBACK broken"); |
| |
| |
| /* Handle the mapping pair that are presented when a |
| deviceptr clause is used with Fortran. */ |
| |
| static void |
| handle_ftn_pointers (size_t mapnum, void **hostaddrs, size_t *sizes, |
| unsigned short *kinds) |
| { |
| int i; |
| |
| for (i = 0; i < mapnum; i++) |
| { |
| unsigned short kind1 = kinds[i] & 0xff; |
| |
| /* Handle Fortran deviceptr clause. */ |
| if (kind1 == GOMP_MAP_FORCE_DEVICEPTR) |
| { |
| unsigned short kind2; |
| |
| if (i < (signed)mapnum - 1) |
| kind2 = kinds[i + 1] & 0xff; |
| else |
| kind2 = 0xffff; |
| |
| if (sizes[i] == sizeof (void *)) |
| continue; |
| |
| /* At this point, we're dealing with a Fortran deviceptr. |
| If the next element is not what we're expecting, then |
| this is an instance of where the deviceptr variable was |
| not used within the region and the pointer was removed |
| by the gimplifier. */ |
| if (kind2 == GOMP_MAP_POINTER |
| && sizes[i + 1] == 0 |
| && hostaddrs[i] == *(void **)hostaddrs[i + 1]) |
| { |
| kinds[i+1] = kinds[i]; |
| sizes[i+1] = sizeof (void *); |
| } |
| |
| /* Invalidate the entry. */ |
| hostaddrs[i] = NULL; |
| } |
| } |
| } |
| |
| |
| /* Launch a possibly offloaded function with FLAGS. FN is the host fn |
| address. MAPNUM, HOSTADDRS, SIZES & KINDS describe the memory |
| blocks to be copied to/from the device. Varadic arguments are |
| keyed optional parameters terminated with a zero. */ |
| |
| void |
| GOACC_parallel_keyed (int flags_m, void (*fn) (void *), |
| size_t mapnum, void **hostaddrs, size_t *sizes, |
| unsigned short *kinds, ...) |
| { |
| int flags = GOACC_FLAGS_UNMARSHAL (flags_m); |
| |
| va_list ap; |
| struct goacc_thread *thr; |
| struct gomp_device_descr *acc_dev; |
| struct target_mem_desc *tgt; |
| void **devaddrs; |
| unsigned int i; |
| struct splay_tree_key_s k; |
| splay_tree_key tgt_fn_key; |
| void (*tgt_fn); |
| int async = GOMP_ASYNC_SYNC; |
| unsigned dims[GOMP_DIM_MAX]; |
| unsigned tag; |
| |
| #ifdef HAVE_INTTYPES_H |
| gomp_debug (0, "%s: mapnum=%"PRIu64", hostaddrs=%p, size=%p, kinds=%p\n", |
| __FUNCTION__, (uint64_t) mapnum, hostaddrs, sizes, kinds); |
| #else |
| gomp_debug (0, "%s: mapnum=%lu, hostaddrs=%p, sizes=%p, kinds=%p\n", |
| __FUNCTION__, (unsigned long) mapnum, hostaddrs, sizes, kinds); |
| #endif |
| goacc_lazy_initialize (); |
| |
| thr = goacc_thread (); |
| acc_dev = thr->dev; |
| |
| bool profiling_p = GOACC_PROFILING_DISPATCH_P (true); |
| |
| acc_prof_info prof_info; |
| if (profiling_p) |
| { |
| thr->prof_info = &prof_info; |
| |
| prof_info.event_type = acc_ev_compute_construct_start; |
| prof_info.valid_bytes = _ACC_PROF_INFO_VALID_BYTES; |
| prof_info.version = _ACC_PROF_INFO_VERSION; |
| prof_info.device_type = acc_device_type (acc_dev->type); |
| prof_info.device_number = acc_dev->target_id; |
| prof_info.thread_id = -1; |
| prof_info.async = async; |
| prof_info.async_queue = prof_info.async; |
| prof_info.src_file = NULL; |
| prof_info.func_name = NULL; |
| prof_info.line_no = -1; |
| prof_info.end_line_no = -1; |
| prof_info.func_line_no = -1; |
| prof_info.func_end_line_no = -1; |
| } |
| acc_event_info compute_construct_event_info; |
| if (profiling_p) |
| { |
| compute_construct_event_info.other_event.event_type |
| = prof_info.event_type; |
| compute_construct_event_info.other_event.valid_bytes |
| = _ACC_OTHER_EVENT_INFO_VALID_BYTES; |
| compute_construct_event_info.other_event.parent_construct |
| = acc_construct_parallel; |
| compute_construct_event_info.other_event.implicit = 0; |
| compute_construct_event_info.other_event.tool_info = NULL; |
| } |
| acc_api_info api_info; |
| if (profiling_p) |
| { |
| thr->api_info = &api_info; |
| |
| api_info.device_api = acc_device_api_none; |
| api_info.valid_bytes = _ACC_API_INFO_VALID_BYTES; |
| api_info.device_type = prof_info.device_type; |
| api_info.vendor = -1; |
| api_info.device_handle = NULL; |
| api_info.context_handle = NULL; |
| api_info.async_handle = NULL; |
| } |
| |
| if (profiling_p) |
| goacc_profiling_dispatch (&prof_info, &compute_construct_event_info, |
| &api_info); |
| |
| handle_ftn_pointers (mapnum, hostaddrs, sizes, kinds); |
| |
| /* Host fallback if "if" clause is false or if the current device is set to |
| the host. */ |
| if (flags & GOACC_FLAG_HOST_FALLBACK) |
| { |
| prof_info.device_type = acc_device_host; |
| api_info.device_type = prof_info.device_type; |
| goacc_save_and_set_bind (acc_device_host); |
| fn (hostaddrs); |
| goacc_restore_bind (); |
| goto out_prof; |
| } |
| else if (acc_device_type (acc_dev->type) == acc_device_host) |
| { |
| fn (hostaddrs); |
| goto out_prof; |
| } |
| |
| /* Default: let the runtime choose. */ |
| for (i = 0; i != GOMP_DIM_MAX; i++) |
| dims[i] = 0; |
| |
| va_start (ap, kinds); |
| /* TODO: This will need amending when device_type is implemented. */ |
| while ((tag = va_arg (ap, unsigned)) != 0) |
| { |
| if (GOMP_LAUNCH_DEVICE (tag)) |
| gomp_fatal ("device_type '%d' offload parameters, libgomp is too old", |
| GOMP_LAUNCH_DEVICE (tag)); |
| |
| switch (GOMP_LAUNCH_CODE (tag)) |
| { |
| case GOMP_LAUNCH_DIM: |
| { |
| unsigned mask = GOMP_LAUNCH_OP (tag); |
| |
| for (i = 0; i != GOMP_DIM_MAX; i++) |
| if (mask & GOMP_DIM_MASK (i)) |
| dims[i] = va_arg (ap, unsigned); |
| } |
| break; |
| |
| case GOMP_LAUNCH_ASYNC: |
| { |
| /* Small constant values are encoded in the operand. */ |
| async = GOMP_LAUNCH_OP (tag); |
| |
| if (async == GOMP_LAUNCH_OP_MAX) |
| async = va_arg (ap, unsigned); |
| |
| if (profiling_p) |
| { |
| prof_info.async = async; |
| prof_info.async_queue = prof_info.async; |
| } |
| |
| break; |
| } |
| |
| case GOMP_LAUNCH_WAIT: |
| { |
| unsigned num_waits = GOMP_LAUNCH_OP (tag); |
| goacc_wait (async, num_waits, &ap); |
| break; |
| } |
| |
| default: |
| gomp_fatal ("unrecognized offload code '%d'," |
| " libgomp is too old", GOMP_LAUNCH_CODE (tag)); |
| } |
| } |
| va_end (ap); |
| |
| if (!(acc_dev->capabilities & GOMP_OFFLOAD_CAP_NATIVE_EXEC)) |
| { |
| k.host_start = (uintptr_t) fn; |
| k.host_end = k.host_start + 1; |
| gomp_mutex_lock (&acc_dev->lock); |
| tgt_fn_key = splay_tree_lookup (&acc_dev->mem_map, &k); |
| gomp_mutex_unlock (&acc_dev->lock); |
| |
| if (tgt_fn_key == NULL) |
| gomp_fatal ("target function wasn't mapped"); |
| |
| tgt_fn = (void (*)) tgt_fn_key->tgt_offset; |
| } |
| else |
| tgt_fn = (void (*)) fn; |
| |
| acc_event_info enter_exit_data_event_info; |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_enter_data_start; |
| enter_exit_data_event_info.other_event.event_type |
| = prof_info.event_type; |
| enter_exit_data_event_info.other_event.valid_bytes |
| = _ACC_OTHER_EVENT_INFO_VALID_BYTES; |
| enter_exit_data_event_info.other_event.parent_construct |
| = compute_construct_event_info.other_event.parent_construct; |
| enter_exit_data_event_info.other_event.implicit = 1; |
| enter_exit_data_event_info.other_event.tool_info = NULL; |
| goacc_profiling_dispatch (&prof_info, &enter_exit_data_event_info, |
| &api_info); |
| } |
| |
| goacc_aq aq = get_goacc_asyncqueue (async); |
| |
| tgt = gomp_map_vars_async (acc_dev, aq, mapnum, hostaddrs, NULL, sizes, kinds, |
| true, GOMP_MAP_VARS_OPENACC); |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_enter_data_end; |
| enter_exit_data_event_info.other_event.event_type |
| = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &enter_exit_data_event_info, |
| &api_info); |
| } |
| |
| devaddrs = gomp_alloca (sizeof (void *) * mapnum); |
| for (i = 0; i < mapnum; i++) |
| devaddrs[i] = (void *) gomp_map_val (tgt, hostaddrs, i); |
| |
| if (aq == NULL) |
| acc_dev->openacc.exec_func (tgt_fn, mapnum, hostaddrs, devaddrs, dims, |
| tgt); |
| else |
| acc_dev->openacc.async.exec_func (tgt_fn, mapnum, hostaddrs, devaddrs, |
| dims, tgt, aq); |
| |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_exit_data_start; |
| enter_exit_data_event_info.other_event.event_type = prof_info.event_type; |
| enter_exit_data_event_info.other_event.tool_info = NULL; |
| goacc_profiling_dispatch (&prof_info, &enter_exit_data_event_info, |
| &api_info); |
| } |
| |
| /* If running synchronously, unmap immediately. */ |
| if (aq == NULL) |
| gomp_unmap_vars (tgt, true); |
| else |
| gomp_unmap_vars_async (tgt, true, aq); |
| |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_exit_data_end; |
| enter_exit_data_event_info.other_event.event_type = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &enter_exit_data_event_info, |
| &api_info); |
| } |
| |
| out_prof: |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_compute_construct_end; |
| compute_construct_event_info.other_event.event_type |
| = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &compute_construct_event_info, |
| &api_info); |
| |
| thr->prof_info = NULL; |
| thr->api_info = NULL; |
| } |
| } |
| |
| /* Legacy entry point (GCC 5). Only provide host fallback execution. */ |
| |
| void |
| GOACC_parallel (int flags_m, void (*fn) (void *), |
| size_t mapnum, void **hostaddrs, size_t *sizes, |
| unsigned short *kinds, |
| int num_gangs, int num_workers, int vector_length, |
| int async, int num_waits, ...) |
| { |
| goacc_save_and_set_bind (acc_device_host); |
| fn (hostaddrs); |
| goacc_restore_bind (); |
| } |
| |
| void |
| GOACC_data_start (int flags_m, size_t mapnum, |
| void **hostaddrs, size_t *sizes, unsigned short *kinds) |
| { |
| int flags = GOACC_FLAGS_UNMARSHAL (flags_m); |
| |
| struct target_mem_desc *tgt; |
| |
| #ifdef HAVE_INTTYPES_H |
| gomp_debug (0, "%s: mapnum=%"PRIu64", hostaddrs=%p, size=%p, kinds=%p\n", |
| __FUNCTION__, (uint64_t) mapnum, hostaddrs, sizes, kinds); |
| #else |
| gomp_debug (0, "%s: mapnum=%lu, hostaddrs=%p, sizes=%p, kinds=%p\n", |
| __FUNCTION__, (unsigned long) mapnum, hostaddrs, sizes, kinds); |
| #endif |
| |
| goacc_lazy_initialize (); |
| |
| struct goacc_thread *thr = goacc_thread (); |
| struct gomp_device_descr *acc_dev = thr->dev; |
| |
| bool profiling_p = GOACC_PROFILING_DISPATCH_P (true); |
| |
| acc_prof_info prof_info; |
| if (profiling_p) |
| { |
| thr->prof_info = &prof_info; |
| |
| prof_info.event_type = acc_ev_enter_data_start; |
| prof_info.valid_bytes = _ACC_PROF_INFO_VALID_BYTES; |
| prof_info.version = _ACC_PROF_INFO_VERSION; |
| prof_info.device_type = acc_device_type (acc_dev->type); |
| prof_info.device_number = acc_dev->target_id; |
| prof_info.thread_id = -1; |
| prof_info.async = acc_async_sync; /* Always synchronous. */ |
| prof_info.async_queue = prof_info.async; |
| prof_info.src_file = NULL; |
| prof_info.func_name = NULL; |
| prof_info.line_no = -1; |
| prof_info.end_line_no = -1; |
| prof_info.func_line_no = -1; |
| prof_info.func_end_line_no = -1; |
| } |
| acc_event_info enter_data_event_info; |
| if (profiling_p) |
| { |
| enter_data_event_info.other_event.event_type |
| = prof_info.event_type; |
| enter_data_event_info.other_event.valid_bytes |
| = _ACC_OTHER_EVENT_INFO_VALID_BYTES; |
| enter_data_event_info.other_event.parent_construct = acc_construct_data; |
| for (int i = 0; i < mapnum; ++i) |
| if ((kinds[i] & 0xff) == GOMP_MAP_USE_DEVICE_PTR |
| || (kinds[i] & 0xff) == GOMP_MAP_USE_DEVICE_PTR_IF_PRESENT) |
| { |
| /* If there is one such data mapping kind, then this is actually an |
| OpenACC 'host_data' construct. (GCC maps the OpenACC |
| 'host_data' construct to the OpenACC 'data' construct.) Apart |
| from artificial test cases (such as an OpenACC 'host_data' |
| construct's (implicit) device initialization when there hasn't |
| been any device data be set up before...), there can't really |
| any meaningful events be generated from OpenACC 'host_data' |
| constructs, though. */ |
| enter_data_event_info.other_event.parent_construct |
| = acc_construct_host_data; |
| break; |
| } |
| enter_data_event_info.other_event.implicit = 0; |
| enter_data_event_info.other_event.tool_info = NULL; |
| } |
| acc_api_info api_info; |
| if (profiling_p) |
| { |
| thr->api_info = &api_info; |
| |
| api_info.device_api = acc_device_api_none; |
| api_info.valid_bytes = _ACC_API_INFO_VALID_BYTES; |
| api_info.device_type = prof_info.device_type; |
| api_info.vendor = -1; |
| api_info.device_handle = NULL; |
| api_info.context_handle = NULL; |
| api_info.async_handle = NULL; |
| } |
| |
| if (profiling_p) |
| goacc_profiling_dispatch (&prof_info, &enter_data_event_info, &api_info); |
| |
| /* Host fallback or 'do nothing'. */ |
| if ((acc_dev->capabilities & GOMP_OFFLOAD_CAP_SHARED_MEM) |
| || (flags & GOACC_FLAG_HOST_FALLBACK)) |
| { |
| prof_info.device_type = acc_device_host; |
| api_info.device_type = prof_info.device_type; |
| tgt = gomp_map_vars (NULL, 0, NULL, NULL, NULL, NULL, true, |
| GOMP_MAP_VARS_OPENACC); |
| tgt->prev = thr->mapped_data; |
| thr->mapped_data = tgt; |
| |
| goto out_prof; |
| } |
| |
| gomp_debug (0, " %s: prepare mappings\n", __FUNCTION__); |
| tgt = gomp_map_vars (acc_dev, mapnum, hostaddrs, NULL, sizes, kinds, true, |
| GOMP_MAP_VARS_OPENACC); |
| gomp_debug (0, " %s: mappings prepared\n", __FUNCTION__); |
| tgt->prev = thr->mapped_data; |
| thr->mapped_data = tgt; |
| |
| out_prof: |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_enter_data_end; |
| enter_data_event_info.other_event.event_type = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &enter_data_event_info, &api_info); |
| |
| thr->prof_info = NULL; |
| thr->api_info = NULL; |
| } |
| } |
| |
| void |
| GOACC_data_end (void) |
| { |
| struct goacc_thread *thr = goacc_thread (); |
| struct gomp_device_descr *acc_dev = thr->dev; |
| struct target_mem_desc *tgt = thr->mapped_data; |
| |
| bool profiling_p = GOACC_PROFILING_DISPATCH_P (true); |
| |
| acc_prof_info prof_info; |
| if (profiling_p) |
| { |
| thr->prof_info = &prof_info; |
| |
| prof_info.event_type = acc_ev_exit_data_start; |
| prof_info.valid_bytes = _ACC_PROF_INFO_VALID_BYTES; |
| prof_info.version = _ACC_PROF_INFO_VERSION; |
| prof_info.device_type = acc_device_type (acc_dev->type); |
| prof_info.device_number = acc_dev->target_id; |
| prof_info.thread_id = -1; |
| prof_info.async = acc_async_sync; /* Always synchronous. */ |
| prof_info.async_queue = prof_info.async; |
| prof_info.src_file = NULL; |
| prof_info.func_name = NULL; |
| prof_info.line_no = -1; |
| prof_info.end_line_no = -1; |
| prof_info.func_line_no = -1; |
| prof_info.func_end_line_no = -1; |
| } |
| acc_event_info exit_data_event_info; |
| if (profiling_p) |
| { |
| exit_data_event_info.other_event.event_type |
| = prof_info.event_type; |
| exit_data_event_info.other_event.valid_bytes |
| = _ACC_OTHER_EVENT_INFO_VALID_BYTES; |
| exit_data_event_info.other_event.parent_construct = acc_construct_data; |
| exit_data_event_info.other_event.implicit = 0; |
| exit_data_event_info.other_event.tool_info = NULL; |
| } |
| acc_api_info api_info; |
| if (profiling_p) |
| { |
| thr->api_info = &api_info; |
| |
| api_info.device_api = acc_device_api_none; |
| api_info.valid_bytes = _ACC_API_INFO_VALID_BYTES; |
| api_info.device_type = prof_info.device_type; |
| api_info.vendor = -1; |
| api_info.device_handle = NULL; |
| api_info.context_handle = NULL; |
| api_info.async_handle = NULL; |
| } |
| |
| if (profiling_p) |
| goacc_profiling_dispatch (&prof_info, &exit_data_event_info, &api_info); |
| |
| gomp_debug (0, " %s: restore mappings\n", __FUNCTION__); |
| thr->mapped_data = tgt->prev; |
| gomp_unmap_vars (tgt, true); |
| gomp_debug (0, " %s: mappings restored\n", __FUNCTION__); |
| |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_exit_data_end; |
| exit_data_event_info.other_event.event_type = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &exit_data_event_info, &api_info); |
| |
| thr->prof_info = NULL; |
| thr->api_info = NULL; |
| } |
| } |
| |
| void |
| GOACC_update (int flags_m, size_t mapnum, |
| void **hostaddrs, size_t *sizes, unsigned short *kinds, |
| int async, int num_waits, ...) |
| { |
| int flags = GOACC_FLAGS_UNMARSHAL (flags_m); |
| |
| size_t i; |
| |
| goacc_lazy_initialize (); |
| |
| struct goacc_thread *thr = goacc_thread (); |
| struct gomp_device_descr *acc_dev = thr->dev; |
| |
| bool profiling_p = GOACC_PROFILING_DISPATCH_P (true); |
| |
| acc_prof_info prof_info; |
| if (profiling_p) |
| { |
| thr->prof_info = &prof_info; |
| |
| prof_info.event_type = acc_ev_update_start; |
| prof_info.valid_bytes = _ACC_PROF_INFO_VALID_BYTES; |
| prof_info.version = _ACC_PROF_INFO_VERSION; |
| prof_info.device_type = acc_device_type (acc_dev->type); |
| prof_info.device_number = acc_dev->target_id; |
| prof_info.thread_id = -1; |
| prof_info.async = async; |
| prof_info.async_queue = prof_info.async; |
| prof_info.src_file = NULL; |
| prof_info.func_name = NULL; |
| prof_info.line_no = -1; |
| prof_info.end_line_no = -1; |
| prof_info.func_line_no = -1; |
| prof_info.func_end_line_no = -1; |
| } |
| acc_event_info update_event_info; |
| if (profiling_p) |
| { |
| update_event_info.other_event.event_type |
| = prof_info.event_type; |
| update_event_info.other_event.valid_bytes |
| = _ACC_OTHER_EVENT_INFO_VALID_BYTES; |
| update_event_info.other_event.parent_construct = acc_construct_update; |
| update_event_info.other_event.implicit = 0; |
| update_event_info.other_event.tool_info = NULL; |
| } |
| acc_api_info api_info; |
| if (profiling_p) |
| { |
| thr->api_info = &api_info; |
| |
| api_info.device_api = acc_device_api_none; |
| api_info.valid_bytes = _ACC_API_INFO_VALID_BYTES; |
| api_info.device_type = prof_info.device_type; |
| api_info.vendor = -1; |
| api_info.device_handle = NULL; |
| api_info.context_handle = NULL; |
| api_info.async_handle = NULL; |
| } |
| |
| if (profiling_p) |
| goacc_profiling_dispatch (&prof_info, &update_event_info, &api_info); |
| |
| if ((acc_dev->capabilities & GOMP_OFFLOAD_CAP_SHARED_MEM) |
| || (flags & GOACC_FLAG_HOST_FALLBACK)) |
| { |
| prof_info.device_type = acc_device_host; |
| api_info.device_type = prof_info.device_type; |
| |
| goto out_prof; |
| } |
| |
| if (num_waits) |
| { |
| va_list ap; |
| |
| va_start (ap, num_waits); |
| goacc_wait (async, num_waits, &ap); |
| va_end (ap); |
| } |
| |
| bool update_device = false; |
| for (i = 0; i < mapnum; ++i) |
| { |
| unsigned char kind = kinds[i] & 0xff; |
| |
| switch (kind) |
| { |
| case GOMP_MAP_POINTER: |
| case GOMP_MAP_TO_PSET: |
| break; |
| |
| case GOMP_MAP_ALWAYS_POINTER: |
| if (update_device) |
| { |
| /* Save the contents of the host pointer. */ |
| void *dptr = acc_deviceptr (hostaddrs[i-1]); |
| uintptr_t t = *(uintptr_t *) hostaddrs[i]; |
| |
| /* Update the contents of the host pointer to reflect |
| the value of the allocated device memory in the |
| previous pointer. */ |
| *(uintptr_t *) hostaddrs[i] = (uintptr_t)dptr; |
| /* TODO: verify that we really cannot use acc_update_device_async |
| here. */ |
| acc_update_device (hostaddrs[i], sizeof (uintptr_t)); |
| |
| /* Restore the host pointer. */ |
| *(uintptr_t *) hostaddrs[i] = t; |
| update_device = false; |
| } |
| break; |
| |
| case GOMP_MAP_TO: |
| if (!acc_is_present (hostaddrs[i], sizes[i])) |
| { |
| update_device = false; |
| break; |
| } |
| /* Fallthru */ |
| case GOMP_MAP_FORCE_TO: |
| update_device = true; |
| acc_update_device_async (hostaddrs[i], sizes[i], async); |
| break; |
| |
| case GOMP_MAP_FROM: |
| if (!acc_is_present (hostaddrs[i], sizes[i])) |
| { |
| update_device = false; |
| break; |
| } |
| /* Fallthru */ |
| case GOMP_MAP_FORCE_FROM: |
| update_device = false; |
| acc_update_self_async (hostaddrs[i], sizes[i], async); |
| break; |
| |
| default: |
| gomp_fatal (">>>> GOACC_update UNHANDLED kind 0x%.2x", kind); |
| break; |
| } |
| } |
| |
| out_prof: |
| if (profiling_p) |
| { |
| prof_info.event_type = acc_ev_update_end; |
| update_event_info.other_event.event_type = prof_info.event_type; |
| goacc_profiling_dispatch (&prof_info, &update_event_info, &api_info); |
| |
| thr->prof_info = NULL; |
| thr->api_info = NULL; |
| } |
| } |
| |
| |
| /* Legacy entry point (GCC 5). */ |
| |
| int |
| GOACC_get_num_threads (void) |
| { |
| return 1; |
| } |
| |
| /* Legacy entry point (GCC 5). */ |
| |
| int |
| GOACC_get_thread_num (void) |
| { |
| return 0; |
| } |
| |
| void |
| GOACC_declare (int flags_m, size_t mapnum, |
| void **hostaddrs, size_t *sizes, unsigned short *kinds) |
| { |
| int i; |
| |
| for (i = 0; i < mapnum; i++) |
| { |
| unsigned char kind = kinds[i] & 0xff; |
| |
| if (kind == GOMP_MAP_POINTER || kind == GOMP_MAP_TO_PSET) |
| continue; |
| |
| switch (kind) |
| { |
| case GOMP_MAP_FORCE_ALLOC: |
| case GOMP_MAP_FORCE_FROM: |
| case GOMP_MAP_FORCE_TO: |
| case GOMP_MAP_POINTER: |
| case GOMP_MAP_RELEASE: |
| case GOMP_MAP_DELETE: |
| GOACC_enter_exit_data (flags_m, 1, &hostaddrs[i], &sizes[i], |
| &kinds[i], GOMP_ASYNC_SYNC, 0); |
| break; |
| |
| case GOMP_MAP_FORCE_DEVICEPTR: |
| break; |
| |
| case GOMP_MAP_ALLOC: |
| if (!acc_is_present (hostaddrs[i], sizes[i])) |
| GOACC_enter_exit_data (flags_m, 1, &hostaddrs[i], &sizes[i], |
| &kinds[i], GOMP_ASYNC_SYNC, 0); |
| break; |
| |
| case GOMP_MAP_TO: |
| GOACC_enter_exit_data (flags_m, 1, &hostaddrs[i], &sizes[i], |
| &kinds[i], GOMP_ASYNC_SYNC, 0); |
| |
| break; |
| |
| case GOMP_MAP_FROM: |
| GOACC_enter_exit_data (flags_m, 1, &hostaddrs[i], &sizes[i], |
| &kinds[i], GOMP_ASYNC_SYNC, 0); |
| break; |
| |
| case GOMP_MAP_FORCE_PRESENT: |
| if (!acc_is_present (hostaddrs[i], sizes[i])) |
| gomp_fatal ("[%p,%ld] is not mapped", hostaddrs[i], |
| (unsigned long) sizes[i]); |
| break; |
| |
| default: |
| assert (0); |
| break; |
| } |
| } |
| } |