mirror of
https://gcc.gnu.org/git/gcc.git
synced 2024-11-24 11:24:05 +08:00
9f2fca5659
This patch considers the environment variable syntax extension for device-specific variants of environment variables from OpenMP 5.1 (see OpenMP 5.1 specification, p. 75 and p. 639). An environment variable (e.g. OMP_NUM_TEAMS) can have different suffixes: _DEV (e.g. OMP_NUM_TEAMS_DEV): affects all devices but not the host. _DEV_<device> (e.g. OMP_NUM_TEAMS_DEV_42): affects only device with number <device>. no suffix (e.g. OMP_NUM_TEAMS): affects only the host. In future OpenMP versions also suffix _ALL will be introduced (see discussion https://github.com/OpenMP/spec/issues/3179). This is also considered in this patch: _ALL (e.g. OMP_NUM_TEAMS_ALL): affects all devices and the host. The precedence is as follows (descending). For the host: 1. no suffix 2. _ALL For devices: 1. _DEV_<device> 2. _DEV 3. _ALL That means, _DEV_<device> is used whenever available. Otherwise _DEV is used if available, and at last _ALL. If there is no value for any of the variable variants, default values are used as already implemented before. This patch concerns parsing (a), storing (b), output (c) and transmission to the device (d): (a) The actual number of devices and the numbering are not known when parsing the environment variables. Thus all environment variables are iterated and searched for device-specific ones. (b) Only configured device-specific variables are stored. Thus, a linked list is used. (c) The output is done in omp_display_env (see specification p. 468f). Global ICVs are tagged with [all], see https://github.com/OpenMP/spec/issues/3179. ICVs which are not global but aren't handled device-specific yet are tagged with [host]. omp_display_env outputs the initial values of the ICVs. That is why a dedicated data structure is introduced for the inital values only (gomp_initial_icv_list). (d) Device-specific ICVs are transmitted to the device via GOMP_ADDITIONAL_ICVS. libgomp/ChangeLog: * config/gcn/icv-device.c (omp_get_default_device): Return device- specific ICV. (omp_get_max_teams): Added for GCN devices. (omp_set_num_teams): Likewise. (ialias): Likewise. * config/nvptx/icv-device.c (omp_get_default_device): Return device- specific ICV. (omp_get_max_teams): Added for NVPTX devices. (omp_set_num_teams): Likewise. (ialias): Likewise. * env.c (struct gomp_icv_list): New struct to store entries of initial ICV values. (struct gomp_offload_icv_list): New struct to store entries of device- specific ICV values that are copied to the device and back. (struct gomp_default_icv_values): New struct to store default values of ICVs according to the OpenMP standard. (parse_schedule): Generalized for different variants of OMP_SCHEDULE. (print_env_var_error): Function that prints an error for invalid values for ICVs. (parse_unsigned_long_1): Removed getenv. Generalized. (parse_unsigned_long): Likewise. (parse_int_1): Likewise. (parse_int): Likewise. (parse_int_secure): Likewise. (parse_unsigned_long_list): Likewise. (parse_target_offload): Likewise. (parse_bind_var): Likewise. (parse_stacksize): Likewise. (parse_boolean): Likewise. (parse_wait_policy): Likewise. (parse_allocator): Likewise. (omp_display_env): Extended to output different variants of environment variables. (print_schedule): New helper function for omp_display_env which prints the values of run_sched_var. (print_proc_bind): New helper function for omp_display_env which prints the values of proc_bind_var. (enum gomp_parse_type): Collection of types used for parsing environment variables. (ENTRY): Preprocess string lengths of environment variables. (OMP_VAR_CNT): Preprocess table size. (OMP_HOST_VAR_CNT): Likewise. (INT_MAX_STR_LEN): Constant for the maximal number of digits of a device number. (gomp_get_icv_flag): Returns if a flag for a particular ICV is set. (gomp_set_icv_flag): Sets a flag for a particular ICV. (print_device_specific_icvs): New helper function for omp_display_env to print device specific ICV values. (get_device_num): New helper function for parse_device_specific. Extracts the device number from an environment variable name. (get_icv_member_addr): Gets the memory address for a particular member of an ICV struct. (gomp_get_initial_icv_item): Get a list item of gomp_initial_icv_list. (initialize_icvs): New function to initialize a gomp_initial_icvs struct. (add_initial_icv_to_list): Adds an ICV struct to gomp_initial_icv_list. (startswith): Checks if a string starts with a given prefix. (initialize_env): Extended to parse the new syntax of environment variables. * icv-device.c (omp_get_max_teams): Added. (ialias): Likewise. (omp_set_num_teams): Likewise. * icv.c (omp_set_num_teams): Moved to icv-device.c. (omp_get_max_teams): Likewise. (ialias): Likewise. * libgomp-plugin.h (GOMP_DEVICE_NUM_VAR): Removed. (GOMP_ADDITIONAL_ICVS): New target-side struct that holds the designated ICVs of the target device. * libgomp.h (enum gomp_icvs): Collection of ICVs. (enum gomp_device_num): Definition of device numbers for _ALL, _DEV, and no suffix. (enum gomp_env_suffix): Collection of possible suffixes of environment variables. (struct gomp_initial_icvs): Contains all ICVs for which we need to store initial values. (struct gomp_default_icv):New struct to hold ICVs for which we need to store initial values. (struct gomp_icv_list): Definition of a linked list that is used for storing ICVs for the devices and also for _DEV, _ALL, and without suffix. (struct gomp_offload_icvs): New struct to hold ICVs that are copied to a device. (struct gomp_offload_icv_list): Definition of a linked list that holds device-specific ICVs that are copied to devices. (gomp_get_initial_icv_item): Get a list item of gomp_initial_icv_list. (gomp_get_icv_flag): Returns if a flag for a particular ICV is set. * libgomp.texi: Updated. * plugin/plugin-gcn.c (GOMP_OFFLOAD_load_image): Extended to read further ICVs from the offload image. * plugin/plugin-nvptx.c (GOMP_OFFLOAD_load_image): Likewise. * target.c (gomp_get_offload_icv_item): Get a list item of gomp_offload_icv_list. (get_gomp_offload_icvs): New. Returns the ICV values depending on the device num and the variable hierarchy. (gomp_load_image_to_device): Extended to copy further ICVs to a device. * testsuite/libgomp.c-c++-common/icv-5.c: New test. * testsuite/libgomp.c-c++-common/icv-6.c: New test. * testsuite/libgomp.c-c++-common/icv-7.c: New test. * testsuite/libgomp.c-c++-common/icv-8.c: New test. * testsuite/libgomp.c-c++-common/omp-display-env-1.c: New test. * testsuite/libgomp.c-c++-common/omp-display-env-2.c: New test.
275 lines
6.2 KiB
C
275 lines
6.2 KiB
C
/* Copyright (C) 2005-2022 Free Software Foundation, Inc.
|
|
Contributed by Richard Henderson <rth@redhat.com>.
|
|
|
|
This file is part of the GNU Offloading and Multi Processing Library
|
|
(libgomp).
|
|
|
|
Libgomp is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
/* This file defines the OpenMP API entry points that operate on internal
|
|
control variables. */
|
|
|
|
#include "libgomp.h"
|
|
#include "gomp-constants.h"
|
|
#include <limits.h>
|
|
|
|
ialias_redirect (omp_get_active_level)
|
|
|
|
void
|
|
omp_set_num_threads (int n)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (true);
|
|
icv->nthreads_var = (n > 0 ? n : 1);
|
|
}
|
|
|
|
void
|
|
omp_set_dynamic (int val)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (true);
|
|
icv->dyn_var = val;
|
|
}
|
|
|
|
int
|
|
omp_get_dynamic (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return icv->dyn_var;
|
|
}
|
|
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
|
|
void
|
|
omp_set_nested (int val)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (true);
|
|
if (val)
|
|
icv->max_active_levels_var = gomp_supported_active_levels;
|
|
else if (icv->max_active_levels_var > 1)
|
|
icv->max_active_levels_var = 1;
|
|
}
|
|
|
|
int
|
|
omp_get_nested (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return (icv->max_active_levels_var > 1
|
|
&& icv->max_active_levels_var > omp_get_active_level ());
|
|
}
|
|
#pragma GCC diagnostic pop
|
|
|
|
void
|
|
omp_set_schedule (omp_sched_t kind, int chunk_size)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (true);
|
|
switch (kind & ~omp_sched_monotonic)
|
|
{
|
|
case omp_sched_static:
|
|
if (chunk_size < 1)
|
|
chunk_size = 0;
|
|
icv->run_sched_chunk_size = chunk_size;
|
|
break;
|
|
case omp_sched_dynamic:
|
|
case omp_sched_guided:
|
|
if (chunk_size < 1)
|
|
chunk_size = 1;
|
|
icv->run_sched_chunk_size = chunk_size;
|
|
break;
|
|
case omp_sched_auto:
|
|
break;
|
|
default:
|
|
return;
|
|
}
|
|
icv->run_sched_var = kind;
|
|
}
|
|
|
|
void
|
|
omp_get_schedule (omp_sched_t *kind, int *chunk_size)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
*kind = icv->run_sched_var;
|
|
*chunk_size = icv->run_sched_chunk_size;
|
|
}
|
|
|
|
int
|
|
omp_get_max_threads (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return icv->nthreads_var;
|
|
}
|
|
|
|
int
|
|
omp_get_thread_limit (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return icv->thread_limit_var > INT_MAX ? INT_MAX : icv->thread_limit_var;
|
|
}
|
|
|
|
void
|
|
omp_set_max_active_levels (int max_levels)
|
|
{
|
|
if (max_levels >= 0)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (true);
|
|
|
|
if (max_levels <= gomp_supported_active_levels)
|
|
icv->max_active_levels_var = max_levels;
|
|
else
|
|
icv->max_active_levels_var = gomp_supported_active_levels;
|
|
}
|
|
}
|
|
|
|
int
|
|
omp_get_max_active_levels (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return icv->max_active_levels_var;
|
|
}
|
|
|
|
int
|
|
omp_get_supported_active_levels (void)
|
|
{
|
|
return gomp_supported_active_levels;
|
|
}
|
|
|
|
void
|
|
omp_set_teams_thread_limit (int thread_limit)
|
|
{
|
|
if (thread_limit >= 0)
|
|
gomp_teams_thread_limit_var = thread_limit;
|
|
}
|
|
|
|
int
|
|
omp_get_teams_thread_limit (void)
|
|
{
|
|
return gomp_teams_thread_limit_var;
|
|
}
|
|
|
|
int
|
|
omp_get_cancellation (void)
|
|
{
|
|
return gomp_cancel_var;
|
|
}
|
|
|
|
int
|
|
omp_get_max_task_priority (void)
|
|
{
|
|
return gomp_max_task_priority_var;
|
|
}
|
|
|
|
omp_proc_bind_t
|
|
omp_get_proc_bind (void)
|
|
{
|
|
struct gomp_task_icv *icv = gomp_icv (false);
|
|
return icv->bind_var;
|
|
}
|
|
|
|
int
|
|
omp_get_num_places (void)
|
|
{
|
|
return gomp_places_list_len;
|
|
}
|
|
|
|
int
|
|
omp_get_place_num (void)
|
|
{
|
|
if (gomp_places_list == NULL)
|
|
return -1;
|
|
|
|
struct gomp_thread *thr = gomp_thread ();
|
|
if (thr->place == 0)
|
|
gomp_init_affinity ();
|
|
|
|
return (int) thr->place - 1;
|
|
}
|
|
|
|
int
|
|
omp_get_partition_num_places (void)
|
|
{
|
|
if (gomp_places_list == NULL)
|
|
return 0;
|
|
|
|
struct gomp_thread *thr = gomp_thread ();
|
|
if (thr->place == 0)
|
|
gomp_init_affinity ();
|
|
|
|
return thr->ts.place_partition_len;
|
|
}
|
|
|
|
void
|
|
omp_get_partition_place_nums (int *place_nums)
|
|
{
|
|
if (gomp_places_list == NULL)
|
|
return;
|
|
|
|
struct gomp_thread *thr = gomp_thread ();
|
|
if (thr->place == 0)
|
|
gomp_init_affinity ();
|
|
|
|
unsigned int i;
|
|
for (i = 0; i < thr->ts.place_partition_len; i++)
|
|
*place_nums++ = thr->ts.place_partition_off + i;
|
|
}
|
|
|
|
void
|
|
omp_set_default_allocator (omp_allocator_handle_t allocator)
|
|
{
|
|
struct gomp_thread *thr = gomp_thread ();
|
|
if (allocator == omp_null_allocator)
|
|
allocator = omp_default_mem_alloc;
|
|
thr->ts.def_allocator = (uintptr_t) allocator;
|
|
}
|
|
|
|
omp_allocator_handle_t
|
|
omp_get_default_allocator (void)
|
|
{
|
|
struct gomp_thread *thr = gomp_thread ();
|
|
if (thr->ts.def_allocator == omp_null_allocator)
|
|
return (omp_allocator_handle_t) gomp_def_allocator;
|
|
else
|
|
return (omp_allocator_handle_t) thr->ts.def_allocator;
|
|
}
|
|
|
|
ialias (omp_set_dynamic)
|
|
ialias (omp_get_dynamic)
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
|
|
ialias (omp_set_nested)
|
|
ialias (omp_get_nested)
|
|
#pragma GCC diagnostic pop
|
|
ialias (omp_set_num_threads)
|
|
ialias (omp_set_schedule)
|
|
ialias (omp_get_schedule)
|
|
ialias (omp_get_max_threads)
|
|
ialias (omp_get_thread_limit)
|
|
ialias (omp_set_max_active_levels)
|
|
ialias (omp_get_max_active_levels)
|
|
ialias (omp_get_supported_active_levels)
|
|
ialias (omp_set_teams_thread_limit)
|
|
ialias (omp_get_teams_thread_limit)
|
|
ialias (omp_get_cancellation)
|
|
ialias (omp_get_proc_bind)
|
|
ialias (omp_get_max_task_priority)
|
|
ialias (omp_get_num_places)
|
|
ialias (omp_get_place_num)
|
|
ialias (omp_get_partition_num_places)
|
|
ialias (omp_get_partition_place_nums)
|
|
ialias (omp_set_default_allocator)
|
|
ialias (omp_get_default_allocator)
|