7d6da11fce
The following patch implements what I've been talking about earlier, honor that for explicit num_teams clause we create at least the lower-bound (if not specified, upper-bound) teams in the league. For host fallback, it still means we only have one thread doing all the teams, sequentially one after another. For PTX and GCN, I think the new teams-2.c test and maybe teams-4.c too will or might fail. For these offloads, I think it is ok to remove symbols no longer used from libgomp.a. If num_teams_lower is bigger than the provided num_blocks or num_workgroups, we should arrange for gomp_num_teams_var to be num_teams_lower - 1, stop using the %ctaid.x or __builtin_gcn_dim_pos (0) for omp_get_team_num () and instead use for it some .shared var that GOMP_teams4 initializes to %ctaid.x or __builtin_gcn_dim_pos (0) when first and for !first increment that by num_blocks or num_workgroups each time and only return false when we are above num_teams_lower. Any help with actually implementing this for the 2 architectures highly appreciated. 2021-11-12 Jakub Jelinek <jakub@redhat.com> gcc/ * omp-builtins.def (BUILT_IN_GOMP_TEAMS): Remove. (BUILT_IN_GOMP_TEAMS4): New. * builtin-types.def (BT_FN_VOID_UINT_UINT): Remove. (BT_FN_BOOL_UINT_UINT_UINT_BOOL): New. * omp-low.c (lower_omp_teams): Use GOMP_teams4 instead of GOMP_teams, pass to it also num_teams lower-bound expression or a dup of upper-bound if it is missing and a flag whether it is the first call or not. gcc/fortran/ * types.def (BT_FN_VOID_UINT_UINT): Remove. (BT_FN_BOOL_UINT_UINT_UINT_BOOL): New. libgomp/ * libgomp_g.h (GOMP_teams4): Declare. * libgomp.map (GOMP_5.1): Export GOMP_teams4. * target.c (GOMP_teams4): New function. * config/nvptx/target.c (GOMP_teams): Remove. (GOMP_teams4): New function. * config/gcn/target.c (GOMP_teams): Remove. (GOMP_teams4): New function. * testsuite/libgomp.c/teams-4.c (main): Expect exactly 2 teams instead of <= 2. * testsuite/libgomp.c-c++-common/teams-2.c: New test.
404 lines
15 KiB
C
404 lines
15 KiB
C
/* Copyright (C) 2005-2021 Free Software Foundation, Inc.
|
|
Contributed by Richard Henderson <rth@redhat.com>.
|
|
|
|
This file is part of the GNU Offloading and Multi Processing Library
|
|
(libgomp).
|
|
|
|
Libgomp is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3, or (at your option)
|
|
any later version.
|
|
|
|
Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
/* This file contains prototypes of functions in the external ABI.
|
|
This file is included by files in the testsuite. */
|
|
|
|
#ifndef LIBGOMP_G_H
|
|
#define LIBGOMP_G_H 1
|
|
|
|
#include <stdbool.h>
|
|
#include <stddef.h>
|
|
#include <stdint.h>
|
|
|
|
/* barrier.c */
|
|
|
|
extern void GOMP_barrier (void);
|
|
extern bool GOMP_barrier_cancel (void);
|
|
|
|
/* critical.c */
|
|
|
|
extern void GOMP_critical_start (void);
|
|
extern void GOMP_critical_end (void);
|
|
extern void GOMP_critical_name_start (void **);
|
|
extern void GOMP_critical_name_end (void **);
|
|
extern void GOMP_atomic_start (void);
|
|
extern void GOMP_atomic_end (void);
|
|
|
|
/* loop.c */
|
|
|
|
extern bool GOMP_loop_static_start (long, long, long, long, long *, long *);
|
|
extern bool GOMP_loop_dynamic_start (long, long, long, long, long *, long *);
|
|
extern bool GOMP_loop_guided_start (long, long, long, long, long *, long *);
|
|
extern bool GOMP_loop_runtime_start (long, long, long, long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_dynamic_start (long, long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_guided_start (long, long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_runtime_start (long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_maybe_nonmonotonic_runtime_start (long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_start (long, long, long, long, long, long *, long *,
|
|
uintptr_t *, void **);
|
|
|
|
extern bool GOMP_loop_ordered_static_start (long, long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_ordered_dynamic_start (long, long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_ordered_guided_start (long, long, long, long,
|
|
long *, long *);
|
|
extern bool GOMP_loop_ordered_runtime_start (long, long, long, long *, long *);
|
|
extern bool GOMP_loop_ordered_start (long, long, long, long, long, long *,
|
|
long *, uintptr_t *, void **);
|
|
|
|
extern bool GOMP_loop_static_next (long *, long *);
|
|
extern bool GOMP_loop_dynamic_next (long *, long *);
|
|
extern bool GOMP_loop_guided_next (long *, long *);
|
|
extern bool GOMP_loop_runtime_next (long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_dynamic_next (long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_guided_next (long *, long *);
|
|
extern bool GOMP_loop_nonmonotonic_runtime_next (long *, long *);
|
|
extern bool GOMP_loop_maybe_nonmonotonic_runtime_next (long *, long *);
|
|
|
|
extern bool GOMP_loop_ordered_static_next (long *, long *);
|
|
extern bool GOMP_loop_ordered_dynamic_next (long *, long *);
|
|
extern bool GOMP_loop_ordered_guided_next (long *, long *);
|
|
extern bool GOMP_loop_ordered_runtime_next (long *, long *);
|
|
|
|
extern bool GOMP_loop_doacross_static_start (unsigned, long *, long, long *,
|
|
long *);
|
|
extern bool GOMP_loop_doacross_dynamic_start (unsigned, long *, long, long *,
|
|
long *);
|
|
extern bool GOMP_loop_doacross_guided_start (unsigned, long *, long, long *,
|
|
long *);
|
|
extern bool GOMP_loop_doacross_runtime_start (unsigned, long *, long *,
|
|
long *);
|
|
extern bool GOMP_loop_doacross_start (unsigned, long *, long, long, long *,
|
|
long *, uintptr_t *, void **);
|
|
|
|
extern void GOMP_parallel_loop_static_start (void (*)(void *), void *,
|
|
unsigned, long, long, long, long);
|
|
extern void GOMP_parallel_loop_dynamic_start (void (*)(void *), void *,
|
|
unsigned, long, long, long, long);
|
|
extern void GOMP_parallel_loop_guided_start (void (*)(void *), void *,
|
|
unsigned, long, long, long, long);
|
|
extern void GOMP_parallel_loop_runtime_start (void (*)(void *), void *,
|
|
unsigned, long, long, long);
|
|
extern void GOMP_parallel_loop_static (void (*)(void *), void *,
|
|
unsigned, long, long, long, long,
|
|
unsigned);
|
|
extern void GOMP_parallel_loop_dynamic (void (*)(void *), void *,
|
|
unsigned, long, long, long, long,
|
|
unsigned);
|
|
extern void GOMP_parallel_loop_guided (void (*)(void *), void *,
|
|
unsigned, long, long, long, long,
|
|
unsigned);
|
|
extern void GOMP_parallel_loop_runtime (void (*)(void *), void *,
|
|
unsigned, long, long, long,
|
|
unsigned);
|
|
extern void GOMP_parallel_loop_nonmonotonic_dynamic (void (*)(void *), void *,
|
|
unsigned, long, long,
|
|
long, long, unsigned);
|
|
extern void GOMP_parallel_loop_nonmonotonic_guided (void (*)(void *), void *,
|
|
unsigned, long, long,
|
|
long, long, unsigned);
|
|
extern void GOMP_parallel_loop_nonmonotonic_runtime (void (*)(void *), void *,
|
|
unsigned, long, long,
|
|
long, unsigned);
|
|
extern void GOMP_parallel_loop_maybe_nonmonotonic_runtime (void (*)(void *),
|
|
void *, unsigned,
|
|
long, long,
|
|
long, unsigned);
|
|
|
|
extern void GOMP_loop_end (void);
|
|
extern void GOMP_loop_end_nowait (void);
|
|
extern bool GOMP_loop_end_cancel (void);
|
|
|
|
/* loop_ull.c */
|
|
|
|
extern bool GOMP_loop_ull_static_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_dynamic_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_guided_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_runtime_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_dynamic_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_guided_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_runtime_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_maybe_nonmonotonic_runtime_start (bool,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_start (bool, unsigned long long, unsigned long long,
|
|
unsigned long long, long, unsigned long long,
|
|
unsigned long long *, unsigned long long *,
|
|
uintptr_t *, void **);
|
|
|
|
extern bool GOMP_loop_ull_ordered_static_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_dynamic_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_guided_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_runtime_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_start (bool, unsigned long long,
|
|
unsigned long long,
|
|
unsigned long long, long,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *,
|
|
uintptr_t *, void **);
|
|
|
|
extern bool GOMP_loop_ull_static_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_dynamic_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_guided_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_runtime_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_dynamic_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_guided_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_nonmonotonic_runtime_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_maybe_nonmonotonic_runtime_next (unsigned long long *,
|
|
unsigned long long *);
|
|
|
|
extern bool GOMP_loop_ull_ordered_static_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_dynamic_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_guided_next (unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_ordered_runtime_next (unsigned long long *,
|
|
unsigned long long *);
|
|
|
|
extern bool GOMP_loop_ull_doacross_static_start (unsigned,
|
|
unsigned long long *,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_doacross_dynamic_start (unsigned,
|
|
unsigned long long *,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_doacross_guided_start (unsigned,
|
|
unsigned long long *,
|
|
unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_doacross_runtime_start (unsigned,
|
|
unsigned long long *,
|
|
unsigned long long *,
|
|
unsigned long long *);
|
|
extern bool GOMP_loop_ull_doacross_start (unsigned, unsigned long long *,
|
|
long, unsigned long long,
|
|
unsigned long long *,
|
|
unsigned long long *,
|
|
uintptr_t *, void **);
|
|
|
|
/* ordered.c */
|
|
|
|
extern void GOMP_ordered_start (void);
|
|
extern void GOMP_ordered_end (void);
|
|
extern void GOMP_doacross_post (long *);
|
|
extern void GOMP_doacross_wait (long, ...);
|
|
extern void GOMP_doacross_ull_post (unsigned long long *);
|
|
extern void GOMP_doacross_ull_wait (unsigned long long, ...);
|
|
|
|
/* parallel.c */
|
|
|
|
extern void GOMP_parallel_start (void (*) (void *), void *, unsigned);
|
|
extern void GOMP_parallel_end (void);
|
|
extern void GOMP_parallel (void (*) (void *), void *, unsigned, unsigned);
|
|
extern unsigned GOMP_parallel_reductions (void (*) (void *), void *, unsigned,
|
|
unsigned);
|
|
extern bool GOMP_cancel (int, bool);
|
|
extern bool GOMP_cancellation_point (int);
|
|
|
|
/* task.c */
|
|
|
|
extern void GOMP_task (void (*) (void *), void *, void (*) (void *, void *),
|
|
long, long, bool, unsigned, void **, int, void *);
|
|
extern void GOMP_taskloop (void (*) (void *), void *,
|
|
void (*) (void *, void *), long, long, unsigned,
|
|
unsigned long, int, long, long, long);
|
|
extern void GOMP_taskloop_ull (void (*) (void *), void *,
|
|
void (*) (void *, void *), long, long,
|
|
unsigned, unsigned long, int,
|
|
unsigned long long, unsigned long long,
|
|
unsigned long long);
|
|
extern void GOMP_taskwait (void);
|
|
extern void GOMP_taskwait_depend (void **);
|
|
extern void GOMP_taskyield (void);
|
|
extern void GOMP_taskgroup_start (void);
|
|
extern void GOMP_taskgroup_end (void);
|
|
extern void GOMP_taskgroup_reduction_register (uintptr_t *);
|
|
extern void GOMP_taskgroup_reduction_unregister (uintptr_t *);
|
|
extern void GOMP_task_reduction_remap (size_t, size_t, void **);
|
|
extern void GOMP_workshare_task_reduction_unregister (bool);
|
|
|
|
/* sections.c */
|
|
|
|
extern unsigned GOMP_sections_start (unsigned);
|
|
extern unsigned GOMP_sections2_start (unsigned, uintptr_t *, void **);
|
|
extern unsigned GOMP_sections_next (void);
|
|
extern void GOMP_parallel_sections_start (void (*) (void *), void *,
|
|
unsigned, unsigned);
|
|
extern void GOMP_parallel_sections (void (*) (void *), void *,
|
|
unsigned, unsigned, unsigned);
|
|
extern void GOMP_sections_end (void);
|
|
extern void GOMP_sections_end_nowait (void);
|
|
extern bool GOMP_sections_end_cancel (void);
|
|
|
|
/* single.c */
|
|
|
|
extern bool GOMP_single_start (void);
|
|
extern void *GOMP_single_copy_start (void);
|
|
extern void GOMP_single_copy_end (void *);
|
|
|
|
/* scope.c */
|
|
|
|
extern void GOMP_scope_start (uintptr_t *);
|
|
|
|
/* target.c */
|
|
|
|
extern void GOMP_target (int, void (*) (void *), const void *,
|
|
size_t, void **, size_t *, unsigned char *);
|
|
extern void GOMP_target_ext (int, void (*) (void *), size_t, void **, size_t *,
|
|
unsigned short *, unsigned int, void **, void **);
|
|
extern void GOMP_target_data (int, const void *,
|
|
size_t, void **, size_t *, unsigned char *);
|
|
extern void GOMP_target_data_ext (int, size_t, void **, size_t *,
|
|
unsigned short *);
|
|
extern void GOMP_target_end_data (void);
|
|
extern void GOMP_target_update (int, const void *,
|
|
size_t, void **, size_t *, unsigned char *);
|
|
extern void GOMP_target_update_ext (int, size_t, void **, size_t *,
|
|
unsigned short *, unsigned int, void **);
|
|
extern void GOMP_target_enter_exit_data (int, size_t, void **, size_t *,
|
|
unsigned short *, unsigned int,
|
|
void **);
|
|
extern void GOMP_teams (unsigned int, unsigned int);
|
|
extern bool GOMP_teams4 (unsigned int, unsigned int, unsigned int, bool);
|
|
|
|
/* teams.c */
|
|
|
|
extern void GOMP_teams_reg (void (*) (void *), void *, unsigned, unsigned,
|
|
unsigned);
|
|
|
|
/* allocator.c */
|
|
|
|
extern void *GOMP_alloc (size_t, size_t, uintptr_t);
|
|
extern void GOMP_free (void *, uintptr_t);
|
|
|
|
/* error.c */
|
|
|
|
extern void GOMP_warning (const char *, size_t);
|
|
extern void GOMP_error (const char *, size_t);
|
|
|
|
/* oacc-async.c */
|
|
|
|
extern void GOACC_wait (int, int, ...);
|
|
|
|
/* oacc-mem.c */
|
|
|
|
extern void GOACC_enter_exit_data (int, size_t, void **, size_t *,
|
|
unsigned short *, int, int, ...);
|
|
extern void GOACC_enter_data (int, size_t, void **, size_t *,
|
|
unsigned short *, int, int, ...);
|
|
extern void GOACC_exit_data (int, size_t, void **, size_t *,
|
|
unsigned short *, int, int, ...);
|
|
extern void GOACC_declare (int, size_t, void **, size_t *, unsigned short *);
|
|
|
|
/* oacc-parallel.c */
|
|
|
|
extern void GOACC_parallel_keyed (int, void (*) (void *), size_t,
|
|
void **, size_t *, unsigned short *, ...);
|
|
extern void GOACC_parallel (int, void (*) (void *), size_t, void **, size_t *,
|
|
unsigned short *, int, int, int, int, int, ...);
|
|
extern void GOACC_data_start (int, size_t, void **, size_t *,
|
|
unsigned short *);
|
|
extern void GOACC_data_end (void);
|
|
extern void GOACC_update (int, size_t, void **, size_t *,
|
|
unsigned short *, int, int, ...);
|
|
extern int GOACC_get_num_threads (void);
|
|
extern int GOACC_get_thread_num (void);
|
|
|
|
#endif /* LIBGOMP_G_H */
|