|  | /* Copyright (C) 2005-2014 Free Software Foundation, Inc. | 
|  | Contributed by Richard Henderson <rth@redhat.com>. | 
|  |  | 
|  | This file is part of the GNU OpenMP Library (libgomp). | 
|  |  | 
|  | Libgomp is free software; you can redistribute it and/or modify it | 
|  | under the terms of the GNU General Public License as published by | 
|  | the Free Software Foundation; either version 3, or (at your option) | 
|  | any later version. | 
|  |  | 
|  | Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY | 
|  | WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS | 
|  | FOR A PARTICULAR PURPOSE.  See the GNU General Public License for | 
|  | more details. | 
|  |  | 
|  | Under Section 7 of GPL version 3, you are granted additional | 
|  | permissions described in the GCC Runtime Library Exception, version | 
|  | 3.1, as published by the Free Software Foundation. | 
|  |  | 
|  | You should have received a copy of the GNU General Public License and | 
|  | a copy of the GCC Runtime Library Exception along with this program; | 
|  | see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see | 
|  | <http://www.gnu.org/licenses/>.  */ | 
|  |  | 
|  | /* This is a Linux specific implementation of a barrier synchronization | 
|  | mechanism for libgomp.  This type is private to the library.  This | 
|  | implementation uses atomic instructions and the futex syscall.  */ | 
|  |  | 
|  | #ifndef GOMP_BARRIER_H | 
|  | #define GOMP_BARRIER_H 1 | 
|  |  | 
|  | #include "mutex.h" | 
|  |  | 
|  | typedef struct | 
|  | { | 
|  | /* Make sure total/generation is in a mostly read cacheline, while | 
|  | awaited in a separate cacheline.  */ | 
|  | unsigned total __attribute__((aligned (64))); | 
|  | unsigned generation; | 
|  | unsigned awaited __attribute__((aligned (64))); | 
|  | unsigned awaited_final; | 
|  | } gomp_barrier_t; | 
|  |  | 
|  | typedef unsigned int gomp_barrier_state_t; | 
|  |  | 
|  | /* The generation field contains a counter in the high bits, with a few | 
|  | low bits dedicated to flags.  Note that TASK_PENDING and WAS_LAST can | 
|  | share space because WAS_LAST is never stored back to generation.  */ | 
|  | #define BAR_TASK_PENDING	1 | 
|  | #define BAR_WAS_LAST		1 | 
|  | #define BAR_WAITING_FOR_TASK	2 | 
|  | #define BAR_CANCELLED		4 | 
|  | #define BAR_INCR		8 | 
|  |  | 
|  | static inline void gomp_barrier_init (gomp_barrier_t *bar, unsigned count) | 
|  | { | 
|  | bar->total = count; | 
|  | bar->awaited = count; | 
|  | bar->awaited_final = count; | 
|  | bar->generation = 0; | 
|  | } | 
|  |  | 
|  | static inline void gomp_barrier_reinit (gomp_barrier_t *bar, unsigned count) | 
|  | { | 
|  | __atomic_add_fetch (&bar->awaited, count - bar->total, MEMMODEL_ACQ_REL); | 
|  | bar->total = count; | 
|  | } | 
|  |  | 
|  | static inline void gomp_barrier_destroy (gomp_barrier_t *bar) | 
|  | { | 
|  | } | 
|  |  | 
|  | extern void gomp_barrier_wait (gomp_barrier_t *); | 
|  | extern void gomp_barrier_wait_last (gomp_barrier_t *); | 
|  | extern void gomp_barrier_wait_end (gomp_barrier_t *, gomp_barrier_state_t); | 
|  | extern void gomp_team_barrier_wait (gomp_barrier_t *); | 
|  | extern void gomp_team_barrier_wait_final (gomp_barrier_t *); | 
|  | extern void gomp_team_barrier_wait_end (gomp_barrier_t *, | 
|  | gomp_barrier_state_t); | 
|  | extern bool gomp_team_barrier_wait_cancel (gomp_barrier_t *); | 
|  | extern bool gomp_team_barrier_wait_cancel_end (gomp_barrier_t *, | 
|  | gomp_barrier_state_t); | 
|  | extern void gomp_team_barrier_wake (gomp_barrier_t *, int); | 
|  | struct gomp_team; | 
|  | extern void gomp_team_barrier_cancel (struct gomp_team *); | 
|  |  | 
|  | static inline gomp_barrier_state_t | 
|  | gomp_barrier_wait_start (gomp_barrier_t *bar) | 
|  | { | 
|  | unsigned int ret = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE); | 
|  | ret &= -BAR_INCR | BAR_CANCELLED; | 
|  | /* A memory barrier is needed before exiting from the various forms | 
|  | of gomp_barrier_wait, to satisfy OpenMP API version 3.1 section | 
|  | 2.8.6 flush Construct, which says there is an implicit flush during | 
|  | a barrier region.  This is a convenient place to add the barrier, | 
|  | so we use MEMMODEL_ACQ_REL here rather than MEMMODEL_ACQUIRE.  */ | 
|  | if (__atomic_add_fetch (&bar->awaited, -1, MEMMODEL_ACQ_REL) == 0) | 
|  | ret |= BAR_WAS_LAST; | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | static inline gomp_barrier_state_t | 
|  | gomp_barrier_wait_cancel_start (gomp_barrier_t *bar) | 
|  | { | 
|  | return gomp_barrier_wait_start (bar); | 
|  | } | 
|  |  | 
|  | /* This is like gomp_barrier_wait_start, except it decrements | 
|  | bar->awaited_final rather than bar->awaited and should be used | 
|  | for the gomp_team_end barrier only.  */ | 
|  | static inline gomp_barrier_state_t | 
|  | gomp_barrier_wait_final_start (gomp_barrier_t *bar) | 
|  | { | 
|  | unsigned int ret = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE); | 
|  | ret &= -BAR_INCR | BAR_CANCELLED; | 
|  | /* See above gomp_barrier_wait_start comment.  */ | 
|  | if (__atomic_add_fetch (&bar->awaited_final, -1, MEMMODEL_ACQ_REL) == 0) | 
|  | ret |= BAR_WAS_LAST; | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | static inline bool | 
|  | gomp_barrier_last_thread (gomp_barrier_state_t state) | 
|  | { | 
|  | return state & BAR_WAS_LAST; | 
|  | } | 
|  |  | 
|  | /* All the inlines below must be called with team->task_lock | 
|  | held.  */ | 
|  |  | 
|  | static inline void | 
|  | gomp_team_barrier_set_task_pending (gomp_barrier_t *bar) | 
|  | { | 
|  | bar->generation |= BAR_TASK_PENDING; | 
|  | } | 
|  |  | 
|  | static inline void | 
|  | gomp_team_barrier_clear_task_pending (gomp_barrier_t *bar) | 
|  | { | 
|  | bar->generation &= ~BAR_TASK_PENDING; | 
|  | } | 
|  |  | 
|  | static inline void | 
|  | gomp_team_barrier_set_waiting_for_tasks (gomp_barrier_t *bar) | 
|  | { | 
|  | bar->generation |= BAR_WAITING_FOR_TASK; | 
|  | } | 
|  |  | 
|  | static inline bool | 
|  | gomp_team_barrier_waiting_for_tasks (gomp_barrier_t *bar) | 
|  | { | 
|  | return (bar->generation & BAR_WAITING_FOR_TASK) != 0; | 
|  | } | 
|  |  | 
|  | static inline bool | 
|  | gomp_team_barrier_cancelled (gomp_barrier_t *bar) | 
|  | { | 
|  | return __builtin_expect ((bar->generation & BAR_CANCELLED) != 0, 0); | 
|  | } | 
|  |  | 
|  | static inline void | 
|  | gomp_team_barrier_done (gomp_barrier_t *bar, gomp_barrier_state_t state) | 
|  | { | 
|  | bar->generation = (state & -BAR_INCR) + BAR_INCR; | 
|  | } | 
|  |  | 
|  | #endif /* GOMP_BARRIER_H */ |