config/linux/bar.c

2224Sctornqvi/* Copyright (C) 2005-2019 Free Software Foundation, Inc.
2553Siignatyev   Contributed by Richard Henderson <rth@redhat.com>.
2224Sctornqvi
2224Sctornqvi   This file is part of the GNU Offloading and Multi Processing Library
2224Sctornqvi   (libgomp).
2224Sctornqvi
2224Sctornqvi   Libgomp is free software; you can redistribute it and/or modify it
2224Sctornqvi   under the terms of the GNU General Public License as published by
2224Sctornqvi   the Free Software Foundation; either version 3, or (at your option)
2224Sctornqvi   any later version.
2224Sctornqvi
2224Sctornqvi   Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
2224Sctornqvi   WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
2224Sctornqvi   FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
2224Sctornqvi   more details.
2224Sctornqvi
2224Sctornqvi   Under Section 7 of GPL version 3, you are granted additional
2224Sctornqvi   permissions described in the GCC Runtime Library Exception, version
2224Sctornqvi   3.1, as published by the Free Software Foundation.
2224Sctornqvi
2224Sctornqvi   You should have received a copy of the GNU General Public License and
2224Sctornqvi   a copy of the GCC Runtime Library Exception along with this program;
2224Sctornqvi   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
2224Sctornqvi   <http://www.gnu.org/licenses/>.  */
2224Sctornqvi
2224Sctornqvi/* This is a Linux specific implementation of a barrier synchronization
2224Sctornqvi   mechanism for libgomp.  This type is private to the library.  This
2224Sctornqvi   implementation uses atomic instructions and the futex syscall.  */
2224Sctornqvi
2224Sctornqvi#include <limits.h>
2553Siignatyev#include "wait.h"
2224Sctornqvi
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_barrier_wait_end (gomp_barrier_t *bar, gomp_barrier_state_t state)
2224Sctornqvi{
2224Sctornqvi  if (__builtin_expect (state & BAR_WAS_LAST, 0))
2224Sctornqvi    {
2224Sctornqvi      /* Next time we'll be awaiting TOTAL threads again.  */
2224Sctornqvi      bar->awaited = bar->total;
2224Sctornqvi      __atomic_store_n (&bar->generation, bar->generation + BAR_INCR,
2224Sctornqvi			MEMMODEL_RELEASE);
2224Sctornqvi      futex_wake ((int *) &bar->generation, INT_MAX);
2224Sctornqvi    }
2224Sctornqvi  else
2224Sctornqvi    {
2224Sctornqvi      do
2224Sctornqvi	do_wait ((int *) &bar->generation, state);
2224Sctornqvi      while (__atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE) == state);
2224Sctornqvi    }
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_barrier_wait (gomp_barrier_t *bar)
2224Sctornqvi{
2224Sctornqvi  gomp_barrier_wait_end (bar, gomp_barrier_wait_start (bar));
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvi/* Like gomp_barrier_wait, except that if the encountering thread
2224Sctornqvi   is not the last one to hit the barrier, it returns immediately.
2224Sctornqvi   The intended usage is that a thread which intends to gomp_barrier_destroy
2224Sctornqvi   this barrier calls gomp_barrier_wait, while all other threads
2224Sctornqvi   call gomp_barrier_wait_last.  When gomp_barrier_wait returns,
2224Sctornqvi   the barrier can be safely destroyed.  */
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_barrier_wait_last (gomp_barrier_t *bar)
2224Sctornqvi{
2224Sctornqvi  gomp_barrier_state_t state = gomp_barrier_wait_start (bar);
2224Sctornqvi  if (state & BAR_WAS_LAST)
2224Sctornqvi    gomp_barrier_wait_end (bar, state);
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_team_barrier_wake (gomp_barrier_t *bar, int count)
2224Sctornqvi{
2224Sctornqvi  futex_wake ((int *) &bar->generation, count == 0 ? INT_MAX : count);
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_team_barrier_wait_end (gomp_barrier_t *bar, gomp_barrier_state_t state)
2224Sctornqvi{
2224Sctornqvi  unsigned int generation, gen;
2224Sctornqvi
2224Sctornqvi  if (__builtin_expect (state & BAR_WAS_LAST, 0))
2224Sctornqvi    {
2224Sctornqvi      /* Next time we'll be awaiting TOTAL threads again.  */
2224Sctornqvi      struct gomp_thread *thr = gomp_thread ();
2224Sctornqvi      struct gomp_team *team = thr->ts.team;
2224Sctornqvi
2224Sctornqvi      bar->awaited = bar->total;
2224Sctornqvi      team->work_share_cancelled = 0;
2224Sctornqvi      if (__builtin_expect (team->task_count, 0))
2224Sctornqvi	{
2224Sctornqvi	  gomp_barrier_handle_tasks (state);
2224Sctornqvi	  state &= ~BAR_WAS_LAST;
2224Sctornqvi	}
2224Sctornqvi      else
2224Sctornqvi	{
2224Sctornqvi	  state &= ~BAR_CANCELLED;
2224Sctornqvi	  state += BAR_INCR - BAR_WAS_LAST;
2224Sctornqvi	  __atomic_store_n (&bar->generation, state, MEMMODEL_RELEASE);
2224Sctornqvi	  futex_wake ((int *) &bar->generation, INT_MAX);
2224Sctornqvi	  return;
2224Sctornqvi	}
2224Sctornqvi    }
2224Sctornqvi
2224Sctornqvi  generation = state;
2553Siignatyev  state &= ~BAR_CANCELLED;
2224Sctornqvi  do
2224Sctornqvi    {
2224Sctornqvi      do_wait ((int *) &bar->generation, generation);
2224Sctornqvi      gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
2224Sctornqvi      if (__builtin_expect (gen & BAR_TASK_PENDING, 0))
2224Sctornqvi	{
2224Sctornqvi	  gomp_barrier_handle_tasks (state);
2224Sctornqvi	  gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
2224Sctornqvi	}
2224Sctornqvi      generation |= gen & BAR_WAITING_FOR_TASK;
2224Sctornqvi    }
2224Sctornqvi  while (gen != state + BAR_INCR);
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_team_barrier_wait (gomp_barrier_t *bar)
2224Sctornqvi{
2224Sctornqvi  gomp_team_barrier_wait_end (bar, gomp_barrier_wait_start (bar));
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_team_barrier_wait_final (gomp_barrier_t *bar)
2224Sctornqvi{
2224Sctornqvi  gomp_barrier_state_t state = gomp_barrier_wait_final_start (bar);
2224Sctornqvi  if (__builtin_expect (state & BAR_WAS_LAST, 0))
2224Sctornqvi    bar->awaited_final = bar->total;
2224Sctornqvi  gomp_team_barrier_wait_end (bar, state);
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvibool
2224Sctornqvigomp_team_barrier_wait_cancel_end (gomp_barrier_t *bar,
2224Sctornqvi				   gomp_barrier_state_t state)
2224Sctornqvi{
2224Sctornqvi  unsigned int generation, gen;
2224Sctornqvi
2224Sctornqvi  if (__builtin_expect (state & BAR_WAS_LAST, 0))
2224Sctornqvi    {
2224Sctornqvi      /* Next time we'll be awaiting TOTAL threads again.  */
2224Sctornqvi      /* BAR_CANCELLED should never be set in state here, because
2224Sctornqvi	 cancellation means that at least one of the threads has been
2224Sctornqvi	 cancelled, thus on a cancellable barrier we should never see
2224Sctornqvi	 all threads to arrive.  */
2224Sctornqvi      struct gomp_thread *thr = gomp_thread ();
2224Sctornqvi      struct gomp_team *team = thr->ts.team;
2224Sctornqvi
2224Sctornqvi      bar->awaited = bar->total;
2224Sctornqvi      team->work_share_cancelled = 0;
2224Sctornqvi      if (__builtin_expect (team->task_count, 0))
2224Sctornqvi	{
2224Sctornqvi	  gomp_barrier_handle_tasks (state);
2224Sctornqvi	  state &= ~BAR_WAS_LAST;
2224Sctornqvi	}
2224Sctornqvi      else
2224Sctornqvi	{
2224Sctornqvi	  state += BAR_INCR - BAR_WAS_LAST;
2224Sctornqvi	  __atomic_store_n (&bar->generation, state, MEMMODEL_RELEASE);
2224Sctornqvi	  futex_wake ((int *) &bar->generation, INT_MAX);
2224Sctornqvi	  return false;
2224Sctornqvi	}
2224Sctornqvi    }
2224Sctornqvi
2224Sctornqvi  if (__builtin_expect (state & BAR_CANCELLED, 0))
2224Sctornqvi    return true;
2224Sctornqvi
2224Sctornqvi  generation = state;
2224Sctornqvi  do
2224Sctornqvi    {
2224Sctornqvi      do_wait ((int *) &bar->generation, generation);
2224Sctornqvi      gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
2224Sctornqvi      if (__builtin_expect (gen & BAR_CANCELLED, 0))
2224Sctornqvi	return true;
2224Sctornqvi      if (__builtin_expect (gen & BAR_TASK_PENDING, 0))
2224Sctornqvi	{
2224Sctornqvi	  gomp_barrier_handle_tasks (state);
2224Sctornqvi	  gen = __atomic_load_n (&bar->generation, MEMMODEL_ACQUIRE);
2224Sctornqvi	}
2224Sctornqvi      generation |= gen & BAR_WAITING_FOR_TASK;
2224Sctornqvi    }
2224Sctornqvi  while (gen != state + BAR_INCR);
2224Sctornqvi
2224Sctornqvi  return false;
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvibool
2224Sctornqvigomp_team_barrier_wait_cancel (gomp_barrier_t *bar)
2224Sctornqvi{
2224Sctornqvi  return gomp_team_barrier_wait_cancel_end (bar, gomp_barrier_wait_start (bar));
2224Sctornqvi}
2224Sctornqvi
2224Sctornqvivoid
2224Sctornqvigomp_team_barrier_cancel (struct gomp_team *team)
2224Sctornqvi{
2224Sctornqvi  gomp_mutex_lock (&team->task_lock);
2508Sjcm  if (team->barrier.generation & BAR_CANCELLED)
2508Sjcm    {
2508Sjcm      gomp_mutex_unlock (&team->task_lock);
2508Sjcm      return;
2224Sctornqvi    }
2224Sctornqvi  team->barrier.generation |= BAR_CANCELLED;
2224Sctornqvi  gomp_mutex_unlock (&team->task_lock);
2224Sctornqvi  futex_wake ((int *) &team->barrier.generation, INT_MAX);
2224Sctornqvi}
2224Sctornqvi