6041f70ae3
* beginend.cc (GTM::gtm_thread::serial_lock): Put on cacheline boundary. (htm_fastpath): Remove. (gtm_thread::begin_transaction): Fix HTM fastpath. (_ITM_commitTransaction): Adapt. (_ITM_commitTransactionEH): Adapt. * libitm/config/linux/rwlock.h (gtm_rwlock): Add htm_fastpath member and accessors. * libitm/config/posix/rwlock.h (gtm_rwlock): Likewise. * libitm/config/posix/rwlock.cc (gtm_rwlock::gtm_rwlock): Adapt. * libitm/config/x86/sjlj.S (_ITM_beginTransaction): Fix HTM fastpath. * libitm/libitm_i.h (htm_fastpath): Remove declaration. * libitm/method-serial.cc (htm_mg): Adapt. (gtm_thread::serialirr_mode): Adapt. * libitm/query.cc (_ITM_inTransaction, _ITM_getTransactionId): Adapt. From-SVN: r232735
329 lines
12 KiB
C++
329 lines
12 KiB
C++
/* Copyright (C) 2008-2016 Free Software Foundation, Inc.
|
|
Contributed by Richard Henderson <rth@redhat.com>.
|
|
|
|
This file is part of the GNU Transactional Memory Library (libitm).
|
|
|
|
Libitm is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Libitm is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
FOR A PARTICULAR PURPOSE. See the GNU General Public License for
|
|
more details.
|
|
|
|
Under Section 7 of GPL version 3, you are granted additional
|
|
permissions described in the GCC Runtime Library Exception, version
|
|
3.1, as published by the Free Software Foundation.
|
|
|
|
You should have received a copy of the GNU General Public License and
|
|
a copy of the GCC Runtime Library Exception along with this program;
|
|
see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#include "libitm_i.h"
|
|
|
|
namespace GTM HIDDEN {
|
|
|
|
// Initialize a new RW lock.
|
|
// ??? Move this back to the header file when constexpr is implemented.
|
|
|
|
gtm_rwlock::gtm_rwlock()
|
|
: summary (0),
|
|
htm_fastpath (0),
|
|
mutex (PTHREAD_MUTEX_INITIALIZER),
|
|
c_readers (PTHREAD_COND_INITIALIZER),
|
|
c_writers (PTHREAD_COND_INITIALIZER),
|
|
c_confirmed_writers (PTHREAD_COND_INITIALIZER),
|
|
a_readers (0),
|
|
w_readers (0),
|
|
w_writers (0)
|
|
{ }
|
|
|
|
gtm_rwlock::~gtm_rwlock()
|
|
{
|
|
pthread_mutex_destroy (&this->mutex);
|
|
pthread_cond_destroy (&this->c_readers);
|
|
pthread_cond_destroy (&this->c_writers);
|
|
}
|
|
|
|
// Acquire a RW lock for reading.
|
|
|
|
void
|
|
gtm_rwlock::read_lock (gtm_thread *tx)
|
|
{
|
|
// Fast path: first announce our intent to read, then check for conflicting
|
|
// intents to write. The fence ensure that this happens in exactly this
|
|
// order.
|
|
tx->shared_state.store (0, memory_order_relaxed);
|
|
atomic_thread_fence (memory_order_seq_cst);
|
|
unsigned int sum = this->summary.load (memory_order_relaxed);
|
|
if (likely(!(sum & (a_writer | w_writer))))
|
|
return;
|
|
|
|
// There seems to be an active, waiting, or confirmed writer, so enter the
|
|
// mutex-based slow path. To try to keep the number of readers small that
|
|
// the writer will see, we clear our read flag right away before entering
|
|
// the critical section. Otherwise, the writer would have to wait for us to
|
|
// get into the critical section. (Note that for correctness, this only has
|
|
// to happen before we leave the slow path and before we wait for any
|
|
// writer).
|
|
// ??? Add a barrier to enforce early visibility of this?
|
|
tx->shared_state.store(-1, memory_order_relaxed);
|
|
|
|
pthread_mutex_lock (&this->mutex);
|
|
|
|
// Read summary again after acquiring the mutex because it might have
|
|
// changed during waiting for the mutex to become free.
|
|
sum = this->summary.load (memory_order_relaxed);
|
|
|
|
// If there is a writer waiting for readers, wake it up. Only do that if we
|
|
// might be the last reader that could do the wake-up, otherwise skip the
|
|
// wake-up but decrease a_readers to show that we have entered the slow path.
|
|
// This has to happen before we wait for any writers or upgraders.
|
|
// See write_lock_generic() for further explanations.
|
|
if (this->a_readers > 0)
|
|
{
|
|
this->a_readers--;
|
|
if (this->a_readers == 0)
|
|
pthread_cond_signal(&this->c_confirmed_writers);
|
|
}
|
|
|
|
// If there is an active or waiting writer, we must wait.
|
|
while (sum & (a_writer | w_writer))
|
|
{
|
|
this->summary.store (sum | w_reader, memory_order_relaxed);
|
|
this->w_readers++;
|
|
pthread_cond_wait (&this->c_readers, &this->mutex);
|
|
sum = this->summary.load (memory_order_relaxed);
|
|
if (--this->w_readers == 0)
|
|
sum &= ~w_reader;
|
|
}
|
|
|
|
// Otherwise we can acquire the lock for read.
|
|
tx->shared_state.store(0, memory_order_relaxed);
|
|
|
|
pthread_mutex_unlock(&this->mutex);
|
|
}
|
|
|
|
|
|
// Acquire a RW lock for writing. Generic version that also works for
|
|
// upgrades.
|
|
// Note that an upgrade might fail (and thus waste previous work done during
|
|
// this transaction) if there is another thread that tried to go into serial
|
|
// mode earlier (i.e., upgrades do not have higher priority than pure writers).
|
|
// However, this seems rare enough to not consider it further as we need both
|
|
// a non-upgrade writer and a writer to happen to switch to serial mode
|
|
// concurrently. If we'd want to handle this, a writer waiting for readers
|
|
// would have to coordinate with later arriving upgrades and hand over the
|
|
// lock to them, including the the reader-waiting state. We can try to support
|
|
// this if this will actually happen often enough in real workloads.
|
|
|
|
bool
|
|
gtm_rwlock::write_lock_generic (gtm_thread *tx)
|
|
{
|
|
pthread_mutex_lock (&this->mutex);
|
|
|
|
unsigned int sum = this->summary.load (memory_order_relaxed);
|
|
|
|
// If there is an active writer, wait.
|
|
while (sum & a_writer)
|
|
{
|
|
if (tx != 0)
|
|
{
|
|
// If this is an upgrade, we must not wait for other writers or
|
|
// upgrades that already have gone in
|
|
pthread_mutex_unlock (&this->mutex);
|
|
return false;
|
|
}
|
|
|
|
this->summary.store (sum | w_writer, memory_order_relaxed);
|
|
this->w_writers++;
|
|
pthread_cond_wait (&this->c_writers, &this->mutex);
|
|
sum = this->summary.load (memory_order_relaxed);
|
|
if (--this->w_writers == 0)
|
|
sum &= ~w_writer;
|
|
}
|
|
|
|
// Otherwise we can acquire the lock for write. As a writer, we have
|
|
// priority, so we don't need to take this back.
|
|
this->summary.store (sum | a_writer, memory_order_relaxed);
|
|
|
|
// We still need to wait for active readers to finish. The barrier makes
|
|
// sure that we first set our write intent and check for active readers
|
|
// after that, in strictly this order (similar to the barrier in the fast
|
|
// path of read_lock()).
|
|
atomic_thread_fence(memory_order_seq_cst);
|
|
|
|
// Count the number of active readers to be able to decrease the number of
|
|
// wake-ups and wait calls that are necessary.
|
|
//
|
|
// This number is an upper bound of the number of readers that actually
|
|
// are still active and which we need to wait for:
|
|
// - We set our write flag before checking the reader flags, and readers
|
|
// check our write flag after clearing their read flags in read_unlock().
|
|
// Therefore, they will enter the slow path whenever we have seen them.
|
|
// - Readers will have cleared their read flags before leaving the slow
|
|
// path in read_lock() (prevents lost wake-ups), and before waiting for
|
|
// any writer (prevents deadlocks).
|
|
//
|
|
// However, this number is also just a lower bound of the number of readers
|
|
// that will actually enter the slow path in read_unlock() or read_lock():
|
|
// - Because the read flag is cleared outside of a critical section, writers
|
|
// can see it as cleared while the reader still goes into the slow path.
|
|
//
|
|
// Therefore, readers can skip (lower bound - 1) wake-ups, but we do need
|
|
// the following loop to check that the readers that we wanted to wait for
|
|
// are actually those that entered the slow path so far (and either skipped
|
|
// or sent a wake-up).
|
|
//
|
|
// ??? Do we need to optimize further? (The writer could publish a list of
|
|
// readers that it suspects to be active. Readers could check this list and
|
|
// only decrement a_readers if they are in this list.)
|
|
for (;;)
|
|
{
|
|
// ??? Keep a list of active readers that we saw and update it on the
|
|
// next retry instead? This might reduce the number of cache misses that
|
|
// we get when checking reader flags.
|
|
int readers = 0;
|
|
for (gtm_thread *it = gtm_thread::list_of_threads; it != 0;
|
|
it = it->next_thread)
|
|
{
|
|
// Don't count ourself if this is an upgrade.
|
|
if (it == tx)
|
|
continue;
|
|
if (it->shared_state.load(memory_order_relaxed) != (gtm_word)-1)
|
|
readers++;
|
|
}
|
|
|
|
// If we have not seen any readers, we will not wait.
|
|
if (readers == 0)
|
|
break;
|
|
|
|
// If this is an upgrade, we have to break deadlocks with
|
|
// privatization safety. This may fail on our side, in which
|
|
// case we need to cancel our attempt to upgrade. Also, we do not
|
|
// block using the convdar but just spin so that we never have to be
|
|
// woken.
|
|
// FIXME This is horribly inefficient -- but so is not being able
|
|
// to use futexes in this case.
|
|
if (tx != 0)
|
|
{
|
|
pthread_mutex_unlock (&this->mutex);
|
|
if (!abi_disp ()->snapshot_most_recent ())
|
|
{
|
|
write_unlock ();
|
|
return false;
|
|
}
|
|
pthread_mutex_lock (&this->mutex);
|
|
continue;
|
|
}
|
|
|
|
|
|
// We've seen a number of readers, so we publish this number and wait.
|
|
this->a_readers = readers;
|
|
pthread_cond_wait (&this->c_confirmed_writers, &this->mutex);
|
|
}
|
|
|
|
pthread_mutex_unlock (&this->mutex);
|
|
return true;
|
|
}
|
|
|
|
// Acquire a RW lock for writing.
|
|
|
|
void
|
|
gtm_rwlock::write_lock ()
|
|
{
|
|
write_lock_generic (0);
|
|
}
|
|
|
|
|
|
// Upgrade a RW lock that has been locked for reading to a writing lock.
|
|
// Do this without possibility of another writer incoming. Return false
|
|
// if this attempt fails (i.e. another thread also upgraded).
|
|
|
|
bool
|
|
gtm_rwlock::write_upgrade (gtm_thread *tx)
|
|
{
|
|
return write_lock_generic (tx);
|
|
}
|
|
|
|
|
|
// Has to be called iff the previous upgrade was successful and after it is
|
|
// safe for the transaction to not be marked as a reader anymore.
|
|
|
|
void
|
|
gtm_rwlock::write_upgrade_finish (gtm_thread *tx)
|
|
{
|
|
// We are not a reader anymore. This is only safe to do after we have
|
|
// acquired the writer lock.
|
|
tx->shared_state.store (-1, memory_order_release);
|
|
}
|
|
|
|
|
|
// Release a RW lock from reading.
|
|
|
|
void
|
|
gtm_rwlock::read_unlock (gtm_thread *tx)
|
|
{
|
|
// We only need release memory order here because of privatization safety
|
|
// (this ensures that marking the transaction as inactive happens after
|
|
// any prior data accesses by this transaction, and that neither the
|
|
// compiler nor the hardware order this store earlier).
|
|
// ??? We might be able to avoid this release here if the compiler can't
|
|
// merge the release fence with the subsequent seq_cst fence.
|
|
tx->shared_state.store (-1, memory_order_release);
|
|
// We need this seq_cst fence here to avoid lost wake-ups. Furthermore,
|
|
// the privatization safety implementation in gtm_thread::try_commit()
|
|
// relies on the existence of this seq_cst fence.
|
|
atomic_thread_fence (memory_order_seq_cst);
|
|
unsigned int sum = this->summary.load (memory_order_relaxed);
|
|
if (likely(!(sum & (a_writer | w_writer))))
|
|
return;
|
|
|
|
// There is a writer, either active or waiting for other readers or writers.
|
|
// Thus, enter the mutex-based slow path.
|
|
pthread_mutex_lock (&this->mutex);
|
|
|
|
// If there is a writer waiting for readers, wake it up. Only do that if we
|
|
// might be the last reader that could do the wake-up, otherwise skip the
|
|
// wake-up and decrease a_readers to publish that we have entered the slow
|
|
// path but skipped the wake-up.
|
|
if (this->a_readers > 0)
|
|
{
|
|
this->a_readers--;
|
|
if (this->a_readers == 0)
|
|
pthread_cond_signal(&this->c_confirmed_writers);
|
|
}
|
|
|
|
// We don't need to wake up any writers waiting for other writers. Active
|
|
// writers will take care of that.
|
|
|
|
pthread_mutex_unlock (&this->mutex);
|
|
}
|
|
|
|
|
|
// Release a RW lock from writing.
|
|
|
|
void
|
|
gtm_rwlock::write_unlock ()
|
|
{
|
|
pthread_mutex_lock (&this->mutex);
|
|
|
|
unsigned int sum = this->summary.load (memory_order_relaxed);
|
|
this->summary.store (sum & ~a_writer, memory_order_relaxed);
|
|
|
|
// If there is a waiting writer, wake it.
|
|
if (unlikely (sum & w_writer))
|
|
pthread_cond_signal (&this->c_writers);
|
|
|
|
// If there are waiting readers, wake them.
|
|
else if (unlikely (sum & w_reader))
|
|
pthread_cond_broadcast (&this->c_readers);
|
|
|
|
pthread_mutex_unlock (&this->mutex);
|
|
}
|
|
|
|
} // namespace GTM
|