382 lines
14 KiB
C#
Raw Normal View History

//------------------------------------------------------------------------------
// <copyright file="ReadWriteSpinLock.cs" company="Microsoft">
// Copyright (c) Microsoft Corporation. All rights reserved.
// </copyright>
//------------------------------------------------------------------------------
namespace System.Web.Util {
using System.Threading;
using System.Collections;
using System.Globalization;
using Microsoft.Win32;
struct ReadWriteSpinLock {
//
// Fields
//
// _bits is layed out as follows:
//
// 3 3 2 2 2 2 2 2 2 2 2 2 1 1 1 1 1 1 1 1 1 1
// 1 0 9 8 7 6 5 4 3 2 1 0 9 8 7 6 5 4 3 2 1 0 9 8 7 6 5 4 3 2 1 0
// +-+-+---------------------------+--------------------------------+
// |S|W| WriteLockCount | ReadLockCount |
// +-+-+---------------------------+--------------------------------+
// where
//
// S - sign bit (always zero) - By having a sign bit, operations
// on the ReadLockCount can use InterlockedIncrement/Decrement
//
// W - writer waiting bit - set by threads attempting write lock, preventing
// any further threads from acquiring read locks. This attempts to hint
// that updates have priority, but doesn't guarantee priority.
//
// WriteLockCount - Write lock recursion count
//
// ReadLockCount - Read lock recursion count
//
int _bits;
int _id;
//
// Statics
//
static bool s_disableBusyWaiting = (SystemInfo.GetNumProcessCPUs() == 1);
//
// Constants
//
const int BACK_OFF_FACTORS_LENGTH = 13;
static readonly double [] s_backOffFactors = new double [BACK_OFF_FACTORS_LENGTH] {
1.020, 0.965, 0.890, 1.065,
1.025, 1.115, 0.940, 0.995,
1.050, 1.080, 0.915, 0.980,
1.010
};
const int WRITER_WAITING_MASK = (int) 0x40000000;
const int WRITE_COUNT_MASK = (int) 0x3FFF0000;
const int READ_COUNT_MASK = (int) 0x0000FFFF;
const int WRITER_WAITING_SHIFT = 30;
const int WRITE_COUNT_SHIFT = 16;
static bool WriterWaiting(int bits) {return ((bits & WRITER_WAITING_MASK) != 0);}
static int WriteLockCount(int bits) {return ((bits & WRITE_COUNT_MASK) >> WRITE_COUNT_SHIFT);}
static int ReadLockCount(int bits) {return (bits & READ_COUNT_MASK);}
static bool NoWriters(int bits) {return ((bits & WRITE_COUNT_MASK) == 0);}
static bool NoWritersOrWaitingWriters(int bits) {return ((bits & (WRITE_COUNT_MASK | WRITER_WAITING_MASK)) == 0);}
static bool NoLocks(int bits) {return ((bits & ~WRITER_WAITING_MASK) == 0);}
bool WriterWaiting() {return WriterWaiting(_bits);}
int WriteLockCount() {return WriteLockCount(_bits);}
int ReadLockCount() {return ReadLockCount(_bits);}
bool NoWriters() {return NoWriters(_bits);}
bool NoWritersOrWaitingWriters() {return NoWritersOrWaitingWriters(_bits);}
bool NoLocks() {return NoLocks(_bits);}
int CreateNewBits(bool writerWaiting, int writeCount, int readCount) {
int bits = ((writeCount << WRITE_COUNT_SHIFT) | readCount);
if (writerWaiting) {
bits |= WRITER_WAITING_MASK;
}
return bits;
}
internal /*public*/ void AcquireReaderLock() {
// This lock supports Writelock then Readlock
// from the same thread (possibly from different functions).
int threadId = Thread.CurrentThread.GetHashCode();
// Optimize for the common case by
if (_TryAcquireReaderLock(threadId))
return;
_Spin(true, threadId);
Debug.Trace("Spinlock", "AcquireReaderLock: _bits=" + _bits.ToString("x8", CultureInfo.InvariantCulture)
+ " _id= " + _id.ToString("x8", CultureInfo.InvariantCulture));
}
internal /*public*/ void AcquireWriterLock() {
int threadId = Thread.CurrentThread.GetHashCode();
// Optimize for the common case by
if (_TryAcquireWriterLock(threadId))
return;
_Spin(false, threadId);
Debug.Trace("Spinlock", "AcquireWriterLock: _bits=" + _bits.ToString("x8", CultureInfo.InvariantCulture)
+ " _id= " + _id.ToString("x8", CultureInfo.InvariantCulture));
}
internal /*public*/ void ReleaseReaderLock() {
#if DBG
int id = _id;
Debug.Assert(id == 0 || id == Thread.CurrentThread.GetHashCode(), "id == 0 || id == Thread.CurrentThread.GetHashCode()");
#endif
int n = Interlocked.Decrement(ref _bits);
Debug.Assert(n >= 0, "n >= 0");
Debug.Trace("Spinlock", "ReleaseReaderLock: _bits=" + _bits.ToString("x8", CultureInfo.InvariantCulture)
+ " _id= " + _id.ToString("x8", CultureInfo.InvariantCulture));
}
void AlterWriteCountHoldingWriterLock(int oldBits, int delta) {
int readLockCount = ReadLockCount(oldBits);
int oldWriteLockCount = WriteLockCount(oldBits);
int newWriteLockCount = oldWriteLockCount + delta;
Debug.Assert(newWriteLockCount >= 0, "newWriteLockCount >= 0");
int newBits;
int test;
for (;;) {
//
// Since we own the lock, the only change that can be
// made by another thread to _bits is to add the writer-waiting bit.
//
Debug.Assert(WriteLockCount(oldBits) == oldWriteLockCount, "WriteLockCount(oldBits) == oldWriteLockCount");
Debug.Assert(ReadLockCount(oldBits) == readLockCount, "ReadLockCount(oldBits) == readLockCount");
newBits = CreateNewBits(WriterWaiting(oldBits), newWriteLockCount, readLockCount);
test = Interlocked.CompareExchange(ref _bits, newBits, oldBits);
if (test == oldBits) {
break;
}
oldBits = test;
}
}
internal /*public*/ void ReleaseWriterLock() {
#if DBG
int id = _id;
Debug.Assert(id == Thread.CurrentThread.GetHashCode(), "id == Thread.CurrentThread.GetHashCode()");
#endif
int oldBits = _bits;
int writeLockCount = WriteLockCount(oldBits);
Debug.Assert(writeLockCount > 0, "writeLockCount > 0");
if (writeLockCount == 1) {
// Reset the id before releasing count so that
// AcquireRead works correctly.
_id = 0;
}
AlterWriteCountHoldingWriterLock(oldBits, -1);
Debug.Trace("Spinlock", "ReleaseWriterLock: _bits=" + _bits.ToString("x8", CultureInfo.InvariantCulture)
+ " _id= " + _id.ToString("x8", CultureInfo.InvariantCulture));
}
bool _TryAcquireWriterLock(int threadId) {
int id = _id;
int oldBits = _bits;
int newBits;
int test;
if (id == threadId) {
// we can just pound in the correct value
AlterWriteCountHoldingWriterLock(oldBits, +1);
return true;
}
if (id == 0 && NoLocks(oldBits)) {
newBits = CreateNewBits(false, 1, 0);
test = Interlocked.CompareExchange(ref _bits, newBits, oldBits);
if (test == oldBits) {
id = _id;
Debug.Assert(id == 0);
_id = threadId;
return true;
}
oldBits = test;
}
// If there is contention, make sure the WRITER_WAITING bit is set.
// Note: this blocks readers from using a value that is about to be changed
if (!WriterWaiting(oldBits)) {
// hammer on _bits until the bit is set
for (;;) {
newBits = (oldBits | WRITER_WAITING_MASK);
test = Interlocked.CompareExchange(ref _bits, newBits, oldBits);
if (test == oldBits)
break;
oldBits = test;
}
}
return false;
}
bool _TryAcquireReaderLock(int threadId) {
int oldBits = _bits;
int id = _id;
if (id == 0) {
if (!NoWriters(oldBits)) {
return false;
}
}
else if (id != threadId) {
return false;
}
if (Interlocked.CompareExchange(ref _bits, oldBits + 1, oldBits) == oldBits) {
return true;
}
return false;
}
/// <internalonly/>
void _Spin(bool isReaderLock, int threadId) {
const int LOCK_MAXIMUM_SPINS = 10000; // maximum allowable spin count
const int LOCK_DEFAULT_SPINS = 4000; // default spin count
const int LOCK_MINIMUM_SPINS = 100; // minimum allowable spin count
int sleepTime = 0;
int baseSpins;
{ // limit scope of temp. stack vars to calculation of baseSpin2
// Alternatives for threadId include a static counter
// or the low DWORD of QueryPerformanceCounter().
double randomBackoffFactor = s_backOffFactors[Math.Abs(threadId) % BACK_OFF_FACTORS_LENGTH];
baseSpins = (int)(LOCK_DEFAULT_SPINS * randomBackoffFactor);
baseSpins = Math.Min(LOCK_MAXIMUM_SPINS, baseSpins);
baseSpins = Math.Max(baseSpins, LOCK_MINIMUM_SPINS);
}
DateTime utcSpinStartTime = DateTime.UtcNow; // error if struct not initialized
// hand-optimize loop: Increase locality by copying static variables
// onto the stack (this will reduce cache misses after a contact
// switch induced by Sleep()).
bool disableBusyWaiting = s_disableBusyWaiting;
for (;;) {
if (isReaderLock) {
if (_TryAcquireReaderLock(threadId)) {
break;
}
}
else {
if (_TryAcquireWriterLock(threadId)) {
break;
}
}
// if 1 cpu, or cpu affinity is set to 1, spinning is a waste of time
if (disableBusyWaiting) {
Thread.Sleep(sleepTime);
// Avoid priority inversion: 0, 1, 0, 1,...
sleepTime ^= 1;
}
else {
int spinCount = baseSpins;
// Check no more than baseSpins times then yield.
// It is important not to use the InterlockedExchange in the
// inner loop in order to minimize system memory bus traffic.
for(;;) {
//
// If the lock is available break spinning and
// try to obtain it.
//
if (isReaderLock) {
if (NoWritersOrWaitingWriters()) {
break;
}
}
else {
if (NoLocks()) {
break;
}
}
if (--spinCount < 0) {
Thread.Sleep(sleepTime);
// Backoff algorithm: reduce (or increase) busy wait time
baseSpins /= 2;
// LOCK_MINIMUM_SPINS <= baseSpins <= LOCK_MAXIMUM_SPINS
//baseSpins = Math.Min(LOCK_MAXIMUM_SPINS, baseSpins); //= min(LOCK_MAXIMUM_SPINS, baseSpins)
baseSpins = Math.Max(baseSpins, LOCK_MINIMUM_SPINS); //= max(baseSpins, LOCK_MINIMUM_SPINS);
spinCount = baseSpins;
// Using Sleep(0) leads to the possibility of priority
// inversion. Sleep(0) only yields the processor if
// there's another thread of the same priority that's
// ready to run. If a high-priority thread is trying to
// acquire the lock, which is held by a low-priority
// thread, then the low-priority thread may never get
// scheduled and hence never free the lock. NT attempts
// to avoid priority inversions by temporarily boosting
// the priority of low-priority runnable threads, but the
// problem can still occur if there's a medium-priority
// thread that's always runnable. If Sleep(1) is used,
// then the thread unconditionally yields the CPU. We
// only do this for the second and subsequent even
// iterations, since a millisecond is a long time to wait
// if the thread can be scheduled in again sooner
// (~100,000 instructions).
// Avoid priority inversion: 0, 1, 0, 1,...
sleepTime ^= 1;
}
else {
// kill about 20 clock cycles on this proc
Thread.SpinWait(10);
}
}
}
}// while
}// _Spin
} // ReadWriteSpinLock
} // namespace System.Web.Util
// NOTES:
//
// This ReaderWriterSpinlock is a combination of the
// original lightweight (4 byte) System.Web.Util.ReadWriteSpinLock
// and the lightweight (4 byte) exclusive lock (SmallSpinLock) used
// in the George Reilly's LKRHash (see http://georgere/work/lkrhash).
//
// In an effort to support reentrancy during writes we are squirreling
// away the thread id of the thread holding the write lock into the upper
// 16 bits of the lock count. This is possible as long as thread ids stay
// smaller than 7FFF. Anything higher than that would flip the sign bit
// and we'd no longer be able to do signed comparisons to check
// for read vs. write.
//
// read write
// lower #read locks #write locks (from same thread)
// higher 0x0000 thread id of thread holding lock
//
// Adapted from LKRHash's lock.cpp, from GeorgeRe
// The original implementation is due to PALarson.