base/condition_variable_win.cc - platform/external/chromium - Git at Google

 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "base/condition_variable.h"

 #include <stack>

 #include "base/lock.h"
 #include "base/logging.h"
 #include "base/time.h"

 using base::TimeDelta;

 ConditionVariable::ConditionVariable(Lock* user_lock)
   : user_lock_(*user_lock),
     run_state_(RUNNING),
     allocation_counter_(0),
     recycling_list_size_(0) {
   DCHECK(user_lock);
 }

 ConditionVariable::~ConditionVariable() {
   AutoLock auto_lock(internal_lock_);
   run_state_ = SHUTDOWN;  // Prevent any more waiting.

   DCHECK_EQ(recycling_list_size_, allocation_counter_);
   if (recycling_list_size_ != allocation_counter_) {  // Rare shutdown problem.
     // There are threads of execution still in this->TimedWait() and yet the
     // caller has instigated the destruction of this instance :-/.
     // A common reason for such "overly hasty" destruction is that the caller
     // was not willing to wait for all the threads to terminate.  Such hasty
     // actions are a violation of our usage contract, but we'll give the
     // waiting thread(s) one last chance to exit gracefully (prior to our
     // destruction).
     // Note: waiting_list_ *might* be empty, but recycling is still pending.
     AutoUnlock auto_unlock(internal_lock_);
     Broadcast();  // Make sure all waiting threads have been signaled.
     Sleep(10);  // Give threads a chance to grab internal_lock_.
     // All contained threads should be blocked on user_lock_ by now :-).
   }  // Reacquire internal_lock_.

   DCHECK_EQ(recycling_list_size_, allocation_counter_);
 }

 void ConditionVariable::Wait() {
   // Default to "wait forever" timing, which means have to get a Signal()
   // or Broadcast() to come out of this wait state.
   TimedWait(TimeDelta::FromMilliseconds(INFINITE));
 }

 void ConditionVariable::TimedWait(const TimeDelta& max_time) {
   Event* waiting_event;
   HANDLE handle;
   {
     AutoLock auto_lock(internal_lock_);
     if (RUNNING != run_state_) return;  // Destruction in progress.
     waiting_event = GetEventForWaiting();
     handle = waiting_event->handle();
     DCHECK(handle);
   }  // Release internal_lock.

   {
     AutoUnlock unlock(user_lock_);  // Release caller's lock
     WaitForSingleObject(handle, static_cast<DWORD>(max_time.InMilliseconds()));
     // Minimize spurious signal creation window by recycling asap.
     AutoLock auto_lock(internal_lock_);
     RecycleEvent(waiting_event);
     // Release internal_lock_
   }  // Reacquire callers lock to depth at entry.
 }

 // Broadcast() is guaranteed to signal all threads that were waiting (i.e., had
 // a cv_event internally allocated for them) before Broadcast() was called.
 void ConditionVariable::Broadcast() {
   std::stack<HANDLE> handles;  // See FAQ-question-10.
   {
     AutoLock auto_lock(internal_lock_);
     if (waiting_list_.IsEmpty())
       return;
     while (!waiting_list_.IsEmpty())
       // This is not a leak from waiting_list_.  See FAQ-question 12.
       handles.push(waiting_list_.PopBack()->handle());
   }  // Release internal_lock_.
   while (!handles.empty()) {
     SetEvent(handles.top());
     handles.pop();
   }
 }

 // Signal() will select one of the waiting threads, and signal it (signal its
 // cv_event).  For better performance we signal the thread that went to sleep
 // most recently (LIFO).  If we want fairness, then we wake the thread that has
 // been sleeping the longest (FIFO).
 void ConditionVariable::Signal() {
   HANDLE handle;
   {
     AutoLock auto_lock(internal_lock_);
     if (waiting_list_.IsEmpty())
       return;  // No one to signal.
     // Only performance option should be used.
     // This is not a leak from waiting_list.  See FAQ-question 12.
      handle = waiting_list_.PopBack()->handle();  // LIFO.
   }  // Release internal_lock_.
   SetEvent(handle);
 }

 // GetEventForWaiting() provides a unique cv_event for any caller that needs to
 // wait.  This means that (worst case) we may over time create as many cv_event
 // objects as there are threads simultaneously using this instance's Wait()
 // functionality.
 ConditionVariable::Event* ConditionVariable::GetEventForWaiting() {
   // We hold internal_lock, courtesy of Wait().
   Event* cv_event;
   if (0 == recycling_list_size_) {
     DCHECK(recycling_list_.IsEmpty());
     cv_event = new Event();
     cv_event->InitListElement();
     allocation_counter_++;
     CHECK(cv_event->handle());
   } else {
     cv_event = recycling_list_.PopFront();
     recycling_list_size_--;
   }
   waiting_list_.PushBack(cv_event);
   return cv_event;
 }

 // RecycleEvent() takes a cv_event that was previously used for Wait()ing, and
 // recycles it for use in future Wait() calls for this or other threads.
 // Note that there is a tiny chance that the cv_event is still signaled when we
 // obtain it, and that can cause spurious signals (if/when we re-use the
 // cv_event), but such is quite rare (see FAQ-question-5).
 void ConditionVariable::RecycleEvent(Event* used_event) {
   // We hold internal_lock, courtesy of Wait().
   // If the cv_event timed out, then it is necessary to remove it from
   // waiting_list_.  If it was selected by Broadcast() or Signal(), then it is
   // already gone.
   used_event->Extract();  // Possibly redundant
   recycling_list_.PushBack(used_event);
   recycling_list_size_++;
 }
 //------------------------------------------------------------------------------
 // The next section provides the implementation for the private Event class.
 //------------------------------------------------------------------------------

 // Event provides a doubly-linked-list of events for use exclusively by the
 // ConditionVariable class.

 // This custom container was crafted because no simple combination of STL
 // classes appeared to support the functionality required.  The specific
 // unusual requirement for a linked-list-class is support for the Extract()
 // method, which can remove an element from a list, potentially for insertion
 // into a second list.  Most critically, the Extract() method is idempotent,
 // turning the indicated element into an extracted singleton whether it was
 // contained in a list or not.  This functionality allows one (or more) of
 // threads to do the extraction.  The iterator that identifies this extractable
 // element (in this case, a pointer to the list element) can be used after
 // arbitrary manipulation of the (possibly) enclosing list container.  In
 // general, STL containers do not provide iterators that can be used across
 // modifications (insertions/extractions) of the enclosing containers, and
 // certainly don't provide iterators that can be used if the identified
 // element is *deleted* (removed) from the container.

 // It is possible to use multiple redundant containers, such as an STL list,
 // and an STL map, to achieve similar container semantics.  This container has
 // only O(1) methods, while the corresponding (multiple) STL container approach
 // would have more complex O(log(N)) methods (yeah... N isn't that large).
 // Multiple containers also makes correctness more difficult to assert, as
 // data is redundantly stored and maintained, which is generally evil.

 ConditionVariable::Event::Event() : handle_(0) {
   next_ = prev_ = this;  // Self referencing circular.
 }

 ConditionVariable::Event::~Event() {
   if (0 == handle_) {
     // This is the list holder
     while (!IsEmpty()) {
       Event* cv_event = PopFront();
       DCHECK(cv_event->ValidateAsItem());
       delete cv_event;
     }
   }
   DCHECK(IsSingleton());
   if (0 != handle_) {
     int ret_val = CloseHandle(handle_);
     DCHECK(ret_val);
   }
 }

 // Change a container instance permanently into an element of a list.
 void ConditionVariable::Event::InitListElement() {
   DCHECK(!handle_);
   handle_ = CreateEvent(NULL, false, false, NULL);
   CHECK(handle_);
 }

 // Methods for use on lists.
 bool ConditionVariable::Event::IsEmpty() const {
   DCHECK(ValidateAsList());
   return IsSingleton();
 }

 void ConditionVariable::Event::PushBack(Event* other) {
   DCHECK(ValidateAsList());
   DCHECK(other->ValidateAsItem());
   DCHECK(other->IsSingleton());
   // Prepare other for insertion.
   other->prev_ = prev_;
   other->next_ = this;
   // Cut into list.
   prev_->next_ = other;
   prev_ = other;
   DCHECK(ValidateAsDistinct(other));
 }

 ConditionVariable::Event* ConditionVariable::Event::PopFront() {
   DCHECK(ValidateAsList());
   DCHECK(!IsSingleton());
   return next_->Extract();
 }

 ConditionVariable::Event* ConditionVariable::Event::PopBack() {
   DCHECK(ValidateAsList());
   DCHECK(!IsSingleton());
   return prev_->Extract();
 }

 // Methods for use on list elements.
 // Accessor method.
 HANDLE ConditionVariable::Event::handle() const {
   DCHECK(ValidateAsItem());
   return handle_;
 }

 // Pull an element from a list (if it's in one).
 ConditionVariable::Event* ConditionVariable::Event::Extract() {
   DCHECK(ValidateAsItem());
   if (!IsSingleton()) {
     // Stitch neighbors together.
     next_->prev_ = prev_;
     prev_->next_ = next_;
     // Make extractee into a singleton.
     prev_ = next_ = this;
   }
   DCHECK(IsSingleton());
   return this;
 }

 // Method for use on a list element or on a list.
 bool ConditionVariable::Event::IsSingleton() const {
   DCHECK(ValidateLinks());
   return next_ == this;
 }

 // Provide pre/post conditions to validate correct manipulations.
 bool ConditionVariable::Event::ValidateAsDistinct(Event* other) const {
   return ValidateLinks() && other->ValidateLinks() && (this != other);
 }

 bool ConditionVariable::Event::ValidateAsItem() const {
   return (0 != handle_) && ValidateLinks();
 }

 bool ConditionVariable::Event::ValidateAsList() const {
   return (0 == handle_) && ValidateLinks();
 }

 bool ConditionVariable::Event::ValidateLinks() const {
   // Make sure both of our neighbors have links that point back to us.
   // We don't do the O(n) check and traverse the whole loop, and instead only
   // do a local check to (and returning from) our immediate neighbors.
   return (next_->prev_ == this) && (prev_->next_ == this);
 }


 /*
 FAQ On subtle implementation details:

 1) What makes this problem subtle?  Please take a look at "Strategies
 for Implementing POSIX Condition Variables on Win32" by Douglas
 C. Schmidt and Irfan Pyarali.
 http://www.cs.wustl.edu/~schmidt/win32-cv-1.html It includes
 discussions of numerous flawed strategies for implementing this
 functionality.  I'm not convinced that even the final proposed
 implementation has semantics that are as nice as this implementation
 (especially with regard to Broadcast() and the impact on threads that
 try to Wait() after a Broadcast() has been called, but before all the
 original waiting threads have been signaled).

 2) Why can't you use a single wait_event for all threads that call
 Wait()?  See FAQ-question-1, or consider the following: If a single
 event were used, then numerous threads calling Wait() could release
 their cs locks, and be preempted just before calling
 WaitForSingleObject().  If a call to Broadcast() was then presented on
 a second thread, it would be impossible to actually signal all
 waiting(?) threads.  Some number of SetEvent() calls *could* be made,
 but there could be no guarantee that those led to to more than one
 signaled thread (SetEvent()'s may be discarded after the first!), and
 there could be no guarantee that the SetEvent() calls didn't just
 awaken "other" threads that hadn't even started waiting yet (oops).
 Without any limit on the number of requisite SetEvent() calls, the
 system would be forced to do many such calls, allowing many new waits
 to receive spurious signals.

 3) How does this implementation cause spurious signal events?  The
 cause in this implementation involves a race between a signal via
 time-out and a signal via Signal() or Broadcast().  The series of
 actions leading to this are:

 a) Timer fires, and a waiting thread exits the line of code:

     WaitForSingleObject(waiting_event, max_time.InMilliseconds());

 b) That thread (in (a)) is randomly pre-empted after the above line,
 leaving the waiting_event reset (unsignaled) and still in the
 waiting_list_.

 c) A call to Signal() (or Broadcast()) on a second thread proceeds, and
 selects the waiting cv_event (identified in step (b)) as the event to revive
 via a call to SetEvent().

 d) The Signal() method (step c) calls SetEvent() on waiting_event (step b).

 e) The waiting cv_event (step b) is now signaled, but no thread is
 waiting on it.

 f) When that waiting_event (step b) is reused, it will immediately
 be signaled (spuriously).


 4) Why do you recycle events, and cause spurious signals?  First off,
 the spurious events are very rare.  They can only (I think) appear
 when the race described in FAQ-question-3 takes place.  This should be
 very rare.  Most(?)  uses will involve only timer expiration, or only
 Signal/Broadcast() actions.  When both are used, it will be rare that
 the race will appear, and it would require MANY Wait() and signaling
 activities.  If this implementation did not recycle events, then it
 would have to create and destroy events for every call to Wait().
 That allocation/deallocation and associated construction/destruction
 would be costly (per wait), and would only be a rare benefit (when the
 race was "lost" and a spurious signal took place). That would be bad
 (IMO) optimization trade-off.  Finally, such spurious events are
 allowed by the specification of condition variables (such as
 implemented in Vista), and hence it is better if any user accommodates
 such spurious events (see usage note in condition_variable.h).

 5) Why don't you reset events when you are about to recycle them, or
 about to reuse them, so that the spurious signals don't take place?
 The thread described in FAQ-question-3 step c may be pre-empted for an
 arbitrary length of time before proceeding to step d.  As a result,
 the wait_event may actually be re-used *before* step (e) is reached.
 As a result, calling reset would not help significantly.

 6) How is it that the callers lock is released atomically with the
 entry into a wait state?  We commit to the wait activity when we
 allocate the wait_event for use in a given call to Wait().  This
 allocation takes place before the caller's lock is released (and
 actually before our internal_lock_ is released).  That allocation is
 the defining moment when "the wait state has been entered," as that
 thread *can* now be signaled by a call to Broadcast() or Signal().
 Hence we actually "commit to wait" before releasing the lock, making
 the pair effectively atomic.

 8) Why do you need to lock your data structures during waiting, as the
 caller is already in possession of a lock?  We need to Acquire() and
 Release() our internal lock during Signal() and Broadcast().  If we tried
 to use a callers lock for this purpose, we might conflict with their
 external use of the lock.  For example, the caller may use to consistently
 hold a lock on one thread while calling Signal() on another, and that would
 block Signal().

 9) Couldn't a more efficient implementation be provided if you
 preclude using more than one external lock in conjunction with a
 single ConditionVariable instance?  Yes, at least it could be viewed
 as a simpler API (since you don't have to reiterate the lock argument
 in each Wait() call).  One of the constructors now takes a specific
 lock as an argument, and a there are corresponding Wait() calls that
 don't specify a lock now.  It turns that the resulting implmentation
 can't be made more efficient, as the internal lock needs to be used by
 Signal() and Broadcast(), to access internal data structures.  As a
 result, I was not able to utilize the user supplied lock (which is
 being used by the user elsewhere presumably) to protect the private
 member access.

 9) Since you have a second lock, how can be be sure that there is no
 possible deadlock scenario?  Our internal_lock_ is always the last
 lock acquired, and the first one released, and hence a deadlock (due
 to critical section problems) is impossible as a consequence of our
 lock.

 10) When doing a Broadcast(), why did you copy all the events into
 an STL queue, rather than making a linked-loop, and iterating over it?
 The iterating during Broadcast() is done so outside the protection
 of the internal lock. As a result, other threads, such as the thread
 wherein a related event is waiting, could asynchronously manipulate
 the links around a cv_event.  As a result, the link structure cannot
 be used outside a lock.  Broadcast() could iterate over waiting
 events by cycling in-and-out of the protection of the internal_lock,
 but that appears more expensive than copying the list into an STL
 stack.

 11) Why did the lock.h file need to be modified so much for this
 change?  Central to a Condition Variable is the atomic release of a
 lock during a Wait().  This places Wait() functionality exactly
 mid-way between the two classes, Lock and Condition Variable.  Given
 that there can be nested Acquire()'s of locks, and Wait() had to
 Release() completely a held lock, it was necessary to augment the Lock
 class with a recursion counter. Even more subtle is the fact that the
 recursion counter (in a Lock) must be protected, as many threads can
 access it asynchronously.  As a positive fallout of this, there are
 now some DCHECKS to be sure no one Release()s a Lock more than they
 Acquire()ed it, and there is ifdef'ed functionality that can detect
 nested locks (legal under windows, but not under Posix).

 12) Why is it that the cv_events removed from list in Broadcast() and Signal()
 are not leaked?  How are they recovered??  The cv_events that appear to leak are
 taken from the waiting_list_.  For each element in that list, there is currently
 a thread in or around the WaitForSingleObject() call of Wait(), and those
 threads have references to these otherwise leaked events. They are passed as
 arguments to be recycled just aftre returning from WaitForSingleObject().

 13) Why did you use a custom container class (the linked list), when STL has
 perfectly good containers, such as an STL list?  The STL list, as with any
 container, does not guarantee the utility of an iterator across manipulation
 (such as insertions and deletions) of the underlying container.  The custom
 double-linked-list container provided that assurance.  I don't believe any
 combination of STL containers provided the services that were needed at the same
 O(1) efficiency as the custom linked list.  The unusual requirement
 for the container class is that a reference to an item within a container (an
 iterator) needed to be maintained across an arbitrary manipulation of the
 container.  This requirement exposes itself in the Wait() method, where a
 waiting_event must be selected prior to the WaitForSingleObject(), and then it
 must be used as part of recycling to remove the related instance from the
 waiting_list.  A hash table (STL map) could be used, but I was embarrased to
 use a complex and relatively low efficiency container when a doubly linked list
 provided O(1) performance in all required operations.  Since other operations
 to provide performance-and/or-fairness required queue (FIFO) and list (LIFO)
 containers, I would also have needed to use an STL list/queue as well as an STL
 map.  In the end I decided it would be "fun" to just do it right, and I
 put so many assertions (DCHECKs) into the container class that it is trivial to
 code review and validate its correctness.

 */
	// Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "base/condition_variable.h"

	#include <stack>

	#include "base/lock.h"
	#include "base/logging.h"
	#include "base/time.h"

	using base::TimeDelta;

	ConditionVariable::ConditionVariable(Lock* user_lock)
	: user_lock_(*user_lock),
	run_state_(RUNNING),
	allocation_counter_(0),
	recycling_list_size_(0) {
	DCHECK(user_lock);
	}

	ConditionVariable::~ConditionVariable() {
	AutoLock auto_lock(internal_lock_);
	run_state_ = SHUTDOWN; // Prevent any more waiting.

	DCHECK_EQ(recycling_list_size_, allocation_counter_);
	if (recycling_list_size_ != allocation_counter_) { // Rare shutdown problem.
	// There are threads of execution still in this->TimedWait() and yet the
	// caller has instigated the destruction of this instance :-/.
	// A common reason for such "overly hasty" destruction is that the caller
	// was not willing to wait for all the threads to terminate. Such hasty
	// actions are a violation of our usage contract, but we'll give the
	// waiting thread(s) one last chance to exit gracefully (prior to our
	// destruction).
	// Note: waiting_list_ might be empty, but recycling is still pending.
	AutoUnlock auto_unlock(internal_lock_);
	Broadcast(); // Make sure all waiting threads have been signaled.
	Sleep(10); // Give threads a chance to grab internal_lock_.
	// All contained threads should be blocked on user_lock_ by now :-).
	} // Reacquire internal_lock_.

	DCHECK_EQ(recycling_list_size_, allocation_counter_);
	}

	void ConditionVariable::Wait() {
	// Default to "wait forever" timing, which means have to get a Signal()
	// or Broadcast() to come out of this wait state.
	TimedWait(TimeDelta::FromMilliseconds(INFINITE));
	}

	void ConditionVariable::TimedWait(const TimeDelta& max_time) {
	Event* waiting_event;
	HANDLE handle;
	{
	AutoLock auto_lock(internal_lock_);
	if (RUNNING != run_state_) return; // Destruction in progress.
	waiting_event = GetEventForWaiting();
	handle = waiting_event->handle();
	DCHECK(handle);
	} // Release internal_lock.

	{
	AutoUnlock unlock(user_lock_); // Release caller's lock
	WaitForSingleObject(handle, static_cast<DWORD>(max_time.InMilliseconds()));
	// Minimize spurious signal creation window by recycling asap.
	AutoLock auto_lock(internal_lock_);
	RecycleEvent(waiting_event);
	// Release internal_lock_
	} // Reacquire callers lock to depth at entry.
	}

	// Broadcast() is guaranteed to signal all threads that were waiting (i.e., had
	// a cv_event internally allocated for them) before Broadcast() was called.
	void ConditionVariable::Broadcast() {
	std::stack<HANDLE> handles; // See FAQ-question-10.
	{
	AutoLock auto_lock(internal_lock_);
	if (waiting_list_.IsEmpty())
	return;
	while (!waiting_list_.IsEmpty())
	// This is not a leak from waiting_list_. See FAQ-question 12.
	handles.push(waiting_list_.PopBack()->handle());
	} // Release internal_lock_.
	while (!handles.empty()) {
	SetEvent(handles.top());
	handles.pop();
	}
	}

	// Signal() will select one of the waiting threads, and signal it (signal its
	// cv_event). For better performance we signal the thread that went to sleep
	// most recently (LIFO). If we want fairness, then we wake the thread that has
	// been sleeping the longest (FIFO).
	void ConditionVariable::Signal() {
	HANDLE handle;
	{
	AutoLock auto_lock(internal_lock_);
	if (waiting_list_.IsEmpty())
	return; // No one to signal.
	// Only performance option should be used.
	// This is not a leak from waiting_list. See FAQ-question 12.
	handle = waiting_list_.PopBack()->handle(); // LIFO.
	} // Release internal_lock_.
	SetEvent(handle);
	}

	// GetEventForWaiting() provides a unique cv_event for any caller that needs to
	// wait. This means that (worst case) we may over time create as many cv_event
	// objects as there are threads simultaneously using this instance's Wait()
	// functionality.
	ConditionVariable::Event* ConditionVariable::GetEventForWaiting() {
	// We hold internal_lock, courtesy of Wait().
	Event* cv_event;
	if (0 == recycling_list_size_) {
	DCHECK(recycling_list_.IsEmpty());
	cv_event = new Event();
	cv_event->InitListElement();
	allocation_counter_++;
	CHECK(cv_event->handle());
	} else {
	cv_event = recycling_list_.PopFront();
	recycling_list_size_--;
	}
	waiting_list_.PushBack(cv_event);
	return cv_event;
	}

	// RecycleEvent() takes a cv_event that was previously used for Wait()ing, and
	// recycles it for use in future Wait() calls for this or other threads.
	// Note that there is a tiny chance that the cv_event is still signaled when we
	// obtain it, and that can cause spurious signals (if/when we re-use the
	// cv_event), but such is quite rare (see FAQ-question-5).
	void ConditionVariable::RecycleEvent(Event* used_event) {
	// We hold internal_lock, courtesy of Wait().
	// If the cv_event timed out, then it is necessary to remove it from
	// waiting_list_. If it was selected by Broadcast() or Signal(), then it is
	// already gone.
	used_event->Extract(); // Possibly redundant
	recycling_list_.PushBack(used_event);
	recycling_list_size_++;
	}
	//------------------------------------------------------------------------------
	// The next section provides the implementation for the private Event class.
	//------------------------------------------------------------------------------

	// Event provides a doubly-linked-list of events for use exclusively by the
	// ConditionVariable class.

	// This custom container was crafted because no simple combination of STL
	// classes appeared to support the functionality required. The specific
	// unusual requirement for a linked-list-class is support for the Extract()
	// method, which can remove an element from a list, potentially for insertion
	// into a second list. Most critically, the Extract() method is idempotent,
	// turning the indicated element into an extracted singleton whether it was
	// contained in a list or not. This functionality allows one (or more) of
	// threads to do the extraction. The iterator that identifies this extractable
	// element (in this case, a pointer to the list element) can be used after
	// arbitrary manipulation of the (possibly) enclosing list container. In
	// general, STL containers do not provide iterators that can be used across
	// modifications (insertions/extractions) of the enclosing containers, and
	// certainly don't provide iterators that can be used if the identified
	// element is deleted (removed) from the container.

	// It is possible to use multiple redundant containers, such as an STL list,
	// and an STL map, to achieve similar container semantics. This container has
	// only O(1) methods, while the corresponding (multiple) STL container approach
	// would have more complex O(log(N)) methods (yeah... N isn't that large).
	// Multiple containers also makes correctness more difficult to assert, as
	// data is redundantly stored and maintained, which is generally evil.

	ConditionVariable::Event::Event() : handle_(0) {
	next_ = prev_ = this; // Self referencing circular.
	}

	ConditionVariable::Event::~Event() {
	if (0 == handle_) {
	// This is the list holder
	while (!IsEmpty()) {
	Event* cv_event = PopFront();
	DCHECK(cv_event->ValidateAsItem());
	delete cv_event;
	}
	}
	DCHECK(IsSingleton());
	if (0 != handle_) {
	int ret_val = CloseHandle(handle_);
	DCHECK(ret_val);
	}
	}

	// Change a container instance permanently into an element of a list.
	void ConditionVariable::Event::InitListElement() {
	DCHECK(!handle_);
	handle_ = CreateEvent(NULL, false, false, NULL);
	CHECK(handle_);
	}

	// Methods for use on lists.
	bool ConditionVariable::Event::IsEmpty() const {
	DCHECK(ValidateAsList());
	return IsSingleton();
	}

	void ConditionVariable::Event::PushBack(Event* other) {
	DCHECK(ValidateAsList());
	DCHECK(other->ValidateAsItem());
	DCHECK(other->IsSingleton());
	// Prepare other for insertion.
	other->prev_ = prev_;
	other->next_ = this;
	// Cut into list.
	prev_->next_ = other;
	prev_ = other;
	DCHECK(ValidateAsDistinct(other));
	}

	ConditionVariable::Event* ConditionVariable::Event::PopFront() {
	DCHECK(ValidateAsList());
	DCHECK(!IsSingleton());
	return next_->Extract();
	}

	ConditionVariable::Event* ConditionVariable::Event::PopBack() {
	DCHECK(ValidateAsList());
	DCHECK(!IsSingleton());
	return prev_->Extract();
	}

	// Methods for use on list elements.
	// Accessor method.
	HANDLE ConditionVariable::Event::handle() const {
	DCHECK(ValidateAsItem());
	return handle_;
	}

	// Pull an element from a list (if it's in one).
	ConditionVariable::Event* ConditionVariable::Event::Extract() {
	DCHECK(ValidateAsItem());
	if (!IsSingleton()) {
	// Stitch neighbors together.
	next_->prev_ = prev_;
	prev_->next_ = next_;
	// Make extractee into a singleton.
	prev_ = next_ = this;
	}
	DCHECK(IsSingleton());
	return this;
	}

	// Method for use on a list element or on a list.
	bool ConditionVariable::Event::IsSingleton() const {
	DCHECK(ValidateLinks());
	return next_ == this;
	}

	// Provide pre/post conditions to validate correct manipulations.
	bool ConditionVariable::Event::ValidateAsDistinct(Event* other) const {
	return ValidateLinks() && other->ValidateLinks() && (this != other);
	}

	bool ConditionVariable::Event::ValidateAsItem() const {
	return (0 != handle_) && ValidateLinks();
	}

	bool ConditionVariable::Event::ValidateAsList() const {
	return (0 == handle_) && ValidateLinks();
	}

	bool ConditionVariable::Event::ValidateLinks() const {
	// Make sure both of our neighbors have links that point back to us.
	// We don't do the O(n) check and traverse the whole loop, and instead only
	// do a local check to (and returning from) our immediate neighbors.
	return (next_->prev_ == this) && (prev_->next_ == this);
	}


	/*
	FAQ On subtle implementation details:

	1) What makes this problem subtle? Please take a look at "Strategies
	for Implementing POSIX Condition Variables on Win32" by Douglas
	C. Schmidt and Irfan Pyarali.
	http://www.cs.wustl.edu/~schmidt/win32-cv-1.html It includes
	discussions of numerous flawed strategies for implementing this
	functionality. I'm not convinced that even the final proposed
	implementation has semantics that are as nice as this implementation
	(especially with regard to Broadcast() and the impact on threads that
	try to Wait() after a Broadcast() has been called, but before all the
	original waiting threads have been signaled).

	2) Why can't you use a single wait_event for all threads that call
	Wait()? See FAQ-question-1, or consider the following: If a single
	event were used, then numerous threads calling Wait() could release
	their cs locks, and be preempted just before calling
	WaitForSingleObject(). If a call to Broadcast() was then presented on
	a second thread, it would be impossible to actually signal all
	waiting(?) threads. Some number of SetEvent() calls could be made,
	but there could be no guarantee that those led to to more than one
	signaled thread (SetEvent()'s may be discarded after the first!), and
	there could be no guarantee that the SetEvent() calls didn't just
	awaken "other" threads that hadn't even started waiting yet (oops).
	Without any limit on the number of requisite SetEvent() calls, the
	system would be forced to do many such calls, allowing many new waits
	to receive spurious signals.

	3) How does this implementation cause spurious signal events? The
	cause in this implementation involves a race between a signal via
	time-out and a signal via Signal() or Broadcast(). The series of
	actions leading to this are:

	a) Timer fires, and a waiting thread exits the line of code:

	WaitForSingleObject(waiting_event, max_time.InMilliseconds());

	b) That thread (in (a)) is randomly pre-empted after the above line,
	leaving the waiting_event reset (unsignaled) and still in the
	waiting_list_.

	c) A call to Signal() (or Broadcast()) on a second thread proceeds, and
	selects the waiting cv_event (identified in step (b)) as the event to revive
	via a call to SetEvent().

	d) The Signal() method (step c) calls SetEvent() on waiting_event (step b).

	e) The waiting cv_event (step b) is now signaled, but no thread is
	waiting on it.

	f) When that waiting_event (step b) is reused, it will immediately
	be signaled (spuriously).


	4) Why do you recycle events, and cause spurious signals? First off,
	the spurious events are very rare. They can only (I think) appear
	when the race described in FAQ-question-3 takes place. This should be
	very rare. Most(?) uses will involve only timer expiration, or only
	Signal/Broadcast() actions. When both are used, it will be rare that
	the race will appear, and it would require MANY Wait() and signaling
	activities. If this implementation did not recycle events, then it
	would have to create and destroy events for every call to Wait().
	That allocation/deallocation and associated construction/destruction
	would be costly (per wait), and would only be a rare benefit (when the
	race was "lost" and a spurious signal took place). That would be bad
	(IMO) optimization trade-off. Finally, such spurious events are
	allowed by the specification of condition variables (such as
	implemented in Vista), and hence it is better if any user accommodates
	such spurious events (see usage note in condition_variable.h).

	5) Why don't you reset events when you are about to recycle them, or
	about to reuse them, so that the spurious signals don't take place?
	The thread described in FAQ-question-3 step c may be pre-empted for an
	arbitrary length of time before proceeding to step d. As a result,
	the wait_event may actually be re-used before step (e) is reached.
	As a result, calling reset would not help significantly.

	6) How is it that the callers lock is released atomically with the
	entry into a wait state? We commit to the wait activity when we
	allocate the wait_event for use in a given call to Wait(). This
	allocation takes place before the caller's lock is released (and
	actually before our internal_lock_ is released). That allocation is
	the defining moment when "the wait state has been entered," as that
	thread can now be signaled by a call to Broadcast() or Signal().
	Hence we actually "commit to wait" before releasing the lock, making
	the pair effectively atomic.

	8) Why do you need to lock your data structures during waiting, as the
	caller is already in possession of a lock? We need to Acquire() and
	Release() our internal lock during Signal() and Broadcast(). If we tried
	to use a callers lock for this purpose, we might conflict with their
	external use of the lock. For example, the caller may use to consistently
	hold a lock on one thread while calling Signal() on another, and that would
	block Signal().

	9) Couldn't a more efficient implementation be provided if you
	preclude using more than one external lock in conjunction with a
	single ConditionVariable instance? Yes, at least it could be viewed
	as a simpler API (since you don't have to reiterate the lock argument
	in each Wait() call). One of the constructors now takes a specific
	lock as an argument, and a there are corresponding Wait() calls that
	don't specify a lock now. It turns that the resulting implmentation
	can't be made more efficient, as the internal lock needs to be used by
	Signal() and Broadcast(), to access internal data structures. As a
	result, I was not able to utilize the user supplied lock (which is
	being used by the user elsewhere presumably) to protect the private
	member access.

	9) Since you have a second lock, how can be be sure that there is no
	possible deadlock scenario? Our internal_lock_ is always the last
	lock acquired, and the first one released, and hence a deadlock (due
	to critical section problems) is impossible as a consequence of our
	lock.

	10) When doing a Broadcast(), why did you copy all the events into
	an STL queue, rather than making a linked-loop, and iterating over it?
	The iterating during Broadcast() is done so outside the protection
	of the internal lock. As a result, other threads, such as the thread
	wherein a related event is waiting, could asynchronously manipulate
	the links around a cv_event. As a result, the link structure cannot
	be used outside a lock. Broadcast() could iterate over waiting
	events by cycling in-and-out of the protection of the internal_lock,
	but that appears more expensive than copying the list into an STL
	stack.

	11) Why did the lock.h file need to be modified so much for this
	change? Central to a Condition Variable is the atomic release of a
	lock during a Wait(). This places Wait() functionality exactly
	mid-way between the two classes, Lock and Condition Variable. Given
	that there can be nested Acquire()'s of locks, and Wait() had to
	Release() completely a held lock, it was necessary to augment the Lock
	class with a recursion counter. Even more subtle is the fact that the
	recursion counter (in a Lock) must be protected, as many threads can
	access it asynchronously. As a positive fallout of this, there are
	now some DCHECKS to be sure no one Release()s a Lock more than they
	Acquire()ed it, and there is ifdef'ed functionality that can detect
	nested locks (legal under windows, but not under Posix).

	12) Why is it that the cv_events removed from list in Broadcast() and Signal()
	are not leaked? How are they recovered?? The cv_events that appear to leak are
	taken from the waiting_list_. For each element in that list, there is currently
	a thread in or around the WaitForSingleObject() call of Wait(), and those
	threads have references to these otherwise leaked events. They are passed as
	arguments to be recycled just aftre returning from WaitForSingleObject().

	13) Why did you use a custom container class (the linked list), when STL has
	perfectly good containers, such as an STL list? The STL list, as with any
	container, does not guarantee the utility of an iterator across manipulation
	(such as insertions and deletions) of the underlying container. The custom
	double-linked-list container provided that assurance. I don't believe any
	combination of STL containers provided the services that were needed at the same
	O(1) efficiency as the custom linked list. The unusual requirement
	for the container class is that a reference to an item within a container (an
	iterator) needed to be maintained across an arbitrary manipulation of the
	container. This requirement exposes itself in the Wait() method, where a
	waiting_event must be selected prior to the WaitForSingleObject(), and then it
	must be used as part of recycling to remove the related instance from the
	waiting_list. A hash table (STL map) could be used, but I was embarrased to
	use a complex and relatively low efficiency container when a doubly linked list
	provided O(1) performance in all required operations. Since other operations
	to provide performance-and/or-fairness required queue (FIFO) and list (LIFO)
	containers, I would also have needed to use an STL list/queue as well as an STL
	map. In the end I decided it would be "fun" to just do it right, and I
	put so many assertions (DCHECKs) into the container class that it is trivial to
	code review and validate its correctness.

	*/