From ef1e2ab328087c61a6878c1e84f4fc5d710aebce Mon Sep 17 00:00:00 2001
From: dotnet-bot <dotnet-bot@microsoft.com>
Date: Fri, 30 Jan 2015 14:14:42 -0800
Subject: Initial commit to populate CoreCLR repo

[tfs-changeset: 1407945]
---
 src/vm/win32threadpool.cpp | 5597 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 5597 insertions(+)
 create mode 100644 src/vm/win32threadpool.cpp

(limited to 'src/vm/win32threadpool.cpp')
diff --git a/src/vm/win32threadpool.cpp b/src/vm/win32threadpool.cpp
new file mode 100644
index 0000000000..3e80eb1e67
--- /dev/null
+++ b/src/vm/win32threadpool.cpp
@@ -0,0 +1,5597 @@
+//
+// Copyright (c) Microsoft. All rights reserved.
+// Licensed under the MIT license. See LICENSE file in the project root for full license information.
+//
+
+
+/*++
+
+Module Name:
+
+    Win32ThreadPool.cpp
+
+Abstract:
+
+    This module implements Threadpool support using Win32 APIs
+
+
+Revision History:
+    December 1999 - Created
+
+--*/
+
+#include "common.h"
+#include "log.h"
+#include "threadpoolrequest.h"
+#include "win32threadpool.h"
+#include "delegateinfo.h"
+#include "eeconfig.h"
+#include "dbginterface.h"
+#include "corhost.h"
+#include "eventtrace.h"
+#include "threads.h"
+#include "appdomain.inl"
+#include "nativeoverlapped.h"
+#include "hillclimbing.h"
+
+
+#ifndef FEATURE_PAL
+#ifndef DACCESS_COMPILE
+
+// APIs that must be accessed through dynamic linking. 
+typedef int (WINAPI *NtQueryInformationThreadProc) (
+    HANDLE ThreadHandle,
+    THREADINFOCLASS ThreadInformationClass,
+    PVOID ThreadInformation,
+    ULONG ThreadInformationLength,
+    PULONG ReturnLength);
+NtQueryInformationThreadProc g_pufnNtQueryInformationThread = NULL;
+
+typedef int (WINAPI *NtQuerySystemInformationProc) ( 
+    SYSTEM_INFORMATION_CLASS SystemInformationClass,
+    PVOID SystemInformation,
+    ULONG SystemInformationLength,
+    PULONG ReturnLength OPTIONAL);
+NtQuerySystemInformationProc g_pufnNtQuerySystemInformation = NULL;
+
+typedef HANDLE (WINAPI * CreateWaitableTimerExProc) (
+    LPSECURITY_ATTRIBUTES lpTimerAttributes,
+    LPCTSTR lpTimerName,
+    DWORD dwFlags,
+    DWORD dwDesiredAccess);
+CreateWaitableTimerExProc g_pufnCreateWaitableTimerEx = NULL;
+
+typedef BOOL (WINAPI * SetWaitableTimerExProc) (
+    HANDLE hTimer,
+    const LARGE_INTEGER *lpDueTime,
+    LONG lPeriod,
+    PTIMERAPCROUTINE pfnCompletionRoutine,
+    LPVOID lpArgToCompletionRoutine,
+    void* WakeContext, //should be PREASON_CONTEXT, but it's not defined for us (and we don't use it)
+    ULONG TolerableDelay);
+SetWaitableTimerExProc g_pufnSetWaitableTimerEx = NULL;
+
+#endif // !DACCESS_COMPILE
+#endif // !FEATURE_PAL
+
+BOOL ThreadpoolMgr::InitCompletionPortThreadpool = FALSE;
+HANDLE ThreadpoolMgr::GlobalCompletionPort;                 // used for binding io completions on file handles
+
+SVAL_IMPL(ThreadpoolMgr::ThreadCounter,ThreadpoolMgr,CPThreadCounter);
+
+SVAL_IMPL_INIT(LONG,ThreadpoolMgr,MaxLimitTotalCPThreads,1000);   // = MaxLimitCPThreadsPerCPU * number of CPUS
+SVAL_IMPL(LONG,ThreadpoolMgr,MinLimitTotalCPThreads);             
+SVAL_IMPL(LONG,ThreadpoolMgr,MaxFreeCPThreads);                   // = MaxFreeCPThreadsPerCPU * Number of CPUS
+
+Volatile<LONG> ThreadpoolMgr::NumCPInfrastructureThreads = 0;      // number of threads currently busy handling draining cycle
+
+SVAL_IMPL(ThreadpoolMgr::ThreadCounter, ThreadpoolMgr, WorkerCounter);
+
+SVAL_IMPL(LONG,ThreadpoolMgr,MinLimitTotalWorkerThreads);          // = MaxLimitCPThreadsPerCPU * number of CPUS
+SVAL_IMPL(LONG,ThreadpoolMgr,MaxLimitTotalWorkerThreads);        // = MaxLimitCPThreadsPerCPU * number of CPUS
+
+SVAL_IMPL(LONG,ThreadpoolMgr,cpuUtilization);
+LONG    ThreadpoolMgr::cpuUtilizationAverage = 0;
+
+HillClimbing ThreadpoolMgr::HillClimbingInstance;
+
+Volatile<LONG> ThreadpoolMgr::PriorCompletedWorkRequests = 0;
+Volatile<DWORD> ThreadpoolMgr::PriorCompletedWorkRequestsTime;
+Volatile<DWORD> ThreadpoolMgr::NextCompletedWorkRequestsTime;
+LARGE_INTEGER ThreadpoolMgr::CurrentSampleStartTime;
+
+int ThreadpoolMgr::ThreadAdjustmentInterval;
+
+#define INVALID_HANDLE ((HANDLE) -1)
+#define NEW_THREAD_THRESHOLD            7       // Number of requests outstanding before we start a new thread
+#define CP_THREAD_PENDINGIO_WAIT 5000           // polling interval when thread is retired but has a pending io
+#define GATE_THREAD_DELAY 500 /*milliseconds*/
+#define GATE_THREAD_DELAY_TOLERANCE 50 /*milliseconds*/
+#define DELAY_BETWEEN_SUSPENDS 5000 + GATE_THREAD_DELAY // time to delay between suspensions
+#define SUSPEND_TIME GATE_THREAD_DELAY+100      // milliseconds to suspend during SuspendProcessing
+
+LONG ThreadpoolMgr::Initialization=0;           // indicator of whether the threadpool is initialized.
+Volatile<unsigned int> ThreadpoolMgr::LastDequeueTime; // used to determine if work items are getting thread starved
+int ThreadpoolMgr::offset_counter = 0;
+
+SPTR_IMPL(WorkRequest,ThreadpoolMgr,WorkRequestHead);        // Head of work request queue
+SPTR_IMPL(WorkRequest,ThreadpoolMgr,WorkRequestTail);        // Head of work request queue
+
+SVAL_IMPL(ThreadpoolMgr::LIST_ENTRY,ThreadpoolMgr,TimerQueue);  // queue of timers
+
+//unsigned int ThreadpoolMgr::LastCpuSamplingTime=0;      //  last time cpu utilization was sampled by gate thread
+unsigned int ThreadpoolMgr::LastCPThreadCreation=0;     //  last time a completion port thread was created
+unsigned int ThreadpoolMgr::NumberOfProcessors; // = NumberOfWorkerThreads - no. of blocked threads
+
+
+CrstStatic ThreadpoolMgr::WorkerCriticalSection;
+CLREvent * ThreadpoolMgr::RetiredCPWakeupEvent;       // wakeup event for completion port threads
+CrstStatic ThreadpoolMgr::WaitThreadsCriticalSection;
+ThreadpoolMgr::LIST_ENTRY ThreadpoolMgr::WaitThreadsHead;
+
+ThreadpoolMgr::UnfairSemaphore* ThreadpoolMgr::WorkerSemaphore;
+CLRSemaphore* ThreadpoolMgr::RetiredWorkerSemaphore;
+
+CrstStatic ThreadpoolMgr::TimerQueueCriticalSection;
+HANDLE ThreadpoolMgr::TimerThread=NULL;
+Thread *ThreadpoolMgr::pTimerThread=NULL;
+DWORD ThreadpoolMgr::LastTickCount;
+
+#ifdef _DEBUG
+DWORD ThreadpoolMgr::TickCountAdjustment=0;
+#endif
+
+LONG  ThreadpoolMgr::GateThreadStatus=GATE_THREAD_STATUS_NOT_RUNNING;
+
+ThreadpoolMgr::RecycledListsWrapper ThreadpoolMgr::RecycledLists;
+
+ThreadpoolMgr::TimerInfo *ThreadpoolMgr::TimerInfosToBeRecycled = NULL;
+
+BOOL ThreadpoolMgr::IsApcPendingOnWaitThread = FALSE;
+
+#ifndef DACCESS_COMPILE
+
+// Macros for inserting/deleting from doubly linked list
+
+#define InitializeListHead(ListHead) (\
+    (ListHead)->Flink = (ListHead)->Blink = (ListHead))
+
+//
+// these are named the same as slightly different macros in the NT headers
+//
+#undef RemoveHeadList
+#undef RemoveEntryList
+#undef InsertTailList
+#undef InsertHeadList
+
+#define RemoveHeadList(ListHead,FirstEntry) \
+    {\
+    FirstEntry = (LIST_ENTRY*) (ListHead)->Flink;\
+    ((LIST_ENTRY*)FirstEntry->Flink)->Blink = (ListHead);\
+    (ListHead)->Flink = FirstEntry->Flink;\
+    }
+
+#define RemoveEntryList(Entry) {\
+    LIST_ENTRY* _EX_Entry;\
+        _EX_Entry = (Entry);\
+        ((LIST_ENTRY*) _EX_Entry->Blink)->Flink = _EX_Entry->Flink;\
+        ((LIST_ENTRY*) _EX_Entry->Flink)->Blink = _EX_Entry->Blink;\
+    }
+
+#define InsertTailList(ListHead,Entry) \
+    (Entry)->Flink = (ListHead);\
+    (Entry)->Blink = (ListHead)->Blink;\
+    ((LIST_ENTRY*)(ListHead)->Blink)->Flink = (Entry);\
+    (ListHead)->Blink = (Entry);
+
+#define InsertHeadList(ListHead,Entry) {\
+    LIST_ENTRY* _EX_Flink;\
+    LIST_ENTRY* _EX_ListHead;\
+    _EX_ListHead = (LIST_ENTRY*)(ListHead);\
+    _EX_Flink = (LIST_ENTRY*) _EX_ListHead->Flink;\
+    (Entry)->Flink = _EX_Flink;\
+    (Entry)->Blink = _EX_ListHead;\
+    _EX_Flink->Blink = (Entry);\
+    _EX_ListHead->Flink = (Entry);\
+    }
+
+#define IsListEmpty(ListHead) \
+    ((ListHead)->Flink == (ListHead))
+
+#define SetLastHRError(hr) \
+    if (HRESULT_FACILITY(hr) == FACILITY_WIN32)\
+        SetLastError(HRESULT_CODE(hr));\
+    else \
+        SetLastError(ERROR_INVALID_DATA);\
+
+/************************************************************************/
+
+void ThreadpoolMgr::RecycledListsWrapper::Initialize( unsigned int numProcs )
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+        GC_NOTRIGGER;
+    }
+    CONTRACTL_END;
+
+    pRecycledListPerProcessor = new RecycledListInfo[numProcs][MEMTYPE_COUNT];
+}
+
+//--//
+
+void ThreadpoolMgr::EnsureInitialized()
+{
+    CONTRACTL
+    {
+        THROWS;         // Initialize can throw
+        MODE_ANY;
+        GC_NOTRIGGER;
+    }
+    CONTRACTL_END;
+
+    if (IsInitialized())
+        return;
+
+    DWORD dwSwitchCount = 0;
+
+retry:
+    if (InterlockedCompareExchange(&Initialization, 1, 0) == 0)
+    {
+        if (Initialize())
+            Initialization = -1;
+        else
+        {
+            Initialization = 0;
+            COMPlusThrowOM();
+        }
+    }
+    else // someone has already begun initializing.
+    {
+        // wait until it finishes
+        while (Initialization != -1)
+        {
+            __SwitchToThread(0, ++dwSwitchCount);
+            goto retry;
+        }
+    }
+}
+
+DWORD GetDefaultMaxLimitWorkerThreads(DWORD minLimit)
+{
+    CONTRACTL
+    {
+        MODE_ANY;
+        GC_NOTRIGGER;
+        NOTHROW;
+    }
+    CONTRACTL_END;
+
+    //
+    // We determine the max limit for worker threads as follows:
+    //
+    //  1) It must be at least MinLimitTotalWorkerThreads
+    //  2) It must be no greater than (half the virtual address space)/(thread stack size)
+    //  3) It must be <= MaxPossibleWorkerThreads
+    //
+    // TODO: what about CP threads?  Can they follow a similar plan?  How do we allocate
+    // thread counts between the two kinds of threads?
+    //
+    SIZE_T stackReserveSize = 0;
+    Thread::GetProcessDefaultStackSize(&stackReserveSize, NULL);
+
+    ULONGLONG halfVirtualAddressSpace;
+
+    MEMORYSTATUSEX memStats;
+    memStats.dwLength = sizeof(memStats);
+    if (GlobalMemoryStatusEx(&memStats))
+    {
+        halfVirtualAddressSpace = memStats.ullTotalVirtual / 2;
+    }
+    else
+    {
+        //assume the normal Win32 32-bit virtual address space
+        halfVirtualAddressSpace = 0x000000007FFE0000ull / 2;
+    }
+
+    ULONGLONG limit = halfVirtualAddressSpace / stackReserveSize;
+    limit = max(limit, (ULONGLONG)minLimit);
+    limit = min(limit, (ULONGLONG)ThreadpoolMgr::ThreadCounter::MaxPossibleCount);
+
+    _ASSERTE(FitsIn<DWORD>(limit));
+    return (DWORD)limit;
+}
+
+BOOL ThreadpoolMgr::Initialize()
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+        GC_NOTRIGGER;
+        INJECT_FAULT(COMPlusThrowOM());
+    }
+    CONTRACTL_END;
+
+    BOOL bRet = FALSE;
+    BOOL bExceptionCaught = FALSE;
+
+    UnManagedPerAppDomainTPCount* pADTPCount;
+    pADTPCount = PerAppDomainTPCountList::GetUnmanagedTPCount();
+
+    //ThreadPool_CPUGroup
+    CPUGroupInfo::EnsureInitialized();
+    if (CPUGroupInfo::CanEnableGCCPUGroups() && CPUGroupInfo::CanEnableThreadUseAllCpuGroups())
+        NumberOfProcessors = CPUGroupInfo::GetNumActiveProcessors();
+    else
+        NumberOfProcessors = GetCurrentProcessCpuCount();
+    InitPlatformVariables();
+
+    EX_TRY
+    {
+        ThreadAdjustmentInterval = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_HillClimbing_SampleIntervalLow);
+        
+        pADTPCount->InitResources();
+        WorkerCriticalSection.Init(CrstThreadpoolWorker);
+        WaitThreadsCriticalSection.Init(CrstThreadpoolWaitThreads);
+        TimerQueueCriticalSection.Init(CrstThreadpoolTimerQueue);
+
+        // initialize WaitThreadsHead
+        InitializeListHead(&WaitThreadsHead);
+
+        // initialize TimerQueue
+        InitializeListHead(&TimerQueue);
+
+        RetiredCPWakeupEvent = new CLREvent();
+        RetiredCPWakeupEvent->CreateAutoEvent(FALSE);
+        _ASSERTE(RetiredCPWakeupEvent->IsValid());
+
+        WorkerSemaphore = new UnfairSemaphore(ThreadCounter::MaxPossibleCount);
+
+        RetiredWorkerSemaphore = new CLRSemaphore();
+        RetiredWorkerSemaphore->Create(0, ThreadCounter::MaxPossibleCount);
+
+    //ThreadPool_CPUGroup
+    if (CPUGroupInfo::CanEnableGCCPUGroups() && CPUGroupInfo::CanEnableThreadUseAllCpuGroups())
+            RecycledLists.Initialize( CPUGroupInfo::GetNumActiveProcessors() );
+        else
+        RecycledLists.Initialize( g_SystemInfo.dwNumberOfProcessors );
+    /*
+        {
+            SYSTEM_INFO sysInfo;
+
+            ::GetSystemInfo( &sysInfo );
+
+            RecycledLists.Initialize( sysInfo.dwNumberOfProcessors );
+        }
+    */
+    }
+    EX_CATCH
+    {
+        pADTPCount->CleanupResources();
+
+        if (RetiredCPWakeupEvent)
+        {
+            delete RetiredCPWakeupEvent;
+            RetiredCPWakeupEvent = NULL;
+        }
+
+        // Note: It is fine to call Destroy on unitialized critical sections
+        WorkerCriticalSection.Destroy();
+        WaitThreadsCriticalSection.Destroy();
+        TimerQueueCriticalSection.Destroy();
+
+        bExceptionCaught = TRUE;
+    }
+    EX_END_CATCH(SwallowAllExceptions);
+
+    if (bExceptionCaught)
+    {
+        goto end;
+    }
+
+    // initialize Worker and CP thread settings
+    DWORD forceMin;
+    forceMin = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMinWorkerThreads);
+    MinLimitTotalWorkerThreads = forceMin > 0 ? (LONG)forceMin : (LONG)NumberOfProcessors;
+
+    DWORD forceMax;
+    forceMax = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMaxWorkerThreads);
+    MaxLimitTotalWorkerThreads = forceMax > 0 ? (LONG)forceMax : (LONG)GetDefaultMaxLimitWorkerThreads(MinLimitTotalWorkerThreads);
+
+    ThreadCounter::Counts counts;
+    counts.NumActive = 0;
+    counts.NumWorking = 0;
+    counts.NumRetired = 0;
+    counts.MaxWorking = MinLimitTotalWorkerThreads;
+    WorkerCounter.counts.AsLongLong = counts.AsLongLong;
+
+#ifdef _DEBUG
+    TickCountAdjustment = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadpoolTickCountAdjustment);
+#endif
+
+    // initialize CP thread settings
+    MinLimitTotalCPThreads = NumberOfProcessors;
+
+    MaxFreeCPThreads = NumberOfProcessors*MaxFreeCPThreadsPerCPU;
+
+    counts.NumActive = 0;
+    counts.NumWorking = 0;
+    counts.NumRetired = 0;
+    counts.MaxWorking = MinLimitTotalCPThreads;
+    CPThreadCounter.counts.AsLongLong = counts.AsLongLong;
+
+#ifndef FEATURE_PAL    
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    if (CLRIoCompletionHosted())
+    {
+        HANDLE hPort;
+        HRESULT hr;
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = CorHost2::GetHostIoCompletionManager()->CreateIoCompletionPort(&hPort);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+            goto end;
+
+        GlobalCompletionPort = hPort;
+    }
+    else
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+    {
+        GlobalCompletionPort = CreateIoCompletionPort(INVALID_HANDLE_VALUE,
+                                                      NULL,
+                                                      0,        /*ignored for invalid handle value*/
+                                                      NumberOfProcessors);
+    }
+#endif // !FEATURE_PAL    
+
+    HillClimbingInstance.Initialize();
+
+    bRet = TRUE;
+end:
+    return bRet;
+}
+
+void ThreadpoolMgr::InitPlatformVariables()
+{
+    CONTRACTL
+    {
+        NOTHROW;         
+        MODE_ANY;
+        GC_NOTRIGGER;
+    }
+    CONTRACTL_END;
+
+#ifndef FEATURE_PAL   
+    HINSTANCE  hNtDll;
+    HINSTANCE  hCoreSynch;
+    {
+        CONTRACT_VIOLATION(GCViolation|FaultViolation);
+        hNtDll = CLRLoadLibrary(W("ntdll.dll"));
+        _ASSERTE(hNtDll);
+#ifdef FEATURE_CORESYSTEM
+        hCoreSynch = CLRLoadLibrary(W("api-ms-win-core-synch-l1-1-0.dll"));
+#else
+        hCoreSynch = CLRLoadLibrary(W("kernel32.dll"));
+#endif
+        _ASSERTE(hCoreSynch);
+    }
+
+    // These APIs must be accessed via dynamic binding since they may be removed in future
+    // OS versions.
+    g_pufnNtQueryInformationThread = (NtQueryInformationThreadProc)GetProcAddress(hNtDll,"NtQueryInformationThread");
+    g_pufnNtQuerySystemInformation = (NtQuerySystemInformationProc)GetProcAddress(hNtDll,"NtQuerySystemInformation");
+
+
+    // These APIs are only supported on newer Windows versions
+    g_pufnCreateWaitableTimerEx = (CreateWaitableTimerExProc)GetProcAddress(hCoreSynch, "CreateWaitableTimerExW");
+    g_pufnSetWaitableTimerEx = (SetWaitableTimerExProc)GetProcAddress(hCoreSynch, "SetWaitableTimerEx");
+#endif    
+}
+
+BOOL ThreadpoolMgr::SetMaxThreadsHelper(DWORD MaxWorkerThreads,
+                                        DWORD MaxIOCompletionThreads)
+{
+    CONTRACTL
+    {
+        THROWS;     // Crst can throw and toggle GC mode
+        MODE_ANY;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+
+    BOOL result = FALSE;
+
+    // doesn't need to be WorkerCS, but using it to avoid race condition between setting min and max, and didn't want to create a new CS.
+    CrstHolder csh(&WorkerCriticalSection);
+
+    if (MaxWorkerThreads >= (DWORD)MinLimitTotalWorkerThreads &&
+       MaxIOCompletionThreads >= (DWORD)MinLimitTotalCPThreads)
+    {
+        BEGIN_SO_INTOLERANT_CODE(GetThread());
+
+        if (CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMaxWorkerThreads) == 0)
+        {
+            MaxLimitTotalWorkerThreads = min(MaxWorkerThreads, (DWORD)ThreadCounter::MaxPossibleCount);
+
+            ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+            while (counts.MaxWorking > MaxLimitTotalWorkerThreads)
+            {
+                ThreadCounter::Counts newCounts = counts;
+                newCounts.MaxWorking = MaxLimitTotalWorkerThreads;
+
+                ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+                if (oldCounts == counts)
+                    counts = newCounts;
+                else
+                    counts = oldCounts;
+            }
+        }
+
+        END_SO_INTOLERANT_CODE;
+
+        MaxLimitTotalCPThreads = min(MaxIOCompletionThreads, (DWORD)ThreadCounter::MaxPossibleCount);
+
+        result = TRUE;
+    }
+
+    return result;
+ }
+
+/************************************************************************/
+BOOL ThreadpoolMgr::SetMaxThreads(DWORD MaxWorkerThreads,
+                                     DWORD MaxIOCompletionThreads)
+{
+    CONTRACTL
+    {
+        THROWS;     // SetMaxThreadsHelper can throw and toggle GC mode
+        MODE_ANY;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    IHostThreadpoolManager *threadpoolProvider = CorHost2::GetHostThreadpoolManager();
+    if (threadpoolProvider) {
+        HRESULT hr;
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = threadpoolProvider->SetMaxThreads(MaxWorkerThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    IHostIoCompletionManager *ioCompletionProvider = CorHost2::GetHostIoCompletionManager();
+    if (ioCompletionProvider) {
+        HRESULT hr;
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = ioCompletionProvider->SetMaxThreads(MaxIOCompletionThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    if (threadpoolProvider && ioCompletionProvider) {
+        return TRUE;
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    if (IsInitialized())
+    {
+        return SetMaxThreadsHelper(MaxWorkerThreads, MaxIOCompletionThreads);
+    }
+
+    if (InterlockedCompareExchange(&Initialization, 1, 0) == 0)
+    {
+        Initialize();
+
+        BOOL helper_result = FALSE;
+        helper_result = SetMaxThreadsHelper(MaxWorkerThreads, MaxIOCompletionThreads);
+
+        Initialization = -1;
+        return helper_result;
+    }
+    else // someone else is initializing. Too late, return false
+    {
+        return FALSE;
+    }
+
+}
+
+BOOL ThreadpoolMgr::GetMaxThreads(DWORD* MaxWorkerThreads,
+                                     DWORD* MaxIOCompletionThreads)
+{
+    LIMITED_METHOD_CONTRACT;
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    HRESULT hr = S_OK;
+
+    IHostThreadpoolManager *threadpoolProvider = CorHost2::GetHostThreadpoolManager();
+    if (threadpoolProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = threadpoolProvider->GetMaxThreads(MaxWorkerThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    IHostIoCompletionManager *ioCompletionProvider = CorHost2::GetHostIoCompletionManager();
+    if (ioCompletionProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = ioCompletionProvider->GetMaxThreads(MaxIOCompletionThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    if (threadpoolProvider && ioCompletionProvider) {
+        return TRUE;
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    if (!MaxWorkerThreads || !MaxIOCompletionThreads)
+    {
+        SetLastHRError(ERROR_INVALID_DATA);
+        return FALSE;
+    }
+
+    if (IsInitialized())
+    {
+        *MaxWorkerThreads = (DWORD)MaxLimitTotalWorkerThreads;
+        *MaxIOCompletionThreads = MaxLimitTotalCPThreads;
+    }
+    else
+    {
+        BEGIN_SO_INTOLERANT_CODE_NOTHROW(GetThread(), *MaxWorkerThreads = 1024);
+
+        //ThreadPool_CPUGroup
+        CPUGroupInfo::EnsureInitialized();
+        if (CPUGroupInfo::CanEnableGCCPUGroups() && CPUGroupInfo::CanEnableThreadUseAllCpuGroups())
+            NumberOfProcessors = CPUGroupInfo::GetNumActiveProcessors();
+        else
+            NumberOfProcessors = GetCurrentProcessCpuCount();
+        DWORD min = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMinWorkerThreads);
+        if (min == 0)
+            min = NumberOfProcessors;
+
+        DWORD forceMax = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMaxWorkerThreads);
+        if (forceMax > 0)
+        {
+            *MaxWorkerThreads = forceMax;
+        }
+        else
+        {
+            *MaxWorkerThreads = GetDefaultMaxLimitWorkerThreads(min);
+        }
+
+        END_SO_INTOLERANT_CODE;
+
+        *MaxIOCompletionThreads = MaxLimitTotalCPThreads;
+    }
+    return TRUE;
+}
+
+BOOL ThreadpoolMgr::SetMinThreads(DWORD MinWorkerThreads,
+                                     DWORD MinIOCompletionThreads)
+{
+    CONTRACTL
+    {
+        THROWS;     // Crst can throw and toggle GC mode
+        MODE_ANY;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    HRESULT hr = S_OK;
+
+    IHostThreadpoolManager *threadpoolProvider = CorHost2::GetHostThreadpoolManager();
+    if (threadpoolProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = threadpoolProvider->SetMinThreads(MinWorkerThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    IHostIoCompletionManager *ioCompletionProvider = CorHost2::GetHostIoCompletionManager();
+    if (ioCompletionProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = ioCompletionProvider->SetMinThreads(MinIOCompletionThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+    if (threadpoolProvider && ioCompletionProvider) {
+        return TRUE;
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    if (!IsInitialized())
+    {
+        if (InterlockedCompareExchange(&Initialization, 1, 0) == 0)
+        {
+            Initialize();
+            Initialization = -1;
+        }
+    }
+
+    if (IsInitialized())
+    {
+        // doesn't need to be WorkerCS, but using it to avoid race condition between setting min and max, and didn't want to create a new CS.
+        CrstHolder csh(&WorkerCriticalSection);
+
+        BOOL init_result = false;
+
+        if (MinWorkerThreads >= 0 && MinIOCompletionThreads >= 0 &&
+            MinWorkerThreads <= (DWORD) MaxLimitTotalWorkerThreads &&
+            MinIOCompletionThreads <= (DWORD) MaxLimitTotalCPThreads)
+        {
+            BEGIN_SO_INTOLERANT_CODE(GetThread());
+
+            if (CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMinWorkerThreads) == 0)
+            {
+                MinLimitTotalWorkerThreads = min(MinWorkerThreads, (DWORD)ThreadCounter::MaxPossibleCount);
+
+                ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+                while (counts.MaxWorking < MinLimitTotalWorkerThreads)
+                {
+                    ThreadCounter::Counts newCounts = counts;
+                    newCounts.MaxWorking = MinLimitTotalWorkerThreads;
+
+                    ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+                    if (oldCounts == counts)
+                    {
+                        counts = newCounts;
+
+                        // if we increased the limit, and there are pending workitems, we need
+                        // to dispatch a thread to process the work.
+                        if (newCounts.MaxWorking > oldCounts.MaxWorking &&
+                            PerAppDomainTPCountList::AreRequestsPendingInAnyAppDomains())
+                        {
+                            MaybeAddWorkingWorker();
+                        }
+                    }
+                    else
+                    {
+                        counts = oldCounts;
+                    }
+                }
+            }
+
+            END_SO_INTOLERANT_CODE;
+
+            MinLimitTotalCPThreads = min(MinIOCompletionThreads, (DWORD)ThreadCounter::MaxPossibleCount);
+
+            init_result = TRUE;
+        }
+
+        return init_result;
+    }
+    // someone else is initializing. Too late, return false
+    return FALSE;
+
+}
+
+BOOL ThreadpoolMgr::GetMinThreads(DWORD* MinWorkerThreads,
+                                     DWORD* MinIOCompletionThreads)
+{
+    LIMITED_METHOD_CONTRACT;
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    HRESULT hr = S_OK;
+
+    IHostThreadpoolManager *threadpoolProvider = CorHost2::GetHostThreadpoolManager();
+    if (threadpoolProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = threadpoolProvider->GetMinThreads(MinWorkerThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    IHostIoCompletionManager *ioCompletionProvider = CorHost2::GetHostIoCompletionManager();
+    if (ioCompletionProvider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        hr = ioCompletionProvider->GetMinThreads(MinIOCompletionThreads);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+    }
+
+    if (threadpoolProvider && ioCompletionProvider) {
+        return TRUE;
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    if (!MinWorkerThreads || !MinIOCompletionThreads)
+    {
+        SetLastHRError(ERROR_INVALID_DATA);
+        return FALSE;
+    }
+
+    if (IsInitialized())
+    {
+        *MinWorkerThreads = (DWORD)MinLimitTotalWorkerThreads;
+        *MinIOCompletionThreads = MinLimitTotalCPThreads;
+    }
+    else
+    {
+        CPUGroupInfo::EnsureInitialized();
+        if (CPUGroupInfo::CanEnableGCCPUGroups() && CPUGroupInfo::CanEnableThreadUseAllCpuGroups())
+            NumberOfProcessors = CPUGroupInfo::GetNumActiveProcessors();
+        else
+            NumberOfProcessors = GetCurrentProcessCpuCount();
+        DWORD forceMin;
+        BEGIN_SO_INTOLERANT_CODE_NOTHROW(GetThread(), forceMin=0);
+        forceMin = CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_ForceMinWorkerThreads);
+        END_SO_INTOLERANT_CODE;
+        *MinWorkerThreads = forceMin > 0 ? forceMin : NumberOfProcessors;
+        *MinIOCompletionThreads = NumberOfProcessors;
+    }
+    return TRUE;
+}
+
+BOOL ThreadpoolMgr::GetAvailableThreads(DWORD* AvailableWorkerThreads,
+                                        DWORD* AvailableIOCompletionThreads)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    if (IsInitialized())
+    {
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    HRESULT hr = S_OK;
+
+        IHostThreadpoolManager *threadpoolProvider = CorHost2::GetHostThreadpoolManager();
+        if (threadpoolProvider) {
+            BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+            hr = threadpoolProvider->GetAvailableThreads(AvailableWorkerThreads);
+            END_SO_TOLERANT_CODE_CALLING_HOST;
+            if (FAILED(hr))
+            {
+                SetLastHRError(hr);
+                return FALSE;
+            }
+        }
+
+        IHostIoCompletionManager *ioCompletionProvider = CorHost2::GetHostIoCompletionManager();
+        if (ioCompletionProvider) {
+            BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+            hr = ioCompletionProvider->GetAvailableThreads(AvailableIOCompletionThreads);
+            END_SO_TOLERANT_CODE_CALLING_HOST;
+            if (FAILED(hr))
+            {
+                SetLastHRError(hr);
+                return FALSE;
+            }
+        }
+
+        if (threadpoolProvider && ioCompletionProvider) {
+            return TRUE;
+        }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+        if (!AvailableWorkerThreads || !AvailableIOCompletionThreads)
+        {
+            SetLastHRError(ERROR_INVALID_DATA);
+            return FALSE;
+        }
+
+        ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+
+        if (MaxLimitTotalWorkerThreads < counts.NumActive)
+            *AvailableWorkerThreads = 0;
+        else
+            *AvailableWorkerThreads = MaxLimitTotalWorkerThreads - counts.NumWorking;
+
+        counts = CPThreadCounter.GetCleanCounts();
+        if (MaxLimitTotalCPThreads < counts.NumActive)
+            *AvailableIOCompletionThreads = counts.NumActive - counts.NumWorking;
+        else
+            *AvailableIOCompletionThreads = MaxLimitTotalCPThreads - counts.NumWorking;
+    }
+    else
+    {
+        GetMaxThreads(AvailableWorkerThreads,AvailableIOCompletionThreads);
+    }
+    return TRUE;
+}
+
+void QueueUserWorkItemHelp(LPTHREAD_START_ROUTINE Function, PVOID Context)
+{
+    STATIC_CONTRACT_THROWS;
+    STATIC_CONTRACT_GC_TRIGGERS;
+    STATIC_CONTRACT_MODE_ANY;
+    /* Cannot use contract here because of SEH
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;*/
+
+    Function(Context);
+
+    Thread *pThread = GetThread();
+    if (pThread) {
+        if (pThread->IsAbortRequested())
+            pThread->EEResetAbort(Thread::TAR_ALL);
+        pThread->InternalReset(FALSE);
+    }
+}
+
+//
+// WorkingThreadCounts tracks the number of worker threads currently doing user work, and the maximum number of such threads
+// since the last time TakeMaxWorkingThreadCount was called.  This information is for diagnostic purposes only,
+// and is tracked only if the CLR config value INTERNAL_ThreadPool_EnableWorkerTracking is non-zero (this feature is off
+// by default).
+//
+union WorkingThreadCounts
+{
+    struct
+    {
+        int currentWorking : 16;
+        int maxWorking : 16;
+    };
+
+    LONG asLong;
+};
+
+WorkingThreadCounts g_workingThreadCounts;
+
+//
+// If worker tracking is enabled (see above) then this is called immediately before and after a worker thread executes
+// each work item.
+//
+void ThreadpoolMgr::ReportThreadStatus(bool isWorking)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        SO_TOLERANT;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+    _ASSERTE(CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_EnableWorkerTracking));
+    while (true)
+    {
+        WorkingThreadCounts currentCounts, newCounts;
+        currentCounts.asLong = VolatileLoad(&g_workingThreadCounts.asLong);
+
+        newCounts = currentCounts;
+
+        if (isWorking)
+            newCounts.currentWorking++;
+
+        if (newCounts.currentWorking > newCounts.maxWorking)
+            newCounts.maxWorking = newCounts.currentWorking;
+
+        if (!isWorking)
+            newCounts.currentWorking--;
+
+        if (currentCounts.asLong == InterlockedCompareExchange(&g_workingThreadCounts.asLong, newCounts.asLong, currentCounts.asLong))
+            break;
+    }
+}
+
+//
+// Returns the max working count since the previous call to TakeMaxWorkingThreadCount, and resets WorkingThreadCounts.maxWorking.
+//
+int TakeMaxWorkingThreadCount()
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        SO_TOLERANT;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+    _ASSERTE(CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_EnableWorkerTracking));
+    while (true)
+    {
+        WorkingThreadCounts currentCounts, newCounts;
+        currentCounts.asLong = VolatileLoad(&g_workingThreadCounts.asLong);
+
+        newCounts = currentCounts;
+        newCounts.maxWorking = 0;
+
+        if (currentCounts.asLong == InterlockedCompareExchange(&g_workingThreadCounts.asLong, newCounts.asLong, currentCounts.asLong))
+        {
+            // If we haven't updated the counts since the last call to TakeMaxWorkingThreadCount, then we never updated maxWorking.
+            // In that case, the number of working threads for the whole period since the last TakeMaxWorkingThreadCount is the 
+            // current number of working threads.
+            return currentCounts.maxWorking == 0 ? currentCounts.currentWorking : currentCounts.maxWorking;
+        }
+    }
+}
+
+
+/************************************************************************/
+
+BOOL ThreadpoolMgr::QueueUserWorkItem(LPTHREAD_START_ROUTINE Function,
+                                      PVOID Context,
+                                      DWORD Flags,
+                                      BOOL UnmanagedTPRequest)
+{
+    CONTRACTL
+    {
+        THROWS;     // EnsureInitialized, EnqueueWorkRequest can throw OOM
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    EnsureInitialized();
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    HRESULT hr = S_OK;
+
+    IHostThreadpoolManager *provider = CorHost2::GetHostThreadpoolManager();
+    if (provider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+
+        if(UnmanagedTPRequest)
+        {
+            hr = provider->QueueUserWorkItem(Function, Context, Flags);
+        }
+        else
+        {
+            hr = provider->QueueUserWorkItem(ExecuteHostRequest, Context, Flags);
+        }
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(hr))
+        {
+            SetLastHRError(hr);
+            return FALSE;
+        }
+        else
+        {
+            return TRUE;
+        }
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    if (Flags == CALL_OR_QUEUE)
+    {
+        // we've been asked to call this directly if the thread pressure is not too high
+
+        int MinimumAvailableCPThreads = (NumberOfProcessors < 3) ? 3 : NumberOfProcessors;
+
+        ThreadCounter::Counts counts = CPThreadCounter.GetCleanCounts();
+        if ((MaxLimitTotalCPThreads - counts.NumActive) >= MinimumAvailableCPThreads )
+        {
+            ThreadLocaleHolder localeHolder;
+
+            QueueUserWorkItemHelp(Function, Context);
+            return TRUE;
+        }
+
+    }
+
+    if (UnmanagedTPRequest) 
+    {
+        UnManagedPerAppDomainTPCount* pADTPCount;
+        pADTPCount = PerAppDomainTPCountList::GetUnmanagedTPCount(); 
+        pADTPCount->QueueUnmanagedWorkRequest(Function, Context);
+    }
+    else
+    {
+        // caller has already registered its TPCount; this call is just to adjust the thread count
+    }
+
+    return TRUE;
+}
+
+
+bool ThreadpoolMgr::ShouldWorkerKeepRunning()
+{
+    WRAPPER_NO_CONTRACT;
+    if (CLRThreadpoolHosted())
+        return true;
+
+    //
+    // Maybe this thread should retire now.  Let's see.
+    //
+    bool shouldThisThreadKeepRunning = true;
+
+    // Dirty read is OK here; the worst that can happen is that we won't retire this time.  In the
+    // case where we might retire, we have to succeed a CompareExchange, which will have the effect
+    // of validating this read.
+    ThreadCounter::Counts counts = WorkerCounter.DangerousGetDirtyCounts();
+    while (true)
+    {
+        if (counts.NumActive <= counts.MaxWorking)
+        {
+            shouldThisThreadKeepRunning = true;
+            break;
+        }
+
+        ThreadCounter::Counts newCounts = counts;
+        newCounts.NumWorking--;
+        newCounts.NumActive--;
+        newCounts.NumRetired++;
+
+        ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+
+        if (oldCounts == counts)
+        {
+            shouldThisThreadKeepRunning = false;
+            break;
+        }
+
+        counts = oldCounts;
+    }
+
+    return shouldThisThreadKeepRunning;
+}
+
+DangerousNonHostedSpinLock ThreadpoolMgr::ThreadAdjustmentLock;
+
+
+//
+// This method must only be called if ShouldAdjustMaxWorkersActive has returned true, *and*
+// ThreadAdjustmentLock is held.
+//
+void ThreadpoolMgr::AdjustMaxWorkersActive()
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(!CLRThreadpoolHosted());
+    _ASSERTE(ThreadAdjustmentLock.IsHeld());
+
+    DWORD currentTicks = GetTickCount();
+    LONG totalNumCompletions = Thread::GetTotalThreadPoolCompletionCount();
+    LONG numCompletions = totalNumCompletions - PriorCompletedWorkRequests;
+
+    LARGE_INTEGER startTime = CurrentSampleStartTime;
+    LARGE_INTEGER endTime;
+    QueryPerformanceCounter(&endTime);
+
+    static LARGE_INTEGER freq;
+    if (freq.QuadPart == 0)
+        QueryPerformanceFrequency(&freq);
+
+    double elapsed = (double)(endTime.QuadPart - startTime.QuadPart) / freq.QuadPart;
+
+    //
+    // It's possible for the current sample to be reset while we're holding 
+    // ThreadAdjustmentLock.  This will result in a very short sample, possibly
+    // with completely bogus counts.  We'll try to detect this by checking the sample
+    // interval; if it's very short, then we try again later.
+    //
+    if (elapsed*1000.0 >= (ThreadAdjustmentInterval/2))
+    {
+        ThreadCounter::Counts currentCounts = WorkerCounter.GetCleanCounts();
+
+        int newMax = HillClimbingInstance.Update(
+            currentCounts.MaxWorking, 
+            elapsed, 
+            numCompletions,
+            &ThreadAdjustmentInterval);
+
+        while (newMax != currentCounts.MaxWorking)
+        {
+            ThreadCounter::Counts newCounts = currentCounts;
+            newCounts.MaxWorking = newMax;
+
+            ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, currentCounts);
+            if (oldCounts == currentCounts)
+            {
+                //
+                // If we're increasing the max, inject a thread.  If that thread finds work, it will inject
+                // another thread, etc., until nobody finds work or we reach the new maximum.
+                //
+                // If we're reducing the max, whichever threads notice this first will retire themselves.
+                //
+                if (newMax > oldCounts.MaxWorking)
+                    MaybeAddWorkingWorker();
+
+                break;
+            }
+            else
+            {
+                // we failed - maybe try again
+                if (oldCounts.MaxWorking > currentCounts.MaxWorking &&
+                    oldCounts.MaxWorking >= newMax)
+                {
+                    // someone (probably the gate thread) increased the thread count more than
+                    // we are about to do.  Don't interfere.
+                    break;
+                }
+
+                currentCounts = oldCounts;
+            }
+        }
+
+        PriorCompletedWorkRequests = totalNumCompletions;
+        PriorCompletedWorkRequestsTime = currentTicks;
+        NextCompletedWorkRequestsTime = PriorCompletedWorkRequestsTime + ThreadAdjustmentInterval;
+        CurrentSampleStartTime = endTime;
+    }
+}
+
+
+void ThreadpoolMgr::MaybeAddWorkingWorker()
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(!CLRThreadpoolHosted());
+
+    ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+    ThreadCounter::Counts newCounts;
+    while (true)
+    {
+        newCounts = counts;
+        newCounts.NumWorking = max(counts.NumWorking, min(counts.NumWorking + 1, counts.MaxWorking));
+        newCounts.NumActive = max(counts.NumActive, newCounts.NumWorking);
+        newCounts.NumRetired = max(0, counts.NumRetired - (newCounts.NumActive - counts.NumActive));
+
+        if (newCounts == counts)
+            return;
+
+        ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+
+        if (oldCounts == counts)
+            break;
+
+        counts = oldCounts;
+    }
+
+    int toUnretire = counts.NumRetired - newCounts.NumRetired;
+    int toCreate = (newCounts.NumActive - counts.NumActive) - toUnretire;
+    int toRelease = (newCounts.NumWorking - counts.NumWorking) - (toUnretire + toCreate);
+
+    _ASSERTE(toUnretire >= 0);
+    _ASSERTE(toCreate >= 0);
+    _ASSERTE(toRelease >= 0);
+    _ASSERTE(toUnretire + toCreate + toRelease <= 1);
+
+    if (toUnretire > 0)
+    {
+        LONG previousCount;
+        INDEBUG(BOOL success =) RetiredWorkerSemaphore->Release((LONG)toUnretire, &previousCount);            
+        _ASSERTE(success);
+    }
+
+    if (toRelease > 0)
+        WorkerSemaphore->Release(toRelease);
+
+    while (toCreate > 0)
+    {
+        if (CreateWorkerThread())
+        {
+            toCreate--;
+        }
+        else
+        {
+            //
+            // Uh-oh, we promised to create a new thread, but the creation failed.  We have to renege on our
+            // promise.  This may possibly result in no work getting done for a while, but the gate thread will
+            // eventually notice that no completions are happening and force the creation of a new thread.
+            // Of course, there's no guarantee *that* will work - but hopefully enough time will have passed
+            // to allow whoever's using all the memory right now to release some.
+            //
+            counts = WorkerCounter.GetCleanCounts();
+            while (true)
+            {
+                //
+                // If we said we would create a thread, we also said it would be working.  So we need to
+                // decrement both NumWorking and NumActive by the number of threads we will no longer be creating.
+                //
+                newCounts = counts;
+                newCounts.NumWorking -= toCreate;
+                newCounts.NumActive -= toCreate;
+
+                ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+
+                if (oldCounts == counts)
+                    break;
+
+                counts = oldCounts;
+            }
+
+            toCreate = 0;
+        }
+    }
+}
+
+BOOL ThreadpoolMgr::PostQueuedCompletionStatus(LPOVERLAPPED lpOverlapped,
+                                      LPOVERLAPPED_COMPLETION_ROUTINE Function)
+{
+    CONTRACTL
+    {
+        THROWS;     // EnsureInitialized can throw OOM
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+#ifndef FEATURE_PAL
+    EnsureInitialized();
+
+    // if hosted then we need to queue to worker thread, since hosting API doesn't include this method
+    if (CLRIoCompletionHosted())
+    {
+        PostRequestHolder postRequest = MakePostRequest(Function, lpOverlapped);
+        if (postRequest)
+        {
+            // Will execute in the Default AppDomain
+            if (FALSE == QueueUserWorkItem(QUWIPostCompletion, postRequest, QUEUE_ONLY))
+            {
+                return FALSE;
+            }
+            else
+            {
+                postRequest.SuppressRelease();    
+                return TRUE;
+            }
+        }
+        else
+            return FALSE;
+    }
+
+    _ASSERTE(GlobalCompletionPort != NULL);
+
+    if (!InitCompletionPortThreadpool)
+        InitCompletionPortThreadpool = TRUE;
+
+    GrowCompletionPortThreadpoolIfNeeded();
+
+    // In order to allow external ETW listeners to correlate activities that use our IO completion port 
+    // as a dispatch mechanism, we have to ensure the runtime's calls to ::PostQueuedCompletionStatus
+    // and ::GetQueuedCompletionStatus are "annotated" with ETW events representing to operations 
+    // performed.
+    // There are currently 4 codepaths that post to the GlobalCompletionPort:
+    // 1. and 2. - the Overlapped drainage events. Those are uninteresting to ETW listeners and 
+    //    currently call the global ::PostQueuedCompletionStatus directly.
+    // 3. the managed API ThreadPool.UnsafeQueueNativeOverlapped(), calling CorPostQueuedCompletionStatus()
+    //    which already fires the ETW event as needed
+    // 4. the managed API ThreadPool.RegisterWaitForSingleObject which needs to fire the ETW event
+    //    at the time the managed API is called (on the orignial user thread), and not when the ::PQCS
+    //    is called (from the dedicated wait thread).
+    // If additional codepaths appear they need to either fire the ETW event before calling this or ensure
+    // we do not fire an unmatched "dequeue" event in ThreadpoolMgr::CompletionPortThreadStart
+    // The current possible values for Function:
+    //  - CallbackForInitiateDrainageOfCompletionPortQueue and 
+    //    CallbackForContinueDrainageOfCompletionPortQueue for Drainage
+    //  - BindIoCompletionCallbackStub for ThreadPool.UnsafeQueueNativeOverlapped
+    //  - WaitIOCompletionCallback for ThreadPool.RegisterWaitForSingleObject
+
+    return ::PostQueuedCompletionStatus(GlobalCompletionPort,
+                                        0,
+                                        (ULONG_PTR) Function,
+                                        lpOverlapped);
+#else  
+    SetLastError(ERROR_CALL_NOT_IMPLEMENTED);
+    return FALSE;
+#endif // !FEATURE_PAL
+}
+
+
+void ThreadpoolMgr::WaitIOCompletionCallback(
+    DWORD dwErrorCode,
+    DWORD numBytesTransferred,
+    LPOVERLAPPED lpOverlapped)
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    if (dwErrorCode == ERROR_SUCCESS)
+        DWORD ret = AsyncCallbackCompletion((PVOID)lpOverlapped);
+}
+
+#ifndef FEATURE_PAL
+// We need to make sure that the next jobs picked up by a completion port thread
+// is inserted into the queue after we start cleanup.  The cleanup starts when a completion
+// port thread processes a special overlapped (overlappedForInitiateCleanup).
+// To do this, we loop through all completion port threads.
+// 1. If a thread is in cooperative mode, it is processing a job now, and the next job
+//    it picks up will be after we start cleanup.
+// 2. A completion port thread may be waiting for a job, or is going to dispatch a job.
+//    We can not distinguish these two.  So we queue a dummy job to the queue after the starting
+//    job.
+OVERLAPPED overlappedForInitiateCleanup;
+OVERLAPPED overlappedForContinueCleanup;
+#endif  // !FEATURE_PAL
+
+Volatile<ULONG> g_fCompletionPortDrainNeeded = FALSE;
+
+VOID ThreadpoolMgr::CallbackForContinueDrainageOfCompletionPortQueue(
+    DWORD dwErrorCode,
+    DWORD dwNumberOfBytesTransfered,
+    LPOVERLAPPED lpOverlapped
+    )
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;
+
+#ifndef FEATURE_PAL
+    CounterHolder hldNumCPIT(&NumCPInfrastructureThreads);
+
+    // It is OK if this overlapped is from a previous round.
+    // We have started a new round.  The next job picked by this thread is
+    // going to be after the marker.
+    Thread* pThread = GetThread();
+    if (pThread && !pThread->IsCompletionPortDrained())
+    {
+        pThread->MarkCompletionPortDrained();
+    }
+    if (g_fCompletionPortDrainNeeded)
+    {
+        ::PostQueuedCompletionStatus(GlobalCompletionPort,
+                                             0,
+                                             (ULONG_PTR)CallbackForContinueDrainageOfCompletionPortQueue,
+                                             &overlappedForContinueCleanup);
+        // IO Completion port thread is LIFO queue.  We want our special packet to be picked up by a different thread.
+        while (g_fCompletionPortDrainNeeded && pThread->IsCompletionPortDrained())
+        {
+            __SwitchToThread(100, CALLER_LIMITS_SPINNING);
+        }
+    }
+#endif // !FEATURE_PAL    
+}
+
+
+VOID
+ThreadpoolMgr::CallbackForInitiateDrainageOfCompletionPortQueue(
+    DWORD dwErrorCode,
+    DWORD dwNumberOfBytesTransfered,
+    LPOVERLAPPED lpOverlapped
+    )
+{
+ #ifndef FEATURE_PAL
+    CONTRACTL
+    {
+        NOTHROW;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    CounterHolder hldNumCPIT(&NumCPInfrastructureThreads);
+    {
+        ThreadStoreLockHolder tsl;
+        Thread *pThread = NULL;
+        while ((pThread = ThreadStore::GetAllThreadList(pThread, Thread::TS_CompletionPortThread, Thread::TS_CompletionPortThread)) != NULL)
+        {
+            pThread->UnmarkCompletionPortDrained();
+        }
+    }
+
+    FastInterlockOr(&g_fCompletionPortDrainNeeded, 1);
+
+    // Wake up retiring CP Threads so it can mark its status.
+    ThreadCounter::Counts counts = CPThreadCounter.GetCleanCounts();
+    if (counts.NumRetired > 0)
+        RetiredCPWakeupEvent->Set();
+
+    DWORD nTry = 0;
+    BOOL fTryNextTime = FALSE;
+    BOOL fMore = TRUE;
+    BOOL fFirstTime = TRUE;
+    while (fMore)
+    {
+        fMore = FALSE;
+        Thread *pCurThread = GetThread();
+        Thread *pThread = NULL;
+        {
+
+            ThreadStoreLockHolder tsl;
+
+            ::FlushProcessWriteBuffers();
+
+            while ((pThread = ThreadStore::GetAllThreadList(pThread, Thread::TS_CompletionPortThread, Thread::TS_CompletionPortThread)) != NULL)
+            {
+                if (pThread == pCurThread || pThread->IsDead() || pThread->IsCompletionPortDrained())
+                {
+                    continue;
+                }
+
+                if (pThread->PreemptiveGCDisabledOther() || pThread->GetFrame() != FRAME_TOP)
+                {
+                    // The thread is processing an IO job now.  When it picks up next job, the job
+                    // will be after the marker.
+                    pThread->MarkCompletionPortDrained();
+                }
+                else
+                {
+                    if (fFirstTime)
+                    {
+                        ::PostQueuedCompletionStatus(GlobalCompletionPort,
+                                                             0,
+                                                             (ULONG_PTR)CallbackForContinueDrainageOfCompletionPortQueue,
+                                                             &overlappedForContinueCleanup);
+                    }
+                    fMore = TRUE;
+                }
+            }
+        }
+        if (fMore)
+        {
+            __SwitchToThread(10, CALLER_LIMITS_SPINNING);
+            nTry ++;
+            if (nTry > 1000)
+            {
+                fTryNextTime = TRUE;
+                break;
+            }
+        }
+        fFirstTime = FALSE;
+    }
+
+    FastInterlockAnd(&g_fCompletionPortDrainNeeded, 0);
+    OverlappedDataObject::FinishCleanup(!fTryNextTime);
+#endif // !FEATURE_PAL
+}
+
+extern void WINAPI BindIoCompletionCallbackStub(DWORD ErrorCode,
+                                            DWORD numBytesTransferred,
+                                            LPOVERLAPPED lpOverlapped);
+
+void HostIOCompletionCallback(
+    DWORD ErrorCode,
+    DWORD numBytesTransferred,
+    LPOVERLAPPED lpOverlapped)
+{
+#ifndef FEATURE_PAL
+    if (lpOverlapped == &overlappedForInitiateCleanup)
+    {
+        ThreadpoolMgr::CallbackForInitiateDrainageOfCompletionPortQueue (
+            ErrorCode,
+            numBytesTransferred,
+            lpOverlapped);
+    }
+    else if (lpOverlapped == &overlappedForContinueCleanup)
+    {
+        ThreadpoolMgr::CallbackForContinueDrainageOfCompletionPortQueue(
+            ErrorCode,
+            numBytesTransferred,
+            lpOverlapped);
+    }
+    else
+    {
+        BindIoCompletionCallbackStub (
+            ErrorCode,
+            numBytesTransferred,
+            lpOverlapped);
+    }
+#endif // !FEATURE_PAL
+}
+
+BOOL ThreadpoolMgr::DrainCompletionPortQueue()
+{
+#ifndef FEATURE_PAL
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    if (GlobalCompletionPort == 0)
+    {
+        return FALSE;
+    }
+
+    return ::PostQueuedCompletionStatus(GlobalCompletionPort,
+                                                    0,
+                                                    (ULONG_PTR)CallbackForInitiateDrainageOfCompletionPortQueue,
+                                                    &overlappedForInitiateCleanup);
+#else
+    return FALSE;
+#endif // !FEATURE_PAL
+}
+
+
+DWORD __stdcall ThreadpoolMgr::QUWIPostCompletion(PVOID pArgs)
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_ANY;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    PostRequest* postRequest = (PostRequest*) pArgs;
+
+    EX_TRY
+    {
+        (postRequest->Function)(postRequest->errorCode, postRequest->numBytesTransferred, postRequest->lpOverlapped);
+    }
+    EX_CATCH
+    {
+        RecycleMemory( postRequest, MEMTYPE_PostRequest );
+        if (!SwallowUnhandledExceptions())
+            EX_RETHROW;
+    }
+    EX_END_CATCH(SwallowAllExceptions);
+    return ERROR_SUCCESS;
+
+}
+
+
+// This is either made by a worker thread or a CP thread
+// indicated by threadTypeStatus
+void ThreadpoolMgr::EnsureGateThreadRunning()
+{
+    LIMITED_METHOD_CONTRACT;
+
+    // The gate thread is only needed if the CLR is providing part of the ThreadPool implementation.
+    _ASSERTE(!CLRThreadpoolHosted() || !CLRIoCompletionHosted());
+
+    while (true)
+    {
+        switch (GateThreadStatus)
+        {
+        case GATE_THREAD_STATUS_REQUESTED:
+            //
+            // No action needed; the gate thread is running, and someone else has already registered a request
+            // for it to stay.
+            //
+            return;
+
+        case GATE_THREAD_STATUS_WAITING_FOR_REQUEST:
+            //
+            // Prevent the gate thread from exiting, if it hasn't already done so.  If it has, we'll create it on the next iteration of
+            // this loop.
+            //
+            FastInterlockCompareExchange(&GateThreadStatus, GATE_THREAD_STATUS_REQUESTED, GATE_THREAD_STATUS_WAITING_FOR_REQUEST);
+            break;
+
+        case GATE_THREAD_STATUS_NOT_RUNNING:
+            //
+            // We need to create a new gate thread
+            //
+            if (FastInterlockCompareExchange(&GateThreadStatus, GATE_THREAD_STATUS_REQUESTED, GATE_THREAD_STATUS_NOT_RUNNING) == GATE_THREAD_STATUS_NOT_RUNNING)
+            {
+                if (!CreateGateThread()) 
+                {
+                    //
+                    // If we failed to create the gate thread, someone else will need to try again later.
+                    //
+                    GateThreadStatus = GATE_THREAD_STATUS_NOT_RUNNING;
+                }
+                return;
+            }
+            break;
+
+        default:
+            _ASSERTE(!"Invalid value of ThreadpoolMgr::GateThreadStatus");
+        }
+    }
+
+    return;
+}
+
+
+bool ThreadpoolMgr::ShouldGateThreadKeepRunning()
+{
+    LIMITED_METHOD_CONTRACT;
+
+    // The gate thread is only needed if the CLR is providing part of the ThreadPool implementation.
+    _ASSERTE(!CLRThreadpoolHosted() || !CLRIoCompletionHosted());
+
+    _ASSERTE(GateThreadStatus == GATE_THREAD_STATUS_WAITING_FOR_REQUEST ||
+             GateThreadStatus == GATE_THREAD_STATUS_REQUESTED);
+
+    //
+    // Switch to WAITING_FOR_REQUEST, and see if we had a request since the last check.
+    //
+    LONG previousStatus = FastInterlockExchange(&GateThreadStatus, GATE_THREAD_STATUS_WAITING_FOR_REQUEST);
+
+    if (previousStatus == GATE_THREAD_STATUS_WAITING_FOR_REQUEST)
+    {
+        //
+        // No recent requests for the gate thread.  Check to see if we're still needed.
+        //
+
+        //
+        // Are there any free threads in the I/O completion pool?  If there are, we don't need a gate thread.
+        // This implies that whenever we decrement NumFreeCPThreads to 0, we need to call EnsureGateThreadRunning().
+        //
+        ThreadCounter::Counts counts = CPThreadCounter.GetCleanCounts();
+        bool needGateThreadForCompletionPort = 
+            InitCompletionPortThreadpool &&
+            (counts.NumActive - counts.NumWorking) <= 0;
+
+        //
+        // Are there any work requests in any worker queue?  If so, we need a gate thread.
+        // This imples that whenever a work queue goes from empty to non-empty, we need to call EnsureGateThreadRunning().
+        //
+        bool needGateThreadForWorkerThreads = 
+            !CLRThreadpoolHosted() &&
+            PerAppDomainTPCountList::AreRequestsPendingInAnyAppDomains();
+
+        //
+        // If worker tracking is enabled, we need to fire periodic ETW events with active worker counts.  This is
+        // done by the gate thread.
+        // We don't have to do anything special with EnsureGateThreadRunning() here, because this is only needed
+        // once work has been added to the queue for the first time (which is covered above).
+        //
+        bool needGateThreadForWorkerTracking = 
+            0 != CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_EnableWorkerTracking);
+
+        if (!(needGateThreadForCompletionPort || 
+              needGateThreadForWorkerThreads ||
+              needGateThreadForWorkerTracking))
+        {
+            //
+            // It looks like we shouldn't be running.  But another thread may now tell us to run.  If so, they will set GateThreadStatus
+            // back to GATE_THREAD_STATUS_REQUESTED.
+            //
+            previousStatus = FastInterlockCompareExchange(&GateThreadStatus, GATE_THREAD_STATUS_NOT_RUNNING, GATE_THREAD_STATUS_WAITING_FOR_REQUEST);
+            if (previousStatus == GATE_THREAD_STATUS_WAITING_FOR_REQUEST)
+                return false;
+        }
+    }
+
+
+    _ASSERTE(GateThreadStatus == GATE_THREAD_STATUS_WAITING_FOR_REQUEST ||
+             GateThreadStatus == GATE_THREAD_STATUS_REQUESTED);
+    return true;
+}
+
+
+
+//************************************************************************
+void ThreadpoolMgr::EnqueueWorkRequest(WorkRequest* workRequest)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        MODE_ANY;
+        GC_NOTRIGGER;
+    }
+    CONTRACTL_END;
+
+    AppendWorkRequest(workRequest);
+}
+
+WorkRequest* ThreadpoolMgr::DequeueWorkRequest()
+{
+    WorkRequest* entry = NULL;
+    CONTRACT(WorkRequest*)
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_PREEMPTIVE;
+
+        POSTCONDITION(CheckPointer(entry, NULL_OK));
+    } CONTRACT_END;
+
+    entry = RemoveWorkRequest();
+
+    RETURN entry;
+}
+
+DWORD WINAPI ThreadpoolMgr::ExecuteHostRequest(PVOID pArg)
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    ThreadLocaleHolder localeHolder;
+
+    bool foundWork, wasNotRecalled;
+    ExecuteWorkRequest(&foundWork, &wasNotRecalled);
+    return ERROR_SUCCESS;
+}
+
+void ThreadpoolMgr::ExecuteWorkRequest(bool* foundWork, bool* wasNotRecalled)
+{
+    CONTRACTL
+    {
+        THROWS;     // QueueUserWorkItem can throw
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    IPerAppDomainTPCount* pAdCount;
+
+    LONG index = PerAppDomainTPCountList::GetAppDomainIndexForThreadpoolDispatch();
+
+    if (index == 0)
+    {
+        *foundWork = false;
+        *wasNotRecalled = true;
+        return;
+    }
+
+    if(IsThreadPoolHosted()) 
+    {
+        //Only managed callBacks go this route under hosts.
+        //Also, since if we came here, atleast one managed requests was 
+        //created, and that means atleast one app domain exists.
+
+        if (index == -1) 
+        {
+            index = 1;
+        }
+    }
+
+    if (index == -1) 
+    {
+        pAdCount = PerAppDomainTPCountList::GetUnmanagedTPCount(); 
+    } 
+    else 
+    {
+
+        pAdCount = PerAppDomainTPCountList::GetPerAppdomainCount(TPIndex((DWORD)index));
+        _ASSERTE(pAdCount);
+    }
+
+    pAdCount->DispatchWorkItem(foundWork, wasNotRecalled);
+}
+
+//--------------------------------------------------------------------------
+//This function informs the thread scheduler that the first requests has been
+//queued on an appdomain, or it's the first unmanaged TP request. 
+//Arguments:
+//         UnmanagedTP: Indicates that the request arises from the unmanaged 
+//part of Thread Pool.
+//Assumptions:
+//         This function must be called under a per-appdomain lock or the 
+//correct lock under unmanaged TP queue.
+// 
+BOOL ThreadpoolMgr::SetAppDomainRequestsActive(BOOL UnmanagedTP)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        MODE_ANY;
+        GC_TRIGGERS;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    BOOL fShouldSignalEvent = FALSE;
+
+    IPerAppDomainTPCount* pAdCount;
+
+    if(UnmanagedTP)
+    {
+        pAdCount = PerAppDomainTPCountList::GetUnmanagedTPCount();
+        _ASSERTE(pAdCount);
+    }
+    else
+    {       
+        Thread* pCurThread = GetThread();
+        _ASSERTE( pCurThread);
+
+        AppDomain* pAppDomain = pCurThread->GetDomain();
+        _ASSERTE(pAppDomain);
+        
+        TPIndex tpindex = pAppDomain->GetTPIndex();        
+        pAdCount = PerAppDomainTPCountList::GetPerAppdomainCount(tpindex);
+
+        _ASSERTE(pAdCount);
+    }
+
+    pAdCount->SetAppDomainRequestsActive();
+
+    return fShouldSignalEvent;
+}
+
+void ThreadpoolMgr::ClearAppDomainRequestsActive(BOOL UnmanagedTP, BOOL AdUnloading, LONG id)
+//--------------------------------------------------------------------------
+//This function informs the thread scheduler that the kast request has been
+//dequeued on an appdomain, or it's the last unmanaged TP request. 
+//Arguments:
+//         UnmanagedTP: Indicates that the request arises from the unmanaged 
+//part of Thread Pool.
+//         id: Indicates the id of the appdomain. The id is needed as this 
+//function can be called (indirectly) from the appdomain unload thread from
+//unmanaged code to clear per-appdomain state during rude unload. 
+//Assumptions:
+//         This function must be called under a per-appdomain lock or the 
+//correct lock under unmanaged TP queue.
+// 
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        MODE_ANY;
+        GC_TRIGGERS;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    IPerAppDomainTPCount* pAdCount;
+
+    if(UnmanagedTP) 
+    {
+        pAdCount = PerAppDomainTPCountList::GetUnmanagedTPCount();
+        _ASSERTE(pAdCount);
+    } 
+    else
+    {
+       if (AdUnloading)
+       { 
+           pAdCount = PerAppDomainTPCountList::GetPerAppdomainCount(TPIndex(id));
+       }
+       else
+       {  
+           Thread* pCurThread = GetThread();
+           _ASSERTE( pCurThread);
+
+           AppDomain* pAppDomain = pCurThread->GetDomain();
+           _ASSERTE(pAppDomain);
+        
+           TPIndex tpindex = pAppDomain->GetTPIndex();
+
+           pAdCount = PerAppDomainTPCountList::GetPerAppdomainCount(tpindex);
+       } 
+
+        _ASSERTE(pAdCount);
+    }
+
+    pAdCount->ClearAppDomainRequestsActive();
+}
+
+
+// Remove a block from the appropriate recycleList and return.
+// If recycleList is empty, fall back to new.
+LPVOID ThreadpoolMgr::GetRecycledMemory(enum MemType memType)
+{
+    LPVOID result = NULL;
+    CONTRACT(LPVOID)
+    {
+        THROWS;
+        GC_NOTRIGGER;
+        MODE_ANY;
+        INJECT_FAULT(COMPlusThrowOM());
+        POSTCONDITION(CheckPointer(result));
+    } CONTRACT_END;
+
+    if(RecycledLists.IsInitialized())
+    {
+        RecycledListInfo& list = RecycledLists.GetRecycleMemoryInfo( memType );
+
+        result = list.Remove();
+    }
+
+    if(result == NULL)
+    {
+        switch (memType)
+        {
+            case MEMTYPE_DelegateInfo:
+                result =  new DelegateInfo;
+                break;
+            case MEMTYPE_AsyncCallback:
+                result =  new AsyncCallback;
+                break;
+            case MEMTYPE_WorkRequest:
+                result =  new WorkRequest;
+                break;
+            case MEMTYPE_PostRequest:
+                result =  new PostRequest;
+                break;
+            default:
+                _ASSERTE(!"Unknown Memtype");
+                result = NULL;
+                break;
+        }
+    }
+
+    RETURN result;
+}
+
+// Insert freed block in recycle list. If list is full, return to system heap
+void ThreadpoolMgr::RecycleMemory(LPVOID mem, enum MemType memType)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        SO_TOLERANT;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    if(RecycledLists.IsInitialized())
+    {
+        RecycledListInfo& list = RecycledLists.GetRecycleMemoryInfo( memType );
+
+        if(list.CanInsert())
+        {
+            list.Insert( mem );
+            return;
+        }
+    }
+
+    switch (memType)
+    {
+        case MEMTYPE_DelegateInfo:
+            delete (DelegateInfo*) mem;
+            break;
+        case MEMTYPE_AsyncCallback:
+            delete (AsyncCallback*) mem;
+            break;
+        case MEMTYPE_WorkRequest:
+            delete (WorkRequest*) mem;
+            break;
+        case MEMTYPE_PostRequest:
+            delete (PostRequest*) mem;
+            break;
+        default:
+            _ASSERTE(!"Unknown Memtype");
+
+    }
+}
+
+#define THROTTLE_RATE  0.10 /* rate by which we increase the delay as number of threads increase */
+
+// This is to avoid the 64KB/1MB aliasing problem present on Pentium 4 processors,
+// which can significantly impact performance with HyperThreading enabled
+DWORD __stdcall ThreadpoolMgr::intermediateThreadProc(PVOID arg)
+{
+    WRAPPER_NO_CONTRACT;
+    STATIC_CONTRACT_SO_INTOLERANT;
+
+    offset_counter++;
+    if (offset_counter * offset_multiplier > PAGE_SIZE)
+        offset_counter = 0;
+
+    (void)_alloca(offset_counter * offset_multiplier);
+
+    intermediateThreadParam* param = (intermediateThreadParam*)arg;
+
+    LPTHREAD_START_ROUTINE ThreadFcnPtr = param->lpThreadFunction;
+    PVOID args = param->lpArg;
+    delete param;
+
+    return ThreadFcnPtr(args);
+}
+
+Thread* ThreadpoolMgr::CreateUnimpersonatedThread(LPTHREAD_START_ROUTINE lpStartAddress, LPVOID lpArgs, BOOL *pIsCLRThread)
+{
+    STATIC_CONTRACT_NOTHROW;
+    if (GetThread()) { STATIC_CONTRACT_GC_TRIGGERS;} else {DISABLED(STATIC_CONTRACT_GC_NOTRIGGER);}
+    STATIC_CONTRACT_MODE_ANY;
+    /* cannot use contract because of SEH
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_ANY;
+    }
+    CONTRACTL_END;*/
+
+    Thread* pThread = NULL;
+
+    if (g_fEEStarted) {
+        *pIsCLRThread = TRUE;
+    }
+    else
+        *pIsCLRThread = FALSE;
+    if (*pIsCLRThread) {
+        EX_TRY
+        {
+            pThread = SetupUnstartedThread();
+        }
+        EX_CATCH
+        {
+            pThread = NULL;
+        }
+        EX_END_CATCH(SwallowAllExceptions);
+        if (pThread == NULL) {
+            return NULL;
+        }
+    }
+    DWORD threadId;
+    BOOL bOK = FALSE;
+    HANDLE threadHandle = NULL;
+
+    if (*pIsCLRThread) {
+        // CreateNewThread takes care of reverting any impersonation - so dont do anything here.
+        bOK = pThread->CreateNewThread(0,               // default stack size
+                                       lpStartAddress,
+                                       lpArgs           //arguments
+                                       );
+    }
+    else {
+#ifndef FEATURE_PAL
+        ThreadAffinityHolder affinityHolder(FALSE);
+        HandleHolder token;
+        BOOL bReverted = FALSE;
+        bOK = RevertIfImpersonated(&bReverted, &token, &affinityHolder);
+        if (bOK != TRUE)
+            return NULL;
+#endif // !FEATURE_PAL 
+        NewHolder<intermediateThreadParam> lpThreadArgs(new (nothrow) intermediateThreadParam);
+        if (lpThreadArgs != NULL)
+        {
+            lpThreadArgs->lpThreadFunction = lpStartAddress;
+            lpThreadArgs->lpArg = lpArgs;
+            threadHandle = CreateThread(NULL,               // security descriptor
+                                        0,                  // default stack size
+                                        intermediateThreadProc,
+                                        lpThreadArgs,       // arguments
+                                        CREATE_SUSPENDED,
+                                        &threadId);
+            if (threadHandle != NULL)
+                lpThreadArgs.SuppressRelease();
+        }
+#ifndef FEATURE_PAL
+        UndoRevert(bReverted, token);
+#endif // !FEATURE_PAL 
+    }
+
+    if (*pIsCLRThread && !bOK)
+    {
+        pThread->DecExternalCount(FALSE);
+        pThread = NULL;
+    }
+
+    if (*pIsCLRThread) {
+        return pThread;
+    }
+    else
+        return (Thread*)threadHandle;
+}
+
+
+BOOL ThreadpoolMgr::CreateWorkerThread()
+{
+    CONTRACTL
+    {
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        NOTHROW;
+        MODE_ANY;   // We may try to add a worker thread while queuing a work item thru an fcall
+    }
+    CONTRACTL_END;
+
+    Thread *pThread;
+    BOOL fIsCLRThread;
+    if ((pThread = CreateUnimpersonatedThread(WorkerThreadStart, NULL, &fIsCLRThread)) != NULL)
+    {
+        if (fIsCLRThread) {
+            pThread->ChooseThreadCPUGroupAffinity();
+            pThread->StartThread();
+        }
+        else {
+            DWORD status;
+            status = ResumeThread((HANDLE)pThread);
+            _ASSERTE(status != (DWORD) (-1));
+            CloseHandle((HANDLE)pThread);          // we don't need this anymore
+        }
+
+        return TRUE;
+    }
+
+    return FALSE;
+}
+
+
+DWORD __stdcall ThreadpoolMgr::WorkerThreadStart(LPVOID lpArgs)
+{
+    ClrFlsSetThreadType (ThreadType_Threadpool_Worker);
+
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(!CLRThreadpoolHosted());
+
+    Thread *pThread = NULL;
+    DWORD dwSwitchCount = 0;
+    BOOL fThreadInit = FALSE;
+
+    ThreadCounter::Counts counts, oldCounts, newCounts;
+    bool foundWork = true, wasNotRecalled = true;
+
+    counts = WorkerCounter.GetCleanCounts();
+    FireEtwThreadPoolWorkerThreadStart(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+
+#ifdef FEATURE_COMINTEROP
+    BOOL fCoInited = FALSE;
+    // Threadpool threads should be initialized as MTA. If we are unable to do so,
+    // return failure.
+    {
+        fCoInited = SUCCEEDED(::CoInitializeEx(NULL, COINIT_MULTITHREADED));
+        if (!fCoInited)
+        {
+            goto Exit;
+        }
+    }
+#endif // FEATURE_COMINTEROP
+Work:
+
+    if (!fThreadInit) {
+        if (g_fEEStarted) {
+            pThread = SetupThreadNoThrow();
+            if (pThread == NULL) {
+                __SwitchToThread(0, ++dwSwitchCount);
+                goto Work;
+            }
+
+            // converted to CLRThread and added to ThreadStore, pick an group affinity for this thread
+            pThread->ChooseThreadCPUGroupAffinity(); 
+
+            #ifdef FEATURE_COMINTEROP
+            if (pThread->SetApartment(Thread::AS_InMTA, TRUE) != Thread::AS_InMTA)
+            {
+                counts = WorkerCounter.GetCleanCounts();
+                while (true)
+                {
+                    newCounts = counts;
+                    newCounts.NumActive--;
+                    newCounts.NumWorking--;
+                    oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+                    if (oldCounts == counts)
+                        break;
+                    counts = oldCounts;
+                }
+                goto Exit;
+            }
+            #endif // FEATURE_COMINTEROP
+
+            pThread->SetBackground(TRUE);
+            fThreadInit = TRUE;
+        }
+    }
+
+    GCX_PREEMP_NO_DTOR();
+    _ASSERTE(pThread == NULL || !pThread->PreemptiveGCDisabled());
+
+    // make sure there's really work.  If not, go back to sleep
+
+    counts = WorkerCounter.GetCleanCounts();
+    while (true)
+    {
+        _ASSERTE(counts.NumActive > 0);
+        _ASSERTE(counts.NumWorking > 0);
+
+        newCounts = counts;
+
+        bool retired;
+
+        if (counts.NumActive > counts.MaxWorking)
+        {
+            newCounts.NumActive--;
+            newCounts.NumRetired++;
+            retired = true;
+        }
+        else
+        {
+            retired = false;
+
+            if (foundWork)
+                break;
+        }
+
+        newCounts.NumWorking--;
+
+        oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+
+        if (oldCounts == counts)
+        {
+            if (retired)
+                goto Retire;
+            else
+                goto WaitForWork;
+        }
+
+        counts = oldCounts;
+    }
+
+    if (GCHeap::IsGCInProgress(TRUE))
+    {
+        // GC is imminent, so wait until GC is complete before executing next request.
+        // this reduces in-flight objects allocated right before GC, easing the GC's work
+        GCHeap::WaitForGCCompletion(TRUE);
+    }
+
+    {
+        ThreadLocaleHolder localeHolder;
+
+        ThreadpoolMgr::UpdateLastDequeueTime();
+        ThreadpoolMgr::ExecuteWorkRequest(&foundWork, &wasNotRecalled);
+    }
+
+    if (foundWork)
+    {
+        // Reset TLS etc. for next WorkRequest.
+        if (pThread == NULL)
+            pThread = GetThread();
+
+        if (pThread) 
+        {
+            if (pThread->IsAbortRequested())
+                pThread->EEResetAbort(Thread::TAR_ALL);
+            pThread->InternalReset(FALSE);
+        }
+    }
+
+    if (wasNotRecalled)
+        goto Work;
+
+Retire:
+
+    counts = WorkerCounter.GetCleanCounts();
+    FireEtwThreadPoolWorkerThreadRetirementStart(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+
+    // It's possible that some work came in just before we decremented the active thread count, in which 
+    // case whoever queued that work may be expecting us to pick it up - so they would not have signalled
+    // the worker semaphore.  If there are other threads waiting, they will never be woken up, because 
+    // whoever queued the work expects that it's already been picked up.  The solution is to signal the semaphore
+    // if there's any work available.
+    if (PerAppDomainTPCountList::AreRequestsPendingInAnyAppDomains())
+        MaybeAddWorkingWorker();
+
+    while (true)
+    {
+RetryRetire:
+        DWORD result = RetiredWorkerSemaphore->Wait(AppX::IsAppXProcess() ? WorkerTimeoutAppX : WorkerTimeout, FALSE);
+        _ASSERTE(WAIT_OBJECT_0 == result || WAIT_TIMEOUT == result);
+
+        if (WAIT_OBJECT_0 == result)
+        {
+            foundWork = true;
+            counts = WorkerCounter.GetCleanCounts();
+            FireEtwThreadPoolWorkerThreadRetirementStop(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+            goto Work;
+        }
+
+        if (!IsIoPending())
+        {
+            //
+            // We're going to exit.  There's a nasty race here.  We're about to decrement NumRetired,
+            // since we're going to exit.  Once we've done that, nobody will expect this thread
+            // to be waiting for RetiredWorkerSemaphore.  But between now and then, other threads still
+            // think we're waiting on the semaphore, and they will happily do the following to try to
+            // wake us up:
+            //
+            // 1) Decrement NumRetired
+            // 2) Increment NumActive
+            // 3) Increment NumWorking
+            // 4) Signal RetiredWorkerSemaphore
+            //
+            // We will not receive that signal.  If we don't do something special here,
+            // we will decrement NumRetired an extra time, and leave the world thinking there
+            // are fewer retired threads, and more working threads than reality.
+            //
+            // What can we do about this?  First, we *need* to decrement NumRetired.  If someone did it before us,
+            // it might go negative.  This is the easiest way to tell that we've encountered this race.  In that case,
+            // we will simply not commit the decrement, swallow the signal that was sent, and proceed as if we
+            // got WAIT_OBJECT_0 in the wait above.
+            //
+            // If we don't hit zero while decrementing NumRetired, we still may have encountered this race.  But 
+            // if we don't hit zero, then there's another retired thread that will pick up this signal.  So it's ok
+            // to exit.
+            //
+            counts = WorkerCounter.GetCleanCounts();
+            while (true)
+            {
+                if (counts.NumRetired == 0)
+                    goto RetryRetire;
+
+                newCounts = counts;
+                newCounts.NumRetired--;
+
+                oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+                if (oldCounts == counts)
+                {
+                    counts = newCounts;
+                    break;
+                }
+                counts = oldCounts;
+            }
+
+            FireEtwThreadPoolWorkerThreadRetirementStop(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+            goto Exit;
+        }
+    }
+
+WaitForWork:
+
+    // It's possible that we decided we had no work just before some work came in, 
+    // but reduced the worker count *after* the work came in.  In this case, we might
+    // miss the notification of available work.  So we make a sweep through the ADs here,
+    // and wake up a thread (maybe this one!) if there is work to do.
+    if (PerAppDomainTPCountList::AreRequestsPendingInAnyAppDomains())
+    {
+        foundWork = true;
+        MaybeAddWorkingWorker();
+    }
+
+    FireEtwThreadPoolWorkerThreadWait(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+
+RetryWaitForWork:
+    if (!WorkerSemaphore->Wait(AppX::IsAppXProcess() ? WorkerTimeoutAppX : WorkerTimeout))
+    {
+        if (!IsIoPending())
+        {
+            //
+            // We timed out, and are about to exit.  This puts us in a very similar situation to the
+            // retirement case above - someone may think we're still waiting, and go ahead and:
+            //
+            // 1) Increment NumWorking
+            // 2) Signal WorkerSemaphore
+            //
+            // The solution is much like retirement; when we're decrementing NumActive, we need to make
+            // sure it doesn't drop below NumWorking.  If it would, then we need to go back and wait 
+            // again.
+            //
+
+            DangerousNonHostedSpinLockHolder tal(&ThreadAdjustmentLock);
+
+            counts = WorkerCounter.GetCleanCounts();
+            while (true)
+            {
+                if (counts.NumActive == counts.NumWorking)
+                {
+                    goto RetryWaitForWork;
+                }
+
+                newCounts = counts;
+                newCounts.NumActive--;
+
+                // if we timed out while active, then Hill Climbing needs to be told that we need fewer threads
+                newCounts.MaxWorking = max(MinLimitTotalWorkerThreads, min(newCounts.NumActive, newCounts.MaxWorking));
+
+                oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+
+                if (oldCounts == counts)
+                {
+                    HillClimbingInstance.ForceChange(newCounts.MaxWorking, ThreadTimedOut);
+                    goto Exit;
+                }
+
+                counts = oldCounts;
+            }
+        }
+        else
+        {
+            goto RetryWaitForWork;
+        }
+    }
+    else
+    {
+        foundWork = true;
+        goto Work;
+    }
+
+Exit:
+
+#ifdef FEATURE_COMINTEROP
+    if (pThread) {
+        pThread->SetApartment(Thread::AS_Unknown, TRUE);
+        pThread->CoUninitialize();
+    }
+
+    // Couninit the worker thread
+    if (fCoInited)
+    {
+        CoUninitialize();
+    }
+#endif
+
+    if (pThread) {
+        pThread->ClearThreadCPUGroupAffinity();
+
+        DestroyThread(pThread);
+    }
+
+    _ASSERTE(!IsIoPending());
+
+    counts = WorkerCounter.GetCleanCounts();
+    FireEtwThreadPoolWorkerThreadStop(counts.NumActive, counts.NumRetired, GetClrInstanceId());
+
+    return ERROR_SUCCESS;
+}
+
+
+#ifdef _MSC_VER
+#pragma warning(default:4702)
+#endif
+BOOL ThreadpoolMgr::SuspendProcessing()
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;
+
+    BOOL shouldRetire = TRUE;
+    DWORD sleepInterval = SUSPEND_TIME;
+    int oldCpuUtilization = cpuUtilization;
+    for (int i = 0; i < shouldRetire; i++)
+    {
+        __SwitchToThread(sleepInterval, CALLER_LIMITS_SPINNING);
+        if ((cpuUtilization <= (oldCpuUtilization - 4)))
+        {   // if cpu util. dips by 4% or more, then put it back in circulation
+            shouldRetire = FALSE;
+            break;
+        }
+    }
+
+    return shouldRetire;
+}
+
+
+// this should only be called by unmanaged thread (i.e. there should be no mgd
+// caller on the stack) since we are swallowing terminal exceptions
+DWORD ThreadpoolMgr::SafeWait(CLREvent * ev, DWORD sleepTime, BOOL alertable)
+{
+    STATIC_CONTRACT_NOTHROW;
+    STATIC_CONTRACT_GC_NOTRIGGER;
+    STATIC_CONTRACT_MODE_PREEMPTIVE;
+    /* cannot use contract because of SEH
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;*/
+
+    DWORD status = WAIT_TIMEOUT;
+    EX_TRY
+    {
+        status = ev->Wait(sleepTime,FALSE);
+    }
+    EX_CATCH
+    {
+    }
+    EX_END_CATCH(SwallowAllExceptions)
+    return status;
+}
+
+/************************************************************************/
+
+BOOL ThreadpoolMgr::RegisterWaitForSingleObject(PHANDLE phNewWaitObject,
+                                                HANDLE hWaitObject,
+                                                WAITORTIMERCALLBACK Callback,
+                                                PVOID Context,
+                                                ULONG timeout,
+                                                DWORD dwFlag )
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+    }
+    CONTRACTL_END;
+    EnsureInitialized();
+
+    ThreadCB* threadCB;
+    {
+        CrstHolder csh(&WaitThreadsCriticalSection);
+
+        threadCB = FindWaitThread();
+    }
+
+    *phNewWaitObject = NULL;
+
+    if (threadCB)
+    {
+        WaitInfo* waitInfo = new (nothrow) WaitInfo;
+
+        if (waitInfo == NULL)
+            return FALSE;
+
+        waitInfo->waitHandle = hWaitObject;
+        waitInfo->Callback = Callback;
+        waitInfo->Context = Context;
+        waitInfo->timeout = timeout;
+        waitInfo->flag = dwFlag;
+        waitInfo->threadCB = threadCB;
+        waitInfo->state = 0;
+        waitInfo->refCount = 1;     // safe to do this since no wait has yet been queued, so no other thread could be modifying this
+        waitInfo->ExternalCompletionEvent = INVALID_HANDLE;
+        waitInfo->ExternalEventSafeHandle = NULL;
+        waitInfo->handleOwningAD = (ADID) 0;
+
+        waitInfo->timer.startTime = GetTickCount();
+        waitInfo->timer.remainingTime = timeout;
+
+        *phNewWaitObject = waitInfo;
+
+        // We fire the "enqueue" ETW event here, to "mark" the thread that had called the API, rather than the
+        // thread that will PostQueuedCompletionStatus (the dedicated WaitThread).
+        // This event correlates with ThreadPoolIODequeue in ThreadpoolMgr::AsyncCallbackCompletion
+        if (ETW_EVENT_ENABLED(MICROSOFT_WINDOWS_DOTNETRUNTIME_PROVIDER_Context, ThreadPoolIOEnqueue))
+            FireEtwThreadPoolIOEnqueue((LPOVERLAPPED)waitInfo, Callback, (dwFlag & WAIT_SINGLE_EXECUTION) == 0, GetClrInstanceId());
+    
+        BOOL status = QueueUserAPC((PAPCFUNC)InsertNewWaitForSelf, threadCB->threadHandle, (size_t) waitInfo);
+
+        if (status == FALSE)
+        {
+            *phNewWaitObject = NULL;
+            delete waitInfo;
+        }
+
+        return status;
+    }
+
+    return FALSE;
+}
+
+
+// Returns a wait thread that can accomodate another wait request. The
+// caller is responsible for synchronizing access to the WaitThreadsHead
+ThreadpoolMgr::ThreadCB* ThreadpoolMgr::FindWaitThread()
+{
+    CONTRACTL
+    {
+        THROWS;     // CreateWaitThread can throw
+        MODE_ANY;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+    do
+    {
+        for (LIST_ENTRY* Node = (LIST_ENTRY*) WaitThreadsHead.Flink ;
+             Node != &WaitThreadsHead ;
+             Node = (LIST_ENTRY*)Node->Flink)
+        {
+            _ASSERTE(offsetof(WaitThreadInfo,link) == 0);
+
+            ThreadCB*  threadCB = ((WaitThreadInfo*) Node)->threadCB;
+
+            if (threadCB->NumWaitHandles < MAX_WAITHANDLES)         // this test and following ...
+
+            {
+                InterlockedIncrement(&threadCB->NumWaitHandles);    // ... increment are protected by WaitThreadsCriticalSection.
+                                                                    // but there might be a concurrent decrement in DeactivateWait
+                                                                    // or InsertNewWaitForSelf, hence the interlock
+                return threadCB;
+            }
+        }
+
+        // if reached here, there are no wait threads available, so need to create a new one
+        if (!CreateWaitThread())
+            return NULL;
+
+
+        // Now loop back
+    } while (TRUE);
+
+}
+
+BOOL ThreadpoolMgr::CreateWaitThread()
+{
+    CONTRACTL
+    {
+        THROWS; // CLREvent::CreateAutoEvent can throw OOM
+        GC_TRIGGERS;
+        MODE_ANY;
+        INJECT_FAULT(COMPlusThrowOM());
+    }
+    CONTRACTL_END;
+    DWORD threadId;
+
+    if (g_fEEShutDown & ShutDown_Finalize2){
+        // The process is shutting down.  Shutdown thread has ThreadStore lock,
+        // wait thread is blocked on the lock.
+        return FALSE;
+    }
+
+    NewHolder<WaitThreadInfo> waitThreadInfo(new (nothrow) WaitThreadInfo);
+    if (waitThreadInfo == NULL)
+        return FALSE;
+
+    NewHolder<ThreadCB> threadCB(new (nothrow) ThreadCB);
+
+    if (threadCB == NULL)
+    {
+        return FALSE;
+    }
+
+    threadCB->startEvent.CreateAutoEvent(FALSE);
+    HANDLE threadHandle = Thread::CreateUtilityThread(Thread::StackSize_Small, WaitThreadStart, (LPVOID)threadCB, CREATE_SUSPENDED, &threadId);
+
+    if (threadHandle == NULL)
+    {
+        threadCB->startEvent.CloseEvent();
+        return FALSE;
+    }
+
+    waitThreadInfo.SuppressRelease();
+    threadCB.SuppressRelease();
+    threadCB->threadHandle = threadHandle;
+    threadCB->threadId = threadId;              // may be useful for debugging otherwise not used
+    threadCB->NumWaitHandles = 0;
+    threadCB->NumActiveWaits = 0;
+    for (int i=0; i< MAX_WAITHANDLES; i++)
+    {
+        InitializeListHead(&(threadCB->waitPointer[i]));
+    }
+
+    waitThreadInfo->threadCB = threadCB;
+
+    DWORD status = ResumeThread(threadHandle);
+
+    {
+        // We will QueueUserAPC on the newly created thread.
+        // Let us wait until the thread starts running.
+        GCX_PREEMP();
+        DWORD timeout=500;
+        while (TRUE) {
+            if (g_fEEShutDown & ShutDown_Finalize2){
+                // The process is shutting down.  Shutdown thread has ThreadStore lock,
+                // wait thread is blocked on the lock.
+                return FALSE;
+            }
+            DWORD wait_status = threadCB->startEvent.Wait(timeout, FALSE);
+            if (wait_status == WAIT_OBJECT_0) {
+                break;
+            }
+        }
+    }
+    threadCB->startEvent.CloseEvent();
+
+    // check to see if setup succeeded
+    if (threadCB->threadHandle == NULL)
+        return FALSE;
+
+    InsertHeadList(&WaitThreadsHead,&waitThreadInfo->link);
+
+    _ASSERTE(status != (DWORD) (-1));
+
+    return (status != (DWORD) (-1));
+
+}
+
+// Executed as an APC on a WaitThread. Add the wait specified in pArg to the list of objects it is waiting on
+void ThreadpoolMgr::InsertNewWaitForSelf(WaitInfo* pArgs)
+{
+    WRAPPER_NO_CONTRACT;
+    STATIC_CONTRACT_SO_INTOLERANT;
+
+    WaitInfo* waitInfo = pArgs;
+
+    // the following is safe since only this thread is allowed to change the state
+    if (!(waitInfo->state & WAIT_DELETE))
+    {
+        waitInfo->state =  (WAIT_REGISTERED | WAIT_ACTIVE);
+    }
+    else
+    {
+        // some thread unregistered the wait
+        DeleteWait(waitInfo);
+        return;
+    }
+
+
+    ThreadCB* threadCB = waitInfo->threadCB;
+
+    _ASSERTE(threadCB->NumActiveWaits <= threadCB->NumWaitHandles);
+
+    int index = FindWaitIndex(threadCB, waitInfo->waitHandle);
+    _ASSERTE(index >= 0 && index <= threadCB->NumActiveWaits);
+
+    if (index == threadCB->NumActiveWaits)
+    {
+        threadCB->waitHandle[threadCB->NumActiveWaits] = waitInfo->waitHandle;
+        threadCB->NumActiveWaits++;
+    }
+    else
+    {
+        // this is a duplicate waithandle, so the increment in FindWaitThread
+        // wasn't strictly necessary.  This will avoid unnecessary thread creation.
+        InterlockedDecrement(&threadCB->NumWaitHandles);
+    }
+
+    _ASSERTE(offsetof(WaitInfo, link) == 0);
+    InsertTailList(&(threadCB->waitPointer[index]), (&waitInfo->link));
+
+    return;
+}
+
+// returns the index of the entry that matches waitHandle or next free entry if not found
+int ThreadpoolMgr::FindWaitIndex(const ThreadCB* threadCB, const HANDLE waitHandle)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    for (int i=0;i<threadCB->NumActiveWaits; i++)
+        if (threadCB->waitHandle[i] == waitHandle)
+            return i;
+
+    // else not found
+    return threadCB->NumActiveWaits;
+}
+
+
+// if no wraparound that the timer is expired if duetime is less than current time
+// if wraparound occurred, then the timer expired if dueTime was greater than last time or dueTime is less equal to current time
+#define TimeExpired(last,now,duetime) (last <= now ? \
+                                       (duetime <= now && duetime >= last): \
+                                       (duetime >= last || duetime <= now))
+
+#define TimeInterval(end,start) ( end > start ? (end - start) : ((0xffffffff - start) + end + 1)   )
+
+// Returns the minimum of the remaining time to reach a timeout among all the waits
+DWORD ThreadpoolMgr::MinimumRemainingWait(LIST_ENTRY* waitInfo, unsigned int numWaits)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    unsigned int min = (unsigned int) -1;
+    DWORD currentTime = GetTickCount();
+
+    for (unsigned i=0; i < numWaits ; i++)
+    {
+        WaitInfo* waitInfoPtr = (WaitInfo*) (waitInfo[i].Flink);
+        PVOID waitInfoHead = &(waitInfo[i]);
+        do
+        {
+            if (waitInfoPtr->timeout != INFINITE)
+            {
+                // compute remaining time
+                DWORD elapsedTime = TimeInterval(currentTime,waitInfoPtr->timer.startTime );
+
+                __int64 remainingTime = (__int64) (waitInfoPtr->timeout) - (__int64) elapsedTime;
+
+                // update remaining time
+                waitInfoPtr->timer.remainingTime =  remainingTime > 0 ? (int) remainingTime : 0;
+
+                // ... and min
+                if (waitInfoPtr->timer.remainingTime < min)
+                    min = waitInfoPtr->timer.remainingTime;
+            }
+
+            waitInfoPtr = (WaitInfo*) (waitInfoPtr->link.Flink);
+
+        } while ((PVOID) waitInfoPtr != waitInfoHead);
+
+    }
+    return min;
+}
+
+#ifdef _MSC_VER
+#ifdef _WIN64
+#pragma warning (disable : 4716)
+#else
+#pragma warning (disable : 4715)
+#endif
+#endif
+#ifdef _PREFAST_
+#pragma warning(push)
+#pragma warning(disable:22008) // "Prefast integer overflow check on (0 + lval) is bogus.  Tried local disable without luck, doing whole method."
+#endif
+
+DWORD __stdcall ThreadpoolMgr::WaitThreadStart(LPVOID lpArgs)
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+        SO_TOLERANT;
+    }
+    CONTRACTL_END;
+
+    ClrFlsSetThreadType (ThreadType_Wait);
+
+    ThreadCB* threadCB = (ThreadCB*) lpArgs;
+    Thread* pThread = SetupThreadNoThrow();
+
+    if (pThread == NULL)
+    {
+        _ASSERTE(threadCB->threadHandle != NULL);
+        threadCB->threadHandle = NULL;
+    }
+
+    threadCB->startEvent.Set();
+
+    if (pThread == NULL)
+    {
+        return 0;
+    }
+
+    BEGIN_SO_INTOLERANT_CODE(pThread);  // we probe at the top of the thread so we can safely call anything below here.
+    {
+        // wait threads never die. (Why?)
+        for (;;)
+        {
+            DWORD status;
+            DWORD timeout = 0;
+
+            if (threadCB->NumActiveWaits == 0)
+            {
+
+#undef SleepEx
+                // <TODO>@TODO Consider doing a sleep for an idle period and terminating the thread if no activity</TODO>
+        //We use SleepEx instead of CLRSLeepEx because CLRSleepEx calls into SQL(or other hosts) in hosted
+        //scenarios. SQL does not deliver APC's, and the waithread wait insertion/deletion logic depends on
+        //APC's being delivered.
+                status = SleepEx(INFINITE,TRUE);
+#define SleepEx(a,b) Dont_Use_SleepEx(a,b)
+
+                _ASSERTE(status == WAIT_IO_COMPLETION);
+            }
+            else if (IsWaitThreadAPCPending())
+            {
+                //Do a sleep if an APC is pending, This was done to solve the corner case where the wait is signaled,
+                //and APC to deregiter the wait never fires. That scenario leads to an infinite loop. This check would
+                //allow the thread to enter alertable wait and thus cause the APC to fire.
+
+                ResetWaitThreadAPCPending(); 
+
+                //We use SleepEx instead of CLRSLeepEx because CLRSleepEx calls into SQL(or other hosts) in hosted
+                //scenarios. SQL does not deliver APC's, and the waithread wait insertion/deletion logic depends on
+                //APC's being delivered.
+
+                #undef SleepEx
+                status = SleepEx(0,TRUE);    
+                #define SleepEx(a,b) Dont_Use_SleepEx(a,b)
+
+                continue;
+            }
+            else
+            {
+                // compute minimum timeout. this call also updates the remainingTime field for each wait
+                timeout = MinimumRemainingWait(threadCB->waitPointer,threadCB->NumActiveWaits);
+
+                status = WaitForMultipleObjectsEx(  threadCB->NumActiveWaits,
+                                                    threadCB->waitHandle,
+                                                    FALSE,                      // waitall
+                                                    timeout,
+                                                    TRUE  );                    // alertable
+
+                _ASSERTE( (status == WAIT_TIMEOUT) ||
+                          (status == WAIT_IO_COMPLETION) ||
+                          //It could be that there are no waiters at this point,
+                          //as the APC to deregister the wait may have run.
+                          (status == WAIT_OBJECT_0) ||
+                          (status >= WAIT_OBJECT_0 && status < (DWORD)(WAIT_OBJECT_0 + threadCB->NumActiveWaits))  ||
+                          (status == WAIT_FAILED));
+
+                //It could be that the last waiter also got deregistered.
+                if (threadCB->NumActiveWaits == 0)
+                {
+                    continue;
+                }
+            }
+
+            if (status == WAIT_IO_COMPLETION)
+                continue;
+
+            if (status == WAIT_TIMEOUT)
+            {
+                for (int i=0; i< threadCB->NumActiveWaits; i++)
+                {
+                    WaitInfo* waitInfo = (WaitInfo*) (threadCB->waitPointer[i]).Flink;
+                    PVOID waitInfoHead = &(threadCB->waitPointer[i]);
+
+                    do
+                    {
+                        _ASSERTE(waitInfo->timer.remainingTime >= timeout);
+
+                        WaitInfo* wTemp = (WaitInfo*) waitInfo->link.Flink;
+
+                        if (waitInfo->timer.remainingTime == timeout)
+                        {
+                            ProcessWaitCompletion(waitInfo,i,TRUE);
+                        }
+
+                        waitInfo = wTemp;
+
+                    } while ((PVOID) waitInfo != waitInfoHead);
+                }
+            }
+            else if (status >= WAIT_OBJECT_0 && status < (DWORD)(WAIT_OBJECT_0 + threadCB->NumActiveWaits))
+            {
+                unsigned index = status - WAIT_OBJECT_0;
+                WaitInfo* waitInfo = (WaitInfo*) (threadCB->waitPointer[index]).Flink;
+                PVOID waitInfoHead = &(threadCB->waitPointer[index]);
+                BOOL isAutoReset;
+
+                // Setting to unconditional TRUE is inefficient since we will re-enter the wait and release
+                // the next waiter, but short of using undocumented NT apis is the only solution.
+                // Querying the state with a WaitForSingleObject is not an option as it will reset an
+                // auto reset event if it has been signalled since the previous wait.
+                isAutoReset = TRUE;
+
+                do
+                {
+                    WaitInfo* wTemp = (WaitInfo*) waitInfo->link.Flink;
+                    ProcessWaitCompletion(waitInfo,index,FALSE);
+
+                    waitInfo = wTemp;
+
+                } while (((PVOID) waitInfo != waitInfoHead) && !isAutoReset);
+
+                // If an app registers a recurring wait for an event that is always signalled (!),
+                // then no apc's will be executed since the thread never enters the alertable state.
+                // This can be fixed by doing the following:
+                //     SleepEx(0,TRUE);
+                // However, it causes an unnecessary context switch. It is not worth penalizing well
+                // behaved apps to protect poorly written apps.
+
+
+            }
+            else
+            {
+                _ASSERTE(status == WAIT_FAILED);
+                // wait failed: application error
+                // find out which wait handle caused the wait to fail
+                for (int i = 0; i < threadCB->NumActiveWaits; i++)
+                {
+                    DWORD subRet = WaitForSingleObject(threadCB->waitHandle[i], 0);
+
+                    if (subRet != WAIT_FAILED)
+                        continue;
+
+                    // remove all waits associated with this wait handle
+
+                    WaitInfo* waitInfo = (WaitInfo*) (threadCB->waitPointer[i]).Flink;
+                    PVOID waitInfoHead = &(threadCB->waitPointer[i]);
+
+                    do
+                    {
+                        WaitInfo* temp  = (WaitInfo*) waitInfo->link.Flink;
+
+                        DeactivateNthWait(waitInfo,i);
+
+
+                // Note, we cannot cleanup here since there is no way to suppress finalization
+                // we will just leak, and rely on the finalizer to clean up the memory
+                        //if (InterlockedDecrement(&waitInfo->refCount) == 0)
+                        //    DeleteWait(waitInfo);
+
+
+                        waitInfo = temp;
+
+                    } while ((PVOID) waitInfo != waitInfoHead);
+
+                    break;
+                }
+            }
+        }
+    }
+    END_SO_INTOLERANT_CODE;
+
+    //This is unreachable...so no return required.
+}
+#ifdef _PREFAST_
+#pragma warning(pop)
+#endif
+
+#ifdef _MSC_VER
+#ifdef _WIN64
+#pragma warning (default : 4716)
+#else
+#pragma warning (default : 4715)
+#endif
+#endif
+
+void ThreadpoolMgr::ProcessWaitCompletion(WaitInfo* waitInfo,
+                                          unsigned index,
+                                          BOOL waitTimedOut
+                                         )
+{
+    STATIC_CONTRACT_THROWS;
+    STATIC_CONTRACT_GC_TRIGGERS;
+    STATIC_CONTRACT_MODE_PREEMPTIVE;
+    /* cannot use contract because of SEH
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;*/
+
+    AsyncCallback* asyncCallback = NULL;
+    EX_TRY{
+        if ( waitInfo->flag & WAIT_SINGLE_EXECUTION)
+        {
+            DeactivateNthWait (waitInfo,index) ;
+        }
+        else
+        {   // reactivate wait by resetting timer
+            waitInfo->timer.startTime = GetTickCount();
+        }
+
+        asyncCallback = MakeAsyncCallback();
+        if (asyncCallback)
+        {
+            asyncCallback->wait = waitInfo;
+            asyncCallback->waitTimedOut = waitTimedOut;
+
+            InterlockedIncrement(&waitInfo->refCount);
+
+#ifndef FEATURE_PAL
+            if (FALSE == PostQueuedCompletionStatus((LPOVERLAPPED)asyncCallback, (LPOVERLAPPED_COMPLETION_ROUTINE)WaitIOCompletionCallback))
+#else  // FEATURE_PAL
+            if (FALSE == QueueUserWorkItem(AsyncCallbackCompletion, asyncCallback, QUEUE_ONLY))
+#endif // !FEATURE_PAL
+                ReleaseAsyncCallback(asyncCallback);
+        }
+    }
+    EX_CATCH {
+        if (asyncCallback)
+            ReleaseAsyncCallback(asyncCallback);
+
+        if (SwallowUnhandledExceptions())
+        {
+            // Do nothing to swallow the exception
+        }
+        else
+        {
+            EX_RETHROW;
+        }
+    }
+    EX_END_CATCH(SwallowAllExceptions);
+}
+
+
+DWORD __stdcall ThreadpoolMgr::AsyncCallbackCompletion(PVOID pArgs)
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_PREEMPTIVE;
+        GC_TRIGGERS;
+        SO_TOLERANT;
+    }
+    CONTRACTL_END;
+
+    Thread * pThread = GetThread();
+
+    if (pThread == NULL)
+    {
+        HRESULT hr = ERROR_SUCCESS;
+
+        ClrFlsSetThreadType(ThreadType_Threadpool_Worker);
+        pThread = SetupThreadNoThrow(&hr);
+
+        if (pThread == NULL)
+        {
+            return hr;
+        }
+    }
+
+    BEGIN_SO_INTOLERANT_CODE_NOTHROW(pThread, return ERROR_STACK_OVERFLOW);
+    {
+        AsyncCallback * asyncCallback = (AsyncCallback*) pArgs;
+
+        WaitInfo * waitInfo = asyncCallback->wait;
+
+        AsyncCallbackHolder asyncCBHolder;
+        asyncCBHolder.Assign(asyncCallback);
+
+        // We fire the "dequeue" ETW event here, before executing the user code, to enable correlation with
+        // the ThreadPoolIOEnqueue fired in ThreadpoolMgr::RegisterWaitForSingleObject
+        if (ETW_EVENT_ENABLED(MICROSOFT_WINDOWS_DOTNETRUNTIME_PROVIDER_Context, ThreadPoolIODequeue))
+            FireEtwThreadPoolIODequeue(waitInfo, waitInfo->Callback, GetClrInstanceId());
+
+        // the user callback can throw, the host must be prepared to handle it.
+        // SQL is ok, since they have a top-level SEH handler. However, there's
+        // no easy way to verify it
+
+        ((WAITORTIMERCALLBACKFUNC) waitInfo->Callback)
+                                    ( waitInfo->Context, asyncCallback->waitTimedOut != FALSE);
+    }
+    END_SO_INTOLERANT_CODE;
+
+    return ERROR_SUCCESS;
+}
+
+void ThreadpoolMgr::DeactivateWait(WaitInfo* waitInfo)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    ThreadCB* threadCB = waitInfo->threadCB;
+    DWORD endIndex = threadCB->NumActiveWaits-1;
+    DWORD index;
+
+    for (index = 0;  index <= endIndex; index++)
+    {
+        LIST_ENTRY* head = &(threadCB->waitPointer[index]);
+        LIST_ENTRY* current = head;
+        do {
+            if (current->Flink == (PVOID) waitInfo)
+                goto FOUND;
+
+            current = (LIST_ENTRY*) current->Flink;
+
+        } while (current != head);
+    }
+
+FOUND:
+    _ASSERTE(index <= endIndex);
+
+    DeactivateNthWait(waitInfo, index);
+}
+
+
+void ThreadpoolMgr::DeactivateNthWait(WaitInfo* waitInfo, DWORD index)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    ThreadCB* threadCB = waitInfo->threadCB;
+
+    if (waitInfo->link.Flink != waitInfo->link.Blink)
+    {
+        RemoveEntryList(&(waitInfo->link));
+    }
+    else
+    {
+
+        ULONG EndIndex = threadCB->NumActiveWaits -1;
+
+        // Move the remaining ActiveWaitArray left.
+
+        ShiftWaitArray( threadCB, index+1, index,EndIndex - index ) ;
+
+        // repair the blink and flink of the first and last elements in the list
+        for (unsigned int i = 0; i< EndIndex-index; i++)
+        {
+            WaitInfo* firstWaitInfo = (WaitInfo*) threadCB->waitPointer[index+i].Flink;
+            WaitInfo* lastWaitInfo = (WaitInfo*) threadCB->waitPointer[index+i].Blink;
+            firstWaitInfo->link.Blink =  &(threadCB->waitPointer[index+i]);
+            lastWaitInfo->link.Flink =  &(threadCB->waitPointer[index+i]);
+        }
+        // initialize the entry just freed
+        InitializeListHead(&(threadCB->waitPointer[EndIndex]));
+
+        threadCB->NumActiveWaits-- ;
+        InterlockedDecrement(&threadCB->NumWaitHandles);
+    }
+
+    waitInfo->state &= ~WAIT_ACTIVE ;
+
+}
+
+void ThreadpoolMgr::DeleteWait(WaitInfo* waitInfo)
+{
+    CONTRACTL
+    {
+        if (waitInfo->ExternalEventSafeHandle != NULL) { THROWS;} else { NOTHROW; }
+        MODE_ANY;
+        if (GetThread()) {GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+    }
+    CONTRACTL_END;
+
+    if(waitInfo->Context && (waitInfo->flag & WAIT_FREE_CONTEXT)) {
+        DelegateInfo* pDelegate = (DelegateInfo*) waitInfo->Context;
+
+        // Since the delegate release destroys a handle, we need to be in
+        // co-operative mode
+        {
+            GCX_COOP();
+            pDelegate->Release();
+        }
+
+        RecycleMemory( pDelegate, MEMTYPE_DelegateInfo );
+    }
+
+    if (waitInfo->flag & WAIT_INTERNAL_COMPLETION)
+    {
+        waitInfo->InternalCompletionEvent.Set();
+        return;  // waitInfo will be deleted by the thread that's waiting on this event
+    }
+    else if (waitInfo->ExternalCompletionEvent != INVALID_HANDLE)
+    {
+        UnsafeSetEvent(waitInfo->ExternalCompletionEvent);
+    }
+    else if (waitInfo->ExternalEventSafeHandle != NULL)
+    {
+        // Release the safe handle and the GC handle holding it
+        ReleaseWaitInfo(waitInfo);
+    }
+
+    delete waitInfo;
+
+
+}
+
+
+
+/************************************************************************/
+BOOL ThreadpoolMgr::UnregisterWaitEx(HANDLE hWaitObject,HANDLE Event)
+{
+    CONTRACTL
+    {
+        THROWS; //NOTHROW;
+        if (GetThread()) {GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(IsInitialized());              // cannot call unregister before first registering
+
+    const BOOL Blocking = (Event == (HANDLE) -1);
+    WaitInfo* waitInfo = (WaitInfo*) hWaitObject;
+
+    if (!hWaitObject)
+    {
+        return FALSE;
+    }
+
+    // we do not allow callbacks to run in the wait thread, hence the assert
+    _ASSERTE(GetCurrentThreadId() != waitInfo->threadCB->threadId);
+
+
+    if (Blocking)
+    {
+        waitInfo->InternalCompletionEvent.CreateAutoEvent(FALSE);
+        waitInfo->flag |= WAIT_INTERNAL_COMPLETION;
+
+    }
+    else
+    {
+        waitInfo->ExternalCompletionEvent = (Event ? Event : INVALID_HANDLE);
+        _ASSERTE((waitInfo->flag & WAIT_INTERNAL_COMPLETION) == 0);
+        // we still want to block until the wait has been deactivated
+        waitInfo->PartialCompletionEvent.CreateAutoEvent(FALSE);
+    }
+
+    BOOL status = QueueDeregisterWait(waitInfo->threadCB->threadHandle, waitInfo);
+
+
+    if (status == 0)
+    {
+        STRESS_LOG1(LF_THREADPOOL, LL_ERROR, "Queue APC failed in UnregisterWaitEx %x", status);
+
+        if (Blocking)
+            waitInfo->InternalCompletionEvent.CloseEvent();
+        else
+            waitInfo->PartialCompletionEvent.CloseEvent();
+        return FALSE;
+    }
+
+    if (!Blocking)
+    {
+        waitInfo->PartialCompletionEvent.Wait(INFINITE,TRUE);
+        waitInfo->PartialCompletionEvent.CloseEvent();
+        // we cannot do DeleteWait in DeregisterWait, since the DeleteWait could happen before
+        // we close the event. So, the code has been moved here.
+        if (InterlockedDecrement(&waitInfo->refCount) == 0)
+        {
+            DeleteWait(waitInfo);
+        }
+    }
+
+    else        // i.e. blocking
+    {
+        _ASSERTE(waitInfo->flag & WAIT_INTERNAL_COMPLETION);
+        _ASSERTE(waitInfo->ExternalEventSafeHandle == NULL);
+
+        waitInfo->InternalCompletionEvent.Wait(INFINITE,TRUE);
+        waitInfo->InternalCompletionEvent.CloseEvent();
+        delete waitInfo;  // if WAIT_INTERNAL_COMPLETION is not set, waitInfo will be deleted in DeleteWait
+    }
+    return TRUE;
+}
+
+
+void ThreadpoolMgr::DeregisterWait(WaitInfo* pArgs)
+{
+
+    WRAPPER_NO_CONTRACT;
+    STATIC_CONTRACT_SO_INTOLERANT;
+
+    WaitInfo* waitInfo = pArgs;
+
+    if ( ! (waitInfo->state & WAIT_REGISTERED) )
+    {
+        // set state to deleted, so that it does not get registered
+        waitInfo->state |= WAIT_DELETE ;
+
+        // since the wait has not even been registered, we dont need an interlock to decrease the RefCount
+        waitInfo->refCount--;
+
+        if (waitInfo->PartialCompletionEvent.IsValid())
+        {
+            waitInfo->PartialCompletionEvent.Set();
+        }
+        return;
+    }
+
+    if (waitInfo->state & WAIT_ACTIVE)
+    {
+        DeactivateWait(waitInfo);
+    }
+
+    if ( waitInfo->PartialCompletionEvent.IsValid())
+    {
+        waitInfo->PartialCompletionEvent.Set();
+        return;     // we cannot delete the wait here since the PartialCompletionEvent
+                    // may not have been closed yet. so, we return and rely on the waiter of PartialCompletionEvent
+                    // to do the close
+    }
+
+    if (InterlockedDecrement(&waitInfo->refCount) == 0)
+    {
+        // After we suspend EE during shutdown, a thread may be blocked in WaitForEndOfShutdown in alertable state.
+        // We don't allow a thread reenter runtime while processing APC or pumping message.
+        if (!g_fSuspendOnShutdown )
+        {
+            DeleteWait(waitInfo);
+        }
+    }
+    return;
+}
+
+
+/* This gets called in a finalizer thread ONLY IF an app does not deregister the
+   the wait. Note that just because the registeredWaitHandle is collected by GC
+   does not mean it is safe to delete the wait. The refcount tells us when it is
+   safe.
+*/
+void ThreadpoolMgr::WaitHandleCleanup(HANDLE hWaitObject)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    WaitInfo* waitInfo = (WaitInfo*) hWaitObject;
+    _ASSERTE(waitInfo->refCount > 0);
+
+    DWORD result = QueueDeregisterWait(waitInfo->threadCB->threadHandle, waitInfo);
+
+    if (result == 0)
+        STRESS_LOG1(LF_THREADPOOL, LL_ERROR, "Queue APC failed in WaitHandleCleanup %x", result);
+
+}
+
+BOOL ThreadpoolMgr::CreateGateThread()
+{
+    LIMITED_METHOD_CONTRACT;
+
+    // The gate thread is only needed if the CLR is providing part of the ThreadPool implementation.
+    _ASSERTE(!CLRThreadpoolHosted() || !CLRIoCompletionHosted());
+
+    HANDLE threadHandle = Thread::CreateUtilityThread(Thread::StackSize_Small, GateThreadStart, NULL);
+
+    if (threadHandle)
+    {
+        CloseHandle(threadHandle);  //we don't need this anymore
+        return TRUE;
+    }
+
+    return FALSE;
+}
+
+
+
+/************************************************************************/
+
+BOOL ThreadpoolMgr::BindIoCompletionCallback(HANDLE FileHandle,
+                                            LPOVERLAPPED_COMPLETION_ROUTINE Function,
+                                            ULONG Flags,
+                                            DWORD& errCode)
+{
+
+    CONTRACTL
+    {
+        THROWS;     // EnsureInitialized can throw
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+#ifndef FEATURE_PAL
+    
+    errCode = S_OK;
+
+    EnsureInitialized();
+
+#ifdef FEATURE_INCLUDE_ALL_INTERFACES
+    IHostIoCompletionManager *provider = CorHost2::GetHostIoCompletionManager();
+    if (provider) {
+        BEGIN_SO_TOLERANT_CODE_CALLING_HOST(GetThread());
+        errCode = provider->Bind(GlobalCompletionPort, FileHandle);
+        END_SO_TOLERANT_CODE_CALLING_HOST;
+        if (FAILED(errCode))
+        {
+            SetLastHRError(errCode);
+            return FALSE;
+        }
+        else
+        {
+            return TRUE;
+        }
+    }
+#endif // FEATURE_INCLUDE_ALL_INTERFACES
+
+    _ASSERTE(GlobalCompletionPort != NULL);
+
+    if (!InitCompletionPortThreadpool)
+        InitCompletionPortThreadpool = TRUE;
+
+    GrowCompletionPortThreadpoolIfNeeded();
+
+    HANDLE h = CreateIoCompletionPort(FileHandle,
+                                      GlobalCompletionPort,
+                                      (ULONG_PTR) Function,
+                                      NumberOfProcessors);
+    if (h == NULL)
+    {
+        errCode = GetLastError();
+        return FALSE;
+    }
+
+    _ASSERTE(h == GlobalCompletionPort);
+
+    return TRUE;
+#else // FEATURE_PAL
+    SetLastError(ERROR_CALL_NOT_IMPLEMENTED);
+    return FALSE;
+#endif // !FEATURE_PAL
+}
+
+#ifndef FEATURE_PAL
+BOOL ThreadpoolMgr::CreateCompletionPortThread(LPVOID lpArgs)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    Thread *pThread;
+    BOOL fIsCLRThread;
+    if ((pThread = CreateUnimpersonatedThread(CompletionPortThreadStart, lpArgs, &fIsCLRThread)) != NULL)
+    {
+        LastCPThreadCreation = GetTickCount();          // record this for use by logic to spawn additional threads
+
+        if (fIsCLRThread) {
+            pThread->ChooseThreadCPUGroupAffinity();
+            pThread->StartThread();
+        }
+        else {
+            DWORD status;
+            status = ResumeThread((HANDLE)pThread);
+            _ASSERTE(status != (DWORD) (-1));
+            CloseHandle((HANDLE)pThread);          // we don't need this anymore
+        }
+
+        ThreadCounter::Counts counts = CPThreadCounter.GetCleanCounts();
+        FireEtwIOThreadCreate_V1(counts.NumActive + counts.NumRetired, counts.NumRetired, GetClrInstanceId());
+
+        return TRUE;
+    }
+
+
+    return FALSE;
+}
+
+DWORD __stdcall ThreadpoolMgr::CompletionPortThreadStart(LPVOID lpArgs)
+{
+    ClrFlsSetThreadType (ThreadType_Threadpool_IOCompletion);
+
+    CONTRACTL
+    {
+        THROWS;
+        if (GetThread()) { MODE_PREEMPTIVE;} else { DISABLED(MODE_ANY);}
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE (!CLRIoCompletionHosted());
+
+    DWORD numBytes=0;
+    size_t key=0;
+
+    LPOVERLAPPED pOverlapped = NULL;
+    DWORD errorCode;
+    PIOCompletionContext context;
+    BOOL fIsCompletionContext;
+
+    const DWORD CP_THREAD_WAIT = AppX::IsAppXProcess() ? 5000 : 15000; /* milliseconds */
+
+    _ASSERTE(GlobalCompletionPort != NULL);
+
+    BOOL fThreadInit = FALSE;
+    Thread *pThread = NULL;
+
+    if (g_fEEStarted) {
+        pThread = SetupThreadNoThrow();
+        if (pThread == NULL) {
+            return 0;
+        }
+
+        // converted to CLRThread and added to ThreadStore, pick an group affinity for this thread
+        pThread->ChooseThreadCPUGroupAffinity(); 
+
+        fThreadInit = TRUE;
+    }
+
+#ifdef FEATURE_COMINTEROP
+    // Threadpool threads should be initialized as MTA. If we are unable to do so,
+    // return failure.
+    BOOL fCoInited = FALSE;
+    {
+        fCoInited = SUCCEEDED(::CoInitializeEx(NULL, COINIT_MULTITHREADED));
+        if (!fCoInited)
+        {
+            goto Exit;
+        }
+    }
+
+    if (pThread && pThread->SetApartment(Thread::AS_InMTA, TRUE) != Thread::AS_InMTA)
+    {
+        // @todo: should we log the failure
+        goto Exit;
+    }
+#endif // FEATURE_COMINTEROP
+
+    ThreadCounter::Counts oldCounts;
+    ThreadCounter::Counts newCounts;
+
+    DWORD cpThreadWait = CP_THREAD_WAIT;
+    for (;; )
+    {
+Top:
+        if (!fThreadInit) {
+            if (g_fEEStarted) {
+                pThread = SetupThreadNoThrow();
+                if (pThread == NULL) {
+                    break;
+                }
+
+                // converted to CLRThread and added to ThreadStore, pick an group affinity for this thread
+                pThread->ChooseThreadCPUGroupAffinity(); 
+
+#ifdef FEATURE_COMINTEROP
+                if (pThread->SetApartment(Thread::AS_InMTA, TRUE) != Thread::AS_InMTA)
+                {
+                    // @todo: should we log the failure
+                    goto Exit;
+                }
+#endif // FEATURE_COMINTEROP
+
+                fThreadInit = TRUE;
+            }
+        }
+
+        GCX_PREEMP_NO_DTOR();
+
+        //
+        // We're about to wait on the IOCP; mark ourselves as no longer "working."
+        //
+        while (true)
+        {
+            ThreadCounter::Counts oldCounts = CPThreadCounter.DangerousGetDirtyCounts();
+            ThreadCounter::Counts newCounts = oldCounts;
+            newCounts.NumWorking--;
+
+            //
+            // If we've only got one thread left, it won't be allowed to exit, because we need to keep
+            // one thread listening for completions.  So there's no point in having a timeout; it will
+            // only use power unnecessarily.
+            //
+            cpThreadWait = (newCounts.NumActive == 1) ? INFINITE : CP_THREAD_WAIT;
+
+            if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                break;
+        }
+
+        errorCode = S_OK;
+
+        if (lpArgs == NULL)
+        {
+            CONTRACT_VIOLATION(ThrowsViolation);
+
+            if (g_fCompletionPortDrainNeeded && pThread)
+            {
+                // We have started draining completion port.
+                // The next job picked up by this thread is going to be after our special marker.
+                if (!pThread->IsCompletionPortDrained())
+                {
+                    pThread->MarkCompletionPortDrained();
+                }
+            }
+
+            context = NULL;
+            fIsCompletionContext = FALSE;
+        
+            if (pThread == NULL) 
+            {    
+                pThread = GetThread();
+            }
+
+            if (pThread) 
+            {
+ 
+                context = (PIOCompletionContext) pThread->GetIOCompletionContext();
+            
+                if (context->lpOverlapped != NULL) 
+                {
+                    errorCode = context->ErrorCode;
+                    numBytes = context->numBytesTransferred;
+                    pOverlapped = context->lpOverlapped;
+                    key = context->key;
+                    
+                    context->lpOverlapped = NULL;
+                    fIsCompletionContext = TRUE;
+                }
+            }
+
+            if((context == NULL) || (!fIsCompletionContext))
+            {
+                _ASSERTE (context == NULL || context->lpOverlapped == NULL);
+
+                LeaveRuntimeHolder holder((size_t)GetQueuedCompletionStatus);
+
+                BOOL status = GetQueuedCompletionStatus(
+                    GlobalCompletionPort,
+                    &numBytes,
+                    (PULONG_PTR)&key,
+                    &pOverlapped,
+                    cpThreadWait
+                    );
+
+                if (status == 0)
+                    errorCode = GetLastError();
+            }
+        }
+        else
+        {
+            QueuedStatus *CompletionStatus = (QueuedStatus*)lpArgs;
+            numBytes = CompletionStatus->numBytes;
+            key = (size_t)CompletionStatus->key;
+            pOverlapped = CompletionStatus->pOverlapped;
+            errorCode = CompletionStatus->errorCode;
+            delete CompletionStatus;
+            lpArgs = NULL;  // one-time deal for initial CP packet
+        }
+
+        // We fire IODequeue events whether the IO completion was retrieved in the above call to
+        // GetQueuedCompletionStatus or during an earlier call (e.g. in GateThreadStart, and passed here in lpArgs, 
+        // or in CompletionPortDispatchWorkWithinAppDomain, and passed here through StoreOverlappedInfoInThread)
+
+        // For the purposes of activity correlation we only fire ETW events here, if needed OR if not fired at a higher
+        // abstration level (e.g. ThreadpoolMgr::RegisterWaitForSingleObject)
+        // Note: we still fire the event for managed async IO, despite the fact we don't have a paired IOEnqueue event
+        // for this case. We do this to "mark" the end of the previous workitem. When we provide full support at the higher
+        // abstraction level for managed IO we can remove the IODequeues fired here
+        if (ETW_EVENT_ENABLED(MICROSOFT_WINDOWS_DOTNETRUNTIME_PROVIDER_Context, ThreadPoolIODequeue)
+                && !AreEtwIOQueueEventsSpeciallyHandled((LPOVERLAPPED_COMPLETION_ROUTINE)key) && pOverlapped != NULL)
+            FireEtwThreadPoolIODequeue(pOverlapped, (BYTE*)pOverlapped - offsetof(OverlappedDataObject, Internal), GetClrInstanceId());
+
+        bool enterRetirement;
+
+        while (true)
+        {
+            //
+            // When we reach this point, this thread is "active" but not "working."  Depending on the result of the call to GetQueuedCompletionStatus, 
+            // and the state of the rest of the IOCP threads, we need to figure out whether to de-activate (exit) this thread, retire this thread,
+            // or transition to "working."
+            //
+            oldCounts = CPThreadCounter.GetCleanCounts();
+            newCounts = oldCounts;
+            enterRetirement = false;
+
+            if (errorCode == WAIT_TIMEOUT)
+            {
+                //
+                // We timed out, and are going to try to exit or retire.
+                //
+                newCounts.NumActive--;
+
+                //
+                // We need at least one free thread, or we have no way of knowing if completions are being queued.
+                // 
+                if (newCounts.NumWorking == newCounts.NumActive)
+                {
+                    newCounts = oldCounts;
+                    newCounts.NumWorking++; //not really working, but we'll decremented it at the top
+                    if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                        goto Top;
+                    else
+                        continue;
+                }
+
+                //
+                // We can't exit a thread that has pending I/O - we'll "retire" it instead.
+                //
+                if (IsIoPending())
+                {
+                    enterRetirement = true;
+                    newCounts.NumRetired++;
+                }
+            }
+            else
+            {
+                //
+                // We have work to do
+                //
+                newCounts.NumWorking++;
+            }
+
+            if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                break;
+        }
+
+        if (errorCode == WAIT_TIMEOUT)
+        {
+            if (!enterRetirement)
+            {
+                goto Exit;
+            }
+            else
+            {
+                // now in "retired mode" waiting for pending io to complete
+                FireEtwIOThreadRetire_V1(newCounts.NumActive + newCounts.NumRetired, newCounts.NumRetired, GetClrInstanceId());
+
+                for (;;)
+                {
+#ifndef FEATURE_PAL
+                    if (g_fCompletionPortDrainNeeded && pThread)
+                    {
+                        // The thread is not going to process IO job now.
+                        if (!pThread->IsCompletionPortDrained())
+                        {
+                            pThread->MarkCompletionPortDrained();
+                        }
+                    }
+#endif // !FEATURE_PAL
+
+                    DWORD status = SafeWait(RetiredCPWakeupEvent,CP_THREAD_PENDINGIO_WAIT,FALSE);
+                    _ASSERTE(status == WAIT_TIMEOUT || status == WAIT_OBJECT_0);
+
+                    if (status == WAIT_TIMEOUT)
+                    {
+                        if (IsIoPending())
+                        {
+                            continue;
+                        }
+                        else
+                        {
+                            // We can now exit; decrement the retired count.
+                            while (true)
+                            {
+                                oldCounts = CPThreadCounter.GetCleanCounts();
+                                newCounts = oldCounts;
+                                newCounts.NumRetired--;
+                                if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                                    break;
+                            }
+                            goto Exit;
+                        }
+                    }
+                    else
+                    {
+                        // put back into rotation -- we need a thread
+                        while (true)
+                        {
+                            oldCounts = CPThreadCounter.GetCleanCounts();
+                            newCounts = oldCounts;
+                            newCounts.NumRetired--;
+                            newCounts.NumActive++;
+                            newCounts.NumWorking++; //we're not really working, but we'll decrement this before waiting for work.
+                            if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                                break;
+                        }
+                        FireEtwIOThreadUnretire_V1(newCounts.NumActive + newCounts.NumRetired, newCounts.NumRetired, GetClrInstanceId());
+                        goto Top;
+                    }
+                }
+            }
+        }
+
+        // we should not reach this point unless we have work to do
+        _ASSERTE(errorCode != WAIT_TIMEOUT && !enterRetirement);
+
+        // if we have no more free threads, start the gate thread
+        if (newCounts.NumWorking >= newCounts.NumActive)
+            EnsureGateThreadRunning();
+
+
+        // We can not assert here.  If stdin/stdout/stderr of child process are redirected based on
+        // async io, GetQueuedCompletionStatus returns when child process operates on its stdin/stdout/stderr.
+        // Parent process does not issue any ReadFile/WriteFile, and hence pOverlapped is going to be NULL.
+        //_ASSERTE(pOverlapped != NULL);
+
+        if (pOverlapped != NULL)
+        {
+            _ASSERTE(key != 0);  // should be a valid function address
+
+            if (key != 0)
+            {
+                if (GCHeap::IsGCInProgress(TRUE))
+                {
+                    //Indicate that this thread is free, and waiting on GC, not doing any user work.
+                    //This helps in threads not getting injected when some threads have woken up from the
+                    //GC event, and some have not.
+                    while (true)
+                    {
+                        oldCounts = CPThreadCounter.GetCleanCounts();
+                        newCounts = oldCounts;
+                        newCounts.NumWorking--;
+                        if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                            break;
+                    }
+
+                    // GC is imminent, so wait until GC is complete before executing next request.
+                    // this reduces in-flight objects allocated right before GC, easing the GC's work
+                    GCHeap::WaitForGCCompletion(TRUE);
+
+                    while (true)
+                    {
+                        oldCounts = CPThreadCounter.GetCleanCounts();
+                        newCounts = oldCounts;
+                        newCounts.NumWorking++;
+                        if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                            break;
+                    }
+
+                    if (newCounts.NumWorking >= newCounts.NumActive)
+                        EnsureGateThreadRunning();
+                }
+                else
+                {
+                    GrowCompletionPortThreadpoolIfNeeded();
+                }
+
+                {
+                    CONTRACT_VIOLATION(ThrowsViolation);
+
+                    ThreadLocaleHolder localeHolder;
+
+                    ((LPOVERLAPPED_COMPLETION_ROUTINE) key)(errorCode, numBytes, pOverlapped);
+                }
+
+                if (pThread == NULL) {
+                    pThread = GetThread();
+                }
+                if (pThread) {
+                    if (pThread->IsAbortRequested())
+                        pThread->EEResetAbort(Thread::TAR_ALL);
+                    pThread->InternalReset(FALSE);
+                }
+            }
+            else
+            {
+                // Application bug - can't do much, just ignore it
+            }
+
+        }
+
+    }   // for (;;)
+
+Exit:
+
+    oldCounts = CPThreadCounter.GetCleanCounts();
+
+    // we should never destroy or retire all IOCP threads, because then we won't have any threads to notice incoming completions.
+    _ASSERTE(oldCounts.NumActive > 0);
+
+    FireEtwIOThreadTerminate_V1(oldCounts.NumActive + oldCounts.NumRetired, oldCounts.NumRetired, GetClrInstanceId());
+
+#ifdef FEATURE_COMINTEROP
+    if (pThread) {
+        pThread->SetApartment(Thread::AS_Unknown, TRUE);
+        pThread->CoUninitialize();
+    }
+    // Couninit the worker thread
+    if (fCoInited)
+    {
+        CoUninitialize();
+    }
+#endif
+
+    if (pThread) {
+        pThread->ClearThreadCPUGroupAffinity();
+
+        DestroyThread(pThread);
+    }
+
+    return 0;
+}
+
+LPOVERLAPPED ThreadpoolMgr::CompletionPortDispatchWorkWithinAppDomain(
+    Thread* pThread,
+    DWORD* pErrorCode, 
+    DWORD* pNumBytes,
+    size_t* pKey,
+    DWORD adid)
+//
+//This function is called just after dispatching the previous BindIO callback
+//to Managed code. This is a perf optimization to do a quick call to 
+//GetQueuedCompletionStatus with a timeout of 0 ms. If there is work in the
+//same appdomain, dispatch it back immediately. If not stick it in a well known
+//place, and reenter the target domain. The timeout of zero is chosen so as to 
+//not delay appdomain unloads.
+//
+{
+    STATIC_CONTRACT_THROWS;
+    STATIC_CONTRACT_GC_NOTRIGGER;
+    STATIC_CONTRACT_MODE_ANY;
+    STATIC_CONTRACT_SO_TOLERANT;
+
+    LPOVERLAPPED lpOverlapped=NULL;
+
+    BOOL status=FALSE;
+    OVERLAPPEDDATAREF overlapped=NULL;
+    BOOL ManagedCallback=FALSE;
+
+    if (CLRIoCompletionHosted()) 
+    {
+        return NULL;
+    }
+
+    *pErrorCode = S_OK;
+
+    LeaveRuntimeHolder holder((size_t)GetQueuedCompletionStatus);
+
+
+    //Very Very Important!
+    //Do not change the timeout for GetQueuedCompletionStatus to a non-zero value.
+    //Selecting a non-zero value can cause the thread to block, and lead to expensive context switches.
+    //In real life scenarios, we have noticed a packet to be not availabe immediately, but very shortly 
+    //(after few 100's of instructions), and falling back to the VM is good in that case as compared to
+    //taking a context switch. Changing the timeout to non-zero can lead to perf degrades, that are very
+    //hard to diagnose.     
+
+    status = ::GetQueuedCompletionStatus(
+                 GlobalCompletionPort,
+                 pNumBytes,
+                 (PULONG_PTR)pKey,
+                 &lpOverlapped,
+                 0);
+
+    DWORD lastError = GetLastError();
+
+    if (status == 0) 
+    {          
+        if (lpOverlapped != NULL) 
+        {
+            *pErrorCode = lastError;
+        } 
+        else 
+        {
+            return NULL;
+        }
+    } 
+
+    if (((LPOVERLAPPED_COMPLETION_ROUTINE) *pKey) != BindIoCompletionCallbackStub)
+    {
+        //_ASSERTE(FALSE);
+    } 
+    else 
+    {
+        ManagedCallback = TRUE;
+        overlapped = ObjectToOVERLAPPEDDATAREF(OverlappedDataObject::GetOverlapped(lpOverlapped));
+    }  
+
+    if (ManagedCallback && (overlapped->GetAppDomainId() == adid)) 
+    {           
+        _ASSERTE(*pKey != 0);  // should be a valid function address
+        
+        if (*pKey ==0) 
+        {
+            //Application Bug.
+            return NULL;
+        }
+    
+    } 
+    else 
+    {
+        //Just retruned back from managed code, a Thread structure should exist.
+        _ASSERTE (pThread);
+        
+        //Oops, this is an overlapped fom a different appdomain. STick it in
+        //the thread. We will process it later.
+
+        StoreOverlappedInfoInThread(pThread, *pErrorCode, *pNumBytes, *pKey, lpOverlapped);
+
+        lpOverlapped = NULL;        
+    }
+
+#ifndef DACCESS_COMPILE    
+    return lpOverlapped;
+#endif
+}
+
+void ThreadpoolMgr::StoreOverlappedInfoInThread(Thread* pThread, DWORD dwErrorCode, DWORD dwNumBytes, size_t key, LPOVERLAPPED lpOverlapped)
+{
+    STATIC_CONTRACT_NOTHROW;
+    STATIC_CONTRACT_GC_NOTRIGGER;
+    STATIC_CONTRACT_MODE_ANY;
+    STATIC_CONTRACT_SO_TOLERANT;
+
+    _ASSERTE(pThread);
+
+    PIOCompletionContext context;
+
+    context = (PIOCompletionContext) pThread->GetIOCompletionContext();
+
+    _ASSERTE(context);
+
+    context->ErrorCode = dwErrorCode;
+    context->numBytesTransferred = dwNumBytes;
+    context->lpOverlapped = lpOverlapped;
+    context->key = key;
+}
+
+BOOL ThreadpoolMgr::ShouldGrowCompletionPortThreadpool(ThreadCounter::Counts counts)
+{
+    CONTRACTL
+    {
+        GC_NOTRIGGER;
+        NOTHROW;
+        MODE_ANY;
+        SO_TOLERANT;
+    }
+    CONTRACTL_END;     
+
+    if (counts.NumWorking >= counts.NumActive 
+        && NumCPInfrastructureThreads == 0
+        && (counts.NumActive == 0 ||  !GCHeap::IsGCInProgress(TRUE))
+        )
+    {
+        // adjust limit if neeeded
+        if (counts.NumRetired == 0)
+        {
+            if (counts.NumActive + counts.NumRetired < MaxLimitTotalCPThreads &&
+                (counts.NumActive < MinLimitTotalCPThreads || cpuUtilization < CpuUtilizationLow))
+            {
+                // add one more check to make sure that we haven't fired off a new
+                // thread since the last time time we checked the cpu utilization.
+                // However, don't bother if we haven't reached the MinLimit (2*number of cpus)
+                if ((counts.NumActive < MinLimitTotalCPThreads) ||
+                    SufficientDelaySinceLastSample(LastCPThreadCreation,counts.NumActive))
+                {
+                    return TRUE;
+                }                 
+            }
+        }
+
+        if (counts.NumRetired > 0)
+            return TRUE;
+    }
+    return FALSE;
+}
+
+void ThreadpoolMgr::GrowCompletionPortThreadpoolIfNeeded()
+{
+    CONTRACTL
+    {
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        NOTHROW;
+        MODE_ANY;
+    }
+    CONTRACTL_END;    
+
+    ThreadCounter::Counts oldCounts, newCounts;
+    while (true)
+    {
+        oldCounts = CPThreadCounter.GetCleanCounts();
+        newCounts = oldCounts;
+        
+        if(!ShouldGrowCompletionPortThreadpool(oldCounts))
+        {
+            break;
+        }
+        else
+        {
+            if (oldCounts.NumRetired > 0)
+            {        
+                // wakeup retired thread instead
+                RetiredCPWakeupEvent->Set();
+                return;
+            }
+            else 
+            {
+                // create a new thread.  New IOCP threads start as "active" and "working"
+                newCounts.NumActive++;
+                newCounts.NumWorking++;
+                if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                {
+                    if (!CreateCompletionPortThread(NULL))
+                    {
+                        // if thread creation failed, we have to adjust the counts back down.
+                        while (true)
+                        {
+                            oldCounts = CPThreadCounter.GetCleanCounts();
+                            newCounts = oldCounts;
+                            newCounts.NumActive--;
+                            newCounts.NumWorking--;
+                            if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                                break;
+                        }
+                    }
+                    return;
+                }
+            }    
+        } 
+    }
+}
+#endif // !FEATURE_PAL
+
+// Returns true if there is pending io on the thread.
+BOOL ThreadpoolMgr::IsIoPending()
+{
+    CONTRACTL
+    {
+        NOTHROW;         
+        MODE_ANY;
+        GC_NOTRIGGER;
+    }
+    CONTRACTL_END;
+
+#ifndef FEATURE_PAL
+    int Status;
+    ULONG IsIoPending;
+
+    if (g_pufnNtQueryInformationThread)
+    {
+        Status =(int) (*g_pufnNtQueryInformationThread)(GetCurrentThread(),
+                                          ThreadIsIoPending,
+                                          &IsIoPending,
+                                          sizeof(IsIoPending),
+                                          NULL);
+
+
+        if ((Status < 0) || IsIoPending)
+            return TRUE;
+        else
+            return FALSE;
+    }
+    return TRUE;
+#else
+    return FALSE;
+#endif // !FEATURE_PAL
+}
+
+#ifndef FEATURE_PAL
+
+#ifdef _WIN64
+#pragma warning (disable : 4716)
+#else
+#pragma warning (disable : 4715)
+#endif
+
+int ThreadpoolMgr::GetCPUBusyTime_NT(PROCESS_CPU_INFORMATION* pOldInfo)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    PROCESS_CPU_INFORMATION newUsage;
+    newUsage.idleTime.QuadPart   = 0;
+    newUsage.kernelTime.QuadPart = 0;
+    newUsage.userTime.QuadPart   = 0;
+
+    if (CPUGroupInfo::CanEnableGCCPUGroups() && CPUGroupInfo::CanEnableThreadUseAllCpuGroups())
+    {
+#if !defined(FEATURE_CORECLR)
+        FILETIME newIdleTime, newKernelTime, newUserTime;
+
+        CPUGroupInfo::GetSystemTimes(&newIdleTime, &newKernelTime, &newUserTime);
+        newUsage.idleTime.u.LowPart    = newIdleTime.dwLowDateTime;
+        newUsage.idleTime.u.HighPart   = newIdleTime.dwHighDateTime;
+        newUsage.kernelTime.u.LowPart  = newKernelTime.dwLowDateTime;
+        newUsage.kernelTime.u.HighPart = newKernelTime.dwHighDateTime;
+        newUsage.userTime.u.LowPart    = newUserTime.dwLowDateTime;
+        newUsage.userTime.u.HighPart   = newUserTime.dwHighDateTime;
+#endif
+    }
+    else
+    {
+        (*g_pufnNtQuerySystemInformation)(SystemProcessorPerformanceInformation, 
+                        pOldInfo->usageBuffer,
+                        pOldInfo->usageBufferSize,
+                        NULL);
+
+        SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION* pInfoArray = pOldInfo->usageBuffer;
+        DWORD_PTR pmask = pOldInfo->affinityMask;
+
+        int proc_no = 0;
+        while (pmask)
+        {
+            if (pmask & 1)
+            {   //should be good: 1CPU 28823 years, 256CPUs 100+years
+                newUsage.idleTime.QuadPart   += pInfoArray[proc_no].IdleTime.QuadPart;
+                newUsage.kernelTime.QuadPart += pInfoArray[proc_no].KernelTime.QuadPart;
+                newUsage.userTime.QuadPart   += pInfoArray[proc_no].UserTime.QuadPart;
+            }
+
+            pmask >>=1;
+            proc_no++;
+        }
+    }
+
+    __int64 cpuTotalTime, cpuBusyTime;
+
+    cpuTotalTime  = (newUsage.userTime.QuadPart   - pOldInfo->userTime.QuadPart) +
+                    (newUsage.kernelTime.QuadPart - pOldInfo->kernelTime.QuadPart);
+    cpuBusyTime   = cpuTotalTime - 
+                    (newUsage.idleTime.QuadPart   - pOldInfo->idleTime.QuadPart);
+
+    // Preserve reading
+    pOldInfo->idleTime   = newUsage.idleTime;
+    pOldInfo->kernelTime = newUsage.kernelTime;
+    pOldInfo->userTime   = newUsage.userTime;
+
+    __int64 reading = 0;
+
+    if (cpuTotalTime > 0)
+        reading = ((cpuBusyTime * 100) / cpuTotalTime);
+
+    _ASSERTE(FitsIn<int>(reading));
+    return (int)reading;
+}
+
+#else // !FEATURE_PAL
+
+int ThreadpoolMgr::GetCPUBusyTime_NT(PAL_IOCP_CPU_INFORMATION* pOldInfo)
+{
+    return PAL_GetCPUBusyTime(pOldInfo);
+}
+
+#endif // !FEATURE_PAL
+
+//
+// A timer that ticks every GATE_THREAD_DELAY milliseconds.  
+// On platforms that support it, we use a coalescable waitable timer object.
+// For other platforms, we use Sleep, via __SwitchToThread.
+//
+class GateThreadTimer
+{
+#ifndef FEATURE_PAL
+    HANDLE m_hTimer;
+
+public:
+    GateThreadTimer()
+        : m_hTimer(NULL)
+    {
+        CONTRACTL
+        {
+            NOTHROW;
+            MODE_PREEMPTIVE;
+        }
+        CONTRACTL_END;
+
+        if (g_pufnCreateWaitableTimerEx && g_pufnSetWaitableTimerEx)
+        {
+            m_hTimer = g_pufnCreateWaitableTimerEx(NULL, NULL, 0, TIMER_ALL_ACCESS);
+            if (m_hTimer)
+            {
+                //
+                // Set the timer to fire GATE_THREAD_DELAY milliseconds from now, then every GATE_THREAD_DELAY milliseconds thereafter.
+                // We also set the tolerance to GET_THREAD_DELAY_TOLERANCE, allowing the OS to coalesce this timer.
+                //
+                LARGE_INTEGER dueTime;
+                dueTime.QuadPart = MILLI_TO_100NANO(-(LONGLONG)GATE_THREAD_DELAY); //negative value indicates relative time
+                if (!g_pufnSetWaitableTimerEx(m_hTimer, &dueTime, GATE_THREAD_DELAY, NULL, NULL, NULL, GATE_THREAD_DELAY_TOLERANCE))
+                {
+                    CloseHandle(m_hTimer);
+                    m_hTimer = NULL;
+                }
+            }
+        }
+    }
+
+    ~GateThreadTimer()
+    {
+        CONTRACTL
+        {
+            NOTHROW;
+            MODE_PREEMPTIVE;
+        }
+        CONTRACTL_END;
+
+        if (m_hTimer)
+        {
+            CloseHandle(m_hTimer);
+            m_hTimer = NULL;
+        }
+    }
+
+#endif // !FEATURE_PAL
+
+public:
+    void Wait()
+    {
+        CONTRACTL
+        {
+            NOTHROW;
+            MODE_PREEMPTIVE;
+        }
+        CONTRACTL_END;
+
+#ifndef FEATURE_PAL
+        if (m_hTimer)
+            WaitForSingleObject(m_hTimer, INFINITE);
+        else
+#endif // !FEATURE_PAL
+            __SwitchToThread(GATE_THREAD_DELAY, CALLER_LIMITS_SPINNING);
+    }
+};
+
+
+DWORD __stdcall ThreadpoolMgr::GateThreadStart(LPVOID lpArgs)
+{
+    ClrFlsSetThreadType (ThreadType_Gate);
+
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    // The gate thread is only needed if the CLR is providing part of the ThreadPool implementation.
+    _ASSERTE(!CLRThreadpoolHosted() || !CLRIoCompletionHosted());
+
+    _ASSERTE(GateThreadStatus == GATE_THREAD_STATUS_REQUESTED);
+
+    GateThreadTimer timer;
+
+    // TODO: do we need to do this?
+    timer.Wait(); // delay getting initial CPU reading
+
+#ifndef FEATURE_PAL
+    PROCESS_CPU_INFORMATION prevCPUInfo;
+
+    if (!g_pufnNtQuerySystemInformation)
+    {
+        _ASSERT(!"NtQuerySystemInformation API not available!");
+        return 0;
+    }
+
+    //GateThread can start before EESetup, so ensure CPU group information is initialized;
+    CPUGroupInfo::EnsureInitialized();
+
+    // initialize CPU usage information structure;
+    prevCPUInfo.idleTime.QuadPart   = 0;
+    prevCPUInfo.kernelTime.QuadPart = 0;
+    prevCPUInfo.userTime.QuadPart   = 0;
+
+    PREFIX_ASSUME(NumberOfProcessors < 65536);
+    prevCPUInfo.numberOfProcessors = NumberOfProcessors;
+
+    /* In following cases, affinity mask can be zero
+     * 1. hosted, the hosted process already uses multiple cpu groups.
+     *    thus, during CLR initialization, GetCurrentProcessCpuCount() returns 64, and GC threads
+     *    are created to fill up the initial CPU group. ==> use g_SystemInfo.dwNumberOfProcessors
+     * 2. GCCpuGroups=1, CLR creates GC threads for all processors in all CPU groups
+     *    thus, the threadpool thread would use a whole CPU group (if Thread_UseAllCpuGroups is not set).
+     *    ==> use g_SystemInfo.dwNumberOfProcessors.
+     * 3. !defined(FEATURE_PAL) but defined(FEATURE_CORESYSTEM), GetCurrentProcessCpuCount()
+     *    returns g_SystemInfo.dwNumberOfProcessors ==> use g_SystemInfo.dwNumberOfProcessors;
+     * Other cases:
+     * 1. Normal case: the mask is all or a subset of all processors in a CPU group;
+     * 2. GCCpuGroups=1 && Thread_UseAllCpuGroups = 1, the mask is not used
+     */
+    prevCPUInfo.affinityMask = GetCurrentProcessCpuMask();
+    if (prevCPUInfo.affinityMask == 0) 
+    {   // create a mask that has g_SystemInfo.dwNumberOfProcessors;
+        DWORD_PTR mask = 0, maskpos = 1;
+        for (unsigned int i=0; i < g_SystemInfo.dwNumberOfProcessors; i++)
+        {
+             mask |= maskpos;
+             maskpos <<= 1;
+        }
+        prevCPUInfo.affinityMask = mask;
+    }
+
+    // in some cases GetCurrentProcessCpuCount() returns a number larger than
+    // g_SystemInfo.dwNumberOfProcessor when there are CPU groups, use the larger
+    // one to create buffer. This buffer must be cleared with 0's to get correct
+    // CPU usage statistics
+    int elementsNeeded = NumberOfProcessors > g_SystemInfo.dwNumberOfProcessors ?
+                                                  NumberOfProcessors : g_SystemInfo.dwNumberOfProcessors;
+    if (!ClrSafeInt<int>::multiply(elementsNeeded, sizeof(SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION), 
+                                                  prevCPUInfo.usageBufferSize))
+        return 0;
+
+    prevCPUInfo.usageBuffer = (SYSTEM_PROCESSOR_PERFORMANCE_INFORMATION *)alloca(prevCPUInfo.usageBufferSize);
+    if (prevCPUInfo.usageBuffer == NULL)
+        return 0;
+
+    memset((void *)prevCPUInfo.usageBuffer, 0, prevCPUInfo.usageBufferSize); //must clear it with 0s
+
+    GetCPUBusyTime_NT(&prevCPUInfo);
+#else // !FEATURE_PAL
+    PAL_IOCP_CPU_INFORMATION prevCPUInfo;
+    GetCPUBusyTime_NT(&prevCPUInfo);                  // ignore return value the first time
+#endif // !FEATURE_PAL
+    
+    BOOL IgnoreNextSample = FALSE;
+
+    do
+    {
+        timer.Wait();
+
+        if(CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_EnableWorkerTracking))
+            FireEtwThreadPoolWorkingThreadCount(TakeMaxWorkingThreadCount(), GetClrInstanceId());
+
+#ifdef DEBUGGING_SUPPORTED
+        // if we are stopped at a debug breakpoint, go back to sleep
+        if (CORDebuggerAttached() && g_pDebugInterface->IsStopped())
+            continue;
+#endif // DEBUGGING_SUPPORTED
+
+        if(g_IsPaused)
+        {
+            _ASSERTE(g_ClrResumeEvent.IsValid());
+            EX_TRY {
+                g_ClrResumeEvent.Wait(INFINITE, TRUE);
+            }
+            EX_CATCH {
+                // Assert on debug builds 
+                _ASSERTE(FALSE);
+            }
+            EX_END_CATCH(SwallowAllExceptions);
+        }
+
+        if (!GCHeap::IsGCInProgress(FALSE) )
+        {
+            if (IgnoreNextSample)
+            {
+                IgnoreNextSample = FALSE;
+                int cpuUtilizationTemp = GetCPUBusyTime_NT(&prevCPUInfo);            // updates prevCPUInfo as side effect
+                // don't artificially drive down average if cpu is high
+                if (cpuUtilizationTemp <= CpuUtilizationLow)
+                    cpuUtilization = CpuUtilizationLow + 1;
+                else
+                    cpuUtilization = cpuUtilizationTemp;
+            }
+            else
+            {
+                cpuUtilization = GetCPUBusyTime_NT(&prevCPUInfo);            // updates prevCPUInfo as side effect
+            }
+        }
+        else
+        {
+            int cpuUtilizationTemp = GetCPUBusyTime_NT(&prevCPUInfo);            // updates prevCPUInfo as side effect
+            // don't artificially drive down average if cpu is high
+            if (cpuUtilizationTemp <= CpuUtilizationLow)
+                cpuUtilization = CpuUtilizationLow + 1;
+            else
+                cpuUtilization = cpuUtilizationTemp;
+            IgnoreNextSample = TRUE;
+        }
+
+#ifndef FEATURE_PAL
+        // don't mess with CP thread pool settings if not initialized yet
+        if (InitCompletionPortThreadpool)
+        {
+            _ASSERTE (!CLRIoCompletionHosted());
+
+            ThreadCounter::Counts oldCounts, newCounts;
+            oldCounts = CPThreadCounter.GetCleanCounts();
+
+            if (oldCounts.NumActive == oldCounts.NumWorking &&
+                oldCounts.NumRetired == 0 &&
+                oldCounts.NumActive < MaxLimitTotalCPThreads &&
+                !g_fCompletionPortDrainNeeded &&
+                NumCPInfrastructureThreads == 0 &&       // infrastructure threads count as "to be free as needed"
+                !GCHeap::IsGCInProgress(TRUE))
+
+            {
+                BOOL status;
+                DWORD numBytes;
+                size_t key;
+                LPOVERLAPPED pOverlapped;
+                DWORD errorCode;
+
+                errorCode = S_OK;
+
+                status = GetQueuedCompletionStatus(
+                            GlobalCompletionPort,
+                            &numBytes,
+                            (PULONG_PTR)&key,
+                            &pOverlapped,
+                            0 // immediate return
+                            );
+
+                if (status == 0)
+                {
+                    errorCode = GetLastError();
+                }
+
+                if(pOverlapped == &overlappedForContinueCleanup)
+                {
+                    // if we picked up a "Continue Drainage" notification DO NOT create a new CP thread
+                }
+                else 
+                if (errorCode != WAIT_TIMEOUT)
+                {
+                    QueuedStatus *CompletionStatus = NULL;
+
+                    // loop, retrying until memory is allocated.  Under such conditions the gate
+                    // thread is not useful anyway, so I feel comfortable with this behavior
+                    do
+                    {
+                        // make sure to free mem later in thread
+                        CompletionStatus = new (nothrow) QueuedStatus;
+                        if (CompletionStatus == NULL)
+                        {
+                            __SwitchToThread(GATE_THREAD_DELAY, CALLER_LIMITS_SPINNING);
+                        }
+                    }
+                    while (CompletionStatus == NULL);
+
+                    CompletionStatus->numBytes = numBytes;
+                    CompletionStatus->key = (PULONG_PTR)key;
+                    CompletionStatus->pOverlapped = pOverlapped;
+                    CompletionStatus->errorCode = errorCode;
+
+                    // IOCP threads are created as "active" and "working"
+                    while (true)
+                    {
+                        oldCounts = CPThreadCounter.GetCleanCounts();
+                        newCounts = oldCounts;
+                        newCounts.NumActive++;
+                        newCounts.NumWorking++;
+                        if (oldCounts == CPThreadCounter.CompareExchangeCounts(newCounts, oldCounts))
+                            break;
+                    }
+
+                    // loop, retrying until thread is created.
+                    while (!CreateCompletionPortThread((LPVOID)CompletionStatus))
+                    {
+                        __SwitchToThread(GATE_THREAD_DELAY, CALLER_LIMITS_SPINNING);
+                    }
+                }
+            }
+            else if (cpuUtilization < CpuUtilizationLow)
+            {
+                // this could be an indication that threads might be getting blocked or there is no work
+                if (oldCounts.NumWorking == oldCounts.NumActive &&                // don't bump the limit if there are already free threads
+                    oldCounts.NumRetired > 0) 
+                {
+                    RetiredCPWakeupEvent->Set();
+                }
+            }
+        }
+#endif // !FEATURE_PAL
+
+        if (!CLRThreadpoolHosted() &&
+            (0 == CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_DisableStarvationDetection)))
+        {
+            if (PerAppDomainTPCountList::AreRequestsPendingInAnyAppDomains() && SufficientDelaySinceLastDequeue())
+            {
+                DangerousNonHostedSpinLockHolder tal(&ThreadAdjustmentLock);
+
+                ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+                while (counts.NumActive < MaxLimitTotalWorkerThreads && //don't add a thread if we're at the max
+                       counts.NumActive >= counts.MaxWorking)            //don't add a thread if we're already in the process of adding threads
+                {
+                    bool breakIntoDebugger = (0 != CLRConfig::GetConfigValue(CLRConfig::INTERNAL_ThreadPool_DebugBreakOnWorkerStarvation));
+                    if (breakIntoDebugger)
+                    {
+                        OutputDebugStringW(W("The CLR ThreadPool detected work queue starvation!"));
+                        DebugBreak();
+                    }
+
+                    ThreadCounter::Counts newCounts = counts;
+                    newCounts.MaxWorking = newCounts.NumActive + 1;
+
+                    ThreadCounter::Counts oldCounts = WorkerCounter.CompareExchangeCounts(newCounts, counts);
+                    if (oldCounts == counts)
+                    {
+                        HillClimbingInstance.ForceChange(newCounts.MaxWorking, Starvation);
+                        MaybeAddWorkingWorker();
+                        break;
+                    }
+                    else
+                    {
+                        counts = oldCounts;
+                    }
+                }
+            }
+        }
+    }
+    while (ShouldGateThreadKeepRunning());
+
+    return 0;
+}
+
+// called by logic to spawn a new completion port thread.
+// return false if not enough time has elapsed since the last
+// time we sampled the cpu utilization.
+BOOL ThreadpoolMgr::SufficientDelaySinceLastSample(unsigned int LastThreadCreationTime,
+                                                   unsigned NumThreads,   // total number of threads of that type (worker or CP)
+                                                   double    throttleRate // the delay is increased by this percentage for each extra thread
+                                                   )
+{
+    LIMITED_METHOD_CONTRACT;
+
+    unsigned dwCurrentTickCount =  GetTickCount();
+
+    unsigned delaySinceLastThreadCreation = dwCurrentTickCount - LastThreadCreationTime;
+
+    unsigned minWaitBetweenThreadCreation =  GATE_THREAD_DELAY;
+
+    if (throttleRate > 0.0)
+    {
+        _ASSERTE(throttleRate <= 1.0);
+
+        unsigned adjustedThreadCount = NumThreads > NumberOfProcessors ? (NumThreads - NumberOfProcessors) : 0;
+
+        minWaitBetweenThreadCreation = (unsigned) (GATE_THREAD_DELAY * pow((1.0 + throttleRate),(double)adjustedThreadCount));
+    }
+    // the amount of time to wait should grow up as the number of threads is increased
+
+    return (delaySinceLastThreadCreation > minWaitBetweenThreadCreation);
+
+}
+
+
+// called by logic to spawn new worker threads, return true if it's been too long
+// since the last dequeue operation - takes number of worker threads into account
+// in deciding "too long"
+BOOL ThreadpoolMgr::SufficientDelaySinceLastDequeue()
+{
+    LIMITED_METHOD_CONTRACT;
+
+    #define DEQUEUE_DELAY_THRESHOLD (GATE_THREAD_DELAY * 2)
+
+    unsigned delay = GetTickCount() - LastDequeueTime;
+    unsigned tooLong;
+
+    if(cpuUtilization < CpuUtilizationLow)
+    {
+        tooLong = GATE_THREAD_DELAY;
+    }
+    else       
+    {
+        ThreadCounter::Counts counts = WorkerCounter.GetCleanCounts();
+        unsigned numThreads = counts.MaxWorking;
+        tooLong = numThreads * DEQUEUE_DELAY_THRESHOLD;
+    }
+
+    return (delay > tooLong);
+
+}
+
+
+#ifdef _MSC_VER
+#ifdef _WIN64
+#pragma warning (default : 4716)
+#else
+#pragma warning (default : 4715)
+#endif
+#endif
+
+/************************************************************************/
+
+struct CreateTimerThreadParams {
+    CLREvent    event;
+    BOOL        setupSucceeded;
+};
+
+BOOL ThreadpoolMgr::CreateTimerQueueTimer(PHANDLE phNewTimer,
+                                          WAITORTIMERCALLBACK Callback,
+                                          PVOID Parameter,
+                                          DWORD DueTime,
+                                          DWORD Period,
+                                          ULONG Flag)
+{
+    CONTRACTL
+    {
+        THROWS;     // EnsureInitialized, CreateAutoEvent can throw
+        if (GetThread()) {GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}  // There can be calls thru ICorThreadpool
+        MODE_ANY;
+        INJECT_FAULT(COMPlusThrowOM());
+    }
+    CONTRACTL_END;
+
+    EnsureInitialized();
+
+    // For now we use just one timer thread. Consider using multiple timer threads if
+    // number of timers in the queue exceeds a certain threshold. The logic and code
+    // would be similar to the one for creating wait threads.
+    if (NULL == TimerThread)
+    {
+        CrstHolder csh(&TimerQueueCriticalSection);
+
+        // check again
+        if (NULL == TimerThread)
+        {
+            CreateTimerThreadParams params;
+            params.event.CreateAutoEvent(FALSE);
+            params.setupSucceeded = FALSE;
+
+            HANDLE TimerThreadHandle = Thread::CreateUtilityThread(Thread::StackSize_Small, TimerThreadStart, &params);
+
+            if (TimerThreadHandle == NULL)
+            {
+                params.event.CloseEvent();
+                ThrowOutOfMemory();
+            }
+
+            {
+                GCX_PREEMP();
+                for(;;)
+                {
+                    // if a host throws because it couldnt allocate another thread,
+                    // just retry the wait.
+                    if (SafeWait(&params.event,INFINITE, FALSE) != WAIT_TIMEOUT)
+                        break;
+                }
+            }
+            params.event.CloseEvent();
+
+            if (!params.setupSucceeded)
+            {
+                CloseHandle(TimerThreadHandle);
+                return FALSE;
+            }
+
+            TimerThread = TimerThreadHandle;
+        }
+
+    }
+
+
+    NewHolder<TimerInfo> timerInfoHolder;
+    TimerInfo * timerInfo = new (nothrow) TimerInfo;
+    *phNewTimer = (HANDLE) timerInfo;
+
+    if (NULL == timerInfo)
+        ThrowOutOfMemory();
+
+    timerInfoHolder.Assign(timerInfo);
+
+    timerInfo->FiringTime = DueTime;
+    timerInfo->Function = Callback;
+    timerInfo->Context = Parameter;
+    timerInfo->Period = Period;
+    timerInfo->state = 0;
+    timerInfo->flag = Flag;
+    timerInfo->ExternalCompletionEvent = INVALID_HANDLE;
+    timerInfo->ExternalEventSafeHandle = NULL;
+    timerInfo->handleOwningAD = (ADID) 0;
+
+    BOOL status = QueueUserAPC((PAPCFUNC)InsertNewTimer,TimerThread,(size_t)timerInfo);
+    if (FALSE == status)
+    {
+        return FALSE;
+    }
+
+    timerInfoHolder.SuppressRelease();
+    return TRUE;
+}
+
+#ifdef _MSC_VER
+#ifdef _WIN64
+#pragma warning (disable : 4716)
+#else
+#pragma warning (disable : 4715)
+#endif
+#endif
+DWORD __stdcall ThreadpoolMgr::TimerThreadStart(LPVOID p)
+{
+    ClrFlsSetThreadType (ThreadType_Timer);
+
+    STATIC_CONTRACT_THROWS;
+    STATIC_CONTRACT_GC_TRIGGERS;        // due to SetApartment
+    STATIC_CONTRACT_MODE_PREEMPTIVE;
+    STATIC_CONTRACT_SO_INTOLERANT;
+    /* cannot use contract because of SEH
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;*/
+
+    CreateTimerThreadParams* params = (CreateTimerThreadParams*)p;
+
+    Thread* pThread = SetupThreadNoThrow();
+
+    params->setupSucceeded = (pThread == NULL) ? 0 : 1;
+    params->event.Set();
+
+    if (pThread == NULL)
+        return 0;
+
+    pTimerThread = pThread;
+    // Timer threads never die
+
+    LastTickCount = GetTickCount();
+
+#ifdef FEATURE_COMINTEROP
+    if (pThread->SetApartment(Thread::AS_InMTA, TRUE) != Thread::AS_InMTA)
+    {
+        // @todo: should we log the failure
+        goto Exit;
+    }
+#endif // FEATURE_COMINTEROP
+
+    for (;;)
+    {
+         // moved to its own function since EX_TRY consumes stack
+#ifdef _MSC_VER
+#pragma inline_depth (0) // the function containing EX_TRY can't be inlined here
+#endif
+        TimerThreadFire();
+#ifdef _MSC_VER
+#pragma inline_depth (20)
+#endif
+    }
+
+#ifdef FEATURE_COMINTEROP
+// unreachable code
+//    if (pThread) {
+//        pThread->SetApartment(Thread::AS_Unknown, TRUE);
+//    }
+Exit:
+
+    // @todo: replace with host provided ExitThread
+    return 0;
+#endif
+}
+
+void ThreadpoolMgr::TimerThreadFire()
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+    }
+    CONTRACTL_END;
+
+    EX_TRY {
+        DWORD timeout = FireTimers();
+
+#undef SleepEx
+        SleepEx(timeout, TRUE);
+#define SleepEx(a,b) Dont_Use_SleepEx(a,b)
+
+        // the thread could wake up either because an APC completed or the sleep timeout
+        // in both case, we need to sweep the timer queue, firing timers, and readjusting
+        // the next firing time
+
+    }
+    EX_CATCH {
+        // Assert on debug builds since a dead timer thread is a fatal error
+        _ASSERTE(FALSE);
+        if (SwallowUnhandledExceptions())
+        {
+            // Do nothing to swallow the exception
+        }
+        else
+        {
+            EX_RETHROW;
+        }
+    }
+    EX_END_CATCH(SwallowAllExceptions);
+}
+
+#ifdef _MSC_VER
+#ifdef _WIN64
+#pragma warning (default : 4716)
+#else
+#pragma warning (default : 4715)
+#endif
+#endif
+
+// Executed as an APC in timer thread
+void ThreadpoolMgr::InsertNewTimer(TimerInfo* pArg)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+    STATIC_CONTRACT_SO_INTOLERANT;
+
+    _ASSERTE(pArg);
+    TimerInfo * timerInfo = pArg;
+
+    if (timerInfo->state & TIMER_DELETE)
+    {   // timer was deleted before it could be registered
+        DeleteTimer(timerInfo);
+        return;
+    }
+
+    // set the firing time = current time + due time (note initially firing time = due time)
+    DWORD currentTime = GetTickCount();
+    if (timerInfo->FiringTime == (ULONG) -1)
+    {
+        timerInfo->state = TIMER_REGISTERED;
+        timerInfo->refCount = 1;
+
+    }
+    else
+    {
+        timerInfo->FiringTime += currentTime;
+
+        timerInfo->state = (TIMER_REGISTERED | TIMER_ACTIVE);
+        timerInfo->refCount = 1;
+
+        // insert the timer in the queue
+        InsertTailList(&TimerQueue,(&timerInfo->link));
+    }
+
+    return;
+}
+
+
+// executed by the Timer thread
+// sweeps through the list of timers, readjusting the firing times, queueing APCs for
+// those that have expired, and returns the next firing time interval
+DWORD ThreadpoolMgr::FireTimers()
+{
+    CONTRACTL
+    {
+        THROWS;     // QueueUserWorkItem can throw
+        if (GetThread()) { GC_TRIGGERS;} else {DISABLED(GC_NOTRIGGER);}
+        if (GetThread()) { MODE_PREEMPTIVE;} else { DISABLED(MODE_ANY);}
+    }
+    CONTRACTL_END;
+
+    DWORD currentTime = GetTickCount();
+    DWORD nextFiringInterval = (DWORD) -1;
+    TimerInfo* timerInfo = NULL;
+    
+    EX_TRY 
+    {
+        for (LIST_ENTRY* node = (LIST_ENTRY*) TimerQueue.Flink;
+             node != &TimerQueue;
+            )
+        {
+            timerInfo = (TimerInfo*) node;
+            node = (LIST_ENTRY*) node->Flink;
+
+            if (TimeExpired(LastTickCount, currentTime, timerInfo->FiringTime))
+            {
+                if (timerInfo->Period == 0 || timerInfo->Period == (ULONG) -1)
+                {
+                    DeactivateTimer(timerInfo);
+                }
+
+                InterlockedIncrement(&timerInfo->refCount);
+
+                QueueUserWorkItem(AsyncTimerCallbackCompletion,
+                                  timerInfo,
+                                  QUEUE_ONLY /* TimerInfo take care of deleting*/);
+
+                timerInfo->FiringTime = currentTime+timerInfo->Period;
+
+                if ((timerInfo->Period != 0) && (timerInfo->Period != (ULONG) -1) && (nextFiringInterval > timerInfo->Period))
+                    nextFiringInterval = timerInfo->Period;
+            }
+
+            else
+            {
+                DWORD firingInterval = TimeInterval(timerInfo->FiringTime,currentTime);
+                if (firingInterval < nextFiringInterval)
+                    nextFiringInterval = firingInterval;
+            }
+        }
+    } 
+    EX_CATCH 
+    {
+        // If QueueUserWorkItem throws OOM, swallow the exception and retry on
+        // the next call to FireTimers(), otherwise retrhow.
+        Exception *ex = GET_EXCEPTION();
+        // undo the call to DeactivateTimer()
+        InterlockedDecrement(&timerInfo->refCount);
+        timerInfo->state = timerInfo->state & TIMER_ACTIVE;
+        InsertTailList(&TimerQueue, (&timerInfo->link));
+        if (ex->GetHR() != E_OUTOFMEMORY)
+        {
+           EX_RETHROW;
+        }
+    }
+    EX_END_CATCH(RethrowTerminalExceptions);
+
+    LastTickCount = currentTime;
+
+    return nextFiringInterval;
+}
+
+DWORD __stdcall ThreadpoolMgr::AsyncTimerCallbackCompletion(PVOID pArgs)
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+        SO_TOLERANT;
+    }
+    CONTRACTL_END;
+
+    Thread* pThread = GetThread();
+
+    if (pThread == NULL)
+    {
+        HRESULT hr = ERROR_SUCCESS;
+
+        ClrFlsSetThreadType(ThreadType_Threadpool_Worker);
+        pThread = SetupThreadNoThrow(&hr);
+
+        if (pThread == NULL)
+        {
+            return hr;
+        }
+    }
+
+    BEGIN_SO_INTOLERANT_CODE(pThread);
+    {
+        TimerInfo* timerInfo = (TimerInfo*) pArgs;
+        ((WAITORTIMERCALLBACKFUNC) timerInfo->Function) (timerInfo->Context, TRUE) ;
+
+        if (InterlockedDecrement(&timerInfo->refCount) == 0)
+        {
+            DeleteTimer(timerInfo);
+        }
+    }
+    END_SO_INTOLERANT_CODE;
+
+    return ERROR_SUCCESS;
+}
+
+
+// removes the timer from the timer queue, thereby cancelling it
+// there may still be pending callbacks that haven't completed
+void ThreadpoolMgr::DeactivateTimer(TimerInfo* timerInfo)
+{
+    LIMITED_METHOD_CONTRACT;
+
+    RemoveEntryList((LIST_ENTRY*) timerInfo);
+
+    // This timer info could go into another linked list of timer infos
+    // waiting to be released. Reinitialize the list pointers
+    InitializeListHead(&timerInfo->link);
+    timerInfo->state = timerInfo->state & ~TIMER_ACTIVE;
+}
+
+DWORD __stdcall ThreadpoolMgr::AsyncDeleteTimer(PVOID pArgs)
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_PREEMPTIVE;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+
+    Thread * pThread = GetThread();
+
+    if (pThread == NULL)
+    {
+        HRESULT hr = ERROR_SUCCESS;
+
+        ClrFlsSetThreadType(ThreadType_Threadpool_Worker);
+        pThread = SetupThreadNoThrow(&hr);
+
+        if (pThread == NULL)
+        {
+            return hr;
+        }
+    }
+
+    DeleteTimer((TimerInfo*) pArgs);
+
+    return ERROR_SUCCESS;
+}
+
+void ThreadpoolMgr::DeleteTimer(TimerInfo* timerInfo)
+{
+    CONTRACTL
+    {
+        if (GetThread() == pTimerThread) { NOTHROW; } else { THROWS; }
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE((timerInfo->state & TIMER_ACTIVE) == 0);
+
+    _ASSERTE(!(timerInfo->flag & WAIT_FREE_CONTEXT));
+
+    if (timerInfo->flag & WAIT_INTERNAL_COMPLETION)
+    {
+        timerInfo->InternalCompletionEvent.Set();
+        return; // the timerInfo will be deleted by the thread that's waiting on InternalCompletionEvent
+    }
+
+    // ExternalCompletionEvent comes from Host, ExternalEventSafeHandle from managed code.
+    // They are mutually exclusive.
+    _ASSERTE(!(timerInfo->ExternalCompletionEvent != INVALID_HANDLE && 
+                        timerInfo->ExternalEventSafeHandle != NULL));
+
+    if (timerInfo->ExternalCompletionEvent != INVALID_HANDLE)
+    {
+        UnsafeSetEvent(timerInfo->ExternalCompletionEvent);
+        timerInfo->ExternalCompletionEvent = INVALID_HANDLE;
+    }
+
+    // We cannot block the timer thread, so some cleanup is deferred to other threads.
+    if (GetThread() == pTimerThread)
+    {
+        // Notify the ExternalEventSafeHandle with an user work item 
+        if (timerInfo->ExternalEventSafeHandle != NULL)
+        {
+            BOOL success = FALSE;
+            EX_TRY
+            {
+                if (QueueUserWorkItem(AsyncDeleteTimer,
+                          timerInfo,
+                          QUEUE_ONLY) != FALSE)
+                {
+                    success = TRUE;
+                }
+            }
+            EX_CATCH
+            {
+            }
+            EX_END_CATCH(SwallowAllExceptions);
+
+            // If unable to queue a user work item, fall back to queueing timer for release
+            // which will happen *sometime* in the future.
+            if (success == FALSE)
+            {
+                QueueTimerInfoForRelease(timerInfo);
+            }    
+            
+            return;
+        }
+
+        // Releasing GC handles can block. So we wont do this on the timer thread.
+        // We'll put it in a list which will be processed by a worker thread
+        if (timerInfo->Context != NULL)
+        {
+            QueueTimerInfoForRelease(timerInfo);
+            return;
+        }
+    }
+
+    // To get here we are either not the Timer thread or there is no blocking work to be done
+    
+    if (timerInfo->Context != NULL)
+    {
+        GCX_COOP();
+        DelegateInfo *pDelInfo = (DelegateInfo *)timerInfo->Context;
+        pDelInfo->Release();
+        RecycleMemory( pDelInfo, MEMTYPE_DelegateInfo );
+    }
+
+    if (timerInfo->ExternalEventSafeHandle != NULL)
+    {
+        ReleaseTimerInfo(timerInfo);
+    }
+
+    delete timerInfo;
+    
+}
+
+// We add TimerInfos from deleted timers into a linked list.
+// A worker thread will later release the handles held by the TimerInfo
+// and recycle them if possible (See DelegateInfo::MakeDelegateInfo)
+void ThreadpoolMgr::QueueTimerInfoForRelease(TimerInfo *pTimerInfo)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    // The synchronization in this method depends on the fact that
+    //  - There is only one timer thread
+    //  - The one and only timer thread is executing this method.
+    //  - This function wont go into an alertable state. That could trigger another APC.
+    // Else two threads can be queueing timerinfos and a race could
+    // lead to leaked memory and handles
+    _ASSERTE(GetThread());
+    _ASSERTE(pTimerThread == GetThread());
+    TimerInfo *pHead = NULL;
+
+    // Make sure this timer info has been deactivated and removed from any other lists
+    _ASSERTE((pTimerInfo->state & TIMER_ACTIVE) == 0);
+    //_ASSERTE(pTimerInfo->link.Blink == &(pTimerInfo->link) &&
+    //    pTimerInfo->link.Flink == &(pTimerInfo->link));
+    // Make sure "link" is the first field in TimerInfo
+    _ASSERTE(pTimerInfo == (PVOID)&pTimerInfo->link);
+
+    // Grab any previously published list
+    if ((pHead = InterlockedExchangeT(&TimerInfosToBeRecycled, NULL)) != NULL)
+    {
+        // If there already is a list, just append
+        InsertTailList((LIST_ENTRY *)pHead, &pTimerInfo->link);
+        pTimerInfo = pHead;
+    }
+    else
+        // If this is the head, make its next and previous ptrs point to itself
+        InitializeListHead((LIST_ENTRY*)&pTimerInfo->link);
+
+    // Publish the list
+    (void) InterlockedExchangeT(&TimerInfosToBeRecycled, pTimerInfo);
+
+}
+
+void ThreadpoolMgr::FlushQueueOfTimerInfos()
+{
+    CONTRACTL
+    {
+        THROWS;
+        GC_TRIGGERS;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    TimerInfo *pHeadTimerInfo = NULL, *pCurrTimerInfo = NULL;
+    LIST_ENTRY *pNextInfo = NULL;
+
+    if ((pHeadTimerInfo = InterlockedExchangeT(&TimerInfosToBeRecycled, NULL)) == NULL)
+        return;
+
+    do
+    {
+        RemoveHeadList((LIST_ENTRY *)pHeadTimerInfo, pNextInfo);
+        _ASSERTE(pNextInfo != NULL);
+
+        pCurrTimerInfo = (TimerInfo *) pNextInfo;
+
+        GCX_COOP();
+        if (pCurrTimerInfo->Context != NULL)
+        {
+            DelegateInfo *pCurrDelInfo = (DelegateInfo *) pCurrTimerInfo->Context;
+            pCurrDelInfo->Release();
+
+            RecycleMemory( pCurrDelInfo, MEMTYPE_DelegateInfo );
+        }
+
+        if (pCurrTimerInfo->ExternalEventSafeHandle != NULL)
+        {
+            ReleaseTimerInfo(pCurrTimerInfo);
+        }
+
+        delete pCurrTimerInfo;
+
+    }
+    while ((TimerInfo *)pNextInfo != pHeadTimerInfo);
+}
+
+/************************************************************************/
+BOOL ThreadpoolMgr::ChangeTimerQueueTimer(
+                                        HANDLE Timer,
+                                        ULONG DueTime,
+                                        ULONG Period)
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+        GC_NOTRIGGER;
+        INJECT_FAULT(COMPlusThrowOM());
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(IsInitialized());
+    _ASSERTE(Timer);                    // not possible to give invalid handle in managed code
+
+    NewHolder<TimerUpdateInfo> updateInfoHolder;
+    TimerUpdateInfo *updateInfo = new TimerUpdateInfo;
+    updateInfoHolder.Assign(updateInfo);
+
+    updateInfo->Timer = (TimerInfo*) Timer;
+    updateInfo->DueTime = DueTime;
+    updateInfo->Period = Period;
+
+    BOOL status = QueueUserAPC((PAPCFUNC)UpdateTimer,
+                               TimerThread,
+                               (size_t) updateInfo);
+
+    if (status)
+        updateInfoHolder.SuppressRelease();
+
+    return(status);
+}
+
+void ThreadpoolMgr::UpdateTimer(TimerUpdateInfo* pArgs)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_NOTRIGGER;
+        MODE_ANY;
+    }
+    CONTRACTL_END;
+
+    TimerUpdateInfo* updateInfo = (TimerUpdateInfo*) pArgs;
+    TimerInfo* timerInfo = updateInfo->Timer;
+
+    timerInfo->Period = updateInfo->Period;
+
+    if (updateInfo->DueTime == (ULONG) -1)
+    {
+        if (timerInfo->state & TIMER_ACTIVE)
+        {
+            DeactivateTimer(timerInfo);
+        }
+        // else, noop (the timer was already inactive)
+        _ASSERTE((timerInfo->state & TIMER_ACTIVE) == 0);
+
+        delete updateInfo;
+        return;
+    }
+
+    DWORD currentTime = GetTickCount();
+    timerInfo->FiringTime = currentTime + updateInfo->DueTime;
+
+    delete updateInfo;
+
+    if (! (timerInfo->state & TIMER_ACTIVE))
+    {
+        // timer not active (probably a one shot timer that has expired), so activate it
+        timerInfo->state |= TIMER_ACTIVE;
+        _ASSERTE(timerInfo->refCount >= 1);
+        // insert the timer in the queue
+        InsertTailList(&TimerQueue,(&timerInfo->link));
+
+    }
+
+    return;
+}
+
+/************************************************************************/
+BOOL ThreadpoolMgr::DeleteTimerQueueTimer(
+                                        HANDLE Timer,
+                                        HANDLE Event)
+{
+    CONTRACTL
+    {
+        THROWS;
+        MODE_ANY;
+        GC_TRIGGERS;
+    }
+    CONTRACTL_END;
+
+    _ASSERTE(IsInitialized());          // cannot call delete before creating timer
+    _ASSERTE(Timer);                    // not possible to give invalid handle in managed code
+
+    // make volatile to avoid compiler reordering check after async call.
+    // otherwise, DeregisterTimer could delete timerInfo before the comparison.
+    VolatilePtr<TimerInfo> timerInfo = (TimerInfo*) Timer;
+
+    if (Event == (HANDLE) -1)
+    {
+        //CONTRACT_VIOLATION(ThrowsViolation);
+        timerInfo->InternalCompletionEvent.CreateAutoEvent(FALSE);
+        timerInfo->flag |= WAIT_INTERNAL_COMPLETION;
+    }
+    else if (Event)
+    {
+        timerInfo->ExternalCompletionEvent = Event;
+    }
+#ifdef _DEBUG
+    else /* Event == NULL */
+    {
+        _ASSERTE(timerInfo->ExternalCompletionEvent == INVALID_HANDLE);
+    }
+#endif
+
+    BOOL isBlocking = timerInfo->flag & WAIT_INTERNAL_COMPLETION;
+
+    BOOL status = QueueUserAPC((PAPCFUNC)DeregisterTimer,
+                               TimerThread,
+                               (size_t)(TimerInfo*)timerInfo);
+
+    if (FALSE == status)
+    {
+        if (isBlocking)
+            timerInfo->InternalCompletionEvent.CloseEvent();
+        return FALSE;
+    }
+
+    if (isBlocking)
+    {
+        _ASSERTE(timerInfo->ExternalEventSafeHandle == NULL);
+        _ASSERTE(timerInfo->ExternalCompletionEvent == INVALID_HANDLE);
+        _ASSERTE(GetThread() != pTimerThread);
+
+        timerInfo->InternalCompletionEvent.Wait(INFINITE,TRUE /*alertable*/);
+        timerInfo->InternalCompletionEvent.CloseEvent();
+        // Release handles and delete TimerInfo
+        _ASSERTE(timerInfo->refCount == 0);
+        // if WAIT_INTERNAL_COMPLETION flag is not set, timerInfo will be deleted in DeleteTimer.
+        timerInfo->flag &= ~WAIT_INTERNAL_COMPLETION;
+        DeleteTimer(timerInfo);
+    }
+    return status;
+}
+
+void ThreadpoolMgr::DeregisterTimer(TimerInfo* pArgs)
+{
+    CONTRACTL
+    {
+        NOTHROW;
+        GC_TRIGGERS;
+        MODE_PREEMPTIVE;
+        SO_INTOLERANT;
+    }
+    CONTRACTL_END;
+
+    TimerInfo* timerInfo = (TimerInfo*) pArgs;
+
+    if (! (timerInfo->state & TIMER_REGISTERED) )
+    {
+        // set state to deleted, so that it does not get registered
+        timerInfo->state |= TIMER_DELETE ;
+
+        // since the timer has not even been registered, we dont need an interlock to decrease the RefCount
+        timerInfo->refCount--;
+
+        return;
+    }
+
+    if (timerInfo->state & TIMER_ACTIVE)
+    {
+        DeactivateTimer(timerInfo);
+    }
+
+    if (InterlockedDecrement(&timerInfo->refCount) == 0 )
+    {
+        DeleteTimer(timerInfo);
+    }
+    return;
+}
+
+#endif // !DACCESS_COMPILE
-- 
cgit v1.2.3