1056 lines
31 KiB
C
1056 lines
31 KiB
C
/*++
|
||
|
||
Copyright (c) 1990 Microsoft Corporation
|
||
|
||
Module Name:
|
||
|
||
lazyrite.c
|
||
|
||
Abstract:
|
||
|
||
This module implements the lazy writer for the Cache subsystem.
|
||
|
||
Author:
|
||
|
||
Tom Miller [TomM] 22-July-1990
|
||
|
||
Revision History:
|
||
|
||
--*/
|
||
|
||
#include "cc.h"
|
||
|
||
//
|
||
// The Bug check file id for this module
|
||
//
|
||
|
||
#define BugCheckFileId (CACHE_BUG_CHECK_LAZYRITE)
|
||
|
||
//
|
||
// Define our debug constant
|
||
//
|
||
|
||
#define me 0x00000020
|
||
|
||
//
|
||
// Local support routines
|
||
//
|
||
|
||
PWORK_QUEUE_ENTRY
|
||
CcReadWorkQueue (
|
||
);
|
||
|
||
VOID
|
||
CcLazyWriteScan (
|
||
);
|
||
|
||
|
||
VOID
|
||
CcScheduleLazyWriteScan (
|
||
IN BOOLEAN FastScan
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This routine may be called to schedule the next lazy writer scan,
|
||
during which lazy write and lazy close activity is posted to other
|
||
worker threads. Callers should acquire the lazy writer spin lock
|
||
to see if the scan is currently active, and then call this routine
|
||
still holding the spin lock if not. One special call is used at
|
||
the end of the lazy write scan to propagate lazy write active once
|
||
we go active. This call is "the" scan thread, and it can therefore
|
||
safely schedule the next scan without taking out the spin lock.
|
||
|
||
Arguments:
|
||
|
||
FastScan - if set, make the scan happen immediately
|
||
|
||
Return Value:
|
||
|
||
None.
|
||
|
||
--*/
|
||
|
||
{
|
||
//
|
||
// It is important to set the active flag TRUE first for the propagate
|
||
// case, because it is conceivable that once the timer is set, another
|
||
// thread could actually run and make the scan go idle before we then
|
||
// jam the flag TRUE.
|
||
//
|
||
// When going from idle to active, we delay a little longer to let the
|
||
// app finish saving its file.
|
||
//
|
||
|
||
if (FastScan) {
|
||
|
||
LazyWriter.ScanActive = TRUE;
|
||
KeSetTimer( &LazyWriter.ScanTimer, CcNoDelay, &LazyWriter.ScanDpc );
|
||
|
||
} else if (LazyWriter.ScanActive) {
|
||
|
||
KeSetTimer( &LazyWriter.ScanTimer, CcIdleDelay, &LazyWriter.ScanDpc );
|
||
|
||
} else {
|
||
|
||
LazyWriter.ScanActive = TRUE;
|
||
KeSetTimer( &LazyWriter.ScanTimer, CcFirstDelay, &LazyWriter.ScanDpc );
|
||
}
|
||
}
|
||
|
||
|
||
VOID
|
||
CcScanDpc (
|
||
IN PKDPC Dpc,
|
||
IN PVOID DeferredContext,
|
||
IN PVOID SystemArgument1,
|
||
IN PVOID SystemArgument2
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This is the Dpc routine which runs when the scan timer goes off. It
|
||
simply posts an element for an Ex Worker thread to do the scan.
|
||
|
||
Arguments:
|
||
|
||
(All are ignored)
|
||
|
||
Return Value:
|
||
|
||
None.
|
||
|
||
--*/
|
||
|
||
{
|
||
PWORK_QUEUE_ENTRY WorkQueueEntry;
|
||
|
||
UNREFERENCED_PARAMETER(Dpc);
|
||
UNREFERENCED_PARAMETER(DeferredContext);
|
||
UNREFERENCED_PARAMETER(SystemArgument1);
|
||
UNREFERENCED_PARAMETER(SystemArgument2);
|
||
|
||
WorkQueueEntry = CcAllocateWorkQueueEntry();
|
||
|
||
//
|
||
// If we failed to allocate a WorkQueueEntry, things must
|
||
// be in pretty bad shape. However, all we have to do is
|
||
// say we are not active, and wait for another event to
|
||
// wake things up again.
|
||
//
|
||
|
||
if (WorkQueueEntry == NULL) {
|
||
|
||
LazyWriter.ScanActive = FALSE;
|
||
|
||
} else {
|
||
|
||
//
|
||
// Otherwise post a work queue entry to do the scan.
|
||
//
|
||
|
||
WorkQueueEntry->Function = (UCHAR)LazyWriteScan;
|
||
|
||
CcPostWorkQueue( WorkQueueEntry, &CcRegularWorkQueue );
|
||
}
|
||
}
|
||
|
||
|
||
NTSTATUS
|
||
CcWaitForCurrentLazyWriterActivity (
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This routine allows a thread to receive notification when the current tick
|
||
of lazy writer work has completed. It must not be called within a lazy
|
||
writer workitem! The caller must not be holding synchronization that could
|
||
block a Cc workitem!
|
||
|
||
In particular, this lets a caller insure that all available lazy closes at
|
||
the time of the call have completed.
|
||
|
||
Arguments:
|
||
|
||
None.
|
||
|
||
Return Value:
|
||
|
||
Final result of the wait.
|
||
|
||
--*/
|
||
|
||
{
|
||
KIRQL OldIrql;
|
||
KEVENT Event;
|
||
PWORK_QUEUE_ENTRY WorkQueueEntry;
|
||
|
||
WorkQueueEntry = CcAllocateWorkQueueEntry();
|
||
|
||
if (WorkQueueEntry == NULL) {
|
||
return STATUS_INSUFFICIENT_RESOURCES;
|
||
}
|
||
|
||
WorkQueueEntry->Function = (UCHAR)EventSet;
|
||
KeInitializeEvent( &Event, NotificationEvent, FALSE );
|
||
WorkQueueEntry->Parameters.Event.Event = &Event;
|
||
|
||
//
|
||
// Add this to the post-tick work queue and wake the lazy writer for it.
|
||
// The lazy writer will add this to the end of the next batch of work
|
||
// he issues.
|
||
//
|
||
|
||
CcAcquireMasterLock( &OldIrql );
|
||
|
||
InsertTailList( &CcPostTickWorkQueue, &WorkQueueEntry->WorkQueueLinks );
|
||
|
||
LazyWriter.OtherWork = TRUE;
|
||
if (!LazyWriter.ScanActive) {
|
||
CcScheduleLazyWriteScan( TRUE );
|
||
}
|
||
|
||
CcReleaseMasterLock( OldIrql );
|
||
|
||
return KeWaitForSingleObject( &Event, Executive, KernelMode, FALSE, NULL );
|
||
}
|
||
|
||
|
||
|
||
VOID
|
||
CcLazyWriteScan (
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This routine implements the Lazy Writer scan for dirty data to flush
|
||
or any other work to do (lazy close). This routine is scheduled by
|
||
calling CcScheduleLazyWriteScan.
|
||
|
||
Arguments:
|
||
|
||
None.
|
||
|
||
Return Value:
|
||
|
||
None.
|
||
|
||
--*/
|
||
|
||
{
|
||
ULONG PagesToWrite, ForegroundRate, EstimatedDirtyNextInterval;
|
||
PSHARED_CACHE_MAP SharedCacheMap, FirstVisited, NextSharedCacheMap;
|
||
KIRQL OldIrql;
|
||
ULONG LoopsWithLockHeld = 0;
|
||
BOOLEAN AlreadyMoved = FALSE;
|
||
BOOLEAN MoveBehindCursor = FALSE;
|
||
|
||
LIST_ENTRY PostTickWorkQueue;
|
||
|
||
//
|
||
// Top of Lazy Writer scan.
|
||
//
|
||
|
||
try {
|
||
|
||
//
|
||
// If there is no work to do, then we will go inactive, and return.
|
||
//
|
||
|
||
CcAcquireMasterLock( &OldIrql );
|
||
|
||
if ((CcTotalDirtyPages == 0) && !LazyWriter.OtherWork) {
|
||
|
||
//
|
||
// Sleep if there are no deferred writes. It is important to check
|
||
// proactively because writes may be blocked for reasons external
|
||
// to the cache manager. The lazy writer must keep poking since it
|
||
// may have no bytes to write itself.
|
||
//
|
||
|
||
#if DBG
|
||
//
|
||
// In DBG builds, make sure that the CcDirtySharedCacheMapList
|
||
// is really empty (except for the cursor) if we are going to sleep
|
||
// because we think there is no more work to do.
|
||
//
|
||
|
||
{
|
||
PLIST_ENTRY CurrentEntry = CcDirtySharedCacheMapList.SharedCacheMapLinks.Flink;
|
||
PSHARED_CACHE_MAP CurrentScm;
|
||
ULONG Count = 0;
|
||
|
||
while( CurrentEntry != &CcDirtySharedCacheMapList.SharedCacheMapLinks ) {
|
||
|
||
CurrentScm = CONTAINING_RECORD( CurrentEntry,
|
||
SHARED_CACHE_MAP,
|
||
SharedCacheMapLinks );
|
||
|
||
if (FlagOn(CurrentScm->Flags, WAITING_FOR_TEARDOWN)) {
|
||
Count++;
|
||
}
|
||
CurrentEntry = CurrentEntry->Flink;
|
||
}
|
||
|
||
ASSERTMSG( "CcLazyWriteScan stopped scan while SCM with the flag WAITING_FOR_TEARDOWN are still in the dirty list!\n",
|
||
Count == 0 );
|
||
}
|
||
#endif
|
||
|
||
if (IsListEmpty(&CcDeferredWrites)) {
|
||
|
||
LazyWriter.ScanActive = FALSE;
|
||
CcReleaseMasterLock( OldIrql );
|
||
|
||
} else {
|
||
|
||
CcReleaseMasterLock( OldIrql );
|
||
|
||
//
|
||
// Check for writes and schedule the next scan.
|
||
//
|
||
|
||
CcPostDeferredWrites();
|
||
CcScheduleLazyWriteScan( FALSE );
|
||
}
|
||
|
||
return;
|
||
}
|
||
|
||
//
|
||
// Pull out the post tick workitems for this pass. It is important that
|
||
// we are doing this at the top since more could be queued as we rummage
|
||
// for work to do. Post tick workitems are guaranteed to occur after all
|
||
// work generated in a complete scan.
|
||
//
|
||
|
||
InitializeListHead( &PostTickWorkQueue );
|
||
while (!IsListEmpty( &CcPostTickWorkQueue )) {
|
||
|
||
PLIST_ENTRY Entry = RemoveHeadList( &CcPostTickWorkQueue );
|
||
InsertTailList( &PostTickWorkQueue, Entry );
|
||
}
|
||
|
||
//
|
||
// Calculate the next sweep time stamp, then update all relevant fields for
|
||
// the next time around. Also we can clear the OtherWork flag.
|
||
//
|
||
|
||
LazyWriter.OtherWork = FALSE;
|
||
|
||
//
|
||
// Assume we will write our usual fraction of dirty pages. Do not do the
|
||
// divide if there is not enough dirty pages, or else we will never write
|
||
// the last few pages.
|
||
//
|
||
|
||
PagesToWrite = CcTotalDirtyPages;
|
||
if (PagesToWrite > LAZY_WRITER_MAX_AGE_TARGET) {
|
||
PagesToWrite /= LAZY_WRITER_MAX_AGE_TARGET;
|
||
}
|
||
|
||
//
|
||
// Estimate the rate of dirty pages being produced in the foreground.
|
||
// This is the total number of dirty pages now plus the number of dirty
|
||
// pages we scheduled to write last time, minus the number of dirty
|
||
// pages we have now. Throw out any cases which would not produce a
|
||
// positive rate.
|
||
//
|
||
|
||
ForegroundRate = 0;
|
||
|
||
if ((CcTotalDirtyPages + CcPagesWrittenLastTime) > CcDirtyPagesLastScan) {
|
||
ForegroundRate = (CcTotalDirtyPages + CcPagesWrittenLastTime) -
|
||
CcDirtyPagesLastScan;
|
||
}
|
||
|
||
//
|
||
// If we estimate that we will exceed our dirty page target by the end
|
||
// of this interval, then we must write more. Try to arrive on target.
|
||
//
|
||
|
||
EstimatedDirtyNextInterval = CcTotalDirtyPages - PagesToWrite + ForegroundRate;
|
||
|
||
if (EstimatedDirtyNextInterval > CcDirtyPageTarget) {
|
||
|
||
PagesToWrite += EstimatedDirtyNextInterval - CcDirtyPageTarget;
|
||
}
|
||
|
||
//
|
||
// Now save away the number of dirty pages and the number of pages we
|
||
// just calculated to write.
|
||
//
|
||
|
||
CcDirtyPagesLastScan = CcTotalDirtyPages;
|
||
CcPagesYetToWrite = CcPagesWrittenLastTime = PagesToWrite;
|
||
|
||
//
|
||
// Loop to flush enough Shared Cache Maps to write the number of pages
|
||
// we just calculated.
|
||
//
|
||
|
||
SharedCacheMap = CONTAINING_RECORD( CcLazyWriterCursor.SharedCacheMapLinks.Flink,
|
||
SHARED_CACHE_MAP,
|
||
SharedCacheMapLinks );
|
||
|
||
DebugTrace( 0, me, "Start of Lazy Writer Scan\n", 0 );
|
||
|
||
//
|
||
// Normally we would just like to visit every Cache Map once on each scan,
|
||
// so the scan will terminate normally when we return to FirstVisited. But
|
||
// in the off chance that FirstVisited gets deleted, we are guaranteed to stop
|
||
// when we get back to our own listhead.
|
||
//
|
||
|
||
FirstVisited = NULL;
|
||
while ((SharedCacheMap != FirstVisited) &&
|
||
(&SharedCacheMap->SharedCacheMapLinks != &CcLazyWriterCursor.SharedCacheMapLinks)) {
|
||
|
||
if (FirstVisited == NULL) {
|
||
FirstVisited = SharedCacheMap;
|
||
}
|
||
|
||
//
|
||
// Skip the SharedCacheMap if a write behind request is
|
||
// already queued, write behind has been disabled, or
|
||
// if there is no work to do (either dirty data to be written
|
||
// or a delete is required).
|
||
//
|
||
// Note that for streams where modified writing is disabled, we
|
||
// need to take out Bcbs exclusive, which serializes with foreground
|
||
// activity. Therefore we use a special counter in the SharedCacheMap
|
||
// to only service these once every n intervals.
|
||
//
|
||
// Skip temporary files unless we currently could not write as many
|
||
// bytes as we might charge some hapless thread for throttling, unless
|
||
// it has been closed. We assume that the "tick" of the lazy writer,
|
||
// delayed temporarily by the passcount check, will permit the common
|
||
// open/write/close/delete action on temporary files to sneak in and
|
||
// truncate the file before we really write the data, if the file was
|
||
// not opened delete-on-close to begin with.
|
||
//
|
||
// Since we will write closed files with dirty pages as part of the
|
||
// regular pass (even temporary ones), only do lazy close on files
|
||
// with no dirty pages.
|
||
//
|
||
|
||
if (!FlagOn(SharedCacheMap->Flags, WRITE_QUEUED | IS_CURSOR)
|
||
|
||
&&
|
||
|
||
(((SharedCacheMap->DirtyPages != 0)
|
||
&&
|
||
(FlagOn(SharedCacheMap->Flags, WAITING_FOR_TEARDOWN)
|
||
||
|
||
((PagesToWrite != 0)
|
||
&&
|
||
(((++SharedCacheMap->LazyWritePassCount & 0xF) == 0) ||
|
||
!FlagOn(SharedCacheMap->Flags, MODIFIED_WRITE_DISABLED) ||
|
||
(CcCapturedSystemSize == MmSmallSystem) ||
|
||
(SharedCacheMap->DirtyPages >= (4 * (MAX_WRITE_BEHIND / PAGE_SIZE))))
|
||
&&
|
||
(!FlagOn(SharedCacheMap->FileObject->Flags, FO_TEMPORARY_FILE) ||
|
||
(SharedCacheMap->OpenCount == 0) ||
|
||
!CcCanIWrite(SharedCacheMap->FileObject, WRITE_CHARGE_THRESHOLD, FALSE, MAXUCHAR)))))
|
||
|
||
||
|
||
|
||
((SharedCacheMap->OpenCount == 0) &&
|
||
(SharedCacheMap->DirtyPages == 0) ||
|
||
(SharedCacheMap->FileSize.QuadPart == 0)))) {
|
||
|
||
PWORK_QUEUE_ENTRY WorkQueueEntry;
|
||
|
||
//
|
||
// If this is a metadata stream with at least 4 times
|
||
// the maximum write behind I/O size, then let's tell
|
||
// this guy to write 1/8 of his dirty data on this pass
|
||
// so it doesn't build up.
|
||
//
|
||
// Else assume we can write everything (PagesToWrite only affects
|
||
// metadata streams - otherwise writing is controlled by the Mbcb -
|
||
// this throttle is engaged in CcWriteBehind).
|
||
//
|
||
|
||
SharedCacheMap->PagesToWrite = SharedCacheMap->DirtyPages;
|
||
|
||
if (FlagOn(SharedCacheMap->Flags, MODIFIED_WRITE_DISABLED) &&
|
||
(SharedCacheMap->PagesToWrite >= (4 * (MAX_WRITE_BEHIND / PAGE_SIZE))) &&
|
||
(CcCapturedSystemSize != MmSmallSystem)) {
|
||
|
||
SharedCacheMap->PagesToWrite /= 8;
|
||
}
|
||
|
||
//
|
||
// If still searching for pages to write, adjust our targets.
|
||
//
|
||
|
||
if (!AlreadyMoved) {
|
||
|
||
//
|
||
// See if he exhausts the number of pages to write. (We
|
||
// keep going in case there are any closes to do.)
|
||
//
|
||
|
||
if (SharedCacheMap->PagesToWrite >= PagesToWrite) {
|
||
|
||
//
|
||
// Here is where we should move the cursor to. Figure
|
||
// out if we should resume on this stream or the next one.
|
||
//
|
||
|
||
//
|
||
// For Metadata streams, set up to resume on the next stream on the
|
||
// next scan. Also force a push forward every n intervals if all of
|
||
// the pages came from this stream, so we don't get preoccupied with
|
||
// one stream at the expense of others (which may be waiting for a
|
||
// lazy close). Normally we would like to avoid seek overhead and
|
||
// take the common case of a large sequential series of writes.
|
||
//
|
||
// This is similar to hotspot detection.
|
||
//
|
||
// Note, to ensure that we iterate through the entire
|
||
// CcDirtySharedCacheMap list, we cannot move this shared
|
||
// cache map behind the cursor now. We will just
|
||
// remember that we want to move this to the end of the
|
||
// list and do the actual move when we are ready to read
|
||
// the next entry.
|
||
//
|
||
|
||
if (FlagOn(SharedCacheMap->Flags, MODIFIED_WRITE_DISABLED) ||
|
||
((FirstVisited == SharedCacheMap) &&
|
||
((SharedCacheMap->LazyWritePassCount & 0xF) == 0))) {
|
||
|
||
MoveBehindCursor = TRUE;
|
||
|
||
//
|
||
// For other streams, set up to resume on the same stream on the
|
||
// next scan.
|
||
//
|
||
|
||
} else {
|
||
|
||
RemoveEntryList( &CcLazyWriterCursor.SharedCacheMapLinks );
|
||
InsertTailList( &SharedCacheMap->SharedCacheMapLinks, &CcLazyWriterCursor.SharedCacheMapLinks );
|
||
}
|
||
|
||
PagesToWrite = 0;
|
||
AlreadyMoved = TRUE;
|
||
|
||
} else {
|
||
|
||
PagesToWrite -= SharedCacheMap->PagesToWrite;
|
||
}
|
||
}
|
||
|
||
//
|
||
// Otherwise show we are actively writing, and keep it in the dirty
|
||
// list.
|
||
//
|
||
|
||
SetFlag(SharedCacheMap->Flags, WRITE_QUEUED);
|
||
SharedCacheMap->DirtyPages += 1;
|
||
|
||
CcReleaseMasterLock( OldIrql );
|
||
|
||
//
|
||
// Queue the request to do the work to a worker thread.
|
||
//
|
||
|
||
WorkQueueEntry = CcAllocateWorkQueueEntry();
|
||
|
||
//
|
||
// If we failed to allocate a WorkQueueEntry, things must
|
||
// be in pretty bad shape. However, all we have to do is
|
||
// break out of our current loop, and try to go back and
|
||
// delay a while. Even if the current guy should have gone
|
||
// away when we clear WRITE_QUEUED, we will find him again
|
||
// in the LW scan.
|
||
//
|
||
|
||
if (WorkQueueEntry == NULL) {
|
||
|
||
CcAcquireMasterLock( &OldIrql );
|
||
ClearFlag(SharedCacheMap->Flags, WRITE_QUEUED);
|
||
SharedCacheMap->DirtyPages -= 1;
|
||
break;
|
||
}
|
||
|
||
WorkQueueEntry->Function = (UCHAR)WriteBehind;
|
||
WorkQueueEntry->Parameters.Write.SharedCacheMap = SharedCacheMap;
|
||
|
||
//
|
||
// Post it to the regular work queue.
|
||
//
|
||
|
||
CcAcquireMasterLock( &OldIrql );
|
||
SharedCacheMap->DirtyPages -= 1;
|
||
|
||
if (FlagOn( SharedCacheMap->Flags, WAITING_FOR_TEARDOWN )) {
|
||
|
||
//
|
||
// If we are waiting for this shared cache map to be torn
|
||
// down, put it at the head of the express work queue so
|
||
// that it gets processed right away.
|
||
//
|
||
|
||
CcPostWorkQueue( WorkQueueEntry, &CcExpressWorkQueue );
|
||
|
||
} else {
|
||
|
||
//
|
||
// We aren't anxiously awaiting for this shared cached map
|
||
// to go away, so just process this work item via the
|
||
// regular work queue.
|
||
//
|
||
|
||
CcPostWorkQueue( WorkQueueEntry, &CcRegularWorkQueue );
|
||
}
|
||
|
||
LoopsWithLockHeld = 0;
|
||
|
||
//
|
||
// Make sure we occasionally drop the lock. Set WRITE_QUEUED
|
||
// to keep the guy from going away.
|
||
//
|
||
|
||
} else if ((++LoopsWithLockHeld >= 20) &&
|
||
!FlagOn(SharedCacheMap->Flags, WRITE_QUEUED | IS_CURSOR)) {
|
||
|
||
SetFlag(SharedCacheMap->Flags, WRITE_QUEUED);
|
||
SharedCacheMap->DirtyPages += 1;
|
||
CcReleaseMasterLock( OldIrql );
|
||
LoopsWithLockHeld = 0;
|
||
CcAcquireMasterLock( &OldIrql );
|
||
ClearFlag(SharedCacheMap->Flags, WRITE_QUEUED);
|
||
SharedCacheMap->DirtyPages -= 1;
|
||
}
|
||
|
||
//
|
||
// Now loop back.
|
||
//
|
||
// If we want to put this shared cache map at the end of the
|
||
// dirty list, we will do it AFTER we determine the next shared
|
||
// cache map to go to. This ensures that we loop through the entire
|
||
// list during this scan tick.
|
||
//
|
||
|
||
NextSharedCacheMap =
|
||
CONTAINING_RECORD( SharedCacheMap->SharedCacheMapLinks.Flink,
|
||
SHARED_CACHE_MAP,
|
||
SharedCacheMapLinks );
|
||
|
||
if (MoveBehindCursor) {
|
||
|
||
RemoveEntryList( &CcLazyWriterCursor.SharedCacheMapLinks );
|
||
InsertHeadList( &SharedCacheMap->SharedCacheMapLinks, &CcLazyWriterCursor.SharedCacheMapLinks );
|
||
MoveBehindCursor = FALSE;
|
||
}
|
||
|
||
SharedCacheMap = NextSharedCacheMap;
|
||
}
|
||
|
||
DebugTrace( 0, me, "End of Lazy Writer Scan\n", 0 );
|
||
|
||
//
|
||
// Queue up our post tick workitems for this pass.
|
||
//
|
||
|
||
while (!IsListEmpty( &PostTickWorkQueue )) {
|
||
|
||
PLIST_ENTRY Entry = RemoveHeadList( &PostTickWorkQueue );
|
||
CcPostWorkQueue( CONTAINING_RECORD( Entry, WORK_QUEUE_ENTRY, WorkQueueLinks ),
|
||
&CcRegularWorkQueue );
|
||
}
|
||
|
||
//
|
||
// Now we can release the global list and loop back, per chance to sleep.
|
||
//
|
||
|
||
CcReleaseMasterLock( OldIrql );
|
||
|
||
//
|
||
// Once again we need to give the deferred writes a poke. We can have all dirty
|
||
// pages on disable_write_behind files but also have an external condition that
|
||
// caused the cached IO to be deferred. If so, this serves as our only chance to
|
||
// issue it when the condition clears.
|
||
//
|
||
// Case hit on ForrestF's 5gb Alpha, 1/12/99.
|
||
//
|
||
|
||
if (!IsListEmpty(&CcDeferredWrites)) {
|
||
|
||
CcPostDeferredWrites();
|
||
}
|
||
|
||
//
|
||
// Now go ahead and schedule the next scan.
|
||
//
|
||
|
||
CcScheduleLazyWriteScan( FALSE );
|
||
|
||
//
|
||
// Basically, the Lazy Writer thread should never get an exception,
|
||
// so we put a try-except around it that bug checks one way or the other.
|
||
// Better we bug check here than worry about what happens if we let one
|
||
// get by.
|
||
//
|
||
|
||
} except( CcExceptionFilter( GetExceptionCode() )) {
|
||
|
||
CcBugCheck( GetExceptionCode(), 0, 0 );
|
||
}
|
||
}
|
||
|
||
|
||
//
|
||
// Internal support routine
|
||
//
|
||
|
||
LONG
|
||
CcExceptionFilter (
|
||
IN NTSTATUS ExceptionCode
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This is the standard exception filter for worker threads which simply
|
||
calls an FsRtl routine to see if an expected status is being raised.
|
||
If so, the exception is handled, else we bug check.
|
||
|
||
Arguments:
|
||
|
||
ExceptionCode - the exception code which was raised.
|
||
|
||
Return Value:
|
||
|
||
EXCEPTION_EXECUTE_HANDLER if expected, else a Bug Check occurs.
|
||
|
||
--*/
|
||
|
||
{
|
||
DebugTrace(0, 0, "CcExceptionFilter %08lx\n", ExceptionCode);
|
||
|
||
if (FsRtlIsNtstatusExpected( ExceptionCode )) {
|
||
|
||
return EXCEPTION_EXECUTE_HANDLER;
|
||
|
||
} else {
|
||
|
||
return EXCEPTION_CONTINUE_SEARCH;
|
||
}
|
||
}
|
||
|
||
|
||
|
||
//
|
||
// Internal support routine
|
||
//
|
||
|
||
VOID
|
||
FASTCALL
|
||
CcPostWorkQueue (
|
||
IN PWORK_QUEUE_ENTRY WorkQueueEntry,
|
||
IN PLIST_ENTRY WorkQueue
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This routine queues a WorkQueueEntry, which has been allocated and
|
||
initialized by the caller, to the WorkQueue for FIFO processing by
|
||
the work threads.
|
||
|
||
Arguments:
|
||
|
||
WorkQueueEntry - supplies a pointer to the entry to queue
|
||
|
||
Return Value:
|
||
|
||
None
|
||
|
||
--*/
|
||
|
||
{
|
||
KIRQL OldIrql;
|
||
PLIST_ENTRY WorkerThreadEntry = NULL;
|
||
|
||
ASSERT(FIELD_OFFSET(WORK_QUEUE_ITEM, List) == 0);
|
||
|
||
DebugTrace(+1, me, "CcPostWorkQueue:\n", 0 );
|
||
DebugTrace( 0, me, " WorkQueueEntry = %08lx\n", WorkQueueEntry );
|
||
|
||
//
|
||
// Queue the entry to the respective work queue.
|
||
//
|
||
|
||
CcAcquireWorkQueueLock( &OldIrql );
|
||
InsertTailList( WorkQueue, &WorkQueueEntry->WorkQueueLinks );
|
||
|
||
//
|
||
// Now, if we aren't throttled and have any more idle threads we can
|
||
// use, activate one.
|
||
//
|
||
|
||
if (!CcQueueThrottle && !IsListEmpty(&CcIdleWorkerThreadList)) {
|
||
WorkerThreadEntry = RemoveHeadList( &CcIdleWorkerThreadList );
|
||
CcNumberActiveWorkerThreads += 1;
|
||
}
|
||
CcReleaseWorkQueueLock( OldIrql );
|
||
|
||
if (WorkerThreadEntry != NULL) {
|
||
|
||
//
|
||
// I had to peak in the sources to verify that this routine
|
||
// is a noop if the Flink is not NULL. Sheeeeit!
|
||
//
|
||
|
||
((PWORK_QUEUE_ITEM)WorkerThreadEntry)->List.Flink = NULL;
|
||
ExQueueWorkItem( (PWORK_QUEUE_ITEM)WorkerThreadEntry, CriticalWorkQueue );
|
||
}
|
||
|
||
//
|
||
// And return to our caller
|
||
//
|
||
|
||
DebugTrace(-1, me, "CcPostWorkQueue -> VOID\n", 0 );
|
||
|
||
return;
|
||
}
|
||
|
||
|
||
//
|
||
// Internal support routine
|
||
//
|
||
|
||
VOID
|
||
CcWorkerThread (
|
||
PVOID ExWorkQueueItem
|
||
)
|
||
|
||
/*++
|
||
|
||
Routine Description:
|
||
|
||
This is worker thread routine for processing cache manager work queue
|
||
entries.
|
||
|
||
Arguments:
|
||
|
||
ExWorkQueueItem - The work item used for this thread
|
||
|
||
Return Value:
|
||
|
||
None
|
||
|
||
--*/
|
||
|
||
{
|
||
KIRQL OldIrql;
|
||
PLIST_ENTRY WorkQueue;
|
||
PWORK_QUEUE_ENTRY WorkQueueEntry;
|
||
BOOLEAN RescanOk = FALSE;
|
||
BOOLEAN DropThrottle = FALSE;
|
||
IO_STATUS_BLOCK IoStatus;
|
||
|
||
IoStatus.Status = STATUS_SUCCESS;
|
||
IoStatus.Information = 0;
|
||
|
||
ASSERT(FIELD_OFFSET(WORK_QUEUE_ENTRY, WorkQueueLinks) == 0);
|
||
|
||
while (TRUE) {
|
||
|
||
CcAcquireWorkQueueLock( &OldIrql );
|
||
|
||
//
|
||
// If we just processed a throttled operation, drop the flag.
|
||
//
|
||
|
||
if (DropThrottle) {
|
||
|
||
DropThrottle = CcQueueThrottle = FALSE;
|
||
}
|
||
|
||
//
|
||
// On requeue, push at end of the source queue and clear hint.
|
||
//
|
||
|
||
if (IoStatus.Information == CC_REQUEUE) {
|
||
|
||
InsertTailList( WorkQueue, &WorkQueueEntry->WorkQueueLinks );
|
||
IoStatus.Information = 0;
|
||
}
|
||
|
||
//
|
||
// First see if there is something in the express queue.
|
||
//
|
||
|
||
if (!IsListEmpty(&CcExpressWorkQueue)) {
|
||
WorkQueue = &CcExpressWorkQueue;
|
||
|
||
//
|
||
// If there was nothing there, then try the regular queue.
|
||
//
|
||
|
||
} else if (!IsListEmpty(&CcRegularWorkQueue)) {
|
||
WorkQueue = &CcRegularWorkQueue;
|
||
|
||
//
|
||
// Else we can break and go idle.
|
||
//
|
||
|
||
} else {
|
||
|
||
break;
|
||
}
|
||
|
||
WorkQueueEntry = CONTAINING_RECORD( WorkQueue->Flink, WORK_QUEUE_ENTRY, WorkQueueLinks );
|
||
|
||
//
|
||
// If this is an EventSet, throttle down to a single thread to be sure
|
||
// that this event fires after all preceeding workitems have completed.
|
||
//
|
||
|
||
if (WorkQueueEntry->Function == EventSet && CcNumberActiveWorkerThreads > 1) {
|
||
|
||
CcQueueThrottle = TRUE;
|
||
break;
|
||
}
|
||
|
||
//
|
||
// Pop the workitem off: we will execute it now.
|
||
//
|
||
|
||
RemoveHeadList( WorkQueue );
|
||
|
||
CcReleaseWorkQueueLock( OldIrql );
|
||
|
||
//
|
||
// Process the entry within a try-except clause, so that any errors
|
||
// will cause us to continue after the called routine has unwound.
|
||
//
|
||
|
||
try {
|
||
|
||
switch (WorkQueueEntry->Function) {
|
||
|
||
//
|
||
// Perform read ahead
|
||
//
|
||
|
||
case ReadAhead:
|
||
|
||
DebugTrace( 0, me, "CcWorkerThread Read Ahead FileObject = %08lx\n",
|
||
WorkQueueEntry->Parameters.Read.FileObject );
|
||
|
||
CcPerformReadAhead( WorkQueueEntry->Parameters.Read.FileObject );
|
||
|
||
break;
|
||
|
||
//
|
||
// Perform write behind
|
||
//
|
||
|
||
case WriteBehind:
|
||
|
||
DebugTrace( 0, me, "CcWorkerThread WriteBehind SharedCacheMap = %08lx\n",
|
||
WorkQueueEntry->Parameters.Write.SharedCacheMap );
|
||
|
||
//
|
||
// While CcWriteBehind is running, we mark this thread as a
|
||
// MemoryMaker so that Mm will allow pool allocations to
|
||
// succeed when we are getting into low-resource situations.
|
||
// This helps avoid loss delayed write error in low-resource
|
||
// scenarios.
|
||
//
|
||
|
||
PsGetCurrentThread()->MemoryMaker = 1;
|
||
|
||
CcWriteBehind( WorkQueueEntry->Parameters.Write.SharedCacheMap, &IoStatus );
|
||
RescanOk = (BOOLEAN)NT_SUCCESS(IoStatus.Status);
|
||
|
||
PsGetCurrentThread()->MemoryMaker = 0;
|
||
break;
|
||
|
||
|
||
//
|
||
// Perform set event
|
||
//
|
||
|
||
case EventSet:
|
||
|
||
DebugTrace( 0, me, "CcWorkerThread SetEvent Event = %08lx\n",
|
||
WorkQueueEntry->Parameters.Event.Event );
|
||
|
||
KeSetEvent( WorkQueueEntry->Parameters.Event.Event, 0, FALSE );
|
||
DropThrottle = TRUE;
|
||
break;
|
||
|
||
//
|
||
// Perform Lazy Write Scan
|
||
//
|
||
|
||
case LazyWriteScan:
|
||
|
||
DebugTrace( 0, me, "CcWorkerThread Lazy Write Scan\n", 0 );
|
||
|
||
CcLazyWriteScan();
|
||
break;
|
||
}
|
||
|
||
}
|
||
except( CcExceptionFilter( GetExceptionCode() )) {
|
||
|
||
//
|
||
// If we hit an exception in this thread, we need to make sure
|
||
// that if we had made this thread a memory maker that flag is
|
||
// cleared in the thread structure because this thread will be
|
||
// reused by arbitrary system worker threads that should not have
|
||
// this designation.
|
||
//
|
||
|
||
if (WorkQueueEntry->Function == WriteBehind) {
|
||
|
||
PsGetCurrentThread()->MemoryMaker = 0;
|
||
}
|
||
}
|
||
|
||
//
|
||
// If not a requeue request, free the workitem.
|
||
//
|
||
|
||
if (IoStatus.Information != CC_REQUEUE) {
|
||
|
||
CcFreeWorkQueueEntry( WorkQueueEntry );
|
||
}
|
||
}
|
||
|
||
//
|
||
// No more work. Requeue our worker thread entry and get out.
|
||
//
|
||
|
||
InsertTailList( &CcIdleWorkerThreadList,
|
||
&((PWORK_QUEUE_ITEM)ExWorkQueueItem)->List );
|
||
CcNumberActiveWorkerThreads -= 1;
|
||
|
||
CcReleaseWorkQueueLock( OldIrql );
|
||
|
||
if (!IsListEmpty(&CcDeferredWrites) && (CcTotalDirtyPages >= 20) && RescanOk) {
|
||
CcLazyWriteScan();
|
||
}
|
||
|
||
return;
|
||
}
|
||
|