Windows2003-3790/admin/pchealth/sr/kernel/hash.h
2020-09-30 16:53:55 +02:00

297 lines
5.6 KiB
C

/*++
Copyright (c) 1998-1999 Microsoft Corporation
Module Name:
hash.h
Abstract:
contains prototypes for functions in hash.c
Author:
Paul McDaniel (paulmcd) 28-Apr-2000
Revision History:
--*/
#ifndef _HASH_H_
#define _HASH_H_
//
// The hash key is the file name, but we need to track both the file
// component of the name in addition to the stream component of the name (if
// there is one). The buffer in the FileName UNICODE_STRING contains the
// full name with stream information, but the length is set to just designate
// the file portion of the name.
//
// Note: The keys will be hashed based on the FileName only, not the stream
// portion of the name. This is done so that we can easily find all the
// entries related to a given file if that file has multiple data streams.
//
typedef struct _HASH_KEY
{
UNICODE_STRING FileName;
USHORT StreamNameLength;
USHORT Reserved;
} HASH_KEY, *PHASH_KEY;
//
// a hash list entry .
//
typedef struct _HASH_ENTRY
{
//
// the hash value
//
ULONG HashValue;
//
// the key
//
HASH_KEY Key;
//
// a context stored with this hash entry
//
PVOID pContext;
} HASH_ENTRY, *PHASH_ENTRY;
//
// a hash bucket, which is basically an array of hash entries
// sorted by (HashValue, Key.Length, Key.Buffer) .
//
#define IS_VALID_HASH_BUCKET(pObject) \
(((pObject) != NULL) && ((pObject)->Signature == HASH_BUCKET_TAG))
typedef struct _HASH_BUCKET
{
//
// = HASH_BUCKET_TAG
//
ULONG Signature;
ULONG AllocCount;
ULONG UsedCount;
HASH_ENTRY Entries[0];
} HASH_BUCKET, *PHASH_BUCKET;
#define HASH_ENTRY_DEFAULT_WIDTH 10
//
// a destructor for hash entries
//
typedef
VOID
(*PHASH_ENTRY_DESTRUCTOR) (
IN PHASH_KEY pKey,
IN PVOID pContext
);
typedef
PVOID
(*PHASH_ENTRY_CALLBACK) (
IN PHASH_KEY pKey,
IN PVOID pEntryContext,
IN PVOID pCallbackContext
);
//
// and a hash header, an array of buckets which is hashed into.
//
#define IS_VALID_HASH_HEADER(pObject) \
(((pObject) != NULL) && ((pObject)->Signature == HASH_HEADER_TAG))
typedef struct _HASH_HEADER
{
//
// NonPagedPool
//
//
// = HASH_HEADER_TAG
//
ULONG Signature;
//
// the count of buckets the hash table has
//
ULONG BucketCount;
//
// the memory this hash table is taking
//
ULONG UsedLength;
//
// the memory this hash table is allowed to use
//
ULONG AllowedLength;
//
// how many times we've trimmed due to memory
//
ULONG TrimCount;
//
// the last time we trim'd
//
LARGE_INTEGER LastTrimTime;
//
// OPTIONAL the length in bytes of the duplicate prefix (if any)
// all keys share in this lists. This will be skipped for all manual
// comparisons as an optimization. this can be 0
//
ULONG PrefixLength;
//
// the lock for this list
//
ERESOURCE Lock;
//
// OPTIONAL destructor
//
PHASH_ENTRY_DESTRUCTOR pDestructor;
//
// and the actual buckets
//
PHASH_BUCKET Buckets[0];
} HASH_HEADER, *PHASH_HEADER;
//
// Function Prototypes.
//
NTSTATUS
HashCreateList (
IN ULONG BucketCount,
IN ULONG AllowedLength,
IN ULONG PrefixLength OPTIONAL,
IN PHASH_ENTRY_DESTRUCTOR pDestructor OPTIONAL,
OUT PHASH_HEADER * ppHashList
);
VOID
HashDestroyList (
IN PHASH_HEADER pHashList
);
NTSTATUS
HashAddEntry (
IN PHASH_HEADER pHashList,
IN PHASH_KEY pKey,
IN PVOID pContext
);
NTSTATUS
HashFindEntry (
IN PHASH_HEADER pHashList,
IN PHASH_KEY pKey,
OUT PVOID * ppContext
);
VOID
HashClearEntries (
IN PHASH_HEADER pHashList
);
NTSTATUS
HashClearAllFileEntries (
IN PHASH_HEADER pHeader,
IN PUNICODE_STRING pFileName
);
VOID
HashProcessEntries (
IN PHASH_HEADER pHeader,
IN PHASH_ENTRY_CALLBACK pfnCallback,
IN PVOID pCallbackContext
);
#if 0
#define HashCompute(Key) HashScramble(HashUnicodeString((Key)))
__inline ULONG
HashUnicodeString(
PUNICODE_STRING pKey
)
{
ULONG Hash = 0;
ULONG Index;
ULONG CharCount;
CharCount = pKey->Length/sizeof(WCHAR);
for (Index = 0 ; Index < CharCount; ++Index)
{
Hash = 37 * Hash + (pKey->Buffer[Index] & 0xFFDF);
}
return Hash;
}
// Produce a scrambled, randomish number in the range 0 to RANDOM_PRIME-1.
// Applying this to the results of the other hash functions is likely to
// produce a much better distribution, especially for the identity hash
// functions such as Hash(char c), where records will tend to cluster at
// the low end of the hashtable otherwise. LKHash applies this internally
// to all hash signatures for exactly this reason.
__inline ULONG
HashScramble(ULONG dwHash)
{
// Here are 10 primes slightly greater than 10^9
// 1000000007, 1000000009, 1000000021, 1000000033, 1000000087,
// 1000000093, 1000000097, 1000000103, 1000000123, 1000000181.
// default value for "scrambling constant"
const ULONG RANDOM_CONSTANT = 314159269UL;
// large prime number, also used for scrambling
const ULONG RANDOM_PRIME = 1000000007UL;
return (RANDOM_CONSTANT * dwHash) % RANDOM_PRIME ;
}
#endif // 0
#endif // _HASH_H_