Leaked source code of windows server 2003
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

877 lines
24 KiB

/*++
Copyright (c) 1997-2000 Microsoft Corporation
Module Name:
ftrie.c
Abstract:
This module contains routines that manipulate
an F-trie data stucture, that forms the fast
path in a fast IP route lookup implementation.
Author:
Chaitanya Kodeboyina (chaitk) 26-Nov-1997
Revision History:
--*/
#include "precomp.h"
#include "ftrie.h"
UINT
CALLCONV
InitFTrie(IN FTrie * pFTrie,
IN ULONG levels,
IN ULONG maxMemory)
/*++
Routine Description:
Initialises an F-trie. This should be done prior to
any other trie operations.
Arguments:
pFTrie - Pointer to the trie to be initialized
levels - Bitmap [ 32 bits ] of expanded levels
maxMemory - Limit on memory taken by the F-Trie
For example, levels = 0xF0F0F0F0 [8,16,24,32 bits]
means -> all prefixes are expanded to these levels
and only these trie levels have any dests at all
Num of Levels + 2 memory accesses are needed in the
worst case to get to the dest corresponding to a
prefix - Num of Levels + 1 accesses including the
zero level access, and 1 access to read the dest.
Return Value:
TRIE_SUCCESS or ERROR_TRIE_*
--*/
{
UINT prevLevel;
UINT currLevel;
UINT nBytes, i;
TRY_BLOCK
{
if (levels == 0) {
Error("NewFTrie: No levels specified", (UINT) ERROR_TRIE_BAD_PARAM);
}
// Zero all the memory for the trie header
RtlZeroMemory(pFTrie, sizeof(FTrie));
// Set a limit on the memory for trie/nodes
pFTrie->availMemory = maxMemory;
// Initialize list of trienodes allocated
InitializeListHead(&pFTrie->listofNodes);
// Initialize root node with a NULL dest
pFTrie->trieRoot = StoreDestPtr(NULL);
// Initialize the number of bits in each level
nBytes = (MAXLEVEL + 1) * sizeof(UINT);
AllocMemory2(pFTrie->bitsInLevel,
nBytes,
pFTrie->availMemory);
RtlZeroMemory(pFTrie->bitsInLevel, nBytes);
// Get the number of index bits at each level
prevLevel = 0;
i = 0;
for (currLevel = 1; currLevel <= MAXLEVEL; currLevel++) {
if (levels & 1) {
pFTrie->bitsInLevel[i++] = currLevel - prevLevel;
prevLevel = currLevel;
}
levels >>= 1;
}
pFTrie->numLevels = i;
// Make sure that the last level is MAXLEVEL
pFTrie->bitsInLevel[i] = MAXLEVEL - prevLevel;
if (pFTrie->bitsInLevel[i]) {
pFTrie->numLevels++;
}
#if DBG
Print("Num of levels: %d\n", pFTrie->numLevels);
Print("Bits In Level:\n");
for (i = 0; i < pFTrie->numLevels; i++) {
Print("\t%d", pFTrie->bitsInLevel[i]);
if (i % 8 == 7)
Print("\n");
}
Print("\n\n");
#endif
// Allocate and Zero all the statistics variables
nBytes = (MAXLEVEL + 1) * sizeof(UINT);
AllocMemory2(pFTrie->numDestsInOrigLevel,
nBytes,
pFTrie->availMemory);
RtlZeroMemory(pFTrie->numDestsInOrigLevel, nBytes);
nBytes = pFTrie->numLevels * sizeof(UINT);
AllocMemory2(pFTrie->numNodesInExpnLevel,
nBytes,
pFTrie->availMemory);
RtlZeroMemory(pFTrie->numNodesInExpnLevel, nBytes);
nBytes = pFTrie->numLevels * sizeof(UINT);
AllocMemory2(pFTrie->numDestsInExpnLevel,
nBytes,
pFTrie->availMemory);
RtlZeroMemory(pFTrie->numDestsInExpnLevel, nBytes);
return TRIE_SUCCESS;
}
ERR_BLOCK
{
// Not enough resources to create an FTrie
CleanupFTrie(pFTrie);
}
END_BLOCK
}
UINT
CALLCONV
InsertIntoFTrie(IN FTrie * pFTrie,
IN Route * pInsRoute,
IN Dest * pInsDest,
IN Dest * pOldDest)
/*++
Routine Description:
Inserts a dest corresponding to an address
prefix into a F-trie. It actually replaces
all pointers to OldDest by that of InsDest.
Arguments:
pFTrie - Pointer to the F-Trie to insert into
pInsRoute - Pointer to best route on new dest
pInsDest - Pointer to the dest being inserted
pOldDest - Pointer to the dest being replaced
Return Value:
TRIE_SUCCESS or ERROR_TRIE_*
--*/
{
FTrieNode **ppCurrNode;
FTrieNode *pCurrNode;
Dest *pBestDest;
Dest *pComDest;
UINT startIndex;
UINT stopIndex;
UINT nextIndex;
UINT shiftIndex;
UINT addrBits;
UINT numBits;
UINT bitsLeft;
UINT i;
#if DBG
// Make sure the trie is initialized
if (!pFTrie || !pFTrie->trieRoot) {
Fatal("Insert Dest: FTrie not initialized",
ERROR_TRIE_NOT_INITED);
}
// Make sure input dest is valid
if (NULL_DEST(pInsDest)) {
Fatal("Insert Dest: NULL or invalid dest",
ERROR_TRIE_BAD_PARAM);
}
// Make sure input route is valid
if (NULL_ROUTE(pInsRoute)) {
Fatal("Insert Dest: NULL or invalid route",
ERROR_TRIE_BAD_PARAM);
}
if (LEN(pInsRoute) > ADDRSIZE) {
Fatal("Insert Dest: Invalid mask length",
ERROR_TRIE_BAD_PARAM);
}
#endif
Assert(pInsDest != pOldDest);
// Use addr bits to index the trie
addrBits = RtlConvertEndianLong(DEST(pInsRoute));
bitsLeft = LEN(pInsRoute);
#if DBG
// Make sure addr and mask agree
if (ShowMostSigNBits(addrBits, bitsLeft) != addrBits) {
Fatal("Insert Dest: Addr & mask don't agree",
ERROR_TRIE_BAD_PARAM);
}
#endif
TRY_BLOCK
{
// Special case: Default Prefix
if (LEN(pInsRoute) == 0) {
// Do we have a subtree in the trie's root node ?
if (IsPtrADestPtr(pFTrie->trieRoot)) {
// Make sure you are replacing right dest
Assert(pFTrie->trieRoot == StoreDestPtr(pOldDest));
// Make the root to point to the new default
pFTrie->trieRoot = StoreDestPtr(pInsDest);
} else {
// Make sure you are replacing right dest
Assert(pFTrie->trieRoot->comDest == pOldDest);
// Make new dest the common subtrie dest
pFTrie->trieRoot->comDest = pInsDest;
}
return TRIE_SUCCESS;
}
// Start going down the trie using addr bits
pBestDest = NULL;
ppCurrNode = &pFTrie->trieRoot;
for (i = 0; /* NOTHING */ ; i++) {
pCurrNode = *ppCurrNode;
if (IsPtrADestPtr(pCurrNode)) {
// Creating a new subtree for the current level
// This pointer actually points to a dest node
pComDest = RestoreDestPtr(pCurrNode);
// Create, initialize a new FTrie node (grow it)
NewFTrieNode(pFTrie,
pCurrNode,
pFTrie->bitsInLevel[i],
pComDest);
// Attach it to the FTrie
*ppCurrNode = pCurrNode;
// Update FTrie Statistics
pFTrie->numNodesInExpnLevel[i]++;
}
// Update the best dest seen so far - used later
pComDest = pCurrNode->comDest;
if (pComDest) {
pBestDest = pComDest;
}
// Increment the number of dests in this subtrie
pCurrNode->numDests++;
// Can I pass this level with remaining bits ?
if (bitsLeft <= pFTrie->bitsInLevel[i]) {
break;
}
// Get the next index from the IP addr
numBits = pCurrNode->numBits;
nextIndex = PickMostSigNBits(addrBits, numBits);
ppCurrNode = &pCurrNode->child[nextIndex];
// Throw away the used bits
addrBits <<= numBits;
bitsLeft -= numBits;
}
// Update FTrie stats before expanding
// Update if this isn't a dest change
pFTrie->numDestsInExpnLevel[i]++;
pFTrie->numDestsInOrigLevel[LEN(pInsRoute)]++;
// At this level, expand and add the dest
nextIndex = PickMostSigNBits(addrBits, bitsLeft);
shiftIndex = pFTrie->bitsInLevel[i] - bitsLeft;
startIndex = nextIndex << shiftIndex;
stopIndex = (nextIndex + 1) << shiftIndex;
// Have you seen the old dest already ?
if (pBestDest == pOldDest) {
pOldDest = NULL;
}
// These dests cannot be the same here
Assert(pInsDest != pOldDest);
// Fill the expanded range with the dest
for (i = startIndex; i < stopIndex; i++) {
if (IsPtrADestPtr(pCurrNode->child[i])) {
// A dest pointer - replace with new one
ReplaceDestPtr(StoreDestPtr(pInsDest),
StoreDestPtr(pOldDest),
&pCurrNode->child[i]);
} else {
// Node pointer - update subtree's dest
ReplaceDestPtr(pInsDest,
pOldDest,
&pCurrNode->child[i]->comDest);
}
}
return TRIE_SUCCESS;
}
ERR_BLOCK
{
// Not enough resources - rollback to original state
DeleteFromFTrie(pFTrie, pInsRoute, pInsDest, pOldDest, PARTIAL);
}
END_BLOCK
}
UINT
CALLCONV
DeleteFromFTrie(IN FTrie * pFTrie,
IN Route * pDelRoute,
IN Dest * pDelDest,
IN Dest * pNewDest,
IN BOOLEAN trieState)
/*++
Routine Description:
Deletes a dest corresponding to an address
prefix from a F-trie. It actually replaces
all pointers to DelDest by that of NewDest.
Arguments:
pFTrie - Pointer to the F-Trie to delete from
pDelRoute - Pointer to last route on old dest
pDelDest - Pointer to the dest being deleted
pNewDest - Pointer to the dest replacing above
trieState - NORMAL - deleting from a consistent FTrie
PARTIAL - cleaning up an incomplete insert
Return Value:
TRIE_SUCCESS or ERROR_TRIE_*
--*/
{
FTrieNode **ppCurrNode;
FTrieNode *pCurrNode;
FTrieNode *pPrevNode;
FTrieNode *pNextNode;
Dest *pBestDest;
Dest *pComDest;
UINT startIndex;
UINT stopIndex;
UINT nextIndex;
UINT shiftIndex;
UINT addrBits;
UINT numBits;
UINT bitsLeft;
UINT i, j;
DBG_UNREFERENCED_PARAMETER(trieState);
j = 1;
#if DBG
// Make sure the trie is initialized
if (!pFTrie || !pFTrie->trieRoot) {
Fatal("Delete Dest: FTrie not initialized",
ERROR_TRIE_NOT_INITED);
}
// Make sure input dest is valid
if (NULL_DEST(pDelDest)) {
Fatal("Delete Dest: NULL or invalid dest",
ERROR_TRIE_BAD_PARAM);
}
// Make sure input route is valid
if (NULL_ROUTE(pDelRoute)) {
Fatal("Delete Dest: NULL or invalid route",
ERROR_TRIE_BAD_PARAM);
}
if (LEN(pDelRoute) > ADDRSIZE) {
Fatal("Delete Dest: Invalid mask length",
ERROR_TRIE_BAD_PARAM);
}
#endif
// Use addr bits to index the trie
addrBits = RtlConvertEndianLong(DEST(pDelRoute));
bitsLeft = LEN(pDelRoute);
#if DBG
// Make sure addr and mask agree
if (ShowMostSigNBits(addrBits, bitsLeft) != addrBits) {
Fatal("Delete Dest: Addr & mask don't agree",
ERROR_TRIE_BAD_PARAM);
}
#endif
Assert(pDelDest != pNewDest);
// Special case: Default Prefix
if (LEN(pDelRoute) == 0) {
// Do we have a subtree in the trie's root node ?
if (IsPtrADestPtr(pFTrie->trieRoot)) {
// Make sure you are replacing right dest
Assert(pFTrie->trieRoot == StoreDestPtr(pDelDest));
// Make the root to point to the new default
pFTrie->trieRoot = StoreDestPtr(pNewDest);
} else {
// Make sure you are replacing right dest
Assert(pFTrie->trieRoot->comDest == pDelDest);
// Make new dest the common subtrie dest
pFTrie->trieRoot->comDest = pNewDest;
}
return TRIE_SUCCESS;
}
// Start going down the trie using addr bits
pBestDest = NULL;
ppCurrNode = &pFTrie->trieRoot;
pPrevNode = pCurrNode = *ppCurrNode;
for (i = 0; /* NOTHING */ ; i++) {
// We still have bits left, so we go down the trie
// Do we have a valid subtree at the current node
if (IsPtrADestPtr(pCurrNode)) {
// We are cleaning a partial (failed) insert
Assert(trieState == PARTIAL);
// We have cleaned up the trie - return now
return TRIE_SUCCESS;
}
// We have a valid subtree, so we go down the trie
// Update the best dest seen so far - used later
pComDest = pCurrNode->comDest;
if (pComDest) {
pBestDest = pComDest;
}
// Decrement the number of dests in this subtrie
pCurrNode->numDests--;
// Is the number of dests in curr subtree zero ?
if (pCurrNode->numDests == 0) {
#if DBG
int k = 0;
// Just make sure that only one dest exists
for (j = 1; j < (UINT) 1 << pCurrNode->numBits; j++) {
if (pCurrNode->child[j - 1] != pCurrNode->child[j]) {
Assert((pCurrNode->child[j] == StoreDestPtr(NULL)) ||
(pCurrNode->child[j - 1] == StoreDestPtr(NULL)));
k++;
}
}
if (trieState == NORMAL) {
if ((k != 1) && (k != 2)) {
Print("k = %d\n", k);
Assert(FALSE);
}
} else {
if ((k != 0) && (k != 1) && (k != 2)) {
Print("k = %d\n", k);
Assert(FALSE);
}
}
#endif
// Remove link from its parent (if it exists)
if (pPrevNode) {
*ppCurrNode = StoreDestPtr(pCurrNode->comDest);
}
}
// Can I pass this level with remaining bits ?
if (bitsLeft <= pFTrie->bitsInLevel[i]) {
break;
}
// Get the next index from the IP addr
numBits = pCurrNode->numBits;
nextIndex = PickMostSigNBits(addrBits, numBits);
ppCurrNode = &pCurrNode->child[nextIndex];
pNextNode = *ppCurrNode;
// Throw away the used bits
addrBits <<= numBits;
bitsLeft -= numBits;
// Is the number of dests in subtree zero ?
if (pCurrNode->numDests == 0) {
// Deallocate it (shrink FTrie)
FreeFTrieNode(pFTrie, pCurrNode);
// Update FTrie Statistics
pFTrie->numNodesInExpnLevel[i]--;
}
pPrevNode = pCurrNode;
pCurrNode = pNextNode;
}
// Update F-Trie stats before deleting
pFTrie->numDestsInExpnLevel[i]--;
pFTrie->numDestsInOrigLevel[LEN(pDelRoute)]--;
// Is the number of dests in curr subtree zero ?
if (pCurrNode->numDests == 0) {
// Deallocate it (shrink FTrie)
FreeFTrieNode(pFTrie, pCurrNode);
// Update FTrie Statistics
pFTrie->numNodesInExpnLevel[i]--;
} else {
// At this level, expand and add the dest
nextIndex = PickMostSigNBits(addrBits, bitsLeft);
shiftIndex = pFTrie->bitsInLevel[i] - bitsLeft;
startIndex = nextIndex << shiftIndex;
stopIndex = (nextIndex + 1) << shiftIndex;
// Have you seen the new dest already ?
if (pBestDest == pNewDest) {
pNewDest = NULL;
}
// These dests cannot be the same here
Assert(pDelDest != pNewDest);
// Fill the expanded range with the dest
for (i = startIndex; i < stopIndex; i++) {
if (IsPtrADestPtr(pCurrNode->child[i])) {
// A dest pointer - replace with new one
ReplaceDestPtr(StoreDestPtr(pNewDest),
StoreDestPtr(pDelDest),
&pCurrNode->child[i]);
} else {
// Node pointer - update subtree's dest
ReplaceDestPtr(pNewDest,
pDelDest,
&pCurrNode->child[i]->comDest);
}
}
}
return TRIE_SUCCESS;
}
UINT
CALLCONV
SearchDestInFTrie(IN FTrie * pFTrie,
IN Dest * pSerDest,
OUT UINT * pNumPtrs,
OUT Dest ** pStartPtr)
/*++
Routine Description:
Search for a specific dest in an F-trie,
returns the expanded range for the dest
Arguments:
pFTrie - Pointer to the F-trie to search
pSerDest - Pointer to dest being searched
pStartPtr - Start of dest's expanded range
pNumPtrs - Number of pointers in the range
Return Value:
TRIE_SUCCESS or ERROR_TRIE_*
--*/
{
UNREFERENCED_PARAMETER(pFTrie);
UNREFERENCED_PARAMETER(pSerDest);
UNREFERENCED_PARAMETER(pNumPtrs);
UNREFERENCED_PARAMETER(pStartPtr);
return (UINT) ERROR_TRIE_BAD_PARAM;
}
Dest *
CALLCONV
SearchAddrInFTrie(IN FTrie * pFTrie,
IN ULONG Addr)
/*++
Routine Description:
Search for an address in an F-trie
Arguments:
pFTrie - Pointer to the trie to search
Addr - Pointer to addr being queried
Return Value:
Return best dest match for this address
--*/
{
FTrieNode *pCurrNode;
Dest *pBestDest;
Dest *pDest;
ULONG addrBits;
UINT numBits;
UINT nextIndex;
#if DBG
if (!pFTrie || !pFTrie->trieRoot) {
Fatal("Searching into an uninitialized FTrie",
ERROR_TRIE_NOT_INITED);
}
#endif
addrBits = RtlConvertEndianLong(Addr);
pBestDest = NULL;
pCurrNode = pFTrie->trieRoot;
for (;;) {
// Have we reached the end of this search ?
if (IsPtrADestPtr(pCurrNode)) {
// Get the best matching dest until now
pDest = RestoreDestPtr(pCurrNode);
if (!NULL_DEST(pDest)) {
pBestDest = pDest;
}
return pBestDest;
} else {
// Get the best matching dest until now
pDest = pCurrNode->comDest;
if (!NULL_DEST(pDest)) {
pBestDest = pDest;
}
}
// Number of bits to use in this FTrie level
numBits = pCurrNode->numBits;
// Get the next index from IP address bits
nextIndex = PickMostSigNBits(addrBits, numBits);
// And go down the tree with the new index
pCurrNode = pCurrNode->child[nextIndex];
// Throw away the used bits for this iteration
addrBits <<= numBits;
}
}
UINT
CALLCONV
CleanupFTrie(IN FTrie * pFTrie)
/*++
Routine Description:
Deletes an F-trie if it is empty
Arguments:
ppFTrie - Ptr to the F-trie
Return Value:
TRIE_SUCCESS or ERROR_TRIE_*
--*/
{
FTrieNode *pCurrNode;
LIST_ENTRY *p;
// Free all trie nodes and corresponding memory
while (!IsListEmpty(&pFTrie->listofNodes)) {
p = RemoveHeadList(&pFTrie->listofNodes);
pCurrNode = CONTAINING_RECORD(p, FTrieNode, linkage);
FreeFTrieNode(pFTrie, pCurrNode);
}
// Free the memory for the arr of levels
if (pFTrie->bitsInLevel) {
FreeMemory1(pFTrie->bitsInLevel,
(MAXLEVEL + 1) * sizeof(UINT),
pFTrie->availMemory);
}
// Free memory allocated for statistics
if (pFTrie->numDestsInOrigLevel) {
FreeMemory1(pFTrie->numDestsInOrigLevel,
(MAXLEVEL + 1) * sizeof(UINT),
pFTrie->availMemory);
}
if (pFTrie->numNodesInExpnLevel) {
FreeMemory1(pFTrie->numNodesInExpnLevel,
pFTrie->numLevels * sizeof(UINT),
pFTrie->availMemory);
}
if (pFTrie->numDestsInExpnLevel) {
FreeMemory1(pFTrie->numDestsInExpnLevel,
pFTrie->numLevels * sizeof(UINT),
pFTrie->availMemory);
}
// Reset other fields in trie structure
pFTrie->trieRoot = NULL;
pFTrie->numLevels = 0;
return TRIE_SUCCESS;
}
#if DBG
VOID
CALLCONV
PrintFTrie(IN FTrie * pFTrie,
IN UINT printFlags)
/*++
Routine Description:
Print an F-Trie
Arguments:
pFTrie - Pointer to the F-Trie
printFlags - Information to print
Return Value:
None
--*/
{
UINT i;
if (pFTrie == NULL) {
Print("%s", "Uninitialized FTrie\n\n");
return;
}
if ((printFlags & SUMM) == SUMM) {
Print("\n\n/***Fast-Trie------------------------------------------------");
Print("\n/***---------------------------------------------------------\n");
}
if (printFlags & POOL) {
Print("Available Memory: %10lu\n\n", pFTrie->availMemory);
}
if (printFlags & STAT) {
Print("Statistics:\n\n");
Print("Num of levels: %d\n", pFTrie->numLevels);
Print("Bits In Level:\n");
for (i = 0; i < pFTrie->numLevels; i++) {
Print("\t%d", pFTrie->bitsInLevel[i]);
if (i % 8 == 7)
Print("\n");
}
Print("\n\n");
Print("Num of Nodes in Expanded Levels:\n");
for (i = 0; i < pFTrie->numLevels; i++) {
Print("\t%d", pFTrie->numNodesInExpnLevel[i]);
if (i % 8 == 7)
Print("\n");
}
Print("\n\n");
Print("Num of Dests in Original Levels:\n");
for (i = 0; i < MAXLEVEL + 1; i++) {
Print("\t%d", pFTrie->numDestsInOrigLevel[i]);
if (i % 8 == 0)
Print("\n");
}
Print("\n\n");
Print("Num of Dests in Expanded Levels:\n");
for (i = 0; i < pFTrie->numLevels; i++) {
Print("\t%d", pFTrie->numDestsInExpnLevel[i]);
if (i % 8 == 7)
Print("\n");
}
Print("\n\n");
}
if (printFlags & TRIE) {
if (!IsPtrADestPtr(pFTrie->trieRoot)) {
PrintFTrieNode(pFTrie->trieRoot, 0);
} else {
PrintDest(RestoreDestPtr(pFTrie->trieRoot));
}
}
if ((printFlags & SUMM) == SUMM) {
Print("\n---------------------------------------------------------***/\n");
Print("---------------------------------------------------------***/\n\n");
}
}
VOID
CALLCONV
PrintFTrieNode(IN FTrieNode * pFTrieNode,
IN UINT levelNumber)
/*++
Routine Description:
Print an F-Trie node
Arguments:
pFTrieNode - Pointer to the FTrie node
Return Value:
None
--*/
{
FTrieNode *pCurrNode;
UINT numElmts;
UINT i;
Print("\n/*-----------------------------------------------------------\n");
Print("Num of bits at level %3d : %d\n", levelNumber, pFTrieNode->numBits);
Print("Number of Subtrie Dests : %d\n", pFTrieNode->numDests);
Print("Common SubTree Dest : ");
PrintDest(pFTrieNode->comDest);
Print("\n");
numElmts = 1 << pFTrieNode->numBits;
pCurrNode = StoreDestPtr(NULL);
Print("Child Ptrs:\n\n");
for (i = 0; i < numElmts; i++) {
if (pFTrieNode->child[i] != pCurrNode) {
pCurrNode = pFTrieNode->child[i];
Print("Child Index: %8lu ", i);
if (IsPtrADestPtr(pCurrNode)) {
PrintDest(RestoreDestPtr(pCurrNode));
} else {
PrintFTrieNode(pCurrNode, levelNumber + 1);
}
}
}
Print("-----------------------------------------------------------*/\n\n");
}
#endif // DBG