windows-nt-4.0/private/windows/win4help/ftsrch/tokens.cpp


								// Tokens.cpp -- Created 2/9/93 by Ron Murray


								// Implementation for the CTokenList class


								#include   "stdafx.h"

								#include   "Tokens.h"

								#include    "MemEx.h"

								#include  "TxDBase.h"

								#include   <malloc.h>

								#include   "ftslex.h"

								#include "AbrtSrch.h"


								#define INC_LAST_CHAR_SIZE 0x10000L

								#define WORKBUF_SIZE       0x200

								#define BASE_WEIGHT        0x02             // basic character weight (no case or no diacritic)


								UINT SortKeyText(PWCHAR pwText, UINT cwText, PWCHAR pwOut, UINT cwOut);

								BOOL AllLowerCase(PWCHAR pwText, UINT cwText);


								/////////////////////////////////////////////////////////////////////////////

								// Worker functions


								BOOL HasAPrefix(PWCHAR pwL, UINT cwL, PWCHAR pwR, UINT cwR)

								{

								    if (cwL > cwR) return FALSE;


								    for (cwL >>= 1; cwL--; pwL++, pwR++)

								    {

								        if (*pwL++ != *pwR++)

								        	return FALSE;


								        if (HIBYTE(*pwL) > BASE_WEIGHT && HIBYTE(*pwL) != HIBYTE(*pwR))

								            return FALSE;


								        if (LOBYTE(*pwL) > BASE_WEIGHT && LOBYTE(*pwL) != LOBYTE(*pwR))

								            return FALSE;

								    }


								    return TRUE;

								}


								BOOL HasASuffix(PWCHAR pwL, UINT cwL, PWCHAR pwR, UINT cwR)

								{

								    if (cwL > cwR) return FALSE;


								    pwR += cwR - cwL;


								    for (cwL >>= 1; cwL--; pwL++, pwR++)

								    {

								        if (*pwL++ != *pwR++)

								        	return FALSE;


								        if (HIBYTE(*pwL) > BASE_WEIGHT && HIBYTE(*pwL) != HIBYTE(*pwR))

								            return FALSE;


								        if (LOBYTE(*pwL) > BASE_WEIGHT && LOBYTE(*pwL) != LOBYTE(*pwR))

								            return FALSE;

								    }


								    return TRUE;

								}


								BOOL HasASubstring(PWCHAR pwL, UINT cwL, PWCHAR pwR, UINT cwR)

								{

								    if (cwL > cwR)

								        return FALSE;


								    UINT cwDelta = 1 + cwR - cwL;


								    while (cwDelta--)

								        if (HasAPrefix(pwL, cwL, pwR++, cwR--))

								            return TRUE;


								    return FALSE;

								}


								// End of Worker functions

								/////////////////////////////////////////////////////////////////////////////


								#ifdef _DEBUG

								CTokenList::CTokenList(BOOL fFromFile, PSZ pszTypeName) : CTextMatrix WithType(pszTypeName)

								#else // _DEBUG

								CTokenList::CTokenList(BOOL fFromFile) : CTextMatrix()

								#endif // _DEBUG

								{

								    m_fFromFileImage     = fFromFile;

								    m_How_Constructed    = From_Nothing;


								    m_cbMaxLength        = 0;

								    m_pbImages           = NULL;

									m_pwDispImages		 = NULL;

								    m_cbImages           = 0;

								    m_cwDispImages       = 0;

								    m_pd                 = NULL;

								    m_cd                 = 0;

								    m_lcidSorting        = LCID(-1);

								    m_ppdSorted          = NULL;

								    m_ppdTailSorted      = NULL;

								    m_ptdb               = NULL;

								    m_ptklSource         = NULL;

								    m_pafClassifications = NULL;

								    m_fLeadingElipsis    = FALSE;

								    m_fTrailingElipsis   = FALSE;

								    m_pLRRanking         = NULL;

								    m_pRLRanking         = NULL;

								}


								CTokenList *CTokenList::NewTokenList(PWCHAR pwcDisplay, UINT cwcDisplay,

								                                     PDESCRIPTOR pd, int cd, LCID lcid,

								                                     PWCHAR pwSortKeys, UINT cwSortKeys,

								                                     PDESCRIPTOR *papdLRSorting,

								                                     PDESCRIPTOR *papdRLSorting

								                                    )

								{

								    CTokenList *ptl= NULL;


								    __try

								    {

								        ptl= New CTokenList(FALSE);


								        ptl->InitialTokenList(pwcDisplay, cwcDisplay, pd, cd, lcid,

								                              pwSortKeys, cwSortKeys,

								                              papdLRSorting, papdRLSorting

								                             );

								    }

								    __finally

								    {

								        if (_abnormal_termination() && ptl)

								        {

								            delete ptl;  ptl= NULL;

								        }

								    }


								    return ptl;

								}


								void CTokenList::InitialTokenList(PWCHAR pwcDisplay, UINT cwcDisplay,

								                                  PDESCRIPTOR pd, int cd, LCID lcid,

								                                  PWCHAR pwSortKeys, UINT cwSortKeys,

								                                  PDESCRIPTOR *papdLRSorting,

								                                  PDESCRIPTOR *papdRLSorting

								                                 )

								{

								    // We don't need __try/__finally brackets here because all allocations

								    // are bound to our token list structure. We assume our caller has

								    // a __try/__finally bracket which will delete this object in the event

								    // of an unhandled exception.


								    m_How_Constructed  = From_Images;

								    m_fLeadingElipsis  = FALSE;

								    m_fTrailingElipsis = FALSE;

								    m_pLRRanking       = NULL;

								    m_pRLRanking       = NULL;

								    m_ptdb             = NULL;

								    m_cd               = cd;

								    m_cwDispImages     = cwcDisplay;

								    m_cbImages         = cwSortKeys;

								    m_lcidSorting      = lcid;

								    m_pd               = pd;             pd            = NULL;

									m_pwDispImages     = pwcDisplay;     pwcDisplay    = NULL;

								    m_pbImages         = pwSortKeys;     pwSortKeys    = NULL;

								    m_ppdSorted        = papdLRSorting;  papdLRSorting = NULL;

								    m_ppdTailSorted    = papdRLSorting;  papdRLSorting = NULL;


								    CompleteTokenList();

								}


								void CTokenList::CompleteTokenList(BOOL fIgnoreSortKeys)

								{

								    LCID lcidUser = GetUserDefaultLCID();


								    if ((lcidUser & 0x0FF) != (m_lcidSorting & 0x0FF))

								    {

								        fIgnoreSortKeys= FALSE;


								        if (m_pbImages)

								        {

								            VFree(m_pbImages);  m_pbImages = NULL;  m_cbImages = 0;

								        }


								        if (m_ppdSorted)

								        {

								            VFree(m_ppdSorted);  m_ppdSorted = NULL;

								        }


								        if (m_ppdTailSorted)

								        {

								            VFree(m_ppdTailSorted);  m_ppdTailSorted = NULL;

								        }


								        m_lcidSorting= lcidUser;

								    }


									if (!m_pbImages && !fIgnoreSortKeys) ConstructSortKeys(m_lcidSorting);


								    m_clsf.Initial();

								    m_clsf.ScanAndRankData(m_pbImages, m_cbImages);


								    ASSERT(m_ppdSorted || m_pbImages);


								    if (!m_ppdSorted)

								    {

								        m_ppdSorted = (PDESCRIPTOR *) VAlloc(FALSE, m_cd * sizeof(PDESCRIPTOR *));


								        PDESCRIPTOR *ppd = m_ppdSorted;

								        PDESCRIPTOR   pd = m_pd;

								        UINT          cd = m_cd;


								        for (; cd--; ) *ppd++ = pd++;


								        qsort(m_ppdSorted, m_cd, sizeof(PDESCRIPTOR *), CompareImagesLR);

								    }


								    m_pafClassifications= (PUINT) VAlloc(FALSE, m_cd * sizeof(UINT));


								    PUINT pf= m_pafClassifications;


								    PDESCRIPTOR pdNext, *ppdNext;


								    UINT c;


								    m_cbMaxLength= 0;  								// This will be computed on demand...


								    for (c= m_cd, ppdNext= m_ppdSorted; c--; )

								    {

								        pdNext= *ppdNext++;


								        INT cwDisplayImage= CwDisplay(pdNext);


								        ASSERT(cwDisplayImage >= 0);


								        if (cwDisplayImage > m_cwDispMaxLength)

								            m_cwDispMaxLength= cwDisplayImage;


								        *pf++ = m_clsf.ClassifyData(pdNext->pbImage, CbImage(pdNext));

								    }

								}


								CTokenList *CTokenList::NewTokenList(CTextDatabase *ptdb)

								{

								    CTokenList *ptl= NULL;


								    __try

								    {

								        ptl= New CTokenList(FALSE);


								        ptl->InitialTokenList(ptdb);

								    }

								    __finally

								    {

								        if (_abnormal_termination() && ptl)

								        {

								            delete ptl;  ptl= NULL;

								        }

								    }


								    return ptl;

								}


								void CTokenList::InitialTokenList(CTextDatabase *ptdb)

								{

								    m_fFromFileImage     = FALSE;

								    m_How_Constructed    = TDB_FULL_REF;


								    ASSERT(ptdb);


								    m_ptdb= NULL;  AttachRef(m_ptdb, ptdb);


								    m_pbImages           = ptdb->ImageBase();

								    m_pd                 = ptdb->DescriptorBase();

								    m_cd                 = ptdb->m_pdNextGlobal - m_pd;

								    m_lcidSorting        = GetUserDefaultLCID();

								    m_ppdSorted          = ptdb->m_ppdSorted;

								    m_ppdTailSorted      = ptdb->m_ppdTailSorted;

								    m_pafClassifications = ptdb->m_pafClassifications;


								    m_fLeadingElipsis    = FALSE;

								    m_fTrailingElipsis   = FALSE;

								    m_pLRRanking         = NULL;

								    m_pRLRanking         = NULL;


								    if (m_ppdSorted && m_cd == ptdb->m_cdSorted)

								        m_cbMaxLength= ptdb->MaxTokenWidth();


								    SynchronizeDatabase();


								#if 0


								    long cRefs= 0, iLimit= (m_cd < 59984)? m_cd : 59984, i;


								    // Reference Statistics:


								    for (i= 0; i < iLimit; ++i) cRefs += m_pd[i].cReferences;


								    for (cRefs= 0; i < m_cd; ++i) cRefs += m_pd[i].cReferences;


								#endif


								}


								void CTokenList::ConstructSortKeys(LCID lcid)

								{

								    ASSERT(!m_pbImages);


								    MY_VIRTUAL_BUFFER mvb;


								    mvb.Base= NULL;


								    CreateVirtualBuffer(&mvb, m_cwDispImages, MaxSortKeyBytes(m_cwDispImages));


									__try

								    {

								        PWCHAR      pbImageBase = PWCHAR(mvb.Base);

								        PWCHAR      pb          = pbImageBase;

								        PWCHAR      pbLimit     = pb + MaxSortKeyBytes(m_cwDispImages);

								        UINT        c;

								        PDESCRIPTOR pd;


								        __try

								        {

								            for (c = m_cd, pd = m_pd; c--; pd++)

								            {

								                pd->pbImage = pb;


								        	    pb += LCSortKeyW(lcid, 0, pd->pwDisplay, CwDisplay(pd), pb, pbLimit - pb);

								        	}

								        }

								        __except(VirtualBufferExceptionFilter(GetExceptionCode(), GetExceptionInformation(), &mvb))

								        {

								            RaiseException(STATUS_NO_MEMORY, EXCEPTION_NONCONTINUABLE, 0, NULL);

								        }


								        pd->pbImage = pb;


								        UINT cwcImages= pb - pbImageBase;


								        m_cbImages= cwcImages;


								        ASSERT(!m_pbImages);


								        m_pbImages = PWCHAR(VAlloc(FALSE, sizeof(WCHAR) * cwcImages));


								        CopyMemory(m_pbImages, pbImageBase, sizeof(WCHAR) * cwcImages);


								        INT cwDelta;


								        for (cwDelta= m_pbImages - pbImageBase, c= m_cd+1, pd= m_pd;

								             c--;

								             pd++

								            )

								            pd->pbImage += cwDelta;

								    }

								    __finally

								    {

								        if (mvb.Base) FreeVirtualBuffer(&mvb);

								    }

								}


								CTokenList *CTokenList::TokenSubset(PUINT paiSubset, UINT cTokensInSubset)

								{

								    CTokenList *ptl= NULL;


								    __try

								    {

								        ptl= New CTokenList;


								        ptl->InitialTokenList(this, paiSubset, cTokensInSubset);

								    }

								    __finally

								    {

								        if (_abnormal_termination() && ptl)

								        {

								            delete ptl;  ptl= NULL;

								        }

								    }


								    return ptl;

								}


								void CTokenList::InitialTokenList(CTokenList *ptklSource, PUINT paiSubset, UINT cTokensInSubset)

								{

								    AttachRef(m_ptklSource, ptklSource);


								    m_How_Constructed = TKL_SUBSET;

								    m_cbMaxLength     = ptklSource->m_cbMaxLength;

								    m_pbImages        = ptklSource->m_pbImages;

								    m_pwDispImages    = ptklSource->m_pwDispImages;

								    m_cbImages        = ptklSource->m_cbImages;

								    m_cwDispImages    = ptklSource->m_cwDispImages;

								    m_pd              = ptklSource->m_pd;

								    m_cd              = cTokensInSubset;

								    m_ppdTailSorted   = NULL;


								    ASSERT(sizeof(UINT) == sizeof(PDESCRIPTOR));


								    PDESCRIPTOR *ppdDestination = (PDESCRIPTOR *) paiSubset;

								    PDESCRIPTOR *papdSource     = ptklSource->m_ppdSorted;


								    m_ppdSorted = ppdDestination;


								    for (; cTokensInSubset--; )

								        *ppdDestination++ = papdSource[*paiSubset++];

								}


								typedef struct _TokenListHeader

								        {

								            UINT cbMaxLength;

								            UINT cbImages;

								          //  UINT offImages;

											UINT cwDispMaxLength;

											UINT cwDispImages;

											UINT offwDispImages;

								            UINT cDescriptors;

								            UINT offDescriptors;

								            UINT offppdSorted;

								            UINT offppdTailSorted;

								            UINT offpafClassifications;

								            UINT offClassifier;

											UINT cnTokenSortKeys;

											UINT cnDispSortKeys;

								            UINT lcid;


								            PDESCRIPTOR pdOld;


								        } TokenListHeader;


								typedef struct _TokenListHeader2

								        {

											UINT cwDispMaxLength;

											UINT cwDispImages;

											UINT offwDispImages;

											UINT cnDispSortKeys;

								            UINT cwSortKeyImages;

								            UINT offwSortKeyImages;

								            UINT cnSortKeyImages;

								            UINT cDescriptors;

								            UINT offReferenceCounts;

								            UINT offDescriptorFlags;

								            UINT offppdSorted;

								            UINT offppdTailSorted;

								            UINT lcidSorting;


								        } TokenListHeader2;


								// Save/Load Interface --


								void CTokenList::StoreImage2(CPersist *pDiskImage, BOOL fIgnoreSortKeys)

								{

								    ASSERT(m_How_Constructed == From_Images);


								    TokenListHeader2 *ptlh= (TokenListHeader2 *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader2));


									ptlh->cwDispMaxLength		= MaxWidthToken();

									ptlh->cwDispImages			= m_cwDispImages;

								    ptlh->cDescriptors          = m_cd;

								    ptlh->lcidSorting           = GetUserDefaultLCID();

								    ptlh->offwDispImages        = pDiskImage->NextOffset();  ptlh->cnDispSortKeys  = pDiskImage->Encode(PBYTE(m_pwDispImages), m_cwDispImages * sizeof(WCHAR));

								    ptlh->cwSortKeyImages       = m_cbImages;


									if (fIgnoreSortKeys) ptlh->offwSortKeyImages = 0;

								    else ptlh->offwSortKeyImages = pDiskImage->NextOffset(); ptlh->cnSortKeyImages = pDiskImage->Encode(PBYTE(m_pbImages    ), m_cbImages     * sizeof(WCHAR));


								    PUINT           pcRefs     = NULL;

								    CCompressedSet* pcsOffsets = NULL;


								    __try

								    {

								        pcRefs= PUINT(VAlloc(FALSE, sizeof(UINT) * m_cd));


								        PUINT       pui;

								        PDESCRIPTOR pd;

								        PWCHAR      pwcBase= m_pwDispImages;

								        PBYTE       pb;

								        UINT        c;


								        for (pd= m_pd, c= m_cd, pui= pcRefs; c--; ) *pui++ = (pd++)->cReferences;


								        ptlh->offReferenceCounts = pDiskImage->NextOffset();  pDiskImage->WriteDWords(pcRefs, m_cd);


								        for (pd= m_pd, c= m_cd, pb= PBYTE(pcRefs); c--; pd++)

								        {

								            *pb++ = pd->bCharset;

								            *pb++ = pd->fImageFlags;

								        }


								        ptlh->offDescriptorFlags = pDiskImage->NextOffset();  pDiskImage->WriteBytes(PBYTE(pcRefs), m_cd * 2);


								        for (pwcBase= m_pwDispImages, pd= m_pd, c= m_cd, pui= pcRefs; c--; )

								            *pui++ = (pd++)->pwDisplay - pwcBase;


								        pcsOffsets= CCompressedSet::NewCompressedSet(pcRefs, m_cd, m_cwDispImages);


								        pcsOffsets->StoreImage(pDiskImage);


								        delete pcsOffsets;  pcsOffsets= NULL;


								        if (!fIgnoreSortKeys)

										{

									        for (pwcBase= m_pbImages, pd= m_pd, c= m_cd, pui= pcRefs; c--; )

									            *pui++ = (pd++)->pbImage - pwcBase;


									        pcsOffsets= CCompressedSet::NewCompressedSet(pcRefs, m_cd, m_cbImages);


									        pcsOffsets->StoreImage(pDiskImage);

										}

								    }

								    __finally

								    {

								        if (pcRefs    ) { VFree(pcRefs);      pcRefs     = NULL; }

								        if (pcsOffsets) { delete pcsOffsets;  pcsOffsets = NULL; }

								    }


								    ptlh->offppdSorted     = StoreSortOrder(pDiskImage, m_ppdSorted);

								    ptlh->offppdTailSorted = StoreSortOrder(pDiskImage, PPDTailSorting());

								}


								UINT CTokenList::StoreSortOrder(CPersist *pDiskImage, PDESCRIPTOR *ppdSortOrder)

								{

								    PUINT puiGrade = NULL;

								    PBYTE pbSlice  = NULL;


								    UINT offset= pDiskImage->NextOffset();


								    __try

								    {

								        PUINT         pui= puiGrade = PUINT(VAlloc(FALSE, m_cd * sizeof(UINT)));

								        PDESCRIPTOR *ppd = ppdSortOrder;

								        UINT           c = m_cd;


								        for (; c--; ) *pui++ = *ppd++ - m_pd;


								        UINT cb= ((m_cd + 3) >> 2) << 2;


								        pbSlice = PBYTE(VAlloc(FALSE, cb * sizeof(BYTE)));


								        PBYTE pb;


								        if (m_cd > 0x1000000)

								        {

								            for (c= m_cd, pui= puiGrade, pb= pbSlice; c--; ) *pb++ = (*pui++) >> 24;


								            pDiskImage->WriteBytes(pbSlice, cb);

								        }


								        if (m_cd > 0x10000)

								        {

								            for (c= m_cd, pui= puiGrade, pb= pbSlice; c--; ) *pb++ = (*pui++) >> 16;


								            pDiskImage->WriteBytes(pbSlice, cb);

								        }


								        if (m_cd > 0x0100)

								        {

								            for (c= m_cd, pui= puiGrade, pb= pbSlice; c--; ) *pb++ = (*pui++) >> 8;


								            pDiskImage->WriteBytes(pbSlice, cb);

								        }


								        for (c= m_cd, pui= puiGrade, pb= pbSlice; c--; ) *pb++ = *pui++;


								        pDiskImage->WriteBytes(pbSlice, cb);

								    }

								    __finally

								    {

								        if (puiGrade) { VFree(puiGrade);  puiGrade = NULL; }

								        if (pbSlice ) { VFree(pbSlice );  pbSlice  = NULL; }

								    }


								    return offset;

								}


								PDESCRIPTOR *CTokenList::LoadSortOrder(CPersist *pDiskImage, UINT offset)

								{

								    PUINT puiGrade = NULL;


								    __try

								    {

								        puiGrade= PUINT(VAlloc(TRUE, m_cd * sizeof(UINT)));


								        UINT cb= ((m_cd + 3) >> 2) << 2;


								        PBYTE pbBase = PBYTE(pDiskImage->LocationOf(offset));


								        UINT  c;

								        PBYTE pb;

								        PUINT pui;


								        if (m_cd > 0x1000000)

								        {

								            for (c= m_cd, pb= pbBase, pui= puiGrade; c--; )

								                *pui++ |= UINT(*pb++) << 24;


								            pbBase += cb;

								        }


								        if (m_cd > 0x10000)

								        {

								            for (c= m_cd, pb= pbBase, pui= puiGrade; c--; )

								                *pui++ |= UINT(*pb++) << 16;


								            pbBase += cb;

								        }


								        if (m_cd > 0x100)

								        {

								            for (c= m_cd, pb= pbBase, pui= puiGrade; c--; )

								                *pui++ |= UINT(*pb++) << 8;


								            pbBase += cb;

								        }


								        for (c= m_cd, pb= pbBase, pui= puiGrade; c--; )

								            *pui++ |= UINT(*pb++);


								        PDESCRIPTOR *ppd = (PDESCRIPTOR *) puiGrade;


								        for (pui= puiGrade, c= m_cd; c--; ) *ppd++ = m_pd + *pui++;

								    }

								    __finally

								    {

								        if (_abnormal_termination() && puiGrade)

								        {

								            VFree(puiGrade);  puiGrade= NULL;

								        }

								    }


								    return (PDESCRIPTOR *) puiGrade;

								}


								void CTokenList::SkipImage2(CPersist *pDiskImage)

								{

								    TokenListHeader2 *ptlh= (TokenListHeader2 *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader2));


								    CCompressedSet::SkipImage(pDiskImage);

								    CCompressedSet::SkipImage(pDiskImage);

								}


								BOOL CTokenList::ConnectImage2(CPersist *pDiskImage, BOOL fIgnoreSortKeys)

								{

								    TokenListHeader2 *ptlh= (TokenListHeader2 *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader2));


								    m_cd              = ptlh->cDescriptors;

								    m_How_Constructed = From_Images;

									m_cwDispMaxLength = ptlh->cwDispMaxLength;

									m_cwDispImages	  = ptlh->cwDispImages;

								    m_lcidSorting     = ptlh->lcidSorting;


								    if (   (pDiskImage->IsFTSFile() && pDiskImage->VersionIndex() == FTSVERSION_MIN)

								        || (pDiskImage->IsFTGFile() && pDiskImage->VersionIndex() == FTGVERSION_MIN)

								       ) m_lcidSorting = ~GetUserDefaultLCID(); // To force resorting


								    m_pwDispImages = (PWCHAR)VAlloc(FALSE, ptlh->cwDispImages * sizeof(WCHAR));


								    Decode((PUINT)pDiskImage->LocationOf(ptlh->offwDispImages), ptlh->cnDispSortKeys,  (PBYTE)m_pwDispImages);


								    BOOL fLcidUnchanged= (m_lcidSorting  & 0x0FF) == (GetUserDefaultLCID()  & 0x0FF);


								    if (fLcidUnchanged && !fIgnoreSortKeys)

									{

								        m_cbImages= ptlh->cwSortKeyImages;

								        m_pbImages= (PWCHAR)VAlloc(FALSE, m_cbImages * sizeof(WCHAR));


								        Decode((PUINT)pDiskImage->LocationOf(ptlh->offwSortKeyImages), ptlh->cnSortKeyImages, (PBYTE)m_pbImages);

									}


								    m_pd= (PDESCRIPTOR) VAlloc(FALSE, sizeof(DESCRIPTOR) * (m_cd + 1));


								    m_pd[m_cd].pwDisplay = m_pwDispImages + m_cwDispImages;


								    if (fLcidUnchanged) m_pd[m_cd].pbImage = m_pbImages + m_cbImages;


								    PUINT pcRefs = PUINT(pDiskImage->LocationOf(ptlh->offReferenceCounts));

								    PUINT pui;


								    PDESCRIPTOR pd;

								    UINT        c;


								    for (pd= m_pd, pui= pcRefs, c= m_cd; c--; ) (pd++)->cReferences = *pui++;


								    PBYTE pbFlags= PBYTE(pDiskImage->LocationOf(ptlh->offDescriptorFlags));


								    for (pd= m_pd, c= m_cd; c--; pd++)

								    {

								        pd->bCharset    = *pbFlags++;

								        pd->fImageFlags = *pbFlags++;

								    }


								    CCompressedSet* pcsOffsets  = NULL;

								    CCmpEnumerator* pEnumerator = NULL;


								    __try

								    {

								        AttachRef(pcsOffsets, CCompressedSet::CreateImage(pDiskImage));


								        pEnumerator= CCmpEnumerator::NewEnumerator(pcsOffsets);


								        for (pd= m_pd, c= m_cd; c; )

								        {

								            UINT cChunk= c;


								            const UINT *pui= pEnumerator->NextDWordsIn(&cChunk);


								            c -= cChunk;


								            for (; cChunk--; pd++)

								                pd->pwDisplay = m_pwDispImages + *pui++;

								        }


								        delete pEnumerator;  pEnumerator = NULL;

								        DetachRef(pcsOffsets);


										if (fIgnoreSortKeys) __leave;


										if (!fLcidUnchanged)

										{

										 	CCompressedSet::SkipImage(pDiskImage);


											__leave;

										}


								        AttachRef(pcsOffsets, CCompressedSet::CreateImage(pDiskImage));


								        pEnumerator= CCmpEnumerator::NewEnumerator(pcsOffsets);


								        for (pd= m_pd, c= m_cd; c; )

								        {

								            UINT cChunk= c;


								            const UINT *pui= pEnumerator->NextDWordsIn(&cChunk);


								            c -= cChunk;


								            for (; cChunk--; pd++)

								                pd->pbImage = m_pbImages + *pui++;

								        }

								    }

								    __finally

								    {

								        if (pEnumerator) { delete pEnumerator;  pEnumerator = NULL; }

								        if (pcsOffsets ) DetachRef(pcsOffsets);

								    }


								    for (pd= m_pd, c= m_cd; c--; pd++)

								        pd->cwDisplay = (pd+1)->pwDisplay - pd->pwDisplay;


								    m_ppdSorted     = LoadSortOrder(pDiskImage, ptlh->offppdSorted    );

								    m_ppdTailSorted = LoadSortOrder(pDiskImage, ptlh->offppdTailSorted);


								    CompleteTokenList(fIgnoreSortKeys);


								    return !fLcidUnchanged;

								}


								void CTokenList::StoreImage(CPersist *pDiskImage)

								{

								    ASSERT(m_How_Constructed == From_Images);


								    TokenListHeader *ptlh= (TokenListHeader *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader));


								    ptlh->cbMaxLength           = m_cbMaxLength;

								    ptlh->cbImages              = m_cbImages;

									ptlh->cwDispMaxLength		= m_cwDispMaxLength;

									ptlh->cwDispImages			= m_cwDispImages;

								    ptlh->cDescriptors          = m_cd;

								    ptlh->pdOld                 = m_pd;

								    ptlh->lcid                  = GetUserDefaultLCID();

								  //  ptlh->offImages             = pDiskImage->NextOffset();  ptlh->cnTokenSortKeys = pDiskImage->Encode(PBYTE(m_pbImages), m_cbImages * sizeof(WCHAR));

								    ptlh->offwDispImages        = pDiskImage->NextOffset();  ptlh->cnDispSortKeys  = pDiskImage->Encode(PBYTE(m_pwDispImages), m_cwDispImages * sizeof(WCHAR));

								    ptlh->offDescriptors        = pDiskImage->NextOffset();  pDiskImage->SaveData(PBYTE(m_pd), sizeof(DESCRIPTOR) * (m_cd + 1));

								    ptlh->offppdSorted          = pDiskImage->NextOffset();  pDiskImage->WriteDWords(PUINT(m_ppdSorted), m_cd);   ASSERT(sizeof(PDESCRIPTOR) == sizeof(UINT));

								    ptlh->offppdTailSorted      = pDiskImage->NextOffset();  pDiskImage->WriteDWords(PUINT(PPDTailSorting()), m_cd);

								    ptlh->offpafClassifications = pDiskImage->NextOffset();  pDiskImage->WriteDWords(m_pafClassifications, m_cd);

								    ptlh->offClassifier         = pDiskImage->NextOffset();  pDiskImage->SaveData(PBYTE(&m_clsf), sizeof(m_clsf));

								}


								CTokenList *CTokenList::CreateImage(CPersist *pDiskImage)

								{

								    CTokenList *ptl= NULL;


								    __try

								    {

								        ptl= New CTokenList(TRUE);


								        ptl->ConnectImage(pDiskImage);

								    }

								    __finally

								    {

								        if (_abnormal_termination() && ptl)

								        {

								            delete ptl;  ptl= NULL;

								        }

								    }


								    return ptl;

								}


								void CTokenList::SkipImage(CPersist *pDiskImage)

								{

								    TokenListHeader *ptlh= (TokenListHeader *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader));

								}


								void CTokenList::ConnectImage(CPersist *pDiskImage)

								{

								    UINT c;

								    int  cbDelta;

								    LCID lcid = GetUserDefaultLCID();


								    TokenListHeader *ptlh= (TokenListHeader *) pDiskImage->ReserveTableSpace(sizeof(TokenListHeader));


								    m_cd           = ptlh->cDescriptors;


								    m_How_Constructed = From_Images;

								    m_cbMaxLength     = ptlh->cbMaxLength;

								    m_cbImages        = ptlh->cbImages;

									m_cwDispMaxLength = ptlh->cwDispMaxLength;

									m_cwDispImages	  = ptlh->cwDispImages;


								    PDESCRIPTOR pd= PDESCRIPTOR(pDiskImage->LocationOf(ptlh->offDescriptors));


								    m_pd= (PDESCRIPTOR) VAlloc(FALSE, sizeof(DESCRIPTOR) * (m_cd + 1));


								    CopyMemory(m_pd, pd, sizeof(DESCRIPTOR) * (m_cd + 1));


								    ValidateHeap();


								    m_pwDispImages = (PWCHAR)VAlloc(FALSE, ptlh->cwDispImages * sizeof(WCHAR));


								    int cwcDelta= m_pwDispImages - m_pd->pwDisplay;


								    ValidateHeap();


								    for (pd= m_pd, c= m_cd + 1; c--; ++pd) pd->pwDisplay += cwcDelta;


								    ValidateHeap();


								    Decode((PUINT)pDiskImage->LocationOf(ptlh->offwDispImages), ptlh->cnDispSortKeys,  (PBYTE)m_pwDispImages);


								    ValidateHeap();


								    ConstructSortKeys(lcid);


								    BOOL fValidSortOrder = TRUE;


								    if (pDiskImage->IsFTSFile())

								    {

								        if (pDiskImage->VersionIndex() == FTSVERSION_MIN)

								            fValidSortOrder = FALSE;

								    }

								    else

								        if (pDiskImage->IsFTGFile())

								        {

								            if (pDiskImage->VersionIndex() == FTGVERSION_MIN)

								                fValidSortOrder = FALSE;

								        }


								    if (fValidSortOrder && (ptlh->lcid & 0x0FF) == (lcid & 0x0FF))

								    {

								        m_ppdSorted = (PDESCRIPTOR *) VAlloc(FALSE, m_cd * sizeof(PDESCRIPTOR));


								        PDESCRIPTOR *ppdSrc  = (PDESCRIPTOR *) (pDiskImage->LocationOf(ptlh->offppdSorted));

								        PDESCRIPTOR *ppdDest = m_ppdSorted;


								        cbDelta= PBYTE(m_pd) - PBYTE(ptlh->pdOld);


								        for (c= m_cd; c--; ) *ppdDest++ = (PDESCRIPTOR) (PBYTE(*ppdSrc++) + cbDelta);


								        m_ppdTailSorted= (PDESCRIPTOR *) VAlloc(FALSE, m_cd * sizeof(PDESCRIPTOR));


								        ppdSrc  = (PDESCRIPTOR *) (pDiskImage->LocationOf(ptlh->offppdTailSorted));

								        ppdDest = m_ppdTailSorted;


								        for (c= m_cd; c--; ) *ppdDest++ = (PDESCRIPTOR) (PBYTE(*ppdSrc++) + cbDelta);

								    }

								    else

								    {

								        // major languages do not match between stored sort keys and user LCID.

								        // The sort ordering is probably different.


								        UINT cdSorted= 0;


								        SortTokenImages(m_pd, &m_ppdSorted,  &m_ppdTailSorted, &cdSorted, m_cd);

								    }


								    // BugBug! The classification code below is broken when the sort keys

								    //         have changed!


								    m_pafClassifications= PUINT(pDiskImage->LocationOf(ptlh->offpafClassifications));


								    CopyMemory(&m_clsf, PBYTE(pDiskImage->LocationOf(ptlh->offClassifier)), sizeof(m_clsf));

								}


								void CTokenList::SynchronizeDatabase()

								{

								    ASSERT(m_How_Constructed == TDB_FULL_REF);


								    if (m_ptdb->m_pulstate->pld) m_ptdb->SyncForQueries();


								    m_cbImages  = m_ptdb->m_pbNextGalactic - m_pbImages;

								    m_ppdSorted = m_ptdb->m_ppdSorted;


								    m_cwDispImages  = m_ptdb->m_pwDispNextGalactic - m_pwDispImages;


								    UINT cd= m_ptdb->m_pdNextGalactic - m_pd;


								    if (m_cd != cd)

								    {

								        m_cd          = cd;  // NB: MaxWidthToken depends on m_ppdSorted

								                             //     and m_cd being set correctly!

								        m_cbMaxLength= m_ptdb->MaxTokenWidth();

								    }


								    m_ppdTailSorted      = m_ptdb->m_ppdTailSorted;

								    m_pafClassifications = m_ptdb->m_pafClassifications;


								#if 0

								    // Some measurement code...


								    int cTokens= ptdb->TokenCount();


								    int cRefThreshhold= (cTokens+31)/32, cRefs;


								    int cIndexSets= 0, cIndices= 0, cBitSets= 0, cActiveBits= 0, cSingletons= 0,

								        cMaxRefs= 0;


								    int acLogClassEntries[33] = { 0 },

								        acLogClassSums   [33] = { 0 };


								    int iClass;


								    PDESCRIPTOR pd      = ptdb->DescriptorBase(),

								                pdLimit = ptdb->m_pdNextGalactic;


								    for (; pd < pdLimit; ++pd)

								    {

								        cRefs= pd->cReferences;


								        iClass= CBitsToRepresent(cRefs);


								        ++acLogClassEntries[iClass];

								          acLogClassSums   [iClass] += cRefs;


								        if (cRefs > cMaxRefs) cMaxRefs= cRefs;


								        if (cRefs > cRefThreshhold)

								        {

								            ++cBitSets; cActiveBits+= cRefs;

								        }

								        else

								        {

								            ++cIndexSets; cIndices+= cRefs;


								            if (cRefs == 1) ++cSingletons;

								        }

								    }


								#endif


								}


								CTokenList::~CTokenList()

								{

								    if (m_pLRRanking) VFree(m_pLRRanking);

								    if (m_pRLRanking) VFree(m_pRLRanking);


								    switch (m_How_Constructed)

								    {

								    case TDB_FULL_REF:


								        ASSERT(m_ptdb);


								        DetachRef(m_ptdb);


								    case From_Nothing:


								        break;


								    case TDB_PARTIAL_REF:


								        if (m_ppdSorted    ) VFree(m_ppdSorted);

								        if (m_ppdTailSorted) VFree(m_ppdTailSorted);


								        if (m_ptdb) DetachRef(m_ptdb);


								        if (!m_fFromFileImage && m_pafClassifications) VFree(m_pafClassifications);


								        break;


								    case From_Images:


								        if (m_pbImages     ) VFree(m_pbImages     );

								        if (m_pwDispImages ) VFree(m_pwDispImages );

								        if (m_pd           ) VFree(m_pd           );

								        if (m_ppdSorted    ) VFree(m_ppdSorted    );

								        if (m_ppdTailSorted) VFree(m_ppdTailSorted);


								        if (!m_fFromFileImage && m_pafClassifications) VFree(m_pafClassifications);


								        break;


								    case TKL_SUBSET:


								        if (m_ppdSorted) VFree(m_ppdSorted);


								        if (m_ptklSource) DetachRef(m_ptklSource);


								        break;

								    }

								}


								int CTokenList::MaxWidthToken()

								{

								    if (m_cwDispMaxLength) return m_cwDispMaxLength;


								    PDESCRIPTOR *ppd= m_ppdSorted;


								    int c= m_cd;


								    int cwDispMaxLength= 0;


								    for (; c--; )

								    {

								        int cbWidth;


								        PDESCRIPTOR pd= *ppd++;


								      	cbWidth= CwDisplay(pd);


								        if (cwDispMaxLength < cbWidth) cwDispMaxLength= cbWidth;

								    }


								    m_cwDispMaxLength= cwDispMaxLength;


								    return m_cwDispMaxLength;

								}


								void CTokenList::AddTokens(CTokenList *ptl)

								{

								    PDESCRIPTOR   pdResult          = NULL;

								    PDESCRIPTOR *ppdResult          = NULL;

								    PWCHAR       pbImages           = NULL;

								    PUINT        pafClassifications = NULL;


								// Combines the tokens in this list with those in *ptl.


								    __try

								    {

								        if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								        if (ptl->m_How_Constructed == From_Nothing) return;


								        int cdResult= m_cd + ptl->m_cd;


								        pdResult  = (PDESCRIPTOR  ) ExAlloc(LPTR, sizeof( DESCRIPTOR) *(cdResult+1));

								        ppdResult = (PDESCRIPTOR *) ExAlloc(LPTR, sizeof(PDESCRIPTOR) * cdResult);


								        MergeImageRefSets((PVOID *)        ppdResult,  cdResult,

								                          (PVOID *)      m_ppdSorted,      m_cd,

								                          (PVOID *) ptl->m_ppdSorted, ptl->m_cd,

								                          CompareImagesLR

								                         );


								        PDESCRIPTOR pdDest, *ppdDest;


								        int c, cbImages= 0;


								        for (ppdDest= ppdResult,  c= cdResult;  c-- ;)

								            cbImages += CbImage(*ppdDest++);


								        pbImages= (PWCHAR) ExAlloc(LPTR, cbImages * sizeof(WCHAR));


								        PWCHAR pbDest= pbImages;


								        for (c= cdResult, pdDest= pdResult, ppdDest= ppdResult; c--; ++pdDest)

								        {

								            *pdDest= **ppdDest;


								            UINT  cb= CbImage(*ppdDest);


								            *ppdDest++ = pdDest;


								            wcsncpy(pbDest, pdDest->pbImage, cb);


								            pdDest->pbImage= pbDest;


								            pbDest += cb;

								        }


								        pdDest->pbImage= pbDest;

								    	pdDest->pwDisplay = pbDest;


								        m_clsf.Initial();

								        m_clsf.ScanAndRankData(pbImages, cbImages);


								        pafClassifications= (PUINT ) VAlloc(FALSE, cdResult * sizeof(BOOL *));


								        PUINT  pf;


								        for (pf= pafClassifications, c=cdResult, ppdDest= ppdResult; c--; )

								        {

								            pdDest= *ppdDest++;

								            *pf++ = m_clsf.ClassifyData(pdDest->pbImage, CbImage(pdDest));

								        }


								        switch (m_How_Constructed)

								        {

								        case TDB_FULL_REF:

								        case From_Nothing:


								            break;


								        case TDB_PARTIAL_REF:


								            VFree(m_ppdSorted);

								            if (m_ppdTailSorted) VFree(m_ppdTailSorted);


								            break;


								        case From_Images:


								            VFree(m_pbImages);

								            VFree(m_pwDispImages);

								            VFree(m_pd);

								            VFree(m_ppdSorted);

								            if (m_ppdTailSorted) VFree(m_ppdTailSorted);


								            if (m_pafClassifications) VFree(m_pafClassifications);


								            break;

								        }


								        m_How_Constructed    = From_Images;

								        m_pbImages           = pbImages;    pbImages= NULL;

								        m_pwDispImages       = pbImages;

								        m_cbImages           = cbImages;

								        m_cwDispImages       = cbImages;

								        m_pd                 = pdResult;    pdResult= NULL;

								        m_cd                 = cdResult;

								        m_ppdSorted          = ppdResult;  ppdResult= NULL;

								        m_ppdTailSorted      = NULL;  // This will be computed on demand.

								        m_ptdb               = NULL;

								        m_cbMaxLength        = 0;     // This will be computed on demand.

								        m_pafClassifications = pafClassifications;  pafClassifications= NULL;

								    }

								    __finally

								    {

								        if (_abnormal_termination())

								        {

								            if (pdResult          ) { VFree(pdResult          );  pdResult           = NULL; }

								            if (ppdResult         ) { VFree(ppdResult         );  ppdResult          = NULL; }

								            if (pbImages          ) { VFree(pbImages          );  pbImages           = NULL; }

								            if (pafClassifications) { VFree(pafClassifications);  pafClassifications = NULL; }

								        }

								    }

								}


								// Sets up incTail according to the algorithm given by Wojciech Rytter in

								// his paper, CORRECT PREPROCESSING ALGORITHM FOR BOYER-MOORE STRING SEARCHING,

								// Society for Industrial and Applied Mathematics, Vol. 9, No. 3, Aug 1980.

								// The labels given below correspond roughly to those given in Rytter's paper.


								/* Let incTail[n] be an array of BYTEs, where n=patlen.  Then we have four

								 * possible values for each incTail[j], 1 <= j <= n.  We have for 1 <= j <= n

								 *

								 *    incTail[j] = 2*n-j       for the case of *pat[j]...*pat[n] not

								 *                appearing elsewhere in the pattern

								 *    incTail[j] < n           where incTail[j]=n-l, l=max{i | *pat[i+1]...

								 *                *pat[n] appears elsewhere in the pattern and

								 *                *pat[l] != *pat[j]}

								 *    n <= incTail[j] < 2*n-j  j <= SHIFT(*pat), where SHIFT(*pat) is the

								 *                smallest shift of the pattern on itself s.t.

								 *                the two sections of the pattern match.  In

								 *                other words, if SHIFT(*pat)=i, then *pat[1]...

								 *                *pat[n-i]=*pat[i+1]...*pat[n].  For example,

								 *                consider abbaaab.  The smallest shift on itself

								 *                is 5, giving us

								 *

								 *                    abbaaab

								 *                    --->>abbaaab

								 *

								 *                Note:  if the pattern cannot be shifted on

								 *                itself and still have a prefix match a suffix,

								 *                then SHIFT(*pat)=patlen; for example, consider

								 *                string:

								 *

								 *                    string

								 *                    ---->>string

								 *    n <  incTail[j] < 2*n-j  j >  SHIFT(*pat).

								 */


								#define MIN(a,b) (((a) <= (b))? (a) : (b))


								void SetUpTables(WORD n, PWCHAR pat, WORD *incLastChar, WORD *incVar, WORD *incTail)

								{

								    WORD k, j, j1, t, t1, q, q1;  /* n   = patlen      */

								    WORD i, *pi;

								    WORD *pit;


								    PWCHAR pb;


								    for (t= WORD(INC_LAST_CHAR_SIZE-1), pi= incLastChar; t; t--) *pi++ = n;


								    for (t= n, pb= pat; t--; ) incLastChar[*pb++]= t;


								/* Case 1: incTail[j] = 2*n-j */


								// A1:


								    for (i= 2*n, j= n, pit= incTail; j--;) *pit++ = --i;


								//  for (k=n; k>0; k--) incTail[k-1] = 2*n-k;


								/* Case 2: incTail[j] < n, *pat[l] != *pat[j], where l=n-incTail[j] */


								// A2:


								    for (j= n, t= n; j--; --t)

								        for (incVar[j]= t; t < n && pat[j] != pat[t]; t= incVar[t])

								            incTail[t]= MIN(incTail[t],n-j-1);


								//  for (j= n, t= n+1; j>0; --t, --j)

								//  for (incVar[j-1]= t; t <= n && pat[j-1] != pat[t-1]; t= incVar[t-1])

								//      incTail[t-1]= MIN(incTail[t-1],n-j);


								    q = t;

								    t = n-q;


								// B1:


								    for (j1= 0, t1= (WORD)-1; j1 < t; ++t1, ++j1)

								        for (incVar[j1]= t1; t1 != (WORD)-1 && pat[j1] != pat[t1]; )

								            t1= incVar[t1];


								/* Case 3: n <= incTail[j] < 2*n-j, j <= SHIFT(*pat) = incVar[0] = t,

								   AND

								   Case 4: n <  incTail[j] < 2*n-j, j >  SHIFT(*pat),

								   where SHIFT = minimum non-zero shift of pattern itself

								 */


								// B2:


								    for (q1= 0; q < n-1; q1++, q=q+t-incVar[t-1]-1, t= incVar[t-1]+1)

								        for (k=q1; k <= q; k++) incTail[k] = MIN(incTail[k],n+q-k);

								}


								/* Strategic Goal: How to make the TokensContaining function fast for very

								                   Large Token Sets


								   The time required for an invocation of TokensContaining is a function of

								   the total string lengths for the token set and the length of the target

								   string. For a constant target the search operation will be a linear

								   function of the total string length and the number of partial and

								   complete string matches. For a given token set the time for a search is

								   inversely proportional to the length of the target string.


								   This leads to two very good cases:


								       * a short or medium list of token strings to search

								       * a long target string


								   and one very poor case:


								       * a long list of token strings to search and a short target string

								         [Searching for a single character is the worst situation.]


								>> First Idea: Tag each token with letter set flags.


								   This will be implemented as a vector of DWords corresponding to each

								   token. We'll group the set of 256 characters (65,536 glyphs when we

								   move to Unicode) into 32 sets based on the count of their use within

								   the token set. Letters such as "E"and "T" with very high frequencies

								   will be treated as separate classes while less frequently used characters

								   (0x255, for example) will be aggregated into classes.


								   Then we search for target string, we will first construct a 32-bit mask

								   which defines the classes of characters contained in the target. Then

								   we'll strobe the masks for each token looking for a class set match:


								        if ( (afClassMasks[iToken] & fTarget) == fTarget) ...


								   When we find a class match, then we'll invoke the string search code to

								   determine whether we have an actual hit or just a class collision. For a

								   single character target, no string search is unnecessary.


								>> Second Idea: Maintain "Not-Used" Flags for each Character Value


								   Then when a target string contains a character known to never occur

								   in the token string set, we can immediately abandon the search.


								** Aside: How to Partition the Set of Characters in Use?


								   The partitioning algorithm must be bounded linearly in the number of

								   unique characters actually used in the token set, and it must meet these

								   goals:


								   -- The partition sets must be partially ordered. That is, if aRefs is

								      a vector of reference counts for the code points in each partition,

								      then acRefs[i] >= acRefs[i+1].


								   -- The of count members in each partition is also partially ordered. That is,

								      acMembers[i] <= acMembers[i+1].


								   -- The number of partition will be maximized.


								   -- The count of members in each partitions will be be minimized given

								      that the above conditions are satisfied.


								   An Algorithm:


								   Assume -- aiSortByCRefs is a permutation vector for the set of unique

								                character values such that acRefChar[aiSortByCRefs] is

								                partially ordered.


								             aiPartitionBase is a 33 element array which will contain

								                index values defining the characters contained in each

								                partition. In particular partition j will consist of the

								                characters


								                   aiSortByCRefs[aiPartitionBase[j]] through

								                   aiSortByCRefs[aiPartitionBase[j+1]-1]


								    cPartitions= (cCharClasses <= 32)? cCharClasses : 32;


								    for (j=0; j < cPartitions; ++j) aiPartitionBase[j]=j;


								    aiPartitionBase[j]= cCharClasses;


								    if (cCharClasses > 32)

								    {

								        for (i= 0; i < 32; ++i)

								        {

								            cRefs= 0


								            for (j= aiPartitionBase[i], limit= aiPartitionBase[i+1];

								                 j < limit;

								                 ++j

								                ) cRefs+= acRefChar[aiSortByCRefs[j]];


								            acRefsPartition[i]= cRefs;

								        }


								        do

								            for (fChanges= FALSE, i= 32; --i;)

								                while (    acRefsPartition[i  ] > acRefsPartitition[i-1]

								                       && (aiPartitionBase[i+1] - aiPartitionBase  [i  ]) > 1

								                      )

								                {

								                   cRefs= acRefChar[aiSortByCRefs[aiPartitionBase[i]++]];

								                   acRefsPartition[i  ] -= cRefs;

								                   acRefsPartition[i-1] += cRefs;


								                   fChanges= TRUE;

								                }

								        while (fChanges);

								    }


								>> Third Idea: Maintain Search Histories


								   The browser uses incremental searches most of the time. That is, the next

								   search request is usually the same as the previous search with either a

								   character added or a character deleted.


								   Consider the case where each successive target adds a letter to the right

								   end of the string. Each search result will always be a subset of the

								   preceding searches. The basic idea here is to keep an array of WORD or

								   DWORD flags corresponding to each token, along with the most recently

								   used target string. Each character in the target will correspond to one

								   bit in the WORD or DWORD tag. When we add a new trailing character, we'll

								   examine only the tokens corresponding to the most recent bit flag, and

								   we'll add a new bit for the new search subset, shifting the previous

								   bits left by one position.


								   Of course this proceedure can only continue for 16 or 32 iterations.

								   However a target longer than 16 characters will always have very few

								   instances among the token set [except in contrived cases].


								   Usually we'll have a complete set of flags for the predecessor sets.

								   However for those odd cases where we don't, we can keep the string

								   corresponding to each bit flag. In general this will allow for rapid

								   incremental searchs and will also make backspace operations very swift.


								>> Fourth Idea: Maintain Multiple Sort Mappings


								   For the "Begin With" case the matching tokens will aways be contiguously

								   located within the sorted list of tokens. Thus we can use a simple binary

								   search to locate the end points of the matching token subset. In a

								   similar fashion we can make "End With" matches very fast by constructing

								   a sorting map based on the reverse byte ordering of each token.

								 */


								CIndicatorSet *CTokenList::TokensContaining(PWCHAR pszSubstring, BOOL fStarting,

								                                         BOOL fEnding, CIndicatorSet *pisFilter)

								{

								// Returns an indicator set for the tokens which contain the string denoted by

								// pszSubstring. If fStarting is TRUE, the string must occur at the beginning

								// of the token. If fEnding   is TRUE, the string must occur at the end of token.


								    ASSERT(!pisFilter || m_cd == pisFilter->ItemCount());


								    if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								    CIndicatorSet *pisResult= NULL;


								    if (fStarting || fEnding)

								    {

								        if (fStarting)

								             AttachRef(pisResult, TokensStartingWith(pszSubstring, fEnding));

								        else AttachRef(pisResult, TokensEndingWith  (pszSubstring         ));


								        CAbortSearch::CheckContinueState();


								        if (pisFilter) pisResult->ANDWith(pisFilter);


								        ForgetRef(pisResult);


								        return pisResult;

								    }


								    CIndicatorSet *pisCandidates = NULL;

								    int           *paiCandidates = NULL;

								    PWORD          pIncLastChar  = NULL;


								    __try

								    {

								        PWCHAR workL = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));


								        if (!workL) RaiseException(STATUS_NO_MEMORY, EXCEPTION_NONCONTINUABLE, 0, NULL);


								        PWCHAR workR = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));


								        if (!workR) RaiseException(STATUS_NO_MEMORY, EXCEPTION_NONCONTINUABLE, 0, NULL);


								        pszSubstring++;     							    // skip over alpha-num-punc prefix


								        UINT cwL = SortKeyText(pszSubstring, wcslen(pszSubstring), workL, WORKBUF_SIZE);


								        if (cwL > 2*MAX_PATTERN_LENGTH) cwL = 2*MAX_PATTERN_LENGTH;


								        UINT cwPattern = cwL / 2;


								        CClassifier *pclsf = (m_How_Constructed == TDB_FULL_REF) ? &(m_ptdb->m_clsfTokens) : &m_clsf;


								        UINT fClass= pclsf->ClassifyData(pszSubstring, cwPattern);


								        if (fClass & CClassifier::UNUSED_GLYPH)

								        {

								            AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								            __leave;

								        }


								        CAbortSearch::CheckContinueState();


								        AttachRef(pisCandidates, CIndicatorSet::NewIndicatorSet(m_cd, m_pafClassifications, fClass, fClass));


								        if (pisFilter) pisCandidates->ANDWith(pisFilter);


								        UINT cCandidates= pisCandidates->SelectionCount();

								        UINT cProcessed;

								        UINT c, cwR, cCandidatesChunk;


								        int  *pi, iRank;


								        CAbortSearch::CheckContinueState();


								        paiCandidates = (int *) VAlloc(FALSE, CDW_CANDIDATE_BUFFER * sizeof(int));


								        ASSERT(paiCandidates);


								        if (cwL == 2)

								        {

								            AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								            for (cProcessed = 0; cProcessed < cCandidates; cProcessed += cCandidatesChunk)

								            {

								                CAbortSearch::CheckContinueState();


								                cCandidatesChunk = pisCandidates->MarkedItems(cProcessed, paiCandidates, CDW_CANDIDATE_BUFFER);


								                for (c = cCandidatesChunk, pi = paiCandidates; c--; )

								                {

								                    iRank= *pi++;


								                    PDESCRIPTOR pdCandidate = m_ppdSorted[iRank];


								                    cwR = SortKeyText(pdCandidate->pbImage+1, CbImage(pdCandidate)-1, workR, WORKBUF_SIZE);


								                    if (HasASubstring(workL, cwL, workR, cwR))

								                        pisResult->RawSetBit(iRank);

								                }

								            }


								            VFree(paiCandidates);

								            DetachRef(pisCandidates);


								            pisResult->InvalidateCache();


								            __leave;

								        }


								        AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								        pIncLastChar = New WORD[INC_LAST_CHAR_SIZE];


								        WORD  incVar[MAX_PATTERN_LENGTH], incTail[MAX_PATTERN_LENGTH];


								        SetUpTables(cwPattern, pszSubstring, pIncLastChar, incVar, incTail);


								        BOOL fAllLowerCase= AllLowerCase(pszSubstring, wcslen(pszSubstring));


								        for (cProcessed = 0; cProcessed < cCandidates; cProcessed += cCandidatesChunk)

								        {

								            CAbortSearch::CheckContinueState();


								            cCandidatesChunk = pisCandidates->MarkedItems(cProcessed, paiCandidates, CDW_CANDIDATE_BUFFER);


								            for (c = cCandidatesChunk, pi = paiCandidates; c--; )

								            {

								                iRank= *pi++;


								                PDESCRIPTOR pdCandidate = m_ppdSorted[iRank];


								                UINT inc;


								                PWCHAR pwBase  = pdCandidate->pbImage+1;

								                PWCHAR pwStart = pwBase;

								    			PWCHAR pwLimit = pwBase;


								    			while (HIBYTE(*pwLimit) != SORT_KEY_SEPARATOR)

								    				pwLimit++;


								                for (pwBase += cwPattern-1; pwBase < pwLimit; pwBase += inc)

								                {

								                    inc = *(pIncLastChar + *pwBase);


								                    if (inc)

								                    	continue;


								                    int cwUnmatched = cwPattern-1;


								                    PWCHAR pwTarget = pszSubstring + cwUnmatched;


								                    for ( ; cwUnmatched && *--pwTarget == *--pwBase; --cwUnmatched) {};


								                    if (cwUnmatched)

								                    {

								                        inc = incTail[cwUnmatched-1];

								                        continue;

								                    }


								                    if (fAllLowerCase)

								                    {

								                        pisResult->RawSetBit(iRank);


								                        break;

								                    }


								                    inc = pwBase - pwStart;


								                    cwR = SortKeyText(pwStart /*+ inc*/, CbImage(pdCandidate)-1 /*- inc*/, workR, WORKBUF_SIZE);


								                    if (HasASubstring(workL, cwL, workR, cwR))

								                        pisResult->RawSetBit(iRank);


								                    break;

								                }

								            }

								        }


								    	delete pIncLastChar;      pIncLastChar  = NULL;


								        VFree(paiCandidates);     paiCandidates = NULL;


								        DetachRef(pisCandidates);


								        pisResult->InvalidateCache();


								        __leave;

								    }

								    __finally

								    {

								        if (_abnormal_termination())

								        {

								            if (pIncLastChar ) { delete pIncLastChar;   pIncLastChar  = NULL; }

								            if (paiCandidates) { VFree(paiCandidates);  paiCandidates = NULL; }

								            if (pisResult    ) DetachRef(pisResult    );

								            if (pisCandidates) DetachRef(pisCandidates);

								        }

								    }


								    ForgetRef(pisResult);


								    return pisResult;

								}


								BOOL CTokenList::TokenSpan(PDESCRIPTOR *ppdSorted, PWCHAR pszSubstring, PCompareImages pCompareImages,

								                           PUINT  piSpanBase, PUINT  piSpanLimit)

								{

								// Returns an pair of numbers, *piSpanBase and *piSpanLimit which define a span within

								// the supplied toking sorting vector, pptiSorted. The tokens in that span match the supplied

								// pszSubstring in the sense that either the leading or trailing characters match the substring.

								// The comparison function, pCompareImages, determines whether leading or trailing characters

								// are significant.

								//

								// The explicit result will be FALSE if the span is empty, and TRUE otherwise.

								//

								// Side Effect: The string will be overwritten.


								    int cbPattern = wcslen(pszSubstring);


								    if (cbPattern > MAX_PATTERN_LENGTH) cbPattern= MAX_PATTERN_LENGTH;


								    int    cb = cbPattern;

								    PWCHAR pb = pszSubstring;


								    BOOL  fLeftToRight = pCompareImages == &CompareImagesLR;

								    WCHAR wSaved;


								    DESCRIPTOR  tki[2];

								    DESCRIPTOR *ptki= &tki[0];


								    tki[0].pbImage = pszSubstring;

								    tki[1].pbImage = pszSubstring + cbPattern;


								    UINT  iMatchBase, iMatchLimit, iMatchMiddle, cDiff, iBracketBase, iBracketLimit;


									if (fLeftToRight)

									    for (int i = 0; i < cb; i++)						    // skipping characters by two (alpha sort weights)

										    if (HIBYTE(pszSubstring[i]) == SORT_KEY_SEPARATOR)	// search for first weight separator

										    {

								                wSaved = pszSubstring[i];

											    pszSubstring[i] = 0;

											    cb = i;  	    					 			// return character length

								                break;

										    }


								    // Now we're going to use a binary search algorithm to find

								    // the lowest index iMBracketBase where tki <= ppdSorted[iMBracketBase]


								    if (0 >= pCompareImages(&ptki, &ppdSorted[0]) ) iBracketBase= 0;

								    else

								    {

								        // Here the loop invariants are:

								        //

								        //  for i in [0 .. iMatchBase], ppdSorted[i] < tki

								        //

								        //  for j in [iMatchLimit .. m_cd-1], ppdSorted[j] >= tki


								        for (iMatchBase = 0, iMatchLimit = m_cd; 1 < (cDiff = iMatchLimit - iMatchBase); )

								        {

								            iMatchMiddle = iMatchBase + cDiff/2;


								            CAbortSearch::CheckContinueState();


								            if (0 < pCompareImages(&ptki, &ppdSorted[iMatchMiddle]) )

								                 iMatchBase  = iMatchMiddle;

								            else iMatchLimit = iMatchMiddle;

								        }


								        iBracketBase= iMatchLimit;

								    }


								    if (iBracketBase == m_cd)

								    {

								        *piSpanBase  = 0;

								        *piSpanLimit = 0;


								        if (fLeftToRight) pszSubstring[cb] = wSaved;

								        return FALSE;

								    }


								    iBracketLimit= m_cd;


								    BOOL  fReturn = TRUE;


									if (fLeftToRight)

										pb = pszSubstring + cb;

									else

									   	pb = pszSubstring;


								    if (fLeftToRight) tki[1].pbImage = pb--;

								    else              tki[0].pbImage = pb++;


									(*pb)++;


								    if (0 >= pCompareImages(&ptki, &ppdSorted[iBracketBase]))

								    {

								        *piSpanBase  = 0;

								        *piSpanLimit = 0;


								        fReturn = FALSE;

								    }


								    else

								    {

								        for (iMatchBase= iBracketBase, iMatchLimit= m_cd; 1 < (cDiff= iMatchLimit - iMatchBase); )

								        {

								            iMatchMiddle= iMatchBase + cDiff/2;


								            CAbortSearch::CheckContinueState();


								            if (0 < pCompareImages(&ptki, &ppdSorted[iMatchMiddle]))

								                 iMatchBase  = iMatchMiddle;

								            else iMatchLimit = iMatchMiddle;

								        }


								        iBracketLimit= iMatchLimit;


								        *piSpanBase  = iBracketBase;

								        *piSpanLimit = iBracketLimit;

								    }


								    (*pb)--;

								    if (fLeftToRight) pszSubstring[cb] = wSaved;

								    return fReturn;

								}


								CIndicatorSet *CTokenList::TokensStartingWith(PWCHAR pszSubstring, BOOL fMatching)

								{

								// Returns an indicator set for the tokens which begin with the string denoted by

								// pszSubstring. If fMatching is TRUE, the string must exactly match the token.


								    CIndicatorSet *pisResult = NULL;


								    __try

								    {

								        if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								        UINT  iBracketBase, iBracketLimit;


								        if (!TokenSpan(m_ppdSorted, pszSubstring, CompareImagesLR, &iBracketBase, &iBracketLimit))

								        {

								            CAbortSearch::CheckContinueState();


								            AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								            __leave;

								        }


								        if (!fMatching && AllLowerCase(pszSubstring + 1, wcslen(pszSubstring)))

								        {

								            AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd, iBracketBase, iBracketLimit - iBracketBase));


								            __leave;

								        }


								        AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								        PWCHAR workL = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));

								        PWCHAR workR = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));


								        UINT cwL = SortKeyText(pszSubstring+1, wcslen(pszSubstring)-1, workL, WORKBUF_SIZE);

								        UINT cwR;

								    	PDESCRIPTOR pdNew;


								        for ( ; iBracketBase < iBracketLimit; iBracketBase++)

								    	{

								    		CAbortSearch::CheckContinueState();


								    		pdNew  = m_ppdSorted[iBracketBase];


								            cwR = SortKeyText(pdNew->pbImage+1, CbImage(pdNew)-1, workR, WORKBUF_SIZE);


								            if (!fMatching || cwL == cwR)

								                if (HasAPrefix(workL, cwL, workR, cwR))

								                    pisResult->RawSetBit(iBracketBase);

								    	}


								        pisResult->InvalidateCache();


								        __leave;

								    }

								    __finally

								    {

								        if (_abnormal_termination())

								        {

								            if (pisResult) DetachRef(pisResult);

								        }

								    }


								    ForgetRef(pisResult);


								    return pisResult;

								}


								const UINT *CTokenList::LRRanking()

								{

								    // This routine doesn't need __try/__finally brackets because:

								    //

								    // 1. It has only one allocation.

								    // 2. It doesn't call any other routines that might allocate memory.


								    if (m_pLRRanking) return m_pLRRanking;


								    m_pLRRanking= (PUINT) VAlloc(FALSE, m_cd * sizeof(UINT));


								    UINT c= m_cd;


								    PDESCRIPTOR *ppd = m_ppdSorted  + c;


								    for (; c--; ) m_pLRRanking[*--ppd - m_pd] = c;


								    return m_pLRRanking;

								}


								const UINT *CTokenList::RLRanking()

								{

								    if (m_pRLRanking) return m_pRLRanking;


								    __try

								    {

								        m_pRLRanking= (PUINT) VAlloc(FALSE, m_cd * sizeof(UINT));


								        UINT c= m_cd;


								        PDESCRIPTOR *ppd   = PPDTailSorting() + c;

								        const UINT  *puiLR = LRRanking();


								        for (; c--; ) m_pRLRanking[c]= puiLR[*--ppd - m_pd];

								    }

								    __finally

								    {

								        if (_abnormal_termination() && m_pRLRanking)

								        {

								            VFree(m_pRLRanking);  m_pRLRanking= NULL;

								        }

								    }


								    return m_pRLRanking;

								}


								CIndicatorSet *CTokenList::TokensEndingWith(PWCHAR pszSubstring)

								{

								// Returns an indicator set for the tokens which end with the string denoted by pszSubstring.


								    CIndicatorSet *pisResult = NULL;


								    __try

								    {

								        if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								        UINT  iBracketBase, iBracketLimit;


								        PDESCRIPTOR *ppdSortOrder = PPDTailSorting();


								        if (!TokenSpan(ppdSortOrder, pszSubstring, CompareImagesRL, &iBracketBase, &iBracketLimit))

								        {

								            CAbortSearch::CheckContinueState();


								            AttachRef(pisResult, CIndicatorSet::NewIndicatorSet(m_cd));


								            __leave;

								        }


								        const UINT *pRLRanking= RLRanking();


								        AttachRef(pisResult,  CIndicatorSet::NewIndicatorSet(m_cd));


								        if (AllLowerCase(pszSubstring + 1, wcslen(pszSubstring)))

								        {

								            for ( ; iBracketBase < iBracketLimit; iBracketBase++)

								            {

								                UINT iRank= pRLRanking[iBracketBase];


								                pisResult->RawSetBit(iRank);

								            }


								            pisResult->InvalidateCache();


								            __leave;

								        }


								        PWCHAR workL = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));

								        PWCHAR workR = PWCHAR(_alloca(WORKBUF_SIZE * sizeof(WCHAR)));


								        UINT cwL = SortKeyText(pszSubstring+1, wcslen(pszSubstring)-1, workL, WORKBUF_SIZE);

								        UINT cwR;


								        for ( ; iBracketBase < iBracketLimit; iBracketBase++)

								        {

								            CAbortSearch::CheckContinueState();


								            UINT        iRank = pRLRanking  [iBracketBase];

								    		PDESCRIPTOR pdNew = ppdSortOrder[iBracketBase];


								            cwR = SortKeyText(pdNew->pbImage+1, CbImage(pdNew)-1, workR, WORKBUF_SIZE);


								            if (HasASuffix(workL, cwL, workR, cwR))

								                pisResult->RawSetBit(iRank);

								        }


								        pisResult->InvalidateCache();


								        __leave;

								    }

								    __finally

								    {

								        if (_abnormal_termination())

								        {

								            if (pisResult) DetachRef(pisResult);

								        }

								    }


								    ForgetRef(pisResult);


								    return pisResult;

								}


								PDESCRIPTOR *CTokenList::PPDTailSorting()

								{

								    // This routine doesn't need __try/__finally brackets because:

								    //

								    // 1. It has only one allocation.

								    // 2. It doesn't call any other routines that might allocate memory.


								    if (m_ppdTailSorted) return m_ppdTailSorted;


								    PDESCRIPTOR *ppdTailSorted= (PDESCRIPTOR *) VAlloc(FALSE, m_cd * sizeof(PDESCRIPTOR *));


								    memcpy(ppdTailSorted, m_ppdSorted, m_cd * sizeof(PDESCRIPTOR *));


								    qsort(ppdTailSorted, m_cd, sizeof(PDESCRIPTOR *), CompareImagesRL);


								    m_ppdTailSorted= ppdTailSorted;


								    return ppdTailSorted;

								}


								CTokenList *CTokenList::IndicatedTokens(CIndicatorSet *pis, BOOL fFullCopy)

								{

								// Returns a list of the tokens denoted by the indicator set *pis. A NULL

								// pis is considered to be equivalent to an all-1's selection. That is,

								// it selects the entirety of the token list.

								//

								// Setting fFullCopy TRUE usually forces a complete result structure to be

								// constructed.  The exception to that rule is when pis is all 1's and this

								// token list is simply an indirect reference to the token set for a text

								// database.

								//

								// When fFullCopy is false we construct only the m_ppdSorted vector and

								// leave references to the rest of the data structures which are presumed

								// to reside within a text database.

								//

								// For token lists that aren't connected to a text database, we always

								// create a complete set of data arrays.


								    CTokenList *ptlResult         = NULL;

								    int        *piResult          = NULL;

								    PUINT       pfClassifications = NULL;


								    __try

								    {

								        if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								        if (m_How_Constructed == From_Images) fFullCopy= TRUE;


								        ASSERT(!pis || pis->ItemCount() == m_cd);


								        UINT  cMarks= pis? pis->SelectionCount() : m_cd;


								        AttachRef(ptlResult, New CTokenList);


								        if (!cMarks) __leave;


								        if (m_How_Constructed == TDB_FULL_REF && cMarks == m_cd)

								        {

								            ptlResult->m_How_Constructed = m_How_Constructed;

								            ptlResult->m_cbMaxLength     = m_cbMaxLength;

								            ptlResult->m_pbImages        = m_pbImages;

								            ptlResult->m_pwDispImages    = m_pwDispImages;

								            ptlResult->m_cbImages        = m_cbImages;

								            ptlResult->m_cwDispImages    = m_cwDispImages;

								            ptlResult->m_pd              = m_pd;

								            ptlResult->m_cd              = m_cd;

								            ptlResult->m_ppdSorted       = m_ppdSorted;

								            ptlResult->m_ppdTailSorted   = m_ppdTailSorted;

								            ptlResult->m_ptdb            = NULL;


								            ClsAttachRef(ptlResult, m_ptdb, m_ptdb);


								            __leave;

								        }


								        piResult= (int *) ExAlloc(LPTR, cMarks * sizeof(int));


								        pfClassifications= (PUINT ) VAlloc(FALSE, cMarks * sizeof(UINT));


								        PUINT  pfDest;


								        int c, *pi;


								        if (pis)

								            pis->MarkedItems(0, piResult, cMarks);

								        else

								            for (c= cMarks; c-- ; ) piResult[c]= c;


								        for (pfDest= pfClassifications+cMarks, c= cMarks, pi= piResult+cMarks; c--; )

								            *--pfDest = m_pafClassifications[*--pi];


								        ptlResult->m_pafClassifications= pfClassifications;  pfClassifications= NULL;


								        memcpy(&ptlResult->m_clsf, &m_clsf, sizeof(m_clsf));


								        PDESCRIPTOR *ppdResult= (PDESCRIPTOR *)piResult;

								        PDESCRIPTOR *ppd;


								        for (c= cMarks, ppd= ppdResult+cMarks, piResult+= cMarks; c--; )

								            *--ppd = m_ppdSorted[*--piResult];


								        ptlResult->m_ppdSorted   = ppdResult;  piResult= NULL;

								        ptlResult->m_cd          = cMarks;

								        ptlResult->m_cbMaxLength  = 0;  // This will be computed on demand.


								        if (!fFullCopy)

								        {

								            ptlResult->m_How_Constructed = TDB_PARTIAL_REF;

								            ptlResult->m_pbImages        = m_pbImages;

								            ptlResult->m_pwDispImages    = m_pwDispImages;

								            ptlResult->m_cbImages        = m_cbImages;

								            ptlResult->m_cwDispImages    = m_cwDispImages;

								            ptlResult->m_pd              = m_pd;

								            ptlResult->m_ptdb            = NULL;

								            ptlResult->m_cbMaxLength     = m_cbMaxLength;


								            ClsAttachRef(ptlResult, m_ptdb, m_ptdb);


								            ptlResult->m_ppdTailSorted= NULL;  // Will be computed on demand


								            __leave;

								        }


								        ptlResult->m_How_Constructed = From_Images;


								        PDESCRIPTOR pd= ptlResult->m_pd= (PDESCRIPTOR) ExAlloc(LPTR, sizeof(DESCRIPTOR) * (cMarks+1));


								        int cbImages= 0;

								    	int cwDispImages = 0;


								        for (c= cMarks, ppd= ptlResult->m_ppdSorted; c--; )

								    	{

								    		cwDispImages += CwDisplay(*ppd);

								            cbImages += CbImage(*ppd++);

								    	}


								        ptlResult->m_cbImages= cbImages;

								    	ptlResult->m_cwDispImages = cwDispImages;


								        PWCHAR pb= ptlResult->m_pbImages= (PWCHAR) ExAlloc(LPTR, cbImages * sizeof(WCHAR));

								        PWCHAR pwDisp = ptlResult->m_pwDispImages= (PWCHAR) ExAlloc(LPTR, cwDispImages * sizeof(WCHAR));


								        for (c= cMarks, pd= ptlResult->m_pd, ppd= ptlResult->m_ppdSorted; c--; )

								        {

								            int cbImage= CbImage(*ppd);


								            *pd = **ppd;


								            wcsncpy(pb, pd->pbImage, cbImage);


								            pd->pbImage= pb;


								            pb+= cbImage;


								            int cwDispImage = CwDisplay(*ppd);


								            wcsncpy(pwDisp, pd->pwDisplay, cwDispImage);


								            pd->pwDisplay = pwDisp;


								            pwDisp += cwDispImage;


								            *ppd++ = pd++;

								        }


								        pd->pbImage= pb;

								    	pd->pwDisplay = pwDisp;


								        ptlResult->m_ppdTailSorted= NULL;  // Will be computed on demand.


								        __leave;

								    }

								    __finally

								    {

								        if (_abnormal_termination())

								        {

								            if (pfClassifications) { VFree(pfClassifications);  pfClassifications = NULL; }

								            if (piResult         ) { VFree(piResult         );  piResult          = NULL; }

								            if (ptlResult        ) DetachRef(ptlResult);

								        }

								    }


								    ForgetRef(ptlResult);


								    return(ptlResult);

								}


								int CTokenList::Data_cRows()

								{

								    if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								    return(m_cd);

								}


								int CTokenList::Data_cCols()

								{

								    if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


								    int cb= MaxWidthToken();


								    if ( m_fLeadingElipsis) cb+= cbElipsis + 1;

								    if (m_fTrailingElipsis) cb+= cbElipsis + 1;


								    return cb;

								}


								void CTokenList::Data_GetTextMatrix(int rowTop, int colLeft,

								                                    int rows, int cols, PWCHAR lpb, PUINT charsets)

								{

									int i;


								    if (m_How_Constructed == TDB_FULL_REF) SynchronizeDatabase();


									for (i = 0; i < rows*cols; i++)

										lpb[i] = UNICODE_SPACE_CHAR;


								    if (rowTop >= (int) m_cd) return;


								    if (rowTop+rows > (int) m_cd) rows= m_cd-rowTop;


								    int cbLimit= colLeft + cols;


								    for (i = 0; rows--; ++rowTop, i++, lpb+= cols)

								    {

								        int cbOffset= 0;


								        if (m_fLeadingElipsis)

								        {

								            cbOffset= cbElipsis + 1;


								            if (colLeft < cbElipsis)

								                CopyMemory(lpb+colLeft, pszElipsis + colLeft, (cbElipsis - colLeft) * sizeof(WCHAR));

								        }


										charsets[i] = m_ppdSorted[rowTop]->bCharset;


								        cbOffset= FormatAToken(m_ppdSorted[rowTop], cbOffset, colLeft, cbLimit, lpb);


								        if (m_fTrailingElipsis && ++cbOffset < cbLimit)

								        {

								            UINT cb= cbLimit - cbOffset;


								            if (cb > cbElipsis) cb= cbElipsis;


								            CopyMemory(lpb + cbOffset, pszElipsis, cb * sizeof(WCHAR));

								        }

								    }

								}


								int CTokenList::GetTokenI(int iToken, PWCHAR pb, UINT  cbMax, BOOL fSortedOrder)

								{

								    ASSERT(iToken >= 0 && iToken < (int) m_cd);


								    ASSERT(fSortedOrder || m_How_Constructed == From_Images); // Otherwise the token set isn't dense.


								    PDESCRIPTOR pd= fSortedOrder? m_ppdSorted[iToken] : m_pd + iToken;


								    if (!cbMax || !pb) return CbImage(pd);


								    if (--cbMax > CbImage(pd)) cbMax= CbImage(pd);


								    wcsncpy(pb, pd->pbImage, cbMax);


								    *(pb+cbMax)= 0;


								    return(CbImage(pd));

								}


								BYTE CTokenList::GetCharSetI(int iToken, BOOL fSortedOrder)

								{

								    ASSERT(iToken >= 0 && iToken < (int) m_cd);


								    ASSERT(fSortedOrder || m_How_Constructed == From_Images); // Otherwise the token set isn't dense.


								    PDESCRIPTOR pd= fSortedOrder? m_ppdSorted[iToken] : m_pd + iToken;


								    return(pd->bCharset);

								}


								int CTokenList::GetWTokenI(int iToken, PWCHAR pb, UINT  cbMax, BOOL fSortedOrder)

								{

								    ASSERT(iToken >= 0 && iToken < (int) m_cd);


								    ASSERT(fSortedOrder || m_How_Constructed == From_Images); // Otherwise the token set isn't dense.


								    PDESCRIPTOR pd= fSortedOrder? m_ppdSorted[iToken] : m_pd + iToken;


								    if (!cbMax || !pb) return CwDisplay(pd);


								    if (--cbMax > CwDisplay(pd)) cbMax= CwDisplay(pd);


								    wcsncpy(pb, pd->pwDisplay, cbMax);


								    *(pb+cbMax)= 0;


								    return(CwDisplay(pd));

								}


								CMaskedTokenList::CMaskedTokenList()  : CTextMatrix WithType("MaskedTokenList")

								{

								    m_ptl  = NULL;

								    m_psel = NULL;

								}


								CMaskedTokenList *CMaskedTokenList::NewMaskedTokenList(CTokenList *ptl, CIndicatorSet *pis)

								{

								    CMaskedTokenList *pmtl= NULL;


								    __try

								    {

								        pmtl= New CMaskedTokenList;


								        pmtl->InitialMaskedTokenList(ptl, pis);


								        __leave;

								    }

								    __finally

								    {

								        if (_abnormal_termination() && pmtl)

								        {

								            delete pmtl;  pmtl= NULL;

								        }

								    }


								    return pmtl;

								}


								void CMaskedTokenList::InitialMaskedTokenList(CTokenList *ptl, CIndicatorSet *pis)

								{

								    NullFilterShowsAll(TRUE);


								    m_ptl= NULL;


								    AttachRef(m_ptl, ptl);


								    m_psel= CTMMultipleSelect::NewTMMultipleSelect(this);


								    SetSelector(m_psel);


								    SetSubstringFilter(pis);

								}


								CMaskedTokenList::~CMaskedTokenList()

								{

								    if (m_ptl) DetachRef(m_ptl);


								    delete m_psel;

								}


								void CMaskedTokenList::SetTokenList(CTokenList *ptl)

								{

								    if (ptl)

								    {

								        ChangeRef(m_ptl, ptl);


								        SetSubstringFilter(CIndicatorSet::NewIndicatorSet(Data_cRows()));

								    }

								    else

								    {

								        if (m_ptl) DetachRef(m_ptl);


								        SetSubstringFilter(NULL);

								    }

								}


								long CMaskedTokenList::SelectionCount()

								{

								    return (m_psel->GetSelection())->SelectionCount();

								}


								CTokenList *CMaskedTokenList::SelectedTokens()

								{

								   return m_ptl? m_ptl->IndicatedTokens(m_psel->GetSelection()) : NULL;

								}


								CIndicatorSet *CMaskedTokenList::GetIndicators()

								{

								   return m_ptl ? m_psel->GetSelection() : NULL;

								}


								void CMaskedTokenList::SetSelection(CIndicatorSet *pis)

								{

								    ASSERT(m_psel);


								    m_psel->SetSelection(pis);

								}


								void CMaskedTokenList::ClearSelection()

								{

								    ASSERT(m_ptl);

								    ASSERT(m_psel);


								    m_psel->ClearSelection();

								}


								//////////////////////////////////  Hiliter support  //////////////////////////


								void AddSerial2(UINT iValue, PVOID pvTag, PVOID pvEnvironment)

								{	// adds the index to each token to the hash table

								    *PUINT(pvTag)= iValue;

								}


								CSegHashTable *CTokenList::GetFilledHashTable()

								{	// creates a segmented hash table and fills it with the tokenlist

								    CSegHashTable *pHash = NULL;

								    CAValRef *pavr;

								    __try

								    {	// we need to create a new hash table

								        pHash = CSegHashTable::NewSegHashTable(sizeof(UINT), sizeof(UINT));

										// get the sorted list of tokens

										pavr = m_ptdb->DescriptorList(m_pd, m_cd);

										// .. as a pointer to a set of value references

										// BugBug! m_ptdb is non-functional.  Probably should

										// ..move Descriptor list to a better home

								        pHash->Assimilate(pavr, NULL, NULL, AddSerial2);

										// add to the table along with their index

								    }

								    __except(FilterFTExceptions(_exception_code()))

								    {

								        if (pHash) { delete pHash;  pHash = NULL; }

								    }

								    if (pavr) delete pavr;

								return pHash;

								}