windows-xp/Source/XPSP1/NT/sdktools/mep/help/enginlib/helpdec.c


								/*************************************************************************

								 * helpdec - HelpDecomp routine and Other ASM code

								 *

								 *       Copyright <C> 1988, Microsoft Corporation

								 *

								 * Purpose:

								 *

								 * Revision History:

								 *

								 *       08-Oct-1990     RJSA    Converted to C

								 *       22-Dec-1988     LN      Removed MASM High Level Lang support (Need

								 *                               to control segments better than that will

								 *                               let me)

								 *       08-Dec-1988     LN      CSEG

								 *       16-Feb-1988     LN      Rewrite for (some) speed

								 *  []   17-Jan-1988     LN      Created

								 *

								 **************************************************************************/


								#include <stdio.h>

								#include <string.h>

								#include <ctype.h>

								#if defined (OS2)

								#define INCL_BASE

								#include <os2.h>

								#else

								#include <windows.h>

								#endif


								#include <help.h>

								#include <helpfile.h>


								#pragma function( memset, memcpy, memcmp, strcpy, strcmp, strcat )


								//  In order to increase performance, and because of the functions

								//  decomp and NextChar being tightly coupled, global variables are

								//  used instead of passing parameters.

								//


								PBYTE	pHuffmanRoot;	//	Root of Huffman Tree

								PBYTE	pCompTopic;			//	Current pointer to text (compressed)

								BYTE    BitMask;        //  Rotating bit mask

								BOOL    IsCompressed;   //  True if text is compressed


								BYTE NextChar (void);

								BOOL pascal HelpCmp (PCHAR   fpsz1, PCHAR   fpsz2, USHORT  cbCmp, BOOL  fCase, BOOL  fTerm);


								/**************************************************************************

								 *

								 * Decomp - Decompress Topic Text

								 * f near pascal Decomp(fpHuffmanRoot, fpKeyphrase, fpTopic, fpDest)

								 * uchar far *fpHuffmanRoot

								 * uchar far *fpKeyphrase

								 * uchar far *fpTopic

								 * uchar far *fpDest

								 *

								 * Purpose:

								 *  Fully decompress topic text. Decompresses based on current file, from one

								 *  buffer to another.

								 *

								 * Entry:

								 *  fpHuffmanRoot - Pointer to root of huffman tree (or NULL if no huffman)

								 *  fpKeyphrase - Pointer to keyphrase table (or NULL if no keyphrase)

								 *  fpTopic     - Pointer to compressed topic text

								 *  fpDest      - Pointer to destination buffer

								 *

								 * Exit:

								 *  FALSE on successful completion

								 *

								 * Exceptions:

								 *  Returns TRUE on any error.

								 *

								 **************************************************************************/

								BOOL  pascal decomp (

								        PCHAR  fpHuffmanRoot,

								        PCHAR  fpKeyphrase,

								        PCHAR  fpTopic,

								        PCHAR  fpDest

								        ){


									int		cDecomp;		/* count of totally decompressed	*/

									BYTE	c;				/* byte read						*/


								#ifdef BIGDEBUG

									char	DbgB[128];

									char	*DbgP = fpDest;

								#endif


								    // Initialize global variables.


									pHuffmanRoot	=	(PBYTE)fpHuffmanRoot;

									pCompTopic		=	(PBYTE)fpTopic + sizeof(USHORT);

								    BitMask         =   0x01;

								    IsCompressed    =   fpHuffmanRoot

								                          ?   ((*(USHORT UNALIGNED *)((PBYTE)fpHuffmanRoot + 2)) != 0xFFFF)

								                          :   FALSE;


								    cDecomp     = *((USHORT UNALIGNED *)fpTopic);


								#ifdef BIGDEBUG

									sprintf(DbgB, "DECOMPRESSING: HuffmanRoot: %lx, Keyphrase: %lx\n", fpHuffmanRoot, fpKeyphrase );

									OutputDebugString(DbgB);

									sprintf(DbgB, "               Topic: %lx, Dest: %lx\n", fpTopic, fpDest );

									OutputDebugString(DbgB);

									if ( IsCompressed ) {

										OutputDebugString("               The Topic IS Compressed\n");

									}

								#endif


									while ( cDecomp > 0 ) {


								        c = NextChar();


								        //

										// At this point a valid character has been found and huffman decoded. We must

								        // now perform any other decoding on it that is required.

								        //

								        // Variables are:

								        //    c          = character

								        //    cDecomp    = Output count remaining

								        //    BitMask    = bit mask for interpreting input stream

								        //

								        // "Magic Cookie" decompression.

								        // The chararacter stream after huffman encoding is "cookie" encoded, in that

								        // certain characters are flags which when encountered mean something other than

								        // themselves. All characters which are NOT such flags (or cookies, as they seem

								        // to be called), are simply copied to the output stream.

								        //

								        // We first check the character to see if it IS a cookie. If it is NOT, we just

								        // store it, and get the next input byte

								        //


								        if ((c >= C_MIN) && (c <= C_MAX)) {


								            BYTE    Cookie = c ;


								#ifdef BIGDEBUG

											OutputDebugString("Cookie\n");

								#endif

								            // c is a cookie of some sort, jump to the appropriate

								            // cookie eater.


								            c = NextChar();


								            switch (Cookie) {

								                case C_KEYPHRASE0:

								                case C_KEYPHRASE1:

								                case C_KEYPHRASE2:

								                case C_KEYPHRASE3:

								                case C_KEYPHRASE_SPACE0:

								                case C_KEYPHRASE_SPACE1:

								                case C_KEYPHRASE_SPACE2:

								                case C_KEYPHRASE_SPACE3:

								                    {

														ULONG	Index;	/* Keyword index */

								                        PBYTE   pKey;   /* Keyword       */

								                        BYTE    Size;   /* Keyword size  */


								                        if ((Cookie >= C_KEYPHRASE_SPACE0) && (Cookie <= C_KEYPHRASE_SPACE3)) {

															Index = (ULONG)((int)Cookie - C_MIN - 4);

								                        } else {

															Index = (ULONG)((int)Cookie - C_MIN);

								                        }

														Index = (ULONG)(((Index * 0x100) + c) * sizeof(PVOID));


														pKey = *(PBYTE *)(((PBYTE)fpKeyphrase) + Index);


														// pKey = *(PBYTE *)(fpKeyphrase + Index);


								                        Size = *pKey++;


								                        {

								                            BYTE i = Size;


															while (i--) {

																*fpDest++ = *pKey++;

								                            }

								                            cDecomp -=Size;

								                        }

								                        if ((Cookie >= C_KEYPHRASE_SPACE0) && (Cookie <= C_KEYPHRASE_SPACE3)) {

															*fpDest++ = ' ';

								                            cDecomp--;

								                        }

								                        break;

								                    }


								                case C_RUNSPACE:

								                    {

								                        BYTE  Count = c;


								                        while (Count--) {

															*fpDest++ = ' ';

								                        }

								                        cDecomp -= c;

								                        break;

								                    }


								                case C_RUN:

								                    {

								                        BYTE    b = c;

								                        BYTE    Cnt;


								                        Cnt = c = NextChar();


								                        while (Cnt--) {

															*fpDest++ = b;

								                        }

								                        cDecomp -= c;

								                        break;

								                    }


								                case C_QUOTE:

													*fpDest++ =  c;

								                    cDecomp--;

								                    break;


								            }


								        } else {


								            // c is not a cookie


											*fpDest++ = c;

								            cDecomp--;

								        }

								    }


									*fpDest++ = '\00';	// Null terminate string


								#ifdef BIGDEBUG

									sprintf( DbgB, "Decompressed topic: [%s]\n", DbgP );

									OutputDebugString( DbgB );


									if ( cDecomp < 0 ) {

										sprintf( DbgB, "DECOMPRESSION ERROR: cDecomp = %d!\n", cDecomp );

										OutputDebugString(DbgB);

									}

								#endif


								    return FALSE;

								}


								/**************************************************************************

								 *

								 * NextChar - Return next character from input stream

								 *

								 * Purpose:

								 *  Returns next character from input stream, performing huffman decompression

								 *  if enabled.

								 *

								 * Entry:

								 *      fpHuffmanRoot   = pointer to root of huffman tree

								 *      pfpTopic        = pointer to pointer to Topic

								 *      pBitmask        = pointer to bit mask of current bit

								 *

								 * Exit:

								 *      Returns character

								 *      *pfpTopic and *pBitMask updated.

								 *

								 **************************************************************************

								 *

								 * Format of Huffman decode tree:

								 *  The Huffman decode tree is a binary tree used to decode a bitstream into a

								 *  character stream. The tree consists of nodes (internal nodes and leaves).

								 *  Each node is represented by a word. If the high bit in the word is set then

								 *  the node is a leaf. If the node is an internal node, then the value of the

								 *  node is the index of the right branch in the binary tree. The left branch is

								 *  the node following the current node (in memory). If the node is a leaf, then

								 *  the low byte of the node is a character.

								 *

								 *    e.g.

								 *       0: 0004                      0

								 *       1: 0003                     / \

								 *       2: 8020                    /   \

								 *       3: 8065                   1     \------4

								 *       4: 0006                  / \          / \

								 *       5: 806C                 /   \        /   \

								 *       6: 8040                2     3      5     6

								 *                             ' '   'e'     'l'  '@'

								 *

								 * Using the Huffman decode tree:

								 *  The huffman decode tree is used to decode a bitstream into a character

								 *  string. The bitstream is used to traverse the decode tree. Whenever a zero

								 *  is detected in the bit stream we take the right branch, when one is detected

								 *  we take the left branch. When a leaf is reached in the tree, the value of

								 *  the leaf (a character) is output, and the current node is set back to the

								 *

								 ********************************************************************/


								BYTE

								NextChar (

								    void

								    ) {


								    BYTE    b;              // current source byte


								#ifdef BIGDEBUG

									char DbgB[128];

									OutputDebugString("NextChar:\n");

								#endif


								    if (IsCompressed) {


								        USHORT              HuffmanNode;            // curent node in the huffman tree

								        USHORT UNALIGNED *pHuffmanNext;           // next node in the huffman tree


								        //

								        // Huffman decoding.

								        // This first part of the decode loop performs the actual huffman decode. This

								        // code is very speed critical. We walk the tree, as defined by the bit pattern

								        // coming in, and exit this portion of the code when we reach a leaf which

								        // contains the character that the bit pattern represented.

								        //


								        pHuffmanNext = (USHORT UNALIGNED *)pHuffmanRoot;

								        HuffmanNode  = *pHuffmanNext;


										b = *(pCompTopic - 1);		 // get last byte read


										while (!(HuffmanNode & 0x8000)) {  // while not leaf


											BitMask >>= 1;


											if (!(BitMask)) {

								                //

								                //  Get new byte from input

								                //

												b = *pCompTopic++;

								                BitMask = 0x80;

								#ifdef BIGDEBUG

												sprintf(DbgB, "\tb=%02x Mask=%02x Node=%04x", b, BitMask, HuffmanNode );

												OutputDebugString(DbgB);

								#endif

											} else {

								#ifdef BIGDEBUG

												sprintf(DbgB, "\tb=%02x Mask=%02x Node=%04x", b, BitMask, HuffmanNode );

												OutputDebugString(DbgB);

								#endif

											}


											if (b & BitMask) {

								                //

								                //  one: take left branch

								                //

								                pHuffmanNext++;

								            } else {

								                //

								                //  zero: take right branch

												//

												pHuffmanNext = (PUSHORT)((PBYTE)pHuffmanRoot + HuffmanNode);

								#ifdef BIGDEBUG

												sprintf(DbgB, " <%04x+%02x=%04x (%04x)>", pHuffmanRoot, HuffmanNode,

															pHuffmanNext, *pHuffmanNext );

												OutputDebugString( DbgB );

								#endif

											}


											HuffmanNode = *pHuffmanNext;


								#ifdef BIGDEBUG

											sprintf(DbgB, " Next=%04x\n", HuffmanNode );

											OutputDebugString(DbgB);

								#endif


										}


										b = (BYTE)HuffmanNode;	// character is low byte of leaf node


								    } else {

										b = *pCompTopic++;	// not compressed, simply return byte

								    }


								#ifdef BIGDEBUG

									sprintf(DbgB, "\t---->%2x [%c]\n", b,b);

									OutputDebugString(DbgB);

								#endif


								    return  b;

								}


								/**************************************************************************

								 *

								 * HelpCmpSz - help system string comparison routine.

								 * f near pascal HelpCmpSz (fpsz1, fpsz2)

								 * uchar far *fpsz1*

								 * uchar far *fpsz2*

								 *

								 * Purpose:

								 *  Perform string comparisons for help system look-up.

								 *  Default case of HelpCmp below.

								 *

								 * Entry:

								 *  fpsz1        = Far pointer to string 1. (Usually the constant string

								 *                 being "looked-up".

								 *  fpsz2        = Far pointer to string 2. This is usually the string table

								 *                 being searched.

								 *

								 * Exit:

								 *  TRUE on match

								 *

								 ********************************************************************/

								BOOL pascal

								HelpCmpSz (

								    PCHAR fpsz1,

								    PCHAR fpsz2

								    ){

									return HelpCmp(fpsz1, fpsz2, (USHORT)0xFFFF, TRUE, FALSE);	// fcase, fTerm

								}


								/**************************************************************************

								 *

								 * HelpCmp - help system string comparison routine.

								 * f near pascal HelpCmp (fpsz1, fpsz2, cbCmp, fCase, fTerm)

								 * uchar far *fpsz1

								 * uchar far *fpsz2

								 * ushort    cbCmp

								 * f         fCase

								 * f         fTerm

								 *

								 * Purpose:

								 *  Perform string comparisons for help system look-up.

								 *

								 * Entry:

								 *  fpsz1        = Far pointer to string 1. (Usually the constant string being

								 *                 "looked-up"). NOTE THAT IF THIS STRING IS NULL, WE RETURN

								 *                 TRUE!

								 *  fpsz2        = Far pointer to string 2. This is usually the string table

								 *                 being searched.

								 *  cbCmp        = Max number of bytes to compare.

								 *  fCase        = TRUE if search is to be case sensitive.

								 *  fTerm        = TRUE if we allow special termination processing.

								 *

								 * Exit:

								 *  TRUE on match

								 *

								 ********************************************************************/


								BOOL pascal

								HelpCmp (

								    PCHAR   fpsz1,

								    PCHAR   fpsz2,

								    USHORT  cbCmp,

								    BOOL  fCase,

								    BOOL  fTerm

								    ){


									register PBYTE p1 = (PBYTE)fpsz1;

									register PBYTE p2 = (PBYTE)fpsz2;


								    while (cbCmp--) {


										if ((!*p1) && (!*p2)) {

								            //

								            //  Got a match

								            //

								            return TRUE;

								        }


								        if (!fCase) {

											if (toupper((char)*p1) != toupper((char)*p2)) {

								                break;

											}

											p1++;

											p2++;

								        } else {

											if (*p1++ != *p2++) {

								                break;

								            }

								        }

								    }


								    if (!cbCmp) {

								        return TRUE;

								    }


								    // At this point, we have terminated the comparison. Termination conditions

								    // were:

								    //

								    //   character count exausted:   CX == zero. (Complete match, return TRUE)

								    //   Null terminator found:      CX != zero, & Zero flag set. (Complete match,

								    //                                       return TRUE)

								    //   non-match found             CX != zero, & Zero flag clear.

								    //

								    // In the later case, if special termination processing is NOT selected, we

								    // return FALSE, having found a mis-match.

								    //

								    // If special termination processing is TRUE, then if the mismatched character

								    // from string 1 is a null, and the mismatched character from string 2 is any

								    // whitespace or CR, we declare a match. (This is used in minascii processing).

								    //


								    if (fTerm) {

										p1--; p2--;

										if ((! *p1) &&

											((*p2 == '\n') || (*p2 == '\t') || (*p2 == ' '))) {

								            return TRUE;

								        }

								    }

								    return FALSE;

								}


								/*************************************************************************

								 *

								 * hfstrlen - far string length

								 *

								 * Purpose:

								 *  return length of null terminated string.

								 *

								 * Entry:

								 *  fpszSrc     = pointer to source

								 *

								 * Exit:

								 *  returns length

								 *

								 *************************************************************************/

								USHORT

								hfstrlen (

								    PCHAR fpszSrc

								    ){

									return (USHORT)strlen(fpszSrc);

								}


								/*************************************************************************

								 *

								 * hfstrcpy - far string copy

								 *

								 * Purpose:

								 *  copy strings

								 *

								 * Entry:

								 *  fpszDst     = pointer to destination

								 *  fpszSrc     = pointer to source

								 *

								 * Exit:

								 *  pointer to terminating null in destination

								 *

								 *************************************************************************/

								PCHAR

								hfstrcpy (

								    PCHAR fpszDst,

								    PCHAR fpszSrc

								    ) {

								    return (PCHAR)strcpy(fpszDst, fpszSrc);

								}


								/*************************************************************************

								 *

								 * hfstrchr - search for character in far string

								 *

								 * Purpose:

								 *  a near, pascal routine (for size/speed) to search for a character in

								 *  a far string.

								 *

								 * Entry:

								 *  fpsz        = far pointer to string

								 *  c           = character to locate

								 *

								 * Exit:

								 *  returns far pointer into string

								 *

								 * Exceptions:

								 *  returns NULL on character not in string

								 *

								 *************************************************************************/

								PCHAR

								hfstrchr (

								    PCHAR   fpsz,

								    char    c

								    ){

								    return (PCHAR)strchr(fpsz, c);

								}


								/*************************************************************************

								 *

								 * hfmemzer - zero out memory area.

								 *

								 * Purpose:

								 *  a near, pascal routine (for size/speed) to fill an area with zero

								 *

								 * Entry:

								 *  fpb         = far pointer to buffer

								 *  cb          = count of zeros to store

								 *

								 * Exit:

								 *

								 *************************************************************************/

								void

								hfmemzer (

								    PVOID   fpb,

								    ULONG   cb

								    ) {

								    memset(fpb, '\00', cb);

								}


								/*************************************************************************

								 *

								 * NctoFo - extract file offset from NC

								 *

								 * Purpose:

								 *  Extracts the file offset for a minascii file, and returns it as a long.

								 *

								 * Entry:

								 *  nc          = context number

								 *

								 * Exit:

								 *  returns file offset

								 *

								 *************************************************************************/

								ULONG

								NctoFo (

								    ULONG nc

								    ) {

								    nc  = nc & 0x0000FFFF;

								    nc *= 4;

								    return nc;

								}


								/*************************************************************************

								 *

								 * combineNc - combine a minascii file offset and fdb handle into nc.

								 *

								 * Purpose:

								 *  Combines a minascii file offset and fdb memory handle into an NC. If the

								 *  file offset is 0xffffffff, we return zero.

								 *

								 * Entry:

								 *  offset      = long file offset

								 *  mh          = fdb mem handle

								 *

								 * Exit:

								 *  returns NC (DX = mem handle, AX = filepos/4), or 0L if offset==FFFFFFFF

								 *

								 *************************************************************************/

								nc  pascal

								combineNc (

								    ULONG  offset,

								    mh  mh

								    ){

								    nc     ncRet = {0,0};

								    if (offset = 0xFFFFFFFF) {

								        return ncRet;

								    }

								    ncRet.mh = mh;

								    ncRet.cn = offset/4;

								    return ncRet;

								}


								/*************************************************************************

								 *

								 * toupr - convert char to upper case

								 *

								 * Purpose:

								 *

								 * Entry:

								 *  chr          = character

								 *

								 * Exit:

								 *  returns upper case character

								 *

								 *************************************************************************/

								char

								toupr (

								    char chr

								    ){

									return (char)toupper(chr);

								}


								/*************************************************************************

								 *kwPtrBuild - Build table of pointers to keywords.

								 *void pascal near kwPtrBuild(uchar far *fpTable, ushort tsize)

								 *

								 *Purpose:

								 * Builds a table of pointers to the keyword strings in the passed string array.

								 * The table is built in the first 4k of the passed buffer. The strings are

								 * assummed to start immediately thereafter.

								 *

								 *Entry:

								 * fpTable       - pointer to string table

								 * tsize         - size, in bytes, of strings

								 *

								 *Exit:

								 * none

								 *

								 *******************************************************************************/

								void

								kwPtrBuild (

								    PVOID  fpTable,

								    USHORT tsize

								    ) {

								    PBYTE fpStr  = (PBYTE)fpTable + 1024 * sizeof (PVOID);

								    PBYTE *fpTbl = fpTable;

								    while (tsize > 0) {

										UCHAR  sSize = (UCHAR)(*fpStr) + (UCHAR)1;

								        *fpTbl++ = fpStr;

								        tsize   -= sSize;

								        fpStr   += sSize;

								    }

								}