|
|
/*++
// Copyright (c) 1995-2001 Microsoft Corporation, All Rights Reserved
Module Name:
OPATHLEX.CPP
Abstract:
Object Path Lexer Map (for use with GENLEX.CPP).
History:
24-Jun-95 Created. 14-Apr-98 Radical update for singly quoted strings, remove unused tokens, add hex constants, etc.
--*/
#include "precomp.h"
#include <genlex.h>
#include <opathlex.h>
#define ST_IDENT 22
#define ST_NUMERIC 28
#define ST_DECIMAL 30
#define ST_HEX 32
#define ST_SQ_STRING 36
#define ST_DQ_STRING 40
#define ST_DQ_STRING_ESC 43
// DFA State Table for Object Path tokens.
// =======================================
LexEl OPath_LexTable[] = {
// State First Last New state, Return tok, Instructions
// =======================================================================
// -------------------------------------------------------------
// Identifiers
/* 0 */ L'A', L'Z', ST_IDENT, 0, GLEX_ACCEPT, /* 1 */ L'a', L'z', ST_IDENT, 0, GLEX_ACCEPT, /* 2 */ 0x80, 0xfffd, ST_IDENT, 0, GLEX_ACCEPT, /* 3 */ L'_', GLEX_EMPTY, ST_IDENT, 0, GLEX_ACCEPT,
// -------------------------------------------------------------
// Single symbols
/* 4 */ L'.', GLEX_EMPTY, 0, OPATH_TOK_DOT, GLEX_ACCEPT, /* 5 */ '@', GLEX_EMPTY, 0, OPATH_TOK_SINGLETON_SYM, GLEX_ACCEPT, /* 6 */ L'=', GLEX_EMPTY, 0, OPATH_TOK_EQ, GLEX_ACCEPT, /* 7 */ L':', GLEX_EMPTY, 0, OPATH_TOK_COLON, GLEX_ACCEPT,
// -------------------------------------------------------------
// Backslashes & forward slashes are interchangeable and reported
// as OPATH_TOK_BACKSLASH to the parser.
/* 8 */ L'\\', GLEX_EMPTY, 0, OPATH_TOK_BACKSLASH, GLEX_ACCEPT, /* 9 */ L'/', GLEX_EMPTY, 0, OPATH_TOK_BACKSLASH, GLEX_ACCEPT,
// -------------------------------------------------------------
// Simple numeric transition. The '-' must be followed
// by decimal digit sequence. The '0' may be the beginning of a hex
// or a decimal sequence.
/* 10 */ L'1', L'9', ST_DECIMAL, 0, GLEX_ACCEPT, /* 11 */ L'-', GLEX_EMPTY, ST_DECIMAL, 0, GLEX_ACCEPT, /* 12 */ L'0', GLEX_EMPTY, ST_NUMERIC, 0, GLEX_ACCEPT,
// -------------------------------------------------------------
// Simple string transition
//
// If a single quote begins the string, it must end the string.
// Escapes are not supported: 'ab', 'a"b' <not: 'a\'b'>
//
// If a double quote begins the string, it must end the string,
// except that escape+quote is an embedded double quote:
//
// "ab", "a'b", "a\"b"
//
/* 13 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_CONSUME, /* 14 */ L'\'', GLEX_EMPTY, ST_SQ_STRING, 0, GLEX_CONSUME,
// -------------------------------------------------------------
// Whitespace, newlines, etc. Whitespace is an error.
/* 15 */ L' ', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 16 */ L'\t', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 17 */ L'\n', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 18 */ L'\r', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 19 */ 0, GLEX_EMPTY, 0, OPATH_TOK_EOF, GLEX_CONSUME|GLEX_RETURN, // Note forced return
/* 20 */ L',', GLEX_EMPTY, 0, OPATH_TOK_COMMA, GLEX_ACCEPT,
// All remaining unknown characters
/* 21 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN,
// -------------------------------------------------------------
// ST_IDENT
// Accepts C/C++ identifiers, plus any char >= U+0080.
/* 22 */ L'a', L'z', ST_IDENT, 0, GLEX_ACCEPT, /* 23 */ L'A', L'Z', ST_IDENT, 0, GLEX_ACCEPT, /* 24 */ L'_', GLEX_EMPTY, ST_IDENT, 0, GLEX_ACCEPT, /* 25 */ L'0', L'9', ST_IDENT, 0, GLEX_ACCEPT, /* 26 */ 0x80, 0xfffd, ST_IDENT, 0, GLEX_ACCEPT, /* 27 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_IDENT, GLEX_PUSHBACK|GLEX_RETURN,
// -------------------------------------------------------------
// ST_NUMERIC
//
// A zero has been recognized.
// If the next char is 'x' or 'X', we have a valid hex sequence.
// Otherwise, if '1' to '9' we have a decimal sequence.
//
/* 28 */ L'x', GLEX_EMPTY, ST_HEX, 0, GLEX_ACCEPT, /* 29 */ L'X', GLEX_EMPTY, ST_HEX, 0, GLEX_ACCEPT,
// -------------------------------------------------------------
// ST_DECIMAL
//
/* 30 */ L'0', L'9', ST_DECIMAL, 0, GLEX_ACCEPT, /* 31 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_INT, GLEX_PUSHBACK|GLEX_RETURN,
// -------------------------------------------------------------
// ST_HEX
//
// Recognizes a valid hex sequence.
/* 32 */ L'a', L'f', ST_HEX, 0, GLEX_ACCEPT, /* 33 */ L'A', L'F', ST_HEX, 0, GLEX_ACCEPT, /* 34 */ L'0', L'9', ST_HEX, 0, GLEX_ACCEPT, /* 35 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_HEXINT, GLEX_PUSHBACK|GLEX_RETURN, // -------------------------------------------------------------
// ST_SQ_STRING : Single quoted strings
//
// If a single quote begins the string, it must end the string.
// Escapes are not supported: 'ab', 'a"b' <not: 'a\'b'>
/* 36 */ L'\n', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_LINEFEED, /* 37 */ L'\r', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_LINEFEED, /* 38 */ L'\'', GLEX_EMPTY, 0, OPATH_TOK_QSTRING, GLEX_CONSUME, /* 39 */ GLEX_ANY, GLEX_EMPTY, ST_SQ_STRING, 0, GLEX_ACCEPT,
// -------------------------------------------------------------
// ST_DQ_STRING
//
// If a double quote begins the string, it must end the string,
// except that escape+quote is an embedded double quote:
//
// "ab", "a'b", "a\"b"
//
/* 40 */ L'\\', GLEX_EMPTY, ST_DQ_STRING_ESC, 0, GLEX_CONSUME, // Escape
/* 41 */ L'"', GLEX_EMPTY, 0, OPATH_TOK_QSTRING, GLEX_CONSUME, /* 42 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT|GLEX_NOT, // Accept anything but a quote
//-------------------------------------------------------------
// ST_DQ_STRING_ESC
//
// An escape occurred while in a string.
// Either an embedded slash or embedded quote must have occurred.
// Otherwise, an unsupported escape has occurred and we fail.
/* 43 */ L'\\', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT, /* 44 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT, /* 45 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN,
};
|