/*++ Copyright (C) 1995-1999 Microsoft Corporation Module Name: OPATHLEX.CPP Abstract: Object Path Lexer Map (for use with GENLEX.CPP). History: 24-Jun-95 Created. 14-Apr-98 Radical update for singly quoted strings, remove unused tokens, add hex constants, etc. --*/ #include #include #include #include #define ST_IDENT 22 #define ST_NUMERIC 28 #define ST_DECIMAL 30 #define ST_HEX 32 #define ST_SQ_STRING 36 #define ST_DQ_STRING 40 #define ST_DQ_STRING_ESC 43 // DFA State Table for Object Path tokens. // ======================================= LexEl OPath_LexTable[] = { // State First Last New state, Return tok, Instructions // ======================================================================= // ------------------------------------------------------------- // Identifiers /* 0 */ L'A', L'Z', ST_IDENT, 0, GLEX_ACCEPT, /* 1 */ L'a', L'z', ST_IDENT, 0, GLEX_ACCEPT, /* 2 */ 0x80, 0xfffd, ST_IDENT, 0, GLEX_ACCEPT, /* 3 */ L'_', GLEX_EMPTY, ST_IDENT, 0, GLEX_ACCEPT, // ------------------------------------------------------------- // Single symbols /* 4 */ L'.', GLEX_EMPTY, 0, OPATH_TOK_DOT, GLEX_ACCEPT, /* 5 */ '@', GLEX_EMPTY, 0, OPATH_TOK_SINGLETON_SYM, GLEX_ACCEPT, /* 6 */ L'=', GLEX_EMPTY, 0, OPATH_TOK_EQ, GLEX_ACCEPT, /* 7 */ L':', GLEX_EMPTY, 0, OPATH_TOK_COLON, GLEX_ACCEPT, // ------------------------------------------------------------- // Backslashes & forward slashes are interchangeable and reported // as OPATH_TOK_BACKSLASH to the parser. /* 8 */ L'\\', GLEX_EMPTY, 0, OPATH_TOK_BACKSLASH, GLEX_ACCEPT, /* 9 */ L'/', GLEX_EMPTY, 0, OPATH_TOK_BACKSLASH, GLEX_ACCEPT, // ------------------------------------------------------------- // Simple numeric transition. The '-' must be followed // by decimal digit sequence. The '0' may be the beginning of a hex // or a decimal sequence. /* 10 */ L'1', L'9', ST_DECIMAL, 0, GLEX_ACCEPT, /* 11 */ L'-', GLEX_EMPTY, ST_DECIMAL, 0, GLEX_ACCEPT, /* 12 */ L'0', GLEX_EMPTY, ST_NUMERIC, 0, GLEX_ACCEPT, // ------------------------------------------------------------- // Simple string transition // // If a single quote begins the string, it must end the string. // Escapes are not supported: 'ab', 'a"b' // // If a double quote begins the string, it must end the string, // except that escape+quote is an embedded double quote: // // "ab", "a'b", "a\"b" // /* 13 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_CONSUME, /* 14 */ L'\'', GLEX_EMPTY, ST_SQ_STRING, 0, GLEX_CONSUME, // ------------------------------------------------------------- // Whitespace, newlines, etc. Whitespace is an error. /* 15 */ L' ', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 16 */ L'\t', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 17 */ L'\n', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 18 */ L'\r', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, /* 19 */ 0, GLEX_EMPTY, 0, OPATH_TOK_EOF, GLEX_CONSUME|GLEX_RETURN, // Note forced return /* 20 */ L',', GLEX_EMPTY, 0, OPATH_TOK_COMMA, GLEX_ACCEPT, // All remaining unknown characters /* 21 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, // ------------------------------------------------------------- // ST_IDENT // Accepts C/C++ identifiers, plus any char >= U+0080. /* 22 */ L'a', L'z', ST_IDENT, 0, GLEX_ACCEPT, /* 23 */ L'A', L'Z', ST_IDENT, 0, GLEX_ACCEPT, /* 24 */ L'_', GLEX_EMPTY, ST_IDENT, 0, GLEX_ACCEPT, /* 25 */ L'0', L'9', ST_IDENT, 0, GLEX_ACCEPT, /* 26 */ 0x80, 0xfffd, ST_IDENT, 0, GLEX_ACCEPT, /* 27 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_IDENT, GLEX_PUSHBACK|GLEX_RETURN, // ------------------------------------------------------------- // ST_NUMERIC // // A zero has been recognized. // If the next char is 'x' or 'X', we have a valid hex sequence. // Otherwise, if '1' to '9' we have a decimal sequence. // /* 28 */ L'x', GLEX_EMPTY, ST_HEX, 0, GLEX_ACCEPT, /* 29 */ L'X', GLEX_EMPTY, ST_HEX, 0, GLEX_ACCEPT, // ------------------------------------------------------------- // ST_DECIMAL // /* 30 */ L'0', L'9', ST_DECIMAL, 0, GLEX_ACCEPT, /* 31 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_INT, GLEX_PUSHBACK|GLEX_RETURN, // ------------------------------------------------------------- // ST_HEX // // Recognizes a valid hex sequence. /* 32 */ L'a', L'f', ST_HEX, 0, GLEX_ACCEPT, /* 33 */ L'A', L'F', ST_HEX, 0, GLEX_ACCEPT, /* 34 */ L'0', L'9', ST_HEX, 0, GLEX_ACCEPT, /* 35 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_HEXINT, GLEX_PUSHBACK|GLEX_RETURN, // ------------------------------------------------------------- // ST_SQ_STRING : Single quoted strings // // If a single quote begins the string, it must end the string. // Escapes are not supported: 'ab', 'a"b' /* 36 */ L'\n', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_LINEFEED, /* 37 */ L'\r', GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_LINEFEED, /* 38 */ L'\'', GLEX_EMPTY, 0, OPATH_TOK_QSTRING, GLEX_CONSUME, /* 39 */ GLEX_ANY, GLEX_EMPTY, ST_SQ_STRING, 0, GLEX_ACCEPT, // ------------------------------------------------------------- // ST_DQ_STRING // // If a double quote begins the string, it must end the string, // except that escape+quote is an embedded double quote: // // "ab", "a'b", "a\"b" // /* 40 */ L'\\', GLEX_EMPTY, ST_DQ_STRING_ESC, 0, GLEX_CONSUME, // Escape /* 41 */ L'"', GLEX_EMPTY, 0, OPATH_TOK_QSTRING, GLEX_CONSUME, /* 42 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT|GLEX_NOT, // Accept anything but a quote //------------------------------------------------------------- // ST_DQ_STRING_ESC // // An escape occurred while in a string. // Either an embedded slash or embedded quote must have occurred. // Otherwise, an unsupported escape has occurred and we fail. /* 43 */ L'\\', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT, /* 44 */ L'"', GLEX_EMPTY, ST_DQ_STRING, 0, GLEX_ACCEPT, /* 45 */ GLEX_ANY, GLEX_EMPTY, 0, OPATH_TOK_ERROR, GLEX_ACCEPT|GLEX_RETURN, };