Contribute native CTF Parser (bug370499)
[deliverable/tracecompass.git] / org.eclipse.linuxtools.ctf.parser / Grammar / CTFLexer.g
CommitLineData
866e5b51
FC
1lexer grammar CTFLexer;
2
3options {
4 language = Java;
5}
6
7@lexer::header {
8 package org.eclipse.linuxtools.ctf.parser;
9}
10
11/*
12 * Lexer grammers
13 */
14
15/*
16 * Keywords
17 */
18ALIGNTOK : 'align' ;
19CONSTTOK : 'const' ;
20CHARTOK : 'char' ;
21DOUBLETOK : 'double' ;
22ENUMTOK : 'enum' ;
23EVENTTOK : 'event' ;
24FLOATINGPOINTTOK : 'floating_point' ;
25FLOATTOK : 'float' ;
26INTEGERTOK : 'integer' ;
27INTTOK : 'int' ;
28LONGTOK : 'long' ;
29SHORTTOK : 'short' ;
30SIGNEDTOK : 'signed' ;
31STREAMTOK : 'stream' ;
32STRINGTOK : 'string' ;
33STRUCTTOK : 'struct' ;
34TRACETOK : 'trace' ;
35TYPEALIASTOK : 'typealias' ;
36TYPEDEFTOK : 'typedef' ;
37UNSIGNEDTOK : 'unsigned' ;
38VARIANTTOK : 'variant' ;
39VOIDTOK : 'void' ;
40BOOLTOK : '_Bool' ;
41COMPLEXTOK : '_Complex' ;
42IMAGINARYTOK : '_Imaginary' ;
43ENVTOK : 'env' ;
44CLOCKTOK : 'clock' ;
45
46/*
47 * Spec still to come.
48 */
49NANNUMBERTOK : 'NaN' ;
50INFINITYTOK : '+inf' ;
51NINFINITYTOK : '-inf' ;
52
53/*
54 * Symbols
55 */
56SEPARATOR : ',' ;
57COLON : ':' ;
58ELIPSES : '...' ;
59ASSIGNMENT : '=' ;
60TYPE_ASSIGNMENT : ':=' ;
61LT : '<' ;
62GT : '>' ;
63OPENBRAC : '[' ;
64CLOSEBRAC : ']' ;
65LPAREN : '(' ;
66RPAREN : ')' ;
67LCURL : '{' ;
68RCURL : '}' ;
69TERM : ';' ;
70POINTER : '*' ;
71SIGN : '+' | '-' ;
72ARROW : '->' ;
73DOT : '.' ;
74fragment BACKSLASH : '\\' ;
75
76/*
77 * Boolean literals
78 * - We better leave them as identifiers and numbers...
79 */
80/*TRUE : 'true' | 'TRUE' ;
81FALSE : 'false' | 'FALSE' ;
82ZERO : '0' ;
83ONE : '1' ;*/
84
85
86/*
87 * Integer literals
88 */
89OCTAL_LITERAL : '0' ('0'..'7')+ INTEGER_TYPES_SUFFIX? ;
90
91DECIMAL_LITERAL : DIGIT+ INTEGER_TYPES_SUFFIX? ;
92
93HEX_LITERAL : HEX_PREFIX HEX_DIGIT+ INTEGER_TYPES_SUFFIX? ;
94fragment HEX_DIGIT : DIGIT | ('a'..'f') | ('A'..'F') ;
95fragment HEX_PREFIX : '0' ('x' | 'X') ;
96
97/* Helpers for integer literals */
98fragment DIGIT : '0'..'9' ;
99fragment NONZERO_DIGIT : '1'..'9' ;
100
101
102/**
103 * Integer suffix for long, long long and unsigned.
104 *
105 * Matches all possible combination of L, LL and U.
106 */
107fragment INTEGER_TYPES_SUFFIX :
108 ('l' ('l')? | 'L' ('L')?) // l, ll
109 | ('u' | 'U') // u
110 | ('u' | 'U') ('l' ('l')? | 'L' ('L')?) // ul, ull
111 | ('l' ('l')? | 'L' ('L')?) ('u'| 'U') // lu, llu
112 ;
113
114/**
115 * Escape sequences
116 */
117fragment ESCAPE_SEQUENCE :
118 BACKSLASH ('\'' | '"' | '?' | BACKSLASH | 'a' | 'b' | 'f' | 'n' | 'r' | 't' | 'v' )
119 | OCTAL_ESCAPE
120 | UNICODE_ESCAPE
121 | HEXADECIMAL_ESCAPE
122 ;
123
124/**
125 * Octal escape sequence
126 */
127fragment OCTAL_ESCAPE :
128 BACKSLASH ('0'..'3') ('0'..'7') ('0'..'7')
129 | BACKSLASH ('0'..'7') ('0'..'7')
130 | BACKSLASH ('0'..'7')
131 ;
132
133/**
134 * Hexadecimal escape sequence
135 */
136fragment HEXADECIMAL_ESCAPE : BACKSLASH 'x' HEX_DIGIT+ ;
137
138/**
139 * Unicode escape sequence
140 */
141fragment UNICODE_ESCAPE :
142 BACKSLASH 'u' HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT
143 | BACKSLASH 'U' HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT HEX_DIGIT
144 ;
145
146
147/* Used in both character and string literal */
148fragment STRINGPREFIX : 'L';
149
150/*
151 * Character literal
152 */
153CHARACTER_LITERAL : STRINGPREFIX? SINGLEQUOTE CHAR_CONTENT+ SINGLEQUOTE ;
154fragment CHAR_CONTENT : (ESCAPE_SEQUENCE | ~(BACKSLASH | SINGLEQUOTE)) ;
155fragment SINGLEQUOTE : '\'';
156
157/*
158 * String literal
159 */
160STRING_LITERAL : STRINGPREFIX? DOUBLEQUOTE STRING_CONTENT* DOUBLEQUOTE ;
161fragment STRING_CONTENT : (ESCAPE_SEQUENCE | ~(BACKSLASH | DOUBLEQUOTE)) ;
162fragment DOUBLEQUOTE : '"' ;
163
164/**
165 * Whitespaces
166 */
167WS : (' ' | '\r' | '\t' | '\u000C' | '\n') { $channel=HIDDEN; } ;
168
169/**
170 * Multiline comment
171 */
172// About the greedy option: see page 100-101 of The Definitive ANTLR reference
173// COMMENT : '/*' ( options {greedy=false;} : . )* '*/' {$channel=HIDDEN;} ;
174COMMENT : COMMENT_OPEN .* COMMENT_CLOSE { $channel = HIDDEN; } ;
175fragment COMMENT_OPEN : '/*';
176fragment COMMENT_CLOSE : '*/';
177
178/**
179 * Single line comment
180 */
181LINE_COMMENT : '//' ~('\n'|'\r')* '\r'? '\n' {$channel=HIDDEN;} ;
182
183/**
184 * Identifiers
185 */
186IDENTIFIER : NONDIGIT (NONDIGIT | DIGIT)* ;
187fragment NONDIGIT : ('_') | ('A'..'Z') | ('a'..'z') ;
This page took 0.029641 seconds and 5 git commands to generate.