added any2unistr predefined function (artf724008)
[deliverable/titan.core.git] / compiler2 / ttcn3 / compiler.l
CommitLineData
970ed795 1/******************************************************************************
d44e3c4f 2 * Copyright (c) 2000-2016 Ericsson Telecom AB
970ed795
EL
3 * All rights reserved. This program and the accompanying materials
4 * are made available under the terms of the Eclipse Public License v1.0
5 * which accompanies this distribution, and is available at
6 * http://www.eclipse.org/legal/epl-v10.html
d44e3c4f 7 *
8 * Contributors:
9 * Baji, Laszlo
10 * Balasko, Jeno
11 * Baranyi, Botond
12 * Cserveni, Akos
13 * Delic, Adam
14 * Feher, Csaba
15 * Forstner, Matyas
16 * Kovacs, Ferenc
17 * Kremer, Peter
18 * Raduly, Csaba
19 * Szabados, Kristof
19700695 20 * Szabo, Bence Janos
d44e3c4f 21 * Szabo, Janos Zoltan – initial implementation
22 * Zalanyi, Balazs Andor
23 *
970ed795
EL
24 ******************************************************************************/
25%option noyywrap
26%option never-interactive
27%option nounput
28%{
29
30/* Tokenizer for TTCN-3 Core Language */
31
32#include "../../common/dbgnew.hh"
33#include "compiler.h"
34#include "../string.hh"
35#include "../CompilerError.hh"
36#include "../Real.hh"
37#include "../Value.hh"
38#include "AST_ttcn3.hh"
39#include "Ttcnstuff.hh" // at least for PortTypeBody::PortOperationMode_t
40#include "Statement.hh" // for Statement::statementtype_t
41#include "Attributes.hh"
42
43#include <string.h>
44#include <ctype.h>
45#include <openssl/md5.h>
46
47namespace Common {
48 class IndexedValue;
49 class Location;
50}
51
52namespace Ttcn {
53 class ParamRedirect;
54 class Statement;
55 class AltGuard;
56 class IfClause;
57 class IfClauses;
58 class NamedTemplate;
59 class NamedTemplates;
60 class IndexedTemplate;
61 class IndexedTemplates;
62 class Templates;
63 class CompTypeRefList;
64}
65
66using namespace Common;
67using namespace Ttcn;
68
69#include "compiler.tab.hh"
70
71#define yylval ttcn3_lval
72#define yylloc ttcn3_lloc
73
74/* global variable indicating the location of the returned token to bison */
75extern YYLTYPE yylloc;
76
77extern bool is_erroneous_parsed;
78
79/* always points to the first character of the regexp to be recognized */
80static int current_line, current_column;
81
82/* when reporting an error in linemarker or preprocessor
83 * directive the real file name and line number is needed */
84static const char* real_infile;
85/* real_lineno = current_line + real_lineno_offset */
86static int real_lineno_offset;
87
88static bool dot_flag = false;
89/* type of the backup token (that was found after a dot) */
90static int backup_token;
91/* semantic value of the backup token */
92static YYSTYPE backup_lval;
93/* location of the backup token */
94static YYLTYPE backup_lloc;
95
96static MD5_CTX md5_ctx;
97
98static void fill_location()
99{
100 yylloc.first_line = current_line;
101 yylloc.first_column = current_column;
102 current_column += yyleng;
103 yylloc.last_line = current_line;
104 yylloc.last_column = current_column;
105}
106
107static void update_md5()
108{
109 MD5_Update(&md5_ctx, yytext, yyleng);
110 MD5_Update(&md5_ctx, " ", 1);
111}
112
113#define RETURN_SAVED_DOT \
114 do { \
115 yytext[0] = '\0'; \
116 yylloc.first_line = dot_line; \
117 yylloc.first_column = dot_column; \
118 yylloc.last_line = dot_line; \
119 yylloc.last_column = dot_column + 1; \
120 return '.'; \
121 } while (0)
122
123/* return macro for simple tokens without semantic value */
124#define RETURN(ret_val) \
125 do { \
126 update_md5(); \
127 fill_location(); \
128 if (dot_flag) { \
129 backup_token = ret_val; \
130 backup_lloc = yylloc; \
131 RETURN_SAVED_DOT; \
132 } else return ret_val; \
133 } while (0)
134
135/* same as RETURN(ret_val) macro but without location update,
136 * usually a return after an error */
137#define RETURN_NOLOCUPD(ret_val) \
138 do { \
139 update_md5(); \
140 if (dot_flag) { \
141 backup_token = ret_val; \
142 backup_lloc = yylloc; \
143 RETURN_SAVED_DOT; \
144 } else return ret_val; \
145 } while (0)
146
147/* return macro for simple tokens with semantic value */
148#define RETURN_LVAL(ret_val) \
149 do { \
150 update_md5(); \
151 fill_location(); \
152 if (dot_flag) { \
153 backup_token = ret_val; \
154 backup_lval = yylval; \
155 backup_lloc = yylloc; \
156 RETURN_SAVED_DOT; \
157 } else return ret_val; \
158 } while (0)
159
160/* return macro for special tokens that are glued together with previous dot */
161#define RETURN_DOT(ret_val) \
162 do { \
163 update_md5(); \
164 if (dot_flag) { \
165 dot_flag = false; \
166 yylloc.first_line = dot_line; \
167 yylloc.first_column = dot_column; \
168 current_column += yyleng; \
169 yylloc.last_line = current_line; \
170 yylloc.last_column = current_column; \
171 return Dot##ret_val; \
172 } else { \
173 fill_location(); \
174 return ret_val; \
175 } \
176 } while (0)
177
178extern string *parse_charstring_value(const char *str, const Location& loc);
179
180%}
181
182NUMBER 0|([1-9][0-9]*)
183
184FLOAT ({NUMBER}\.[0-9]+)|({NUMBER}(\.[0-9]+)?[Ee][+-]?{NUMBER})
185
186IDENTIFIER [A-Za-z][A-Za-z0-9_]*
187
188LINECOMMENT "//"[^\r\n]*
189
190WHITESPACE [ \t\v\f]
191
192NEWLINE \r|\n|\r\n
193
194LINEMARKER {NUMBER}{WHITESPACE}+\"([^\\\"\r\n]|\\[^\r\n])*\"
195
19700695 196UID [uU][+]?[0-9A-Fa-f]{1,8}
197
970ed795
EL
198TITAN "$#&&&(#TITANERRONEOUS$#&&^#% "
199
200%x SC_blockcomment SC_cstring
201%x SC_binstring SC_binstring_bad
19700695 202%s SC_charkeyword
970ed795
EL
203
204%%
205 /* local variables of yylex() */
206 int start_line = 0, start_column = 0; /**< used by block comments and
207 string literals */
208 int dot_line = 0, dot_column = 0; /**< location of the previous '.' token */
209 /* variables used when processing binary strings */
210 expstring_t binstr = NULL; /**< the string itself */
211 bool valid_bit = false, /**< binstr is valid bitstring */
212 valid_oct = false, /**< binstr is valid octetstring */
213 half_oct = false, /**< binstr is not a valid octetstr but a valid hexstr */
214 contains_match = false, /**< binstr contains matching symbol */
215 contains_ws = false; /**< binstr contains whitespace characters */
216
217 if (dot_flag) {
218 if (backup_token == '.') {
219 /* Two dots were found in the previous call: the first one was returned,
220 * the second one is now in the backup. Let's assume that we have just
221 * found the second one. */
222 dot_line = backup_lloc.first_line;
223 dot_column = backup_lloc.first_column;
224 } else {
225 /* Return the token and its semantic value that was backed up after the
226 * last token (which was a dot). */
227 dot_flag = false;
228 yylval = backup_lval;
229 yylloc = backup_lloc;
230 return backup_token;
231 }
232 }
233
234
235{TITAN} {
236 // hack: to avoid the erroneous parsing reporting a syntax error where it
237 // also lists TTCN3ModuleKeyword as a possible nonterminal to use
238 if (is_erroneous_parsed) {
239 RETURN(TitanErroneousHackKeyword);
240 } else {
241 Location loc(infile, current_line, current_column, current_line,
242 current_column + yyleng);
243 loc.error("Unexpected `%s'.", yytext);
244 }
245}
246
247 /* Eat up comments and whitespaces */
248
249"/*" {
250 start_line = current_line;
251 start_column = current_column;
252 current_column += 2;
253 BEGIN(SC_blockcomment);
254}
255
256<SC_blockcomment> /* -------- SC_blockcomment scope -------------- */
257{
258
259 "*/" {
260 current_column += 2;
261 BEGIN(INITIAL);
262 }
263
264 {NEWLINE} {
265 current_line++;
266 current_column = 0;
267 }
268
269 . current_column++;
270
271} /* SC_blockcomment */
272
273{LINECOMMENT}?{NEWLINE} {
274 current_line++;
275 current_column = 0;
276}
277
278{LINECOMMENT} {
970ed795
EL
279 current_column += yyleng;
280}
281
282{WHITESPACE}+ current_column += yyleng;
283
284 /* C preprocessor line markers */
285
286^{WHITESPACE}*"#"({WHITESPACE}*"line")?{WHITESPACE}+{LINEMARKER}[^\r\n]*{NEWLINE} {
287 bool error_flag = false;
288 int real_lineno = current_line + real_lineno_offset;
289 /* skipping the leading whitespaces */
290 int marker_begin = 0;
291 while (yytext[marker_begin] != '#') marker_begin++;
292 /* skipping the trailing whitespaces and newline */
293 int marker_end = yyleng - 1;
294 while (yytext[marker_end] == '\r' || yytext[marker_end] == '\n' ||
295 yytext[marker_end] == ' ' || yytext[marker_end] == '\t') marker_end--;
296 marker_end++;
297 Location loc(real_infile, real_lineno, current_column + marker_begin,
298 real_lineno, current_column + marker_end);
299 Error_Context cntxt(&loc, "In preprocessor line marker");
300 /* parsing out the line number */
301 int lineno_begin = marker_begin + 1;
302 while (!isdigit((unsigned char)yytext[lineno_begin])) lineno_begin++;
303 int lineno_end = lineno_begin + 1;
304 while (isdigit((int)yytext[lineno_end])) lineno_end++;
305 errno = 0;
306 int new_lineno = strtol(yytext + lineno_begin, NULL, 10);
307 if (errno != 0) {
308 Location lineno_loc(real_infile, real_lineno, current_column + lineno_begin,
309 real_lineno, current_column + lineno_end);
310 string lineno_str(lineno_end - lineno_begin, yytext + lineno_begin);
311 lineno_loc.error("Line number `%s' is too large for being represented in "
312 "memory: %s", lineno_str.c_str(), strerror(errno));
313 error_flag = true;
314 }
315 /* parsing out the file name */
316 int filename_begin = lineno_end + 1;
317 while (yytext[filename_begin] != '"') filename_begin++;
318 filename_begin++;
319 int filename_end = filename_begin;
320 while (yytext[filename_end] != '"') {
321 if (yytext[filename_end] == '\\') filename_end += 2;
322 else filename_end++;
323 }
324 Location filename_loc(real_infile, real_lineno, current_column +
325 filename_begin - 1, real_lineno, current_column + filename_end + 1);
326 string filename_str(filename_end - filename_begin, yytext + filename_begin);
327 string *parsed_filename = parse_charstring_value(filename_str.c_str(),
328 filename_loc);
329 if (!parsed_filename) error_flag = true;
330 /* updating the line/column counters */
331 if (error_flag) {
332 /* the line marker is erroneous, use the real line numbers */
333 infile = real_infile;
334 current_line = real_lineno + 1;
335 real_lineno_offset = 0;
336 } else {
337 /* set the given line number */
338 infile = Location::add_source_file_name(*parsed_filename);
339 current_line = new_lineno;
340 real_lineno_offset = real_lineno + 1 - new_lineno;
341 }
342 current_column = 0;
343 delete parsed_filename;
344}
345
346^{WHITESPACE}*"#"[^\r\n]* {
347 int real_lineno = current_line + real_lineno_offset;
348 /* skip the leading and trailing whitespaces */
349 int marker_begin = 0;
350 while (yytext[marker_begin] != '#') marker_begin++;
351 int marker_end = yyleng - 1;
352 while (yytext[marker_end] == ' ' || yytext[marker_end] == '\t') marker_end--;
353 marker_end++;
354 Location loc(real_infile, real_lineno, current_column + marker_begin,
355 real_lineno, current_column + marker_end);
356 loc.error("Invalid/unsupported preprocessor directive or line marker: `%s'",
357 string(marker_end - marker_begin, yytext + marker_begin).c_str());
358 current_column += yyleng;
359}
360
361 /* Keywords */
362
363action RETURN(ActionKeyword);
364activate RETURN(ActivateKeyword);
365address RETURN(AddressKeyword);
366alive RETURN_DOT(AliveKeyword);
367all RETURN(AllKeyword);
368alt RETURN(AltKeyword);
369altstep RETURN(AltstepKeyword);
370and RETURN(AndKeyword);
371and4b RETURN(And4bKeyword);
372any RETURN(AnyKeyword);
373anytype RETURN(AnyTypeKeyword);
374apply RETURN_DOT(ApplyKeyword);
375bitstring RETURN(BitStringKeyword);
376boolean RETURN(BooleanKeyword);
377break RETURN(BreakKeyword);
378call RETURN_DOT(CallOpKeyword);
379case RETURN(CaseKeyword);
380catch RETURN_DOT(CatchOpKeyword);
19700695 381char { BEGIN(SC_charkeyword); RETURN(CharKeyword); }
970ed795
EL
382charstring RETURN(CharStringKeyword);
383check RETURN_DOT(CheckOpKeyword);
384clear RETURN_DOT(ClearOpKeyword);
385complement RETURN(ComplementKeyword);
386component RETURN(ComponentKeyword);
387connect RETURN(ConnectKeyword);
388const RETURN(ConstKeyword);
389continue RETURN(ContinueKeyword);
390control RETURN(ControlKeyword);
391create RETURN_DOT(CreateKeyword);
392deactivate RETURN(DeactivateKeyword);
393default RETURN(DefaultKeyword);
394derefers RETURN(DerefersKeyword);
395disconnect RETURN(DisconnectKeyword);
396display RETURN(DisplayKeyword);
397do RETURN(DoKeyword);
398done RETURN_DOT(DoneKeyword);
399else RETURN(ElseKeyword);
400encode RETURN(EncodeKeyword);
401enumerated RETURN(EnumKeyword);
402error RETURN(ErrorKeyword);
403except RETURN(ExceptKeyword);
404exception RETURN(ExceptionKeyword);
405execute RETURN(ExecuteKeyword);
406extends RETURN(ExtendsKeyword);
407extension RETURN(ExtensionKeyword);
408external RETURN(ExtKeyword);
409fail RETURN(FailKeyword);
410false RETURN(FalseKeyword);
411float RETURN(FloatKeyword);
412for RETURN(ForKeyword);
413friend RETURN(FriendKeyword);
414from RETURN(FromKeyword);
415function RETURN(FunctionKeyword);
416getcall RETURN_DOT(GetCallOpKeyword);
417getreply RETURN_DOT(GetReplyOpKeyword);
418getverdict RETURN(GetVerdictKeyword);
419goto RETURN(GotoKeyword);
420group RETURN(GroupKeyword);
421halt RETURN_DOT(HaltKeyword);
422hexstring RETURN(HexStringKeyword);
423if RETURN(IfKeyword);
424ifpresent RETURN(IfPresentKeyword);
425import RETURN(ImportKeyword);
426in RETURN(InParKeyword);
427inconc RETURN(InconcKeyword);
428infinity RETURN(InfinityKeyword);
429inout RETURN(InOutParKeyword);
430integer RETURN(IntegerKeyword);
431interleave RETURN(InterleavedKeyword);
432kill RETURN_DOT(KillKeyword);
433killed RETURN_DOT(KilledKeyword);
434label RETURN(LabelKeyword);
435language RETURN(LanguageKeyword);
436length RETURN(LengthKeyword);
437log RETURN(LogKeyword);
438map RETURN(MapKeyword);
439match RETURN(MatchKeyword);
440message RETURN(MessageKeyword);
441mixed RETURN(MixedKeyword);
442mod RETURN(ModKeyword);
443modifies RETURN(ModifiesKeyword);
444module RETURN(TTCN3ModuleKeyword);
445modulepar RETURN(ModuleParKeyword);
446mtc RETURN(MTCKeyword);
447noblock RETURN(NoBlockKeyword);
448none RETURN(NoneKeyword);
449not RETURN(NotKeyword);
450not_a_number RETURN(NaNKeyword);
451not4b RETURN(Not4bKeyword);
452nowait RETURN(NowaitKeyword);
453null RETURN(NullKeyword);
454objid RETURN(ObjectIdentifierKeyword);
455octetstring RETURN(OctetStringKeyword);
456of RETURN(OfKeyword);
457omit RETURN(OmitKeyword);
458on RETURN(OnKeyword);
459optional RETURN(OptionalKeyword);
460or RETURN(OrKeyword);
461or4b RETURN(Or4bKeyword);
462out RETURN(OutParKeyword);
463override RETURN(OverrideKeyword);
464param RETURN(ParamKeyword);
465pass RETURN(PassKeyword);
466pattern RETURN(PatternKeyword);
467permutation RETURN(PermutationKeyword);
468port RETURN(PortKeyword);
469present RETURN(PresentKeyword);
470private RETURN(PrivateKeyword);
471procedure RETURN(ProcedureKeyword);
472public RETURN(PublicKeyword);
473raise RETURN_DOT(RaiseKeyword);
474read RETURN_DOT(ReadKeyword);
475receive RETURN_DOT(ReceiveOpKeyword);
476record RETURN(RecordKeyword);
477recursive RETURN(RecursiveKeyword);
478refers RETURN(RefersKeyword);
479rem RETURN(RemKeyword);
480repeat RETURN(RepeatKeyword);
481reply RETURN_DOT(ReplyKeyword);
482return RETURN(ReturnKeyword);
483running RETURN_DOT(RunningKeyword);
484runs RETURN(RunsKeyword);
485select RETURN(SelectKeyword);
486self RETURN(SelfKeyword);
487send RETURN_DOT(SendOpKeyword);
488sender RETURN(SenderKeyword);
489set RETURN(SetKeyword);
490setverdict RETURN(SetVerdictKeyword);
491signature RETURN(SignatureKeyword);
492start RETURN_DOT(StartKeyword);
493stop RETURN_DOT(StopKeyword);
494subset RETURN(SubsetKeyword);
495superset RETURN(SupersetKeyword);
496system RETURN(SystemKeyword);
497template RETURN(TemplateKeyword);
498testcase RETURN(TestcaseKeyword);
499timeout RETURN_DOT(TimeoutKeyword);
500timer RETURN(TimerKeyword);
501to RETURN(ToKeyword);
502trigger RETURN_DOT(TriggerOpKeyword);
503true RETURN(TrueKeyword);
504type RETURN(TypeDefKeyword);
505union RETURN(UnionKeyword);
506universal RETURN(UniversalKeyword);
507unmap RETURN(UnmapKeyword);
508value RETURN(ValueKeyword);
509valueof RETURN(ValueofKeyword);
510var RETURN(VarKeyword);
511variant RETURN(VariantKeyword);
512verdicttype RETURN(VerdictTypeKeyword);
513while RETURN(WhileKeyword);
514with RETURN(WithKeyword);
515xor RETURN(XorKeyword);
516xor4b RETURN(Xor4bKeyword);
517
feade998 518 /* modifier keywords */
519
520"@nocase" RETURN(NocaseKeyword);
521"@lazy" RETURN(LazyKeyword);
522
970ed795
EL
523 /* special TITAN specific keywords */
524
525"@try" RETURN(TitanSpecificTryKeyword);
526"@catch" RETURN(TitanSpecificCatchKeyword);
a38c6d4c 527"@profiler" RETURN(TitanSpecificProfilerKeyword);
970ed795 528
feade998 529
970ed795
EL
530 /* Predefined function identifiers */
531
532bit2hex RETURN(bit2hexKeyword);
533bit2int RETURN(bit2intKeyword);
534bit2oct RETURN(bit2octKeyword);
535bit2str RETURN(bit2strKeyword);
536char2int RETURN(char2intKeyword);
537char2oct RETURN(char2octKeyword);
538decomp RETURN(decompKeyword);
539float2int RETURN(float2intKeyword);
540float2str RETURN(float2strKeyword);
541hex2bit RETURN(hex2bitKeyword);
542hex2int RETURN(hex2intKeyword);
543hex2oct RETURN(hex2octKeyword);
544hex2str RETURN(hex2strKeyword);
545int2bit RETURN(int2bitKeyword);
546int2char RETURN(int2charKeyword);
3abe9331 547int2enum RETURN(int2enumKeyword);
970ed795
EL
548int2float RETURN(int2floatKeyword);
549int2hex RETURN(int2hexKeyword);
550int2oct RETURN(int2octKeyword);
551int2str RETURN(int2strKeyword);
552int2unichar RETURN(int2unicharKeyword);
553isvalue RETURN(isvalueKeyword);
554isbound RETURN(isboundKeyword);
555ischosen RETURN(ischosenKeyword);
556ispresent RETURN(ispresentKeyword);
557lengthof RETURN(lengthofKeyword);
558oct2bit RETURN(oct2bitKeyword);
559oct2char RETURN(oct2charKeyword);
560oct2hex RETURN(oct2hexKeyword);
561oct2int RETURN(oct2intKeyword);
562oct2str RETURN(oct2strKeyword);
563regexp RETURN(regexpKeyword);
564replace RETURN(replaceKeyword);
565rnd RETURN(rndKeyword);
566sizeof RETURN(sizeofKeyword);
567str2bit RETURN(str2bitKeyword);
568str2float RETURN(str2floatKeyword);
569str2hex RETURN(str2hexKeyword);
570str2int RETURN(str2intKeyword);
571str2oct RETURN(str2octKeyword);
572substr RETURN(substrKeyword);
573unichar2int RETURN(unichar2intKeyword);
574unichar2char RETURN(unichar2charKeyword);
575log2str RETURN(log2strKeyword);
576enum2int RETURN(enum2intKeyword);
577encvalue RETURN(encvalueKeyword);
578decvalue RETURN(decvalueKeyword);
579testcasename RETURN(testcasenameKeyword);
580ttcn2string RETURN(ttcn2stringKeyword);
581string2ttcn RETURN(string2ttcnKeyword);
582unichar2oct RETURN(unichar2octKeyword);
583oct2unichar RETURN(oct2unicharKeyword);
584remove_bom RETURN(remove_bomKeyWord);
585get_stringencoding RETURN(get_stringencodingKeyWord);
586encode_base64 RETURN(encode_base64KeyWord);
587decode_base64 RETURN(decode_base64KeyWord);
1d0599f0 588encvalue_unichar RETURN(encvalue_unicharKeyWord);
589decvalue_unichar RETURN(decvalue_unicharKeyWord);
a50716c1 590any2unistr RETURN(any2unistrKeyWord);
970ed795
EL
591
592 /* Values */
593
594{NUMBER} {
595 Location loc(infile, current_line, current_column, current_line,
596 current_column + yyleng);
597 yylval.int_val = new int_val_t(yytext, loc);
598 RETURN_LVAL(Number);
599}
600
601{FLOAT} {
602 Location loc(infile, current_line, current_column, current_line,
603 current_column + yyleng);
604 yylval.float_val = string2Real(yytext, loc);
605 RETURN_LVAL(FloatValue);
606}
607
608NULL RETURN(NullValue);
609
610"'" {
611 binstr=memptystr();
612 valid_bit=true;
613 valid_oct=true;
614 half_oct=false;
615 contains_match=false;
616 contains_ws=false;
617 start_line = current_line;
618 start_column = current_column;
619 current_column++;
620 MD5_Update(&md5_ctx, yytext, yyleng);
621 BEGIN(SC_binstring);
622}
623
624\" {
625 yylval.str = memptystr();
626 start_line = current_line;
627 start_column = current_column;
628 current_column++;
629 MD5_Update(&md5_ctx, yytext, yyleng);
630 BEGIN(SC_cstring);
19700695 631}
632
633<SC_charkeyword>
634{
635 {UID} {
636 yylval.str = mcopystrn(yytext, yyleng);
637 RETURN_LVAL(Cstring);
638 }
639
640 [,] { RETURN(*yytext); }
641
642 [)] { BEGIN(INITIAL); RETURN(*yytext); }
970ed795
EL
643}
644
645<SC_binstring> /* -------- SC_binstring scope -------------- */
646{
647
648 {WHITESPACE}+ {
649 contains_ws = true;
650 current_column += yyleng;
651 }
652
653 {WHITESPACE}*{NEWLINE} {
654 contains_ws = true;
655 current_line++;
656 current_column = 0;
657 }
658
659 [01] {
660 binstr = mputc(binstr, yytext[0]);
661 half_oct = !half_oct;
662 current_column++;
663 }
664
665 [2-9A-F] {
666 binstr = mputc(binstr, yytext[0]);
667 valid_bit = false;
668 half_oct = !half_oct;
669 current_column++;
670 }
671
672 [a-f] {
673 binstr = mputc(binstr, yytext[0] - 'a' + 'A');
674 valid_bit = false;
675 half_oct = !half_oct;
676 current_column++;
677 }
678
679 "?"|"*" {
680 binstr = mputc(binstr, yytext[0]);
681 contains_match = true;
682 if (half_oct) valid_oct = false;
683 current_column++;
684 }
685
686 "'"[bBhHoO] {
687 yylloc.first_line = start_line;
688 yylloc.first_column = start_column;
689 yylloc.last_line = current_line;
690 yylloc.last_column = current_column + 2;
691 Location loc(infile, yylloc);
692 int ret_val = TOK_errval;
693 switch (yytext[1]) {
694 case 'b': {
695 Location loc2(infile, current_line, current_column + 1, current_line,
696 current_column + 2);
697 loc2.warning("The last character of a bitstring literal should be "
698 "`B' instead of `b'");
699 /* no break */ }
700 case 'B':
701 if (valid_bit) {
702 if (contains_ws) loc.warning("Bitstring %s contains whitespace and/or "
703 "newline character(s)", contains_match ? "match" : "value");
704 ret_val = contains_match ? BitStringMatch : Bstring;
705 yylval.string_val = new string(binstr);
706 } else loc.error("Bitstring value contains invalid character");
707 break;
708 case 'h': {
709 Location loc2(infile, current_line, current_column + 1, current_line,
710 current_column + 2);
711 loc2.warning("The last character of a hexstring literal should be "
712 "`H' instead of `h'");
713 /* no break */ }
714 case 'H':
715 if (contains_ws) loc.warning("Hexstring %s contains whitespace and/or "
716 "newline character(s)", contains_match ? "match" : "value");
717 ret_val = contains_match ? HexStringMatch : Hstring;
718 yylval.string_val = new string(binstr);
719 break;
720 case 'o': {
721 Location loc2(infile, current_line, current_column + 1, current_line,
722 current_column + 2);
723 loc2.warning("The last character of an octetstring literal should be "
724 "`O' instead of `o'");
725 /* no break */ }
726 case 'O':
727 if (valid_oct && !half_oct) {
728 if (contains_ws) loc.warning("Octetstring %s contains whitespace "
729 "and/or newline character(s)", contains_match ? "match" : "value");
730 ret_val = contains_match ? OctetStringMatch : Ostring;
731 yylval.string_val = new string(binstr);
732 } else if (contains_match) {
733 loc.error("Octetstring match contains half octet(s)");
734 } else {
735 loc.error("Octetstring value contains odd number of hexadecimal "
736 "digits");
737 }
738 }
739 MD5_Update(&md5_ctx, binstr, strlen(binstr));
740 Free(binstr);
741 update_md5();
742 BEGIN(INITIAL);
743 current_column += 2;
744 if (dot_flag) {
745 backup_token = ret_val;
746 backup_lval = yylval;
747 backup_lloc = yylloc;
748 RETURN_SAVED_DOT;
749 } else return ret_val;
750 }
751
752 "'" {
753 yylloc.first_line = start_line;
754 yylloc.first_column = start_column;
755 current_column++;
756 yylloc.last_line = current_line;
757 yylloc.last_column = current_column;
758 Location loc(infile, yylloc);
759 loc.error("Invalid binary string literal. Expecting `B', `H' or `O' after "
760 "the closing `''");
761 MD5_Update(&md5_ctx, binstr, strlen(binstr));
762 Free(binstr);
763 BEGIN(INITIAL);
764 RETURN_NOLOCUPD(TOK_errval);
765 }
766
767 . {
768 Location loc(infile, current_line, current_column, current_line,
769 current_column + 1);
770 int c = (unsigned char)yytext[0];
771 loc.error("Invalid character `%c' (0x%02X) in binary string",
772 isprint(c) ? c : '?', c);
773 MD5_Update(&md5_ctx, binstr, strlen(binstr));
774 Free(binstr);
775 MD5_Update(&md5_ctx, yytext, 1);
776 current_column++;
777 BEGIN(SC_binstring_bad);
778 }
779
780} /* SC_binstring scope */
781
782<SC_binstring_bad> /* -------- SC_binstring_bad scope -------------- */
783{
784
785 {WHITESPACE}+ current_column += yyleng;
786
787 {WHITESPACE}*{NEWLINE} {
788 current_line++;
789 current_column = 0;
790 }
791
792 "'"[bBhHoO]? {
793 current_column += yyleng;
794 yylloc.first_line = start_line;
795 yylloc.first_column = start_column;
796 yylloc.last_line = current_line;
797 yylloc.last_column = current_column;
798 BEGIN(INITIAL);
799 RETURN_NOLOCUPD(TOK_errval);
800 }
801
802 . {
803 MD5_Update(&md5_ctx, yytext, yyleng);
804 current_column++;
805 }
806
807} /* SC_binstring_bad scope */
808
809<SC_cstring> /* -------- SC_cstring scope -------------- */
810{
811
812 \\?{NEWLINE} { /* newline possibly preceded by backslash */
813 yylval.str = mputstr(yylval.str, yytext);
814 current_line++;
815 current_column = 0;
816 }
817
818 \"\"|\\. { /* two doublequotes or any backslash-escaped char */
819 yylval.str = mputstr(yylval.str, yytext);
820 current_column += 2;
821 /* Note that both get added ("external representation").
822 * parse_charstring_value() in charstring_la.l is responsible
823 * for transforming the string to "internal representation" */
824 }
825
826 \" {
827 current_column++;
828 yylloc.first_line = start_line;
829 yylloc.first_column = start_column;
830 yylloc.last_line = current_line;
831 yylloc.last_column = current_column;
832 MD5_Update(&md5_ctx, yylval.str, strlen(yylval.str));
833 update_md5();
834 BEGIN(INITIAL);
835 if (dot_flag) {
836 backup_token = Cstring;
837 backup_lval = yylval;
838 backup_lloc = yylloc;
839 RETURN_SAVED_DOT;
840 } else return Cstring;
841 }
842
843 . {
844 yylval.str = mputc(yylval.str, yytext[0]);
845 current_column++;
846 }
847
848} /* SC_cstring scope */
849
850 /* Macros */
851
852"%moduleId" {
853 yylval.macrotype = Value::MACRO_MODULEID;
854 RETURN_LVAL(MacroValue);
855}
856"%fileName" {
857 yylval.macrotype = Value::MACRO_FILENAME;
858 RETURN_LVAL(MacroValue);
859}
860"%lineNumber" {
861 yylval.macrotype = Value::MACRO_LINENUMBER;
862 RETURN_LVAL(MacroValue);
863}
864"%definitionId" {
865 yylval.macrotype = Value::MACRO_DEFINITIONID;
866 RETURN_LVAL(MacroValue);
867}
868"%testcaseId" {
869 yylval.macrotype = Value::MACRO_TESTCASEID;
870 RETURN_LVAL(MacroValue);
871}
872"%"{IDENTIFIER} {
873 fill_location();
874 Location loc(infile, yylloc);
875 loc.error("Invalid macro notation: `%s'", yytext);
876 RETURN_NOLOCUPD(TOK_errval);
877}
878
879"__MODULE__" {
880 yylval.macrotype = Value::MACRO_MODULEID;
881 RETURN_LVAL(MacroValue);
882}
883"__FILE__" {
884 yylval.macrotype = Value::MACRO_FILEPATH;
885 RETURN_LVAL(MacroValue);
886}
887"__BFILE__" {
888 yylval.macrotype = Value::MACRO_BFILENAME;
889 RETURN_LVAL(MacroValue);
890}
891"__LINE__" {
892 yylval.macrotype = Value::MACRO_LINENUMBER_C;
893 RETURN_LVAL(MacroValue);
894}
895"__SCOPE__" {
896 yylval.macrotype = Value::MACRO_SCOPE;
897 RETURN_LVAL(MacroValue);
898}
899"__TESTCASE__" {
900 yylval.macrotype = Value::MACRO_TESTCASEID;
901 RETURN_LVAL(MacroValue);
902}
903"__"{IDENTIFIER}"__" {
904 fill_location();
905 Location loc(infile, yylloc);
906 loc.error("Invalid macro notation: `%s'", yytext);
907 RETURN_NOLOCUPD(TOK_errval);
908}
909
910 /* Multi-character operators */
911
912":=" RETURN(AssignmentChar);
913"\.\." RETURN(DotDot);
914"->" RETURN(PortRedirectSymbol);
915"==" RETURN(EQ);
916"!=" RETURN(NE);
917">=" RETURN(GE);
918"<=" RETURN(LE);
919"<<" RETURN(SL);
920">>" RETURN(SR);
921"<@" RETURN(RL);
922"@>" RETURN(_RR);
923
924"++" |
925"--" {
926 fill_location();
927 Location loc(infile, yylloc);
928 loc.error("Operator `%s' is reserved for future use", yytext);
929}
930
931 /* Invalid operators */
932
933"::=" {
934 fill_location();
935 Location loc(infile, yylloc);
936 loc.error("`::=' is not a valid assignment operator in TTCN-3. Did you mean "
937 "`:='?");
938 RETURN_NOLOCUPD(AssignmentChar);
939}
940
941"=" {
942 fill_location();
943 Location loc(infile, yylloc);
944 loc.error("A single `=' character cannot be used in TTCN-3. Did you mean "
945 "the assignment sign `:=' or the equality operator `=='?");
946 /* the former is more probable than the latter */
947 RETURN_NOLOCUPD(AssignmentChar);
948}
949
950"<>" {
951 fill_location();
952 Location loc(infile, yylloc);
953 loc.error("`<>' is not a valid comparison operator in TTCN-3. Did you mean "
954 "`!='?");
955 RETURN_NOLOCUPD(NE);
956}
957
958 /* Identifiers */
959
960{IDENTIFIER} {
961 yylval.id = new Identifier(Identifier::ID_TTCN, string(yyleng, yytext));
962 RETURN_LVAL(IDentifier);
963}
964
965 /* Single character tokens (brackets, operators, etc.) */
966
967\. {
968 update_md5();
969 if (dot_flag) {
970 /* store this dot in the backup */
971 backup_token = '.';
972 backup_lloc.first_line = current_line;
973 backup_lloc.first_column = current_column;
974 current_column++;
975 backup_lloc.last_line = current_line;
976 backup_lloc.last_column = current_column;
977 /* return the dot that was found previously */
978 RETURN_SAVED_DOT;
979 } else {
980 dot_flag = true;
981 dot_line = current_line;
982 dot_column = current_column;
983 current_column++;
984 }
985}
986
987[()\[\]{}+\-\*/&:;,<>\?!] RETURN(*yytext);
988
989 /* Invalid characters */
990
991. {
992 fill_location();
993 Location loc(infile, yylloc);
994 int c = (unsigned char)yytext[0];
995 loc.error("Character `%c' (0x%02X) is not used in TTCN-3",
996 isprint(c) ? c : '?', c);
997}
998
999 /* EOF rule */
1000
1001<*><<EOF>> {
1002 if (YY_START != INITIAL) {
1003 Location loc(infile, start_line, start_column, current_line,
1004 current_column);
1005 switch (YY_START) {
1006 case SC_blockcomment:
1007 loc.error("Unterminated block comment");
1008 break;
1009 case SC_binstring:
1010 Free(binstr);
1011 /* no break */
1012 case SC_binstring_bad:
1013 loc.error("Unterminated binary string literal");
1014 break;
1015 case SC_cstring:
1016 Free(yylval.str);
1017 loc.error("Unterminated character string literal");
1018 }
1019 BEGIN(INITIAL);
1020 }
1021 if (dot_flag) {
1022 dot_flag = false;
1023 RETURN_SAVED_DOT;
1024 } else {
1025 yylloc.first_line = current_line;
1026 yylloc.first_column = current_column;
1027 yylloc.last_line = current_line;
1028 yylloc.last_column = current_column + 1;
1029 return EOF;
1030 }
1031}
1032
1033%%
1034
1035void init_ttcn3_lex()
1036{
1037 dot_flag = false;
1038 current_line = 1;
1039 current_column = 0;
1040 real_infile = infile;
1041 real_lineno_offset = 0;
1042 MD5_Init(&md5_ctx);
1043}
1044
1045void init_erroneous_lex(const char* p_infile, int p_line, int p_column)
1046{
1047 infile = p_infile;
1048 current_line = p_line;
1049 current_column = p_column;
1050 real_infile = infile;
1051 real_lineno_offset = 0;
1052 dot_flag = false;
1053}
1054
1055void free_dot_flag_stuff()
1056{
1057 if (dot_flag) {
1058 dot_flag = false;
1059 /* clean up the semantic value of the token that was backed up */
1060 switch (backup_token) {
1061 case IDentifier:
1062 delete backup_lval.id;
1063 break;
1064 case Bstring:
1065 case Hstring:
1066 case Ostring:
1067 case BitStringMatch:
1068 case HexStringMatch:
1069 case OctetStringMatch:
1070 delete backup_lval.string_val;
1071 break;
1072 case Cstring:
1073 Free(backup_lval.str);
1074 default:
1075 break;
1076 }
1077 }
1078}
1079
1080void free_ttcn3_lex()
1081{
1082 free_dot_flag_stuff();
1083 fclose(ttcn3_in);
1084 ttcn3_lex_destroy();
1085}
1086
1087/* called from ttcn3_parse_file to finalize MD5 and add it to the module */
1088void set_md5_checksum(Ttcn::Module *m)
1089{
1090 unsigned char md5_sum[MD5_DIGEST_LENGTH];
1091 MD5_Final(md5_sum, &md5_ctx);
1092 m->set_checksum(sizeof(md5_sum), md5_sum);
1093}
This page took 0.06457 seconds and 5 git commands to generate.