blob: baaef5cadf645794f3f40d91344af0790133f224 [file] [log] [blame]
Mark Slee31985722006-05-24 21:45:31 +00001/**
Mark Sleee9ce01c2007-05-16 02:29:53 +00002 * Copyright (c) 2006- Facebook
3 * Distributed under the Thrift Software License
4 *
5 * See accompanying file LICENSE or visit the Thrift site at:
6 * http://developers.facebook.com/thrift/
7 */
8
9/**
Mark Slee31985722006-05-24 21:45:31 +000010 * Thrift scanner.
Mark Slee27ed6ec2007-08-16 01:26:31 +000011 *
Mark Slee31985722006-05-24 21:45:31 +000012 * Tokenizes a thrift definition file.
13 * @author Mark Slee <mcslee@facebook.com>
14 */
Mark Sleef5377b32006-10-10 01:42:59 +000015
Mark Slee31985722006-05-24 21:45:31 +000016%{
17
18#include "main.h"
David Reisscbd4bac2007-08-14 17:12:33 +000019#include "globals.h"
Mark Slee31985722006-05-24 21:45:31 +000020#include "parse/t_program.h"
21
Mark Sleef5377b32006-10-10 01:42:59 +000022/**
23 * Must be included AFTER parse/t_program.h, but I can't remember why anymore
24 * because I wrote this a while ago.
25 */
Mark Sleeeb0d0242007-01-25 07:58:55 +000026#include "thrifty.h"
Mark Slee31985722006-05-24 21:45:31 +000027
Mark Sleef12865a2007-01-12 00:23:26 +000028void thrift_reserved_keyword(char* keyword) {
29 yyerror("Cannot use reserved language keyword: \"%s\"\n", keyword);
30 exit(1);
31}
32
Mark Slee31985722006-05-24 21:45:31 +000033%}
34
Mark Sleef5377b32006-10-10 01:42:59 +000035/**
36 * Provides the yylineno global, useful for debugging output
37 */
Mark Slee27ed6ec2007-08-16 01:26:31 +000038%option lex-compat
Mark Slee31985722006-05-24 21:45:31 +000039
Mark Slee27ed6ec2007-08-16 01:26:31 +000040/**
Mark Sleef5377b32006-10-10 01:42:59 +000041 * Helper definitions, comments, constants, and whatnot
42 */
43
Mark Slee30152872006-11-28 01:24:07 +000044intconstant ([+-]?[0-9]+)
Mark Slee600cdb32006-11-29 22:06:42 +000045hexconstant ("0x"[0-9A-Fa-f]+)
Mark Slee30152872006-11-28 01:24:07 +000046dubconstant ([+-]?[0-9]*(\.[0-9]+)?([eE][+-]?[0-9]+)?)
Mark Slee9cb7c612006-09-01 22:17:45 +000047identifier ([a-zA-Z_][\.a-zA-Z_0-9]*)
Mark Slee31985722006-05-24 21:45:31 +000048whitespace ([ \t\r\n]*)
David Reiss1ac05802007-07-30 22:00:27 +000049sillycomm ("/*""*"*"*/")
50multicomm ("/*"[^*]"/"*([^*/]|[^*]"/"|"*"[^/])*"*"*"*/")
51doctext ("/**"([^*/]|[^*]"/"|"*"[^/])*"*"*"*/")
Mark Slee31985722006-05-24 21:45:31 +000052comment ("//"[^\n]*)
Mark Sleec98d0502006-09-06 02:42:25 +000053unixcomment ("#"[^\n]*)
Mark Sleeae2bc3c2006-11-08 23:44:59 +000054symbol ([:;\,\{\}\(\)\=<>\[\]])
ccheeverf53b5cf2007-02-05 20:33:11 +000055dliteral ("\""[^"]*"\"")
56sliteral ("'"[^']*"'")
57
Mark Slee31985722006-05-24 21:45:31 +000058
59%%
60
61{whitespace} { /* do nothing */ }
David Reiss1ac05802007-07-30 22:00:27 +000062{sillycomm} { /* do nothing */ }
Mark Slee31985722006-05-24 21:45:31 +000063{multicomm} { /* do nothing */ }
64{comment} { /* do nothing */ }
Mark Sleec98d0502006-09-06 02:42:25 +000065{unixcomment} { /* do nothing */ }
Mark Slee31985722006-05-24 21:45:31 +000066
Mark Slee9cb7c612006-09-01 22:17:45 +000067{symbol} { return yytext[0]; }
68
Mark Slee58dfb4f2007-07-06 02:45:25 +000069"namespace" { return tok_namespace; }
70"cpp_namespace" { return tok_cpp_namespace; }
71"cpp_include" { return tok_cpp_include; }
72"cpp_type" { return tok_cpp_type; }
73"java_package" { return tok_java_package; }
Mark Slee7e9eea42007-09-10 21:00:23 +000074"cocoa_prefix" { return tok_cocoa_prefix; }
Mark Slee58dfb4f2007-07-06 02:45:25 +000075"php_namespace" { return tok_php_namespace; }
David Reissc6fc3292007-08-30 00:58:43 +000076"py_module" { return tok_py_module; }
Mark Slee27ed6ec2007-08-16 01:26:31 +000077"perl_package" { return tok_perl_package; }
Mark Slee58dfb4f2007-07-06 02:45:25 +000078"ruby_namespace" { return tok_ruby_namespace; }
79"xsd_all" { return tok_xsd_all; }
80"xsd_optional" { return tok_xsd_optional; }
81"xsd_nillable" { return tok_xsd_nillable; }
82"xsd_namespace" { return tok_xsd_namespace; }
83"xsd_attrs" { return tok_xsd_attrs; }
84"include" { return tok_include; }
Mark Sleef0712dc2006-10-25 19:03:57 +000085
Mark Slee58dfb4f2007-07-06 02:45:25 +000086"void" { return tok_void; }
87"bool" { return tok_bool; }
88"byte" { return tok_byte; }
89"i16" { return tok_i16; }
90"i32" { return tok_i32; }
91"i64" { return tok_i64; }
92"double" { return tok_double; }
93"string" { return tok_string; }
94"binary" { return tok_binary; }
95"slist" { return tok_slist; }
96"senum" { return tok_senum; }
97"map" { return tok_map; }
98"list" { return tok_list; }
99"set" { return tok_set; }
100"async" { return tok_async; }
101"typedef" { return tok_typedef; }
102"struct" { return tok_struct; }
103"exception" { return tok_xception; }
104"extends" { return tok_extends; }
105"throws" { return tok_throws; }
106"service" { return tok_service; }
107"enum" { return tok_enum; }
108"const" { return tok_const; }
David Reiss8320a922007-08-14 19:59:26 +0000109"required" { return tok_required; }
110"optional" { return tok_optional; }
Mark Slee52f643d2006-08-09 00:03:43 +0000111
Mark Sleef12865a2007-01-12 00:23:26 +0000112"abstract" { thrift_reserved_keyword(yytext); }
113"and" { thrift_reserved_keyword(yytext); }
114"as" { thrift_reserved_keyword(yytext); }
115"assert" { thrift_reserved_keyword(yytext); }
116"break" { thrift_reserved_keyword(yytext); }
117"case" { thrift_reserved_keyword(yytext); }
118"class" { thrift_reserved_keyword(yytext); }
119"continue" { thrift_reserved_keyword(yytext); }
120"declare" { thrift_reserved_keyword(yytext); }
121"def" { thrift_reserved_keyword(yytext); }
122"default" { thrift_reserved_keyword(yytext); }
123"del" { thrift_reserved_keyword(yytext); }
124"delete" { thrift_reserved_keyword(yytext); }
125"do" { thrift_reserved_keyword(yytext); }
126"elif" { thrift_reserved_keyword(yytext); }
127"else" { thrift_reserved_keyword(yytext); }
128"elseif" { thrift_reserved_keyword(yytext); }
129"except" { thrift_reserved_keyword(yytext); }
130"exec" { thrift_reserved_keyword(yytext); }
131"false" { thrift_reserved_keyword(yytext); }
132"final" { thrift_reserved_keyword(yytext); }
133"finally" { thrift_reserved_keyword(yytext); }
134"float" { thrift_reserved_keyword(yytext); }
135"for" { thrift_reserved_keyword(yytext); }
136"foreach" { thrift_reserved_keyword(yytext); }
137"function" { thrift_reserved_keyword(yytext); }
138"global" { thrift_reserved_keyword(yytext); }
139"goto" { thrift_reserved_keyword(yytext); }
140"if" { thrift_reserved_keyword(yytext); }
141"implements" { thrift_reserved_keyword(yytext); }
142"import" { thrift_reserved_keyword(yytext); }
143"in" { thrift_reserved_keyword(yytext); }
144"inline" { thrift_reserved_keyword(yytext); }
145"instanceof" { thrift_reserved_keyword(yytext); }
146"interface" { thrift_reserved_keyword(yytext); }
147"is" { thrift_reserved_keyword(yytext); }
148"lambda" { thrift_reserved_keyword(yytext); }
149"native" { thrift_reserved_keyword(yytext); }
150"new" { thrift_reserved_keyword(yytext); }
151"not" { thrift_reserved_keyword(yytext); }
152"or" { thrift_reserved_keyword(yytext); }
153"pass" { thrift_reserved_keyword(yytext); }
154"public" { thrift_reserved_keyword(yytext); }
155"print" { thrift_reserved_keyword(yytext); }
156"private" { thrift_reserved_keyword(yytext); }
157"protected" { thrift_reserved_keyword(yytext); }
158"raise" { thrift_reserved_keyword(yytext); }
159"return" { thrift_reserved_keyword(yytext); }
160"sizeof" { thrift_reserved_keyword(yytext); }
161"static" { thrift_reserved_keyword(yytext); }
162"switch" { thrift_reserved_keyword(yytext); }
163"synchronized" { thrift_reserved_keyword(yytext); }
164"this" { thrift_reserved_keyword(yytext); }
165"throw" { thrift_reserved_keyword(yytext); }
166"transient" { thrift_reserved_keyword(yytext); }
167"true" { thrift_reserved_keyword(yytext); }
168"try" { thrift_reserved_keyword(yytext); }
169"unsigned" { thrift_reserved_keyword(yytext); }
170"var" { thrift_reserved_keyword(yytext); }
171"virtual" { thrift_reserved_keyword(yytext); }
172"volatile" { thrift_reserved_keyword(yytext); }
173"while" { thrift_reserved_keyword(yytext); }
174"with" { thrift_reserved_keyword(yytext); }
175"union" { thrift_reserved_keyword(yytext); }
176"yield" { thrift_reserved_keyword(yytext); }
177
Mark Slee4f8da1d2006-10-12 02:47:27 +0000178{intconstant} {
179 yylval.iconst = atoi(yytext);
180 return tok_int_constant;
181}
Mark Sleef5377b32006-10-10 01:42:59 +0000182
Mark Slee600cdb32006-11-29 22:06:42 +0000183{hexconstant} {
184 sscanf(yytext+2, "%x", &yylval.iconst);
Mark Slee600cdb32006-11-29 22:06:42 +0000185 return tok_int_constant;
186}
187
Mark Slee30152872006-11-28 01:24:07 +0000188{dubconstant} {
189 yylval.dconst = atof(yytext);
190 return tok_dub_constant;
191}
192
Mark Slee4f8da1d2006-10-12 02:47:27 +0000193{identifier} {
194 yylval.id = strdup(yytext);
195 return tok_identifier;
196}
197
Mark Slee30152872006-11-28 01:24:07 +0000198{dliteral} {
199 yylval.id = strdup(yytext+1);
200 yylval.id[strlen(yylval.id)-1] = '\0';
201 return tok_literal;
202}
203
204{sliteral} {
Mark Sleef0712dc2006-10-25 19:03:57 +0000205 yylval.id = strdup(yytext+1);
206 yylval.id[strlen(yylval.id)-1] = '\0';
207 return tok_literal;
208}
Mark Slee31985722006-05-24 21:45:31 +0000209
ccheeverf53b5cf2007-02-05 20:33:11 +0000210{doctext} {
David Reisscbd4bac2007-08-14 17:12:33 +0000211 /* This does not show up in the parse tree. */
212 /* Rather, the parser will grab it out of the global. */
213 if (g_parse_mode == PROGRAM) {
214 clear_doctext();
215 g_doctext = strdup(yytext + 3);
216 g_doctext[strlen(g_doctext) - 2] = '\0';
217 g_doctext = clean_up_doctext(g_doctext);
218 g_doctext_lineno = yylineno;
219 }
ccheeverf53b5cf2007-02-05 20:33:11 +0000220}
221
222
Mark Slee31985722006-05-24 21:45:31 +0000223%%