blob: 60a7f2c7846f5894fca94bc643fd4e7f7853ab8e [file] [log] [blame]
Mark Slee31985722006-05-24 21:45:31 +00001/**
Mark Sleee9ce01c2007-05-16 02:29:53 +00002 * Copyright (c) 2006- Facebook
3 * Distributed under the Thrift Software License
4 *
5 * See accompanying file LICENSE or visit the Thrift site at:
6 * http://developers.facebook.com/thrift/
7 */
8
9/**
Mark Slee31985722006-05-24 21:45:31 +000010 * Thrift scanner.
Mark Slee27ed6ec2007-08-16 01:26:31 +000011 *
Mark Slee31985722006-05-24 21:45:31 +000012 * Tokenizes a thrift definition file.
Mark Slee31985722006-05-24 21:45:31 +000013 */
Mark Sleef5377b32006-10-10 01:42:59 +000014
Mark Slee31985722006-05-24 21:45:31 +000015%{
16
David Reissf1454162008-06-30 20:45:47 +000017#include <errno.h>
18
Mark Slee31985722006-05-24 21:45:31 +000019#include "main.h"
David Reisscbd4bac2007-08-14 17:12:33 +000020#include "globals.h"
Mark Slee31985722006-05-24 21:45:31 +000021#include "parse/t_program.h"
22
Mark Sleef5377b32006-10-10 01:42:59 +000023/**
24 * Must be included AFTER parse/t_program.h, but I can't remember why anymore
25 * because I wrote this a while ago.
26 */
Mark Sleeeb0d0242007-01-25 07:58:55 +000027#include "thrifty.h"
Mark Slee31985722006-05-24 21:45:31 +000028
Mark Sleef12865a2007-01-12 00:23:26 +000029void thrift_reserved_keyword(char* keyword) {
30 yyerror("Cannot use reserved language keyword: \"%s\"\n", keyword);
31 exit(1);
32}
33
David Reissf1454162008-06-30 20:45:47 +000034void integer_overflow(char* text) {
35 yyerror("This integer is too big: \"%s\"\n", text);
36 exit(1);
37}
38
Mark Slee31985722006-05-24 21:45:31 +000039%}
40
Mark Sleef5377b32006-10-10 01:42:59 +000041/**
42 * Provides the yylineno global, useful for debugging output
43 */
Mark Slee27ed6ec2007-08-16 01:26:31 +000044%option lex-compat
Mark Slee31985722006-05-24 21:45:31 +000045
Mark Slee27ed6ec2007-08-16 01:26:31 +000046/**
Mark Sleef5377b32006-10-10 01:42:59 +000047 * Helper definitions, comments, constants, and whatnot
48 */
49
Mark Sleebd588222007-11-21 08:43:35 +000050intconstant ([+-]?[0-9]+)
51hexconstant ("0x"[0-9A-Fa-f]+)
52dubconstant ([+-]?[0-9]*(\.[0-9]+)?([eE][+-]?[0-9]+)?)
53identifier ([a-zA-Z_][\.a-zA-Z_0-9]*)
54whitespace ([ \t\r\n]*)
55sillycomm ("/*""*"*"*/")
56multicomm ("/*"[^*]"/"*([^*/]|[^*]"/"|"*"[^/])*"*"*"*/")
57doctext ("/**"([^*/]|[^*]"/"|"*"[^/])*"*"*"*/")
58comment ("//"[^\n]*)
59unixcomment ("#"[^\n]*)
60symbol ([:;\,\{\}\(\)\=<>\[\]])
61dliteral ("\""[^"]*"\"")
62sliteral ("'"[^']*"'")
63st_identifier ([a-zA-Z-][\.a-zA-Z_0-9-]*)
ccheeverf53b5cf2007-02-05 20:33:11 +000064
Mark Slee31985722006-05-24 21:45:31 +000065
66%%
67
Mark Sleebd588222007-11-21 08:43:35 +000068{whitespace} { /* do nothing */ }
69{sillycomm} { /* do nothing */ }
70{multicomm} { /* do nothing */ }
71{comment} { /* do nothing */ }
72{unixcomment} { /* do nothing */ }
Mark Slee31985722006-05-24 21:45:31 +000073
Mark Sleebd588222007-11-21 08:43:35 +000074{symbol} { return yytext[0]; }
Mark Slee9cb7c612006-09-01 22:17:45 +000075
Mark Sleebd588222007-11-21 08:43:35 +000076"namespace" { return tok_namespace; }
77"cpp_namespace" { return tok_cpp_namespace; }
78"cpp_include" { return tok_cpp_include; }
79"cpp_type" { return tok_cpp_type; }
80"java_package" { return tok_java_package; }
81"cocoa_prefix" { return tok_cocoa_prefix; }
David Reiss7f42bcf2008-01-11 20:59:12 +000082"csharp_namespace" { return tok_csharp_namespace; }
Mark Sleebd588222007-11-21 08:43:35 +000083"php_namespace" { return tok_php_namespace; }
84"py_module" { return tok_py_module; }
85"perl_package" { return tok_perl_package; }
86"ruby_namespace" { return tok_ruby_namespace; }
87"smalltalk_category" { return tok_smalltalk_category; }
David Reiss15457c92007-12-14 07:03:03 +000088"smalltalk_prefix" { return tok_smalltalk_prefix; }
Mark Sleebd588222007-11-21 08:43:35 +000089"xsd_all" { return tok_xsd_all; }
90"xsd_optional" { return tok_xsd_optional; }
91"xsd_nillable" { return tok_xsd_nillable; }
92"xsd_namespace" { return tok_xsd_namespace; }
93"xsd_attrs" { return tok_xsd_attrs; }
94"include" { return tok_include; }
95"void" { return tok_void; }
96"bool" { return tok_bool; }
97"byte" { return tok_byte; }
98"i16" { return tok_i16; }
99"i32" { return tok_i32; }
100"i64" { return tok_i64; }
101"double" { return tok_double; }
102"string" { return tok_string; }
103"binary" { return tok_binary; }
104"slist" { return tok_slist; }
105"senum" { return tok_senum; }
106"map" { return tok_map; }
107"list" { return tok_list; }
108"set" { return tok_set; }
David Reiss6985a422009-03-24 20:00:47 +0000109"async" { return tok_oneway; }
Mark Sleebd588222007-11-21 08:43:35 +0000110"typedef" { return tok_typedef; }
111"struct" { return tok_struct; }
112"exception" { return tok_xception; }
113"extends" { return tok_extends; }
114"throws" { return tok_throws; }
115"service" { return tok_service; }
116"enum" { return tok_enum; }
117"const" { return tok_const; }
118"required" { return tok_required; }
119"optional" { return tok_optional; }
Mark Sleef0712dc2006-10-25 19:03:57 +0000120
Mark Slee52f643d2006-08-09 00:03:43 +0000121
Mark Sleebd588222007-11-21 08:43:35 +0000122"abstract" { thrift_reserved_keyword(yytext); }
123"and" { thrift_reserved_keyword(yytext); }
Mark Sleec27fc312007-12-21 23:52:19 +0000124"args" { thrift_reserved_keyword(yytext); }
Mark Sleebd588222007-11-21 08:43:35 +0000125"as" { thrift_reserved_keyword(yytext); }
126"assert" { thrift_reserved_keyword(yytext); }
127"break" { thrift_reserved_keyword(yytext); }
128"case" { thrift_reserved_keyword(yytext); }
129"class" { thrift_reserved_keyword(yytext); }
130"continue" { thrift_reserved_keyword(yytext); }
131"declare" { thrift_reserved_keyword(yytext); }
132"def" { thrift_reserved_keyword(yytext); }
133"default" { thrift_reserved_keyword(yytext); }
134"del" { thrift_reserved_keyword(yytext); }
135"delete" { thrift_reserved_keyword(yytext); }
136"do" { thrift_reserved_keyword(yytext); }
137"elif" { thrift_reserved_keyword(yytext); }
138"else" { thrift_reserved_keyword(yytext); }
139"elseif" { thrift_reserved_keyword(yytext); }
140"except" { thrift_reserved_keyword(yytext); }
141"exec" { thrift_reserved_keyword(yytext); }
142"false" { thrift_reserved_keyword(yytext); }
Mark Sleebd588222007-11-21 08:43:35 +0000143"finally" { thrift_reserved_keyword(yytext); }
144"float" { thrift_reserved_keyword(yytext); }
145"for" { thrift_reserved_keyword(yytext); }
146"foreach" { thrift_reserved_keyword(yytext); }
147"function" { thrift_reserved_keyword(yytext); }
148"global" { thrift_reserved_keyword(yytext); }
149"goto" { thrift_reserved_keyword(yytext); }
150"if" { thrift_reserved_keyword(yytext); }
151"implements" { thrift_reserved_keyword(yytext); }
152"import" { thrift_reserved_keyword(yytext); }
153"in" { thrift_reserved_keyword(yytext); }
154"inline" { thrift_reserved_keyword(yytext); }
155"instanceof" { thrift_reserved_keyword(yytext); }
156"interface" { thrift_reserved_keyword(yytext); }
157"is" { thrift_reserved_keyword(yytext); }
158"lambda" { thrift_reserved_keyword(yytext); }
159"native" { thrift_reserved_keyword(yytext); }
160"new" { thrift_reserved_keyword(yytext); }
161"not" { thrift_reserved_keyword(yytext); }
162"or" { thrift_reserved_keyword(yytext); }
163"pass" { thrift_reserved_keyword(yytext); }
164"public" { thrift_reserved_keyword(yytext); }
165"print" { thrift_reserved_keyword(yytext); }
166"private" { thrift_reserved_keyword(yytext); }
167"protected" { thrift_reserved_keyword(yytext); }
168"raise" { thrift_reserved_keyword(yytext); }
169"return" { thrift_reserved_keyword(yytext); }
170"sizeof" { thrift_reserved_keyword(yytext); }
171"static" { thrift_reserved_keyword(yytext); }
172"switch" { thrift_reserved_keyword(yytext); }
173"synchronized" { thrift_reserved_keyword(yytext); }
174"this" { thrift_reserved_keyword(yytext); }
175"throw" { thrift_reserved_keyword(yytext); }
176"transient" { thrift_reserved_keyword(yytext); }
177"true" { thrift_reserved_keyword(yytext); }
178"try" { thrift_reserved_keyword(yytext); }
179"unsigned" { thrift_reserved_keyword(yytext); }
180"var" { thrift_reserved_keyword(yytext); }
181"virtual" { thrift_reserved_keyword(yytext); }
182"volatile" { thrift_reserved_keyword(yytext); }
183"while" { thrift_reserved_keyword(yytext); }
184"with" { thrift_reserved_keyword(yytext); }
185"union" { thrift_reserved_keyword(yytext); }
186"yield" { thrift_reserved_keyword(yytext); }
Mark Sleef12865a2007-01-12 00:23:26 +0000187
Mark Slee4f8da1d2006-10-12 02:47:27 +0000188{intconstant} {
David Reissf1454162008-06-30 20:45:47 +0000189 errno = 0;
190 yylval.iconst = strtoll(yytext, NULL, 10);
191 if (errno == ERANGE) {
192 integer_overflow(yytext);
193 }
Mark Slee4f8da1d2006-10-12 02:47:27 +0000194 return tok_int_constant;
195}
Mark Sleef5377b32006-10-10 01:42:59 +0000196
Mark Slee600cdb32006-11-29 22:06:42 +0000197{hexconstant} {
David Reissf1454162008-06-30 20:45:47 +0000198 errno = 0;
199 yylval.iconst = strtoll(yytext+2, NULL, 16);
200 if (errno == ERANGE) {
201 integer_overflow(yytext);
202 }
Mark Slee600cdb32006-11-29 22:06:42 +0000203 return tok_int_constant;
204}
205
Mark Slee30152872006-11-28 01:24:07 +0000206{dubconstant} {
207 yylval.dconst = atof(yytext);
208 return tok_dub_constant;
209}
210
Mark Slee4f8da1d2006-10-12 02:47:27 +0000211{identifier} {
212 yylval.id = strdup(yytext);
213 return tok_identifier;
214}
215
Mark Sleebd588222007-11-21 08:43:35 +0000216{st_identifier} {
217 yylval.id = strdup(yytext);
218 return tok_st_identifier;
219}
220
Mark Slee30152872006-11-28 01:24:07 +0000221{dliteral} {
222 yylval.id = strdup(yytext+1);
223 yylval.id[strlen(yylval.id)-1] = '\0';
224 return tok_literal;
225}
226
227{sliteral} {
Mark Sleef0712dc2006-10-25 19:03:57 +0000228 yylval.id = strdup(yytext+1);
229 yylval.id[strlen(yylval.id)-1] = '\0';
230 return tok_literal;
231}
Mark Slee31985722006-05-24 21:45:31 +0000232
ccheeverf53b5cf2007-02-05 20:33:11 +0000233{doctext} {
David Reisscbd4bac2007-08-14 17:12:33 +0000234 /* This does not show up in the parse tree. */
235 /* Rather, the parser will grab it out of the global. */
236 if (g_parse_mode == PROGRAM) {
237 clear_doctext();
238 g_doctext = strdup(yytext + 3);
239 g_doctext[strlen(g_doctext) - 2] = '\0';
240 g_doctext = clean_up_doctext(g_doctext);
241 g_doctext_lineno = yylineno;
242 }
ccheeverf53b5cf2007-02-05 20:33:11 +0000243}
244
245
Mark Slee31985722006-05-24 21:45:31 +0000246%%