| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 1 | /** | 
| Mark Slee | e9ce01c | 2007-05-16 02:29:53 +0000 | [diff] [blame] | 2 | * Copyright (c) 2006- Facebook | 
|  | 3 | * Distributed under the Thrift Software License | 
|  | 4 | * | 
|  | 5 | * See accompanying file LICENSE or visit the Thrift site at: | 
|  | 6 | * http://developers.facebook.com/thrift/ | 
|  | 7 | */ | 
|  | 8 |  | 
|  | 9 | /** | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 10 | * Thrift scanner. | 
|  | 11 | * | 
|  | 12 | * Tokenizes a thrift definition file. | 
|  | 13 | * @author Mark Slee <mcslee@facebook.com> | 
|  | 14 | */ | 
| Mark Slee | f5377b3 | 2006-10-10 01:42:59 +0000 | [diff] [blame] | 15 |  | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 16 | %{ | 
|  | 17 |  | 
|  | 18 | #include "main.h" | 
|  | 19 | #include "parse/t_program.h" | 
|  | 20 |  | 
| Mark Slee | f5377b3 | 2006-10-10 01:42:59 +0000 | [diff] [blame] | 21 | /** | 
|  | 22 | * Must be included AFTER parse/t_program.h, but I can't remember why anymore | 
|  | 23 | * because I wrote this a while ago. | 
|  | 24 | */ | 
| Mark Slee | eb0d024 | 2007-01-25 07:58:55 +0000 | [diff] [blame] | 25 | #include "thrifty.h" | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 26 |  | 
| Mark Slee | f12865a | 2007-01-12 00:23:26 +0000 | [diff] [blame] | 27 | void thrift_reserved_keyword(char* keyword) { | 
|  | 28 | yyerror("Cannot use reserved language keyword: \"%s\"\n", keyword); | 
|  | 29 | exit(1); | 
|  | 30 | } | 
|  | 31 |  | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 32 | %} | 
|  | 33 |  | 
| Mark Slee | f5377b3 | 2006-10-10 01:42:59 +0000 | [diff] [blame] | 34 | /** | 
|  | 35 | * Provides the yylineno global, useful for debugging output | 
|  | 36 | */ | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 37 | %option lex-compat | 
|  | 38 |  | 
| Mark Slee | f5377b3 | 2006-10-10 01:42:59 +0000 | [diff] [blame] | 39 | /** | 
|  | 40 | * Helper definitions, comments, constants, and whatnot | 
|  | 41 | */ | 
|  | 42 |  | 
| Mark Slee | 3015287 | 2006-11-28 01:24:07 +0000 | [diff] [blame] | 43 | intconstant  ([+-]?[0-9]+) | 
| Mark Slee | 600cdb3 | 2006-11-29 22:06:42 +0000 | [diff] [blame] | 44 | hexconstant  ("0x"[0-9A-Fa-f]+) | 
| Mark Slee | 3015287 | 2006-11-28 01:24:07 +0000 | [diff] [blame] | 45 | dubconstant  ([+-]?[0-9]*(\.[0-9]+)?([eE][+-]?[0-9]+)?) | 
| Mark Slee | 9cb7c61 | 2006-09-01 22:17:45 +0000 | [diff] [blame] | 46 | identifier   ([a-zA-Z_][\.a-zA-Z_0-9]*) | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 47 | whitespace   ([ \t\r\n]*) | 
|  | 48 | multicomm    ("/*""/"*([^*/]|[^*]"/"|"*"[^/])*"*"*"*/") | 
|  | 49 | comment      ("//"[^\n]*) | 
| Mark Slee | c98d050 | 2006-09-06 02:42:25 +0000 | [diff] [blame] | 50 | unixcomment  ("#"[^\n]*) | 
| ccheever | f53b5cf | 2007-02-05 20:33:11 +0000 | [diff] [blame] | 51 | doctext      ("["(("["[^\]\[]*"]")|[^\]\[])*"]") /* allows one level of nesting */ | 
| Mark Slee | ae2bc3c | 2006-11-08 23:44:59 +0000 | [diff] [blame] | 52 | symbol       ([:;\,\{\}\(\)\=<>\[\]]) | 
| ccheever | f53b5cf | 2007-02-05 20:33:11 +0000 | [diff] [blame] | 53 | dliteral     ("\""[^"]*"\"") | 
|  | 54 | sliteral     ("'"[^']*"'") | 
|  | 55 |  | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 56 |  | 
|  | 57 | %% | 
|  | 58 |  | 
|  | 59 | {whitespace}  { /* do nothing */ } | 
|  | 60 | {multicomm}   { /* do nothing */ } | 
|  | 61 | {comment}     { /* do nothing */ } | 
| Mark Slee | c98d050 | 2006-09-06 02:42:25 +0000 | [diff] [blame] | 62 | {unixcomment} { /* do nothing */ } | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 63 |  | 
| Mark Slee | 9cb7c61 | 2006-09-01 22:17:45 +0000 | [diff] [blame] | 64 | {symbol}      { return yytext[0]; } | 
|  | 65 |  | 
| Mark Slee | f0712dc | 2006-10-25 19:03:57 +0000 | [diff] [blame] | 66 | "namespace"     { return tok_namespace;     } | 
|  | 67 | "cpp_namespace" { return tok_cpp_namespace; } | 
|  | 68 | "cpp_include"   { return tok_cpp_include;   } | 
|  | 69 | "cpp_type"      { return tok_cpp_type;      } | 
|  | 70 | "java_package"  { return tok_java_package;  } | 
| Mark Slee | e888b37 | 2007-01-12 01:06:24 +0000 | [diff] [blame] | 71 | "php_namespace" { return tok_php_namespace; } | 
| Mark Slee | 782abbb | 2007-01-19 00:17:02 +0000 | [diff] [blame] | 72 | "xsd_all"       { return tok_xsd_all;       } | 
| Mark Slee | 36bfa2e | 2007-01-19 20:09:51 +0000 | [diff] [blame] | 73 | "xsd_optional"  { return tok_xsd_optional;  } | 
| Mark Slee | 7df0e2a | 2007-02-06 21:03:18 +0000 | [diff] [blame] | 74 | "xsd_nillable"  { return tok_xsd_nillable;  } | 
| Mark Slee | 0d9199e | 2007-01-31 02:08:30 +0000 | [diff] [blame] | 75 | "xsd_namespace" { return tok_xsd_namespace; } | 
| Mark Slee | 21135c3 | 2007-02-05 21:52:08 +0000 | [diff] [blame] | 76 | "xsd_attrs"     { return tok_xsd_attrs;     } | 
| Mark Slee | f0712dc | 2006-10-25 19:03:57 +0000 | [diff] [blame] | 77 | "include"       { return tok_include;       } | 
|  | 78 |  | 
|  | 79 | "void"          { return tok_void;          } | 
|  | 80 | "bool"          { return tok_bool;          } | 
|  | 81 | "byte"          { return tok_byte;          } | 
|  | 82 | "i16"           { return tok_i16;           } | 
|  | 83 | "i32"           { return tok_i32;           } | 
|  | 84 | "i64"           { return tok_i64;           } | 
|  | 85 | "double"        { return tok_double;        } | 
|  | 86 | "string"        { return tok_string;        } | 
| Mark Slee | 8d725a2 | 2007-04-13 01:57:12 +0000 | [diff] [blame] | 87 | "binary"        { return tok_binary;        } | 
| Mark Slee | b6200d8 | 2007-01-19 19:14:36 +0000 | [diff] [blame] | 88 | "slist"         { return tok_slist;         } | 
| Mark Slee | 6a47fed | 2007-02-07 02:40:59 +0000 | [diff] [blame] | 89 | "senum"         { return tok_senum;         } | 
| Mark Slee | f0712dc | 2006-10-25 19:03:57 +0000 | [diff] [blame] | 90 | "map"           { return tok_map;           } | 
|  | 91 | "list"          { return tok_list;          } | 
|  | 92 | "set"           { return tok_set;           } | 
|  | 93 | "async"         { return tok_async;         } | 
|  | 94 | "typedef"       { return tok_typedef;       } | 
|  | 95 | "struct"        { return tok_struct;        } | 
|  | 96 | "exception"     { return tok_xception;      } | 
|  | 97 | "extends"       { return tok_extends;       } | 
|  | 98 | "throws"        { return tok_throws;        } | 
|  | 99 | "service"       { return tok_service;       } | 
|  | 100 | "enum"          { return tok_enum;          } | 
| Mark Slee | 3015287 | 2006-11-28 01:24:07 +0000 | [diff] [blame] | 101 | "const"         { return tok_const;         } | 
| Mark Slee | 52f643d | 2006-08-09 00:03:43 +0000 | [diff] [blame] | 102 |  | 
| Mark Slee | f12865a | 2007-01-12 00:23:26 +0000 | [diff] [blame] | 103 | "abstract" { thrift_reserved_keyword(yytext); } | 
|  | 104 | "and" { thrift_reserved_keyword(yytext); } | 
|  | 105 | "as" { thrift_reserved_keyword(yytext); } | 
|  | 106 | "assert" { thrift_reserved_keyword(yytext); } | 
|  | 107 | "break" { thrift_reserved_keyword(yytext); } | 
|  | 108 | "case" { thrift_reserved_keyword(yytext); } | 
|  | 109 | "class" { thrift_reserved_keyword(yytext); } | 
|  | 110 | "continue" { thrift_reserved_keyword(yytext); } | 
|  | 111 | "declare" { thrift_reserved_keyword(yytext); } | 
|  | 112 | "def" { thrift_reserved_keyword(yytext); } | 
|  | 113 | "default" { thrift_reserved_keyword(yytext); } | 
|  | 114 | "del" { thrift_reserved_keyword(yytext); } | 
|  | 115 | "delete" { thrift_reserved_keyword(yytext); } | 
|  | 116 | "do" { thrift_reserved_keyword(yytext); } | 
|  | 117 | "elif" { thrift_reserved_keyword(yytext); } | 
|  | 118 | "else" { thrift_reserved_keyword(yytext); } | 
|  | 119 | "elseif" { thrift_reserved_keyword(yytext); } | 
|  | 120 | "except" { thrift_reserved_keyword(yytext); } | 
|  | 121 | "exec" { thrift_reserved_keyword(yytext); } | 
|  | 122 | "false" { thrift_reserved_keyword(yytext); } | 
|  | 123 | "final" { thrift_reserved_keyword(yytext); } | 
|  | 124 | "finally" { thrift_reserved_keyword(yytext); } | 
|  | 125 | "float" { thrift_reserved_keyword(yytext); } | 
|  | 126 | "for" { thrift_reserved_keyword(yytext); } | 
|  | 127 | "foreach" { thrift_reserved_keyword(yytext); } | 
|  | 128 | "function" { thrift_reserved_keyword(yytext); } | 
|  | 129 | "global" { thrift_reserved_keyword(yytext); } | 
|  | 130 | "goto" { thrift_reserved_keyword(yytext); } | 
|  | 131 | "if" { thrift_reserved_keyword(yytext); } | 
|  | 132 | "implements" { thrift_reserved_keyword(yytext); } | 
|  | 133 | "import" { thrift_reserved_keyword(yytext); } | 
|  | 134 | "in" { thrift_reserved_keyword(yytext); } | 
|  | 135 | "inline" { thrift_reserved_keyword(yytext); } | 
|  | 136 | "instanceof" { thrift_reserved_keyword(yytext); } | 
|  | 137 | "interface" { thrift_reserved_keyword(yytext); } | 
|  | 138 | "is" { thrift_reserved_keyword(yytext); } | 
|  | 139 | "lambda" { thrift_reserved_keyword(yytext); } | 
|  | 140 | "native" { thrift_reserved_keyword(yytext); } | 
|  | 141 | "new" { thrift_reserved_keyword(yytext); } | 
|  | 142 | "not" { thrift_reserved_keyword(yytext); } | 
|  | 143 | "or" { thrift_reserved_keyword(yytext); } | 
|  | 144 | "pass" { thrift_reserved_keyword(yytext); } | 
|  | 145 | "public" { thrift_reserved_keyword(yytext); } | 
|  | 146 | "print" { thrift_reserved_keyword(yytext); } | 
|  | 147 | "private" { thrift_reserved_keyword(yytext); } | 
|  | 148 | "protected" { thrift_reserved_keyword(yytext); } | 
|  | 149 | "raise" { thrift_reserved_keyword(yytext); } | 
|  | 150 | "return" { thrift_reserved_keyword(yytext); } | 
|  | 151 | "sizeof" { thrift_reserved_keyword(yytext); } | 
|  | 152 | "static" { thrift_reserved_keyword(yytext); } | 
|  | 153 | "switch" { thrift_reserved_keyword(yytext); } | 
|  | 154 | "synchronized" { thrift_reserved_keyword(yytext); } | 
|  | 155 | "this" { thrift_reserved_keyword(yytext); } | 
|  | 156 | "throw" { thrift_reserved_keyword(yytext); } | 
|  | 157 | "transient" { thrift_reserved_keyword(yytext); } | 
|  | 158 | "true" { thrift_reserved_keyword(yytext); } | 
|  | 159 | "try" { thrift_reserved_keyword(yytext); } | 
|  | 160 | "unsigned" { thrift_reserved_keyword(yytext); } | 
|  | 161 | "var" { thrift_reserved_keyword(yytext); } | 
|  | 162 | "virtual" { thrift_reserved_keyword(yytext); } | 
|  | 163 | "volatile" { thrift_reserved_keyword(yytext); } | 
|  | 164 | "while" { thrift_reserved_keyword(yytext); } | 
|  | 165 | "with" { thrift_reserved_keyword(yytext); } | 
|  | 166 | "union" { thrift_reserved_keyword(yytext); } | 
|  | 167 | "yield" { thrift_reserved_keyword(yytext); } | 
|  | 168 |  | 
| Mark Slee | 4f8da1d | 2006-10-12 02:47:27 +0000 | [diff] [blame] | 169 | {intconstant} { | 
|  | 170 | yylval.iconst = atoi(yytext); | 
|  | 171 | return tok_int_constant; | 
|  | 172 | } | 
| Mark Slee | f5377b3 | 2006-10-10 01:42:59 +0000 | [diff] [blame] | 173 |  | 
| Mark Slee | 600cdb3 | 2006-11-29 22:06:42 +0000 | [diff] [blame] | 174 | {hexconstant} { | 
|  | 175 | sscanf(yytext+2, "%x", &yylval.iconst); | 
| Mark Slee | 600cdb3 | 2006-11-29 22:06:42 +0000 | [diff] [blame] | 176 | return tok_int_constant; | 
|  | 177 | } | 
|  | 178 |  | 
| Mark Slee | 3015287 | 2006-11-28 01:24:07 +0000 | [diff] [blame] | 179 | {dubconstant} { | 
|  | 180 | yylval.dconst = atof(yytext); | 
|  | 181 | return tok_dub_constant; | 
|  | 182 | } | 
|  | 183 |  | 
| Mark Slee | 4f8da1d | 2006-10-12 02:47:27 +0000 | [diff] [blame] | 184 | {identifier} { | 
|  | 185 | yylval.id = strdup(yytext); | 
|  | 186 | return tok_identifier; | 
|  | 187 | } | 
|  | 188 |  | 
| Mark Slee | 3015287 | 2006-11-28 01:24:07 +0000 | [diff] [blame] | 189 | {dliteral} { | 
|  | 190 | yylval.id = strdup(yytext+1); | 
|  | 191 | yylval.id[strlen(yylval.id)-1] = '\0'; | 
|  | 192 | return tok_literal; | 
|  | 193 | } | 
|  | 194 |  | 
|  | 195 | {sliteral} { | 
| Mark Slee | f0712dc | 2006-10-25 19:03:57 +0000 | [diff] [blame] | 196 | yylval.id = strdup(yytext+1); | 
|  | 197 | yylval.id[strlen(yylval.id)-1] = '\0'; | 
|  | 198 | return tok_literal; | 
|  | 199 | } | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 200 |  | 
| ccheever | f53b5cf | 2007-02-05 20:33:11 +0000 | [diff] [blame] | 201 | {doctext} { | 
|  | 202 | yylval.id = strdup(yytext + 1); | 
|  | 203 | yylval.id[strlen(yylval.id) - 1] = '\0'; | 
|  | 204 | return tok_doctext; | 
|  | 205 | } | 
|  | 206 |  | 
|  | 207 |  | 
| Mark Slee | 3198572 | 2006-05-24 21:45:31 +0000 | [diff] [blame] | 208 | %% |