blob: ed38b074774b94fa7f239902ebd5c97e0e571425 [file] [log] [blame]
Mark Sleee9ce01c2007-05-16 02:29:53 +00001// Copyright (c) 2006- Facebook
2// Distributed under the Thrift Software License
3//
4// See accompanying file LICENSE or visit the Thrift site at:
5// http://developers.facebook.com/thrift/
6
Mark Slee31985722006-05-24 21:45:31 +00007/**
8 * thrift - a lightweight cross-language rpc/serialization tool
9 *
10 * This file contains the main compiler engine for Thrift, which invokes the
11 * scanner/parser to build the thrift object tree. The interface generation
Mark Sleef5377b32006-10-10 01:42:59 +000012 * code for each language lives in a file by the language name under the
13 * generate/ folder, and all parse structures live in parse/
Mark Slee31985722006-05-24 21:45:31 +000014 *
15 * @author Mark Slee <mcslee@facebook.com>
16 */
17
18#include <stdlib.h>
19#include <stdio.h>
20#include <stdarg.h>
21#include <string>
Mark Sleef0712dc2006-10-25 19:03:57 +000022#include <sys/types.h>
23#include <sys/stat.h>
Mark Slee31985722006-05-24 21:45:31 +000024
Mark Sleef0712dc2006-10-25 19:03:57 +000025// Careful: must include globals first for extern definitions
Mark Slee31985722006-05-24 21:45:31 +000026#include "globals.h"
27
28#include "main.h"
29#include "parse/t_program.h"
Mark Sleef0712dc2006-10-25 19:03:57 +000030#include "parse/t_scope.h"
Mark Slee31985722006-05-24 21:45:31 +000031#include "generate/t_cpp_generator.h"
Mark Sleeb15a68b2006-06-07 06:46:24 +000032#include "generate/t_java_generator.h"
Mark Slee6e536442006-06-30 18:28:50 +000033#include "generate/t_php_generator.h"
Mark Sleefc89d392006-09-04 00:04:39 +000034#include "generate/t_py_generator.h"
Mark Slee6d7d5952007-01-27 01:44:22 +000035#include "generate/t_rb_generator.h"
Mark Slee0e0ff7e2007-01-18 22:59:59 +000036#include "generate/t_xsd_generator.h"
Mark Slee2c44d202007-05-16 02:18:07 +000037#include "generate/t_perl_generator.h"
iproctor9a41a0c2007-07-16 21:59:24 +000038#include "generate/t_ocaml_generator.h"
Christopher Piro2f5afce2007-06-29 07:17:33 +000039#include "generate/t_erl_generator.h"
iproctorff8eb922007-07-25 19:06:13 +000040#include "generate/t_hs_generator.h"
Mark Slee31985722006-05-24 21:45:31 +000041
42using namespace std;
43
Mark Sleef5377b32006-10-10 01:42:59 +000044/**
45 * Global program tree
46 */
Mark Slee31985722006-05-24 21:45:31 +000047t_program* g_program;
48
Mark Sleef5377b32006-10-10 01:42:59 +000049/**
Mark Sleef0712dc2006-10-25 19:03:57 +000050 * Global types
51 */
52
53t_type* g_type_void;
54t_type* g_type_string;
Mark Slee8d725a22007-04-13 01:57:12 +000055t_type* g_type_binary;
Mark Sleeb6200d82007-01-19 19:14:36 +000056t_type* g_type_slist;
Mark Sleef0712dc2006-10-25 19:03:57 +000057t_type* g_type_bool;
58t_type* g_type_byte;
59t_type* g_type_i16;
60t_type* g_type_i32;
61t_type* g_type_i64;
62t_type* g_type_double;
63
64/**
65 * Global scope
66 */
67t_scope* g_scope;
68
69/**
70 * Parent scope to also parse types
71 */
72t_scope* g_parent_scope;
73
74/**
75 * Prefix for putting types in parent scope
76 */
77string g_parent_prefix;
78
79/**
80 * Parsing pass
81 */
82PARSE_MODE g_parse_mode;
83
84/**
85 * Current directory of file being parsed
86 */
87string g_curdir;
88
89/**
90 * Current file being parsed
91 */
92string g_curpath;
93
94/**
Martin Kraemer32c66e12006-11-09 00:06:36 +000095 * Search path for inclusions
96 */
Mark Slee2329a832006-11-09 00:23:30 +000097vector<string> g_incl_searchpath;
Martin Kraemer32c66e12006-11-09 00:06:36 +000098
99/**
Mark Sleef5377b32006-10-10 01:42:59 +0000100 * Global debug state
101 */
Mark Slee31985722006-05-24 21:45:31 +0000102int g_debug = 0;
103
Mark Sleef5377b32006-10-10 01:42:59 +0000104/**
Mark Sleef0712dc2006-10-25 19:03:57 +0000105 * Warning level
106 */
107int g_warn = 1;
108
109/**
110 * Verbose output
111 */
112int g_verbose = 0;
113
114/**
Mark Sleef5377b32006-10-10 01:42:59 +0000115 * Global time string
116 */
Mark Slee31985722006-05-24 21:45:31 +0000117char* g_time_str;
118
Mark Slee31985722006-05-24 21:45:31 +0000119/**
Mark Sleef0712dc2006-10-25 19:03:57 +0000120 * Flags to control code generation
121 */
122bool gen_cpp = false;
123bool gen_java = false;
Mark Slee6d7d5952007-01-27 01:44:22 +0000124bool gen_rb = false;
Mark Sleef0712dc2006-10-25 19:03:57 +0000125bool gen_py = false;
Mark Slee0e0ff7e2007-01-18 22:59:59 +0000126bool gen_xsd = false;
Mark Sleef0712dc2006-10-25 19:03:57 +0000127bool gen_php = false;
128bool gen_phpi = false;
Mark Slee756b1d12007-07-06 00:30:21 +0000129bool gen_rest = false;
Mark Slee2c44d202007-05-16 02:18:07 +0000130bool gen_perl = false;
iproctor9a41a0c2007-07-16 21:59:24 +0000131bool gen_ocaml = false;
Christopher Piro2f5afce2007-06-29 07:17:33 +0000132bool gen_erl = false;
iproctorff8eb922007-07-25 19:06:13 +0000133bool gen_hs = false;
Mark Sleef0712dc2006-10-25 19:03:57 +0000134bool gen_recurse = false;
135
136/**
Mark Slee31985722006-05-24 21:45:31 +0000137 * Report an error to the user. This is called yyerror for historical
138 * reasons (lex and yacc expect the error reporting routine to be called
139 * this). Call this function to report any errors to the user.
140 * yyerror takes printf style arguments.
141 *
142 * @param fmt C format string followed by additional arguments
143 */
144void yyerror(char* fmt, ...) {
145 va_list args;
146 fprintf(stderr,
Mark Sleef0712dc2006-10-25 19:03:57 +0000147 "[ERROR:%s:%d] (last token was '%s')\n",
148 g_curpath.c_str(),
Mark Slee31985722006-05-24 21:45:31 +0000149 yylineno,
150 yytext);
Mark Slee31985722006-05-24 21:45:31 +0000151
152 va_start(args, fmt);
153 vfprintf(stderr, fmt, args);
154 va_end(args);
155
156 fprintf(stderr, "\n");
157}
158
159/**
160 * Prints a debug message from the parser.
161 *
162 * @param fmt C format string followed by additional arguments
163 */
164void pdebug(char* fmt, ...) {
165 if (g_debug == 0) {
166 return;
167 }
168 va_list args;
Mark Slee30152872006-11-28 01:24:07 +0000169 printf("[PARSE:%d] ", yylineno);
Mark Sleef0712dc2006-10-25 19:03:57 +0000170 va_start(args, fmt);
171 vprintf(fmt, args);
172 va_end(args);
173 printf("\n");
174}
175
176/**
177 * Prints a verbose output mode message
178 *
179 * @param fmt C format string followed by additional arguments
180 */
181void pverbose(char* fmt, ...) {
182 if (g_verbose == 0) {
183 return;
184 }
185 va_list args;
186 va_start(args, fmt);
187 vprintf(fmt, args);
188 va_end(args);
189}
190
191/**
192 * Prints a warning message
193 *
194 * @param fmt C format string followed by additional arguments
195 */
196void pwarning(int level, char* fmt, ...) {
197 if (g_warn < level) {
198 return;
199 }
200 va_list args;
201 printf("[WARNING:%s:%d] ", g_curpath.c_str(), yylineno);
Mark Slee31985722006-05-24 21:45:31 +0000202 va_start(args, fmt);
203 vprintf(fmt, args);
204 va_end(args);
205 printf("\n");
206}
207
208/**
209 * Prints a failure message and exits
210 *
211 * @param fmt C format string followed by additional arguments
212 */
Mark Slee30152872006-11-28 01:24:07 +0000213void failure(const char* fmt, ...) {
Mark Slee2c44d202007-05-16 02:18:07 +0000214 va_list args;
Mark Sleef0712dc2006-10-25 19:03:57 +0000215 fprintf(stderr, "[FAILURE:%s:%d] ", g_curpath.c_str(), yylineno);
Mark Slee31985722006-05-24 21:45:31 +0000216 va_start(args, fmt);
217 vfprintf(stderr, fmt, args);
218 va_end(args);
219 printf("\n");
220 exit(1);
221}
222
223/**
Mark Sleef0712dc2006-10-25 19:03:57 +0000224 * Converts a string filename into a thrift program name
225 */
226string program_name(string filename) {
227 string::size_type slash = filename.rfind("/");
228 if (slash != string::npos) {
229 filename = filename.substr(slash+1);
230 }
231 string::size_type dot = filename.rfind(".");
232 if (dot != string::npos) {
233 filename = filename.substr(0, dot);
234 }
235 return filename;
236}
237
238/**
239 * Gets the directory path of a filename
240 */
241string directory_name(string filename) {
242 string::size_type slash = filename.rfind("/");
243 // No slash, just use the current directory
244 if (slash == string::npos) {
245 return ".";
246 }
247 return filename.substr(0, slash);
248}
249
250/**
251 * Finds the appropriate file path for the given filename
252 */
253string include_file(string filename) {
254 // Absolute path? Just try that
Martin Kraemer32c66e12006-11-09 00:06:36 +0000255 if (filename[0] == '/') {
256 // Realpath!
257 char rp[PATH_MAX];
258 if (realpath(filename.c_str(), rp) == NULL) {
259 pwarning(0, "Cannot open include file %s\n", filename.c_str());
260 return std::string();
261 }
Mark Slee2c44d202007-05-16 02:18:07 +0000262
263 // Stat this file
Martin Kraemer32c66e12006-11-09 00:06:36 +0000264 struct stat finfo;
265 if (stat(rp, &finfo) == 0) {
266 return rp;
267 }
268 } else { // relative path, start searching
269 // new search path with current dir global
270 vector<string> sp = g_incl_searchpath;
271 sp.insert(sp.begin(), g_curdir);
Mark Slee2c44d202007-05-16 02:18:07 +0000272
Martin Kraemer32c66e12006-11-09 00:06:36 +0000273 // iterate through paths
274 vector<string>::iterator it;
275 for (it = sp.begin(); it != sp.end(); it++) {
276 string sfilename = *(it) + "/" + filename;
Mark Slee2c44d202007-05-16 02:18:07 +0000277
Martin Kraemer32c66e12006-11-09 00:06:36 +0000278 // Realpath!
279 char rp[PATH_MAX];
280 if (realpath(sfilename.c_str(), rp) == NULL) {
281 continue;
282 }
Mark Slee2c44d202007-05-16 02:18:07 +0000283
Martin Kraemer32c66e12006-11-09 00:06:36 +0000284 // Stat this files
285 struct stat finfo;
286 if (stat(rp, &finfo) == 0) {
287 return rp;
288 }
289 }
Mark Sleef0712dc2006-10-25 19:03:57 +0000290 }
Mark Slee2c44d202007-05-16 02:18:07 +0000291
Mark Sleef0712dc2006-10-25 19:03:57 +0000292 // Uh oh
293 pwarning(0, "Could not find include file %s\n", filename.c_str());
294 return std::string();
295}
296
297/**
David Reiss1ac05802007-07-30 22:00:27 +0000298 * Cleans up text commonly found in doxygen-like comments
299 *
300 * Warning: if you mix tabs and spaces in a non-uniform way,
301 * you will get what you deserve.
302 */
303char* clean_up_doctext(char* doctext) {
304 // Convert to C++ string, and remove Windows's carriage returns.
305 string docstring = doctext;
306 docstring.erase(
307 remove(docstring.begin(), docstring.end(), '\r'),
308 docstring.end());
309
310 // Separate into lines.
311 vector<string> lines;
312 string::size_type pos = string::npos;
313 string::size_type last;
314 while (true) {
315 last = (pos == string::npos) ? 0 : pos+1;
316 pos = docstring.find('\n', last);
317 if (pos == string::npos) {
318 // First bit of cleaning. If the last line is only whitespace, drop it.
319 string::size_type nonwhite = docstring.find_first_not_of(" \t", last);
320 if (nonwhite != string::npos) {
321 lines.push_back(docstring.substr(last));
322 }
323 break;
324 }
325 lines.push_back(docstring.substr(last, pos-last));
326 }
327
328 // A very profound docstring.
329 if (lines.empty()) {
330 return NULL;
331 }
332
333 // Clear leading whitespace from the first line.
334 pos = lines.front().find_first_not_of(" \t");
335 lines.front().erase(0, pos);
336
337 // If every nonblank line after the first has the same number of spaces/tabs,
338 // then a star, remove them.
339 bool have_prefix = true;
340 bool found_prefix = false;
341 string::size_type prefix_len = 0;
342 vector<string>::iterator l_iter;
343 for (l_iter = lines.begin()+1; l_iter != lines.end(); ++l_iter) {
344 if (l_iter->empty()) {
345 continue;
346 }
347
348 pos = l_iter->find_first_not_of(" \t");
349 if (!found_prefix) {
350 if (pos != string::npos) {
351 if (l_iter->at(pos) == '*') {
352 found_prefix = true;
353 prefix_len = pos;
354 } else {
355 have_prefix = false;
356 break;
357 }
358 } else {
359 // Whitespace-only line. Truncate it.
360 l_iter->clear();
361 }
362 } else if (l_iter->size() > pos
363 && l_iter->at(pos) == '*'
364 && pos == prefix_len) {
365 // Business as usual.
366 } else if (pos == string::npos) {
367 // Whitespace-only line. Let's truncate it for them.
368 l_iter->clear();
369 } else {
370 // The pattern has been broken.
371 have_prefix = false;
372 break;
373 }
374 }
375
376 // If our prefix survived, delete it from every line.
377 if (have_prefix) {
378 // Get the star too.
379 prefix_len++;
380 for (l_iter = lines.begin()+1; l_iter != lines.end(); ++l_iter) {
381 l_iter->erase(0, prefix_len);
382 }
383 }
384
385 // Now delete the minimum amount of leading whitespace from each line.
386 prefix_len = string::npos;
387 for (l_iter = lines.begin()+1; l_iter != lines.end(); ++l_iter) {
388 if (l_iter->empty()) {
389 continue;
390 }
391 pos = l_iter->find_first_not_of(" \t");
392 if (pos != string::npos
393 && (prefix_len == string::npos || pos < prefix_len)) {
394 prefix_len = pos;
395 }
396 }
397
398 // If our prefix survived, delete it from every line.
399 if (prefix_len != string::npos) {
400 for (l_iter = lines.begin()+1; l_iter != lines.end(); ++l_iter) {
401 l_iter->erase(0, prefix_len);
402 }
403 }
404
405 // Remove trailing whitespace from every line.
406 for (l_iter = lines.begin(); l_iter != lines.end(); ++l_iter) {
407 pos = l_iter->find_last_not_of(" \t");
408 if (pos != string::npos && pos != l_iter->length()-1) {
409 l_iter->erase(pos+1);
410 }
411 }
412
413 // If the first line is empty, remove it.
414 // Don't do this earlier because a lot of steps skip the first line.
415 if (lines.front().empty()) {
416 lines.erase(lines.begin());
417 }
418
419 // Now rejoin the lines and copy them back into doctext.
420 docstring.clear();
421 for (l_iter = lines.begin(); l_iter != lines.end(); ++l_iter) {
422 docstring += *l_iter;
423 docstring += '\n';
424 }
425
426 assert(docstring.length() <= strlen(doctext));
427 strcpy(doctext, docstring.c_str());
428 return doctext;
429}
430
431/** Set to true to debug docstring parsing */
432static bool dump_docs = false;
433
434/**
435 * Dumps docstrings to stdout
David Reissc2532a92007-07-30 23:46:11 +0000436 * Only works for typedefs and whole program
David Reiss1ac05802007-07-30 22:00:27 +0000437 */
438void dump_docstrings(t_program* program) {
David Reissc2532a92007-07-30 23:46:11 +0000439 string progdoc = g_program->get_doc();
440 if (!progdoc.empty()) {
441 printf("Whole program doc:\n%s\n", progdoc.c_str());
442 }
David Reiss1ac05802007-07-30 22:00:27 +0000443 const vector<t_typedef*>& typedefs = program->get_typedefs();
444 vector<t_typedef*>::const_iterator t_iter;
445 for (t_iter = typedefs.begin(); t_iter != typedefs.end(); ++t_iter) {
446 t_typedef* td = *t_iter;
447 if (td->has_doc()) {
448 printf("%s:\n%s\n", td->get_name().c_str(), td->get_doc().c_str());
449 }
450 }
451}
452
453/**
Mark Slee31985722006-05-24 21:45:31 +0000454 * Diplays the usage message and then exits with an error code.
455 */
456void usage() {
Mark Sleeb15a68b2006-06-07 06:46:24 +0000457 fprintf(stderr, "Usage: thrift [options] file\n");
458 fprintf(stderr, "Options:\n");
Mark Slee2329a832006-11-09 00:23:30 +0000459 fprintf(stderr, " -cpp Generate C++ output files\n");
460 fprintf(stderr, " -java Generate Java output files\n");
461 fprintf(stderr, " -php Generate PHP output files\n");
462 fprintf(stderr, " -phpi Generate PHP inlined files\n");
463 fprintf(stderr, " -py Generate Python output files\n");
ccheeverf53b5cf2007-02-05 20:33:11 +0000464 fprintf(stderr, " -rb Generate Ruby output files\n");
465 fprintf(stderr, " -xsd Generate XSD output files\n");
Mark Slee2c44d202007-05-16 02:18:07 +0000466 fprintf(stderr, " -perl Generate Perl output files\n");
iproctor9a41a0c2007-07-16 21:59:24 +0000467 fprintf(stderr, " -ocaml Generate OCaml output files\n");
Christopher Piro2f5afce2007-06-29 07:17:33 +0000468 fprintf(stderr, " -erl Generate Erlang output files\n");
iproctorff8eb922007-07-25 19:06:13 +0000469 fprintf(stderr, " -hs Generate Haskell output files\n");
Mark Slee227ac2c2007-03-07 05:46:50 +0000470 fprintf(stderr, " -I dir Add a directory to the list of directories \n");
471 fprintf(stderr, " searched for include directives\n");
Mark Slee2329a832006-11-09 00:23:30 +0000472 fprintf(stderr, " -nowarn Suppress all compiler warnings (BAD!)\n");
473 fprintf(stderr, " -strict Strict compiler warnings on\n");
474 fprintf(stderr, " -v[erbose] Verbose mode\n");
475 fprintf(stderr, " -r[ecurse] Also generate included files\n");
476 fprintf(stderr, " -debug Parse debug trace to stdout\n");
Mark Slee31985722006-05-24 21:45:31 +0000477 exit(1);
478}
479
480/**
Mark Slee30152872006-11-28 01:24:07 +0000481 * You know, when I started working on Thrift I really thought it wasn't going
482 * to become a programming language because it was just a generator and it
483 * wouldn't need runtime type information and all that jazz. But then we
484 * decided to add constants, and all of a sudden that means runtime type
485 * validation and inference, except the "runtime" is the code generator
486 * runtime. Shit. I've been had.
487 */
488void validate_const_rec(std::string name, t_type* type, t_const_value* value) {
489 if (type->is_void()) {
490 throw "type error: cannot declare a void const: " + name;
491 }
492
493 if (type->is_base_type()) {
494 t_base_type::t_base tbase = ((t_base_type*)type)->get_base();
495 switch (tbase) {
496 case t_base_type::TYPE_STRING:
497 if (value->get_type() != t_const_value::CV_STRING) {
498 throw "type error: const \"" + name + "\" was declared as string";
499 }
500 break;
501 case t_base_type::TYPE_BOOL:
502 if (value->get_type() != t_const_value::CV_INTEGER) {
503 throw "type error: const \"" + name + "\" was declared as bool";
504 }
505 break;
506 case t_base_type::TYPE_BYTE:
507 if (value->get_type() != t_const_value::CV_INTEGER) {
508 throw "type error: const \"" + name + "\" was declared as byte";
509 }
510 break;
511 case t_base_type::TYPE_I16:
512 if (value->get_type() != t_const_value::CV_INTEGER) {
513 throw "type error: const \"" + name + "\" was declared as i16";
514 }
515 break;
516 case t_base_type::TYPE_I32:
517 if (value->get_type() != t_const_value::CV_INTEGER) {
518 throw "type error: const \"" + name + "\" was declared as i32";
519 }
520 break;
521 case t_base_type::TYPE_I64:
522 if (value->get_type() != t_const_value::CV_INTEGER) {
523 throw "type error: const \"" + name + "\" was declared as i64";
524 }
525 break;
526 case t_base_type::TYPE_DOUBLE:
527 if (value->get_type() != t_const_value::CV_INTEGER &&
528 value->get_type() != t_const_value::CV_DOUBLE) {
529 throw "type error: const \"" + name + "\" was declared as double";
530 }
531 break;
532 default:
533 throw "compiler error: no const of base type " + tbase + name;
534 }
535 } else if (type->is_enum()) {
536 if (value->get_type() != t_const_value::CV_INTEGER) {
537 throw "type error: const \"" + name + "\" was declared as enum";
538 }
539 } else if (type->is_struct() || type->is_xception()) {
540 if (value->get_type() != t_const_value::CV_MAP) {
541 throw "type error: const \"" + name + "\" was declared as struct/xception";
542 }
543 const vector<t_field*>& fields = ((t_struct*)type)->get_members();
544 vector<t_field*>::const_iterator f_iter;
545
546 const map<t_const_value*, t_const_value*>& val = value->get_map();
547 map<t_const_value*, t_const_value*>::const_iterator v_iter;
548 for (v_iter = val.begin(); v_iter != val.end(); ++v_iter) {
549 if (v_iter->first->get_type() != t_const_value::CV_STRING) {
550 throw "type error: " + name + " struct key must be string";
551 }
552 t_type* field_type = NULL;
553 for (f_iter = fields.begin(); f_iter != fields.end(); ++f_iter) {
554 if ((*f_iter)->get_name() == v_iter->first->get_string()) {
555 field_type = (*f_iter)->get_type();
556 }
557 }
558 if (field_type == NULL) {
559 throw "type error: " + type->get_name() + " has no field " + v_iter->first->get_string();
560 }
561
562 validate_const_rec(name + "." + v_iter->first->get_string(), field_type, v_iter->second);
563 }
564 } else if (type->is_map()) {
565 t_type* k_type = ((t_map*)type)->get_key_type();
566 t_type* v_type = ((t_map*)type)->get_val_type();
567 const map<t_const_value*, t_const_value*>& val = value->get_map();
568 map<t_const_value*, t_const_value*>::const_iterator v_iter;
569 for (v_iter = val.begin(); v_iter != val.end(); ++v_iter) {
570 validate_const_rec(name + "<key>", k_type, v_iter->first);
571 validate_const_rec(name + "<val>", v_type, v_iter->second);
Mark Slee2c44d202007-05-16 02:18:07 +0000572 }
Mark Slee30152872006-11-28 01:24:07 +0000573 } else if (type->is_list() || type->is_set()) {
574 t_type* e_type;
575 if (type->is_list()) {
576 e_type = ((t_list*)type)->get_elem_type();
577 } else {
578 e_type = ((t_set*)type)->get_elem_type();
579 }
580 const vector<t_const_value*>& val = value->get_list();
581 vector<t_const_value*>::const_iterator v_iter;
582 for (v_iter = val.begin(); v_iter != val.end(); ++v_iter) {
583 validate_const_rec(name + "<elem>", e_type, *v_iter);
584 }
585 }
586}
587
588/**
589 * Check the type of the parsed const information against its declared type
590 */
591void validate_const_type(t_const* c) {
592 validate_const_rec(c->get_name(), c->get_type(), c->get_value());
593}
594
595/**
Mark Slee7ff32452007-02-01 05:26:18 +0000596 * Check the type of a default value assigned to a field.
597 */
598void validate_field_value(t_field* field, t_const_value* cv) {
599 validate_const_rec(field->get_name(), field->get_type(), cv);
600}
601
602/**
Mark Sleef0712dc2006-10-25 19:03:57 +0000603 * Parses a program
604 */
Mark Slee2c44d202007-05-16 02:18:07 +0000605void parse(t_program* program, t_program* parent_program) {
Mark Sleef0712dc2006-10-25 19:03:57 +0000606 // Get scope file path
607 string path = program->get_path();
Mark Slee2c44d202007-05-16 02:18:07 +0000608
Mark Sleef0712dc2006-10-25 19:03:57 +0000609 // Set current dir global, which is used in the include_file function
610 g_curdir = directory_name(path);
611 g_curpath = path;
612
613 // Open the file
614 yyin = fopen(path.c_str(), "r");
615 if (yyin == 0) {
616 failure("Could not open input file: \"%s\"", path.c_str());
617 }
618
619 // Create new scope and scan for includes
620 pverbose("Scanning %s for includes\n", path.c_str());
Mark Slee2c44d202007-05-16 02:18:07 +0000621 g_parse_mode = INCLUDES;
Mark Sleef0712dc2006-10-25 19:03:57 +0000622 g_program = program;
623 g_scope = program->scope();
Mark Slee30152872006-11-28 01:24:07 +0000624 try {
Mark Slee36bfa2e2007-01-19 20:09:51 +0000625 yylineno = 1;
Mark Slee30152872006-11-28 01:24:07 +0000626 if (yyparse() != 0) {
627 failure("Parser error during include pass.");
628 }
629 } catch (string x) {
630 failure(x.c_str());
Mark Sleef0712dc2006-10-25 19:03:57 +0000631 }
632 fclose(yyin);
633
634 // Recursively parse all the include programs
635 vector<t_program*>& includes = program->get_includes();
636 vector<t_program*>::iterator iter;
637 for (iter = includes.begin(); iter != includes.end(); ++iter) {
638 parse(*iter, program);
639 }
640
641 // Parse the program the file
642 g_parse_mode = PROGRAM;
643 g_program = program;
644 g_scope = program->scope();
645 g_parent_scope = (parent_program != NULL) ? parent_program->scope() : NULL;
646 g_parent_prefix = program->get_name() + ".";
647 g_curpath = path;
648 yyin = fopen(path.c_str(), "r");
649 if (yyin == 0) {
650 failure("Could not open input file: \"%s\"", path.c_str());
651 }
652 pverbose("Parsing %s for types\n", path.c_str());
Mark Slee36bfa2e2007-01-19 20:09:51 +0000653 yylineno = 1;
David Reiss877237a2007-07-27 00:40:19 +0000654 try {
655 if (yyparse() != 0) {
656 failure("Parser error during types pass.");
657 }
658 } catch (string x) {
659 failure(x.c_str());
Mark Sleef0712dc2006-10-25 19:03:57 +0000660 }
661 fclose(yyin);
662}
663
664/**
665 * Generate code
666 */
667void generate(t_program* program) {
668 // Oooohh, recursive code generation, hot!!
669 if (gen_recurse) {
670 const vector<t_program*>& includes = program->get_includes();
671 for (size_t i = 0; i < includes.size(); ++i) {
672 generate(includes[i]);
673 }
674 }
675
676 // Generate code!
677 try {
678 pverbose("Program: %s\n", program->get_path().c_str());
679
680 if (gen_cpp) {
681 pverbose("Generating C++\n");
682 t_cpp_generator* cpp = new t_cpp_generator(program);
683 cpp->generate_program();
684 delete cpp;
685 }
686
687 if (gen_java) {
688 pverbose("Generating Java\n");
689 t_java_generator* java = new t_java_generator(program);
690 java->generate_program();
691 delete java;
692 }
693
694 if (gen_php) {
695 pverbose("Generating PHP\n");
Mark Slee756b1d12007-07-06 00:30:21 +0000696 t_php_generator* php = new t_php_generator(program, false, gen_rest);
Mark Sleef0712dc2006-10-25 19:03:57 +0000697 php->generate_program();
698 delete php;
699 }
700
701 if (gen_phpi) {
702 pverbose("Generating PHP-inline\n");
Mark Slee756b1d12007-07-06 00:30:21 +0000703 t_php_generator* phpi = new t_php_generator(program, true, gen_rest);
Mark Sleef0712dc2006-10-25 19:03:57 +0000704 phpi->generate_program();
705 delete phpi;
706 }
707
708 if (gen_py) {
709 pverbose("Generating Python\n");
710 t_py_generator* py = new t_py_generator(program);
711 py->generate_program();
712 delete py;
713 }
Mark Slee0e0ff7e2007-01-18 22:59:59 +0000714
Mark Slee6d7d5952007-01-27 01:44:22 +0000715 if (gen_rb) {
716 pverbose("Generating Ruby\n");
717 t_rb_generator* rb = new t_rb_generator(program);
718 rb->generate_program();
719 delete rb;
720 }
721
Mark Slee0e0ff7e2007-01-18 22:59:59 +0000722 if (gen_xsd) {
723 pverbose("Generating XSD\n");
724 t_xsd_generator* xsd = new t_xsd_generator(program);
725 xsd->generate_program();
726 delete xsd;
727 }
728
Mark Slee2c44d202007-05-16 02:18:07 +0000729 if (gen_perl) {
730 pverbose("Generating PERL\n");
731 t_perl_generator* perl = new t_perl_generator(program);
732 perl->generate_program();
733 delete perl;
734 }
735
iproctor9a41a0c2007-07-16 21:59:24 +0000736 if (gen_ocaml) {
737 pverbose("Generating OCaml\n");
738 t_ocaml_generator* ocaml = new t_ocaml_generator(program);
739 ocaml->generate_program();
740 delete ocaml;
741 }
742
Christopher Piro2f5afce2007-06-29 07:17:33 +0000743 if (gen_erl) {
744 pverbose("Generating Erlang\n");
745 t_erl_generator* erl = new t_erl_generator(program);
746 erl->generate_program();
747 delete erl;
748 }
iproctorff8eb922007-07-25 19:06:13 +0000749 if (gen_hs) {
750 pverbose("Generating Haskell\n");
751 t_hs_generator* hs = new t_hs_generator(program);
752 hs->generate_program();
753 delete hs;
754 }
David Reiss1ac05802007-07-30 22:00:27 +0000755 if (dump_docs) {
756 dump_docstrings(program);
757 }
iproctor9a41a0c2007-07-16 21:59:24 +0000758
Mark Sleef0712dc2006-10-25 19:03:57 +0000759 } catch (string s) {
760 printf("Error: %s\n", s.c_str());
761 } catch (const char* exc) {
762 printf("Error: %s\n", exc);
763 }
764
765}
766
767/**
Mark Sleef5377b32006-10-10 01:42:59 +0000768 * Parse it up.. then spit it back out, in pretty much every language. Alright
769 * not that many languages, but the cool ones that we care about.
Mark Slee31985722006-05-24 21:45:31 +0000770 */
771int main(int argc, char** argv) {
772 int i;
Mark Sleef5377b32006-10-10 01:42:59 +0000773
Mark Sleeb15a68b2006-06-07 06:46:24 +0000774 // Setup time string
775 time_t now = time(NULL);
776 g_time_str = ctime(&now);
Mark Slee31985722006-05-24 21:45:31 +0000777
Mark Sleef0712dc2006-10-25 19:03:57 +0000778 // Check for necessary arguments, you gotta have at least a filename and
779 // an output language flag
Mark Sleeb15a68b2006-06-07 06:46:24 +0000780 if (argc < 2) {
781 usage();
782 }
Mark Slee31985722006-05-24 21:45:31 +0000783
Mark Sleef5377b32006-10-10 01:42:59 +0000784 // Hacky parameter handling... I didn't feel like using a library sorry!
Mark Slee31985722006-05-24 21:45:31 +0000785 for (i = 1; i < argc-1; i++) {
Mark Sleefdbee812006-09-27 18:50:48 +0000786 char* arg;
Mark Slee2329a832006-11-09 00:23:30 +0000787
Mark Sleefdbee812006-09-27 18:50:48 +0000788 arg = strtok(argv[i], " ");
789 while (arg != NULL) {
Mark Slee2329a832006-11-09 00:23:30 +0000790 // Treat double dashes as single dashes
Mark Slee52cb2232006-11-10 22:32:07 +0000791 if (arg[0] == '-' && arg[1] == '-') {
Mark Slee2329a832006-11-09 00:23:30 +0000792 ++arg;
793 }
794
795 if (strcmp(arg, "-debug") == 0) {
Mark Sleefdbee812006-09-27 18:50:48 +0000796 g_debug = 1;
Mark Slee2329a832006-11-09 00:23:30 +0000797 } else if (strcmp(arg, "-nowarn") == 0) {
Mark Sleef0712dc2006-10-25 19:03:57 +0000798 g_warn = 0;
Mark Slee2329a832006-11-09 00:23:30 +0000799 } else if (strcmp(arg, "-strict") == 0) {
Mark Sleef0712dc2006-10-25 19:03:57 +0000800 g_warn = 2;
Mark Slee2329a832006-11-09 00:23:30 +0000801 } else if (strcmp(arg, "-v") == 0 || strcmp(arg, "-verbose") == 0 ) {
Mark Sleef0712dc2006-10-25 19:03:57 +0000802 g_verbose = 1;
Mark Slee2329a832006-11-09 00:23:30 +0000803 } else if (strcmp(arg, "-r") == 0 || strcmp(arg, "-recurse") == 0 ) {
Mark Sleef0712dc2006-10-25 19:03:57 +0000804 gen_recurse = true;
Mark Slee2329a832006-11-09 00:23:30 +0000805 } else if (strcmp(arg, "-cpp") == 0) {
Mark Sleefdbee812006-09-27 18:50:48 +0000806 gen_cpp = true;
Mark Slee2329a832006-11-09 00:23:30 +0000807 } else if (strcmp(arg, "-java") == 0) {
Mark Sleefdbee812006-09-27 18:50:48 +0000808 gen_java = true;
Mark Slee2329a832006-11-09 00:23:30 +0000809 } else if (strcmp(arg, "-php") == 0) {
Mark Sleefdbee812006-09-27 18:50:48 +0000810 gen_php = true;
Mark Slee2329a832006-11-09 00:23:30 +0000811 } else if (strcmp(arg, "-phpi") == 0) {
Mark Sleef5377b32006-10-10 01:42:59 +0000812 gen_phpi = true;
Mark Slee756b1d12007-07-06 00:30:21 +0000813 } else if (strcmp(arg, "-rest") == 0) {
814 gen_rest = true;
Mark Slee2329a832006-11-09 00:23:30 +0000815 } else if (strcmp(arg, "-py") == 0) {
Mark Sleefdbee812006-09-27 18:50:48 +0000816 gen_py = true;
Mark Slee6d7d5952007-01-27 01:44:22 +0000817 } else if (strcmp(arg, "-rb") == 0) {
818 gen_rb = true;
Mark Slee0e0ff7e2007-01-18 22:59:59 +0000819 } else if (strcmp(arg, "-xsd") == 0) {
820 gen_xsd = true;
Mark Slee2c44d202007-05-16 02:18:07 +0000821 } else if (strcmp(arg, "-perl") == 0) {
822 gen_perl = true;
iproctor9a41a0c2007-07-16 21:59:24 +0000823 } else if (strcmp(arg, "-ocaml") == 0) {
824 gen_ocaml = true;
Christopher Piro2f5afce2007-06-29 07:17:33 +0000825 } else if (strcmp(arg, "-erl") == 0) {
826 gen_erl = true;
iproctorff8eb922007-07-25 19:06:13 +0000827 } else if (strcmp(arg, "-hs") == 0) {
828 gen_hs = true;
Martin Kraemer32c66e12006-11-09 00:06:36 +0000829 } else if (strcmp(arg, "-I") == 0) {
830 // An argument of "-I\ asdf" is invalid and has unknown results
831 arg = argv[++i];
832
833 if (arg == NULL) {
834 fprintf(stderr, "!!! Missing Include directory");
835 usage();
836 }
837 g_incl_searchpath.push_back(arg);
Mark Sleefdbee812006-09-27 18:50:48 +0000838 } else {
839 fprintf(stderr, "!!! Unrecognized option: %s\n", arg);
840 usage();
841 }
842
843 // Tokenize more
844 arg = strtok(NULL, " ");
Mark Slee31985722006-05-24 21:45:31 +0000845 }
846 }
Mark Slee2c44d202007-05-16 02:18:07 +0000847
Mark Sleef0712dc2006-10-25 19:03:57 +0000848 // You gotta generate something!
iproctorff8eb922007-07-25 19:06:13 +0000849 if (!gen_cpp && !gen_java && !gen_php && !gen_phpi && !gen_py && !gen_rb && !gen_xsd && !gen_perl && !gen_ocaml && !gen_erl && !gen_hs) {
Mark Sleeb15a68b2006-06-07 06:46:24 +0000850 fprintf(stderr, "!!! No output language(s) specified\n\n");
851 usage();
852 }
Mark Sleef0712dc2006-10-25 19:03:57 +0000853
854 // Real-pathify it
855 char rp[PATH_MAX];
856 if (realpath(argv[i], rp) == NULL) {
857 failure("Could not open input file: %s", argv[i]);
Mark Slee31985722006-05-24 21:45:31 +0000858 }
Mark Sleef0712dc2006-10-25 19:03:57 +0000859 string input_file(rp);
860
Mark Sleef5377b32006-10-10 01:42:59 +0000861 // Instance of the global parse tree
Mark Sleef0712dc2006-10-25 19:03:57 +0000862 t_program* program = new t_program(input_file);
863
864 // Initialize global types
865 g_type_void = new t_base_type("void", t_base_type::TYPE_VOID);
866 g_type_string = new t_base_type("string", t_base_type::TYPE_STRING);
Mark Slee8d725a22007-04-13 01:57:12 +0000867 g_type_binary = new t_base_type("string", t_base_type::TYPE_STRING);
868 ((t_base_type*)g_type_binary)->set_binary(true);
Mark Sleeb6200d82007-01-19 19:14:36 +0000869 g_type_slist = new t_base_type("string", t_base_type::TYPE_STRING);
870 ((t_base_type*)g_type_slist)->set_string_list(true);
Mark Sleef0712dc2006-10-25 19:03:57 +0000871 g_type_bool = new t_base_type("bool", t_base_type::TYPE_BOOL);
872 g_type_byte = new t_base_type("byte", t_base_type::TYPE_BYTE);
873 g_type_i16 = new t_base_type("i16", t_base_type::TYPE_I16);
874 g_type_i32 = new t_base_type("i32", t_base_type::TYPE_I32);
875 g_type_i64 = new t_base_type("i64", t_base_type::TYPE_I64);
876 g_type_double = new t_base_type("double", t_base_type::TYPE_DOUBLE);
Mark Sleee8540632006-05-30 09:24:40 +0000877
Mark Sleef5377b32006-10-10 01:42:59 +0000878 // Parse it!
Mark Sleef0712dc2006-10-25 19:03:57 +0000879 parse(program, NULL);
Mark Slee31985722006-05-24 21:45:31 +0000880
Mark Sleef0712dc2006-10-25 19:03:57 +0000881 // Generate it!
882 generate(program);
Mark Sleeb15a68b2006-06-07 06:46:24 +0000883
Mark Sleef0712dc2006-10-25 19:03:57 +0000884 // Clean up. Who am I kidding... this program probably orphans heap memory
885 // all over the place, but who cares because it is about to exit and it is
886 // all referenced and used by this wacky parse tree up until now anyways.
Mark Sleeb15a68b2006-06-07 06:46:24 +0000887
Mark Sleef0712dc2006-10-25 19:03:57 +0000888 delete program;
889 delete g_type_void;
890 delete g_type_string;
891 delete g_type_bool;
892 delete g_type_byte;
893 delete g_type_i16;
894 delete g_type_i32;
895 delete g_type_i64;
896 delete g_type_double;
Mark Slee31985722006-05-24 21:45:31 +0000897
898 // Finished
Mark Slee31985722006-05-24 21:45:31 +0000899 return 0;
900}