1 /**********************************************************************
6 created at: Fri May 28 18:02:42 JST 1993
8 Copyright (C) 1993-2007 Yukihiro Matsumoto
10 **********************************************************************/
15 #define PARSER_DEBUG 0
18 #define YYERROR_VERBOSE 1
19 #define YYSTACK_USE_ALLOCA 0
21 #include "ruby/ruby.h"
23 #include "ruby/encoding.h"
34 #define numberof(array) (int)(sizeof(array) / sizeof((array)[0]))
36 #define YYMALLOC(size) rb_parser_malloc(parser, (size))
37 #define YYREALLOC(ptr, size) rb_parser_realloc(parser, (ptr), (size))
38 #define YYCALLOC(nelem, size) rb_parser_calloc(parser, (nelem), (size))
39 #define YYFREE(ptr) rb_parser_free(parser, (ptr))
40 #define malloc YYMALLOC
41 #define realloc YYREALLOC
42 #define calloc YYCALLOC
46 static ID register_symid(ID, const char *, long, rb_encoding *);
47 static ID register_symid_str(ID, VALUE);
48 #define REGISTER_SYMID(id, name) register_symid((id), (name), strlen(name), enc)
52 #define is_notop_id(id) ((id)>tLAST_OP_ID)
53 #define is_local_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_LOCAL)
54 #define is_global_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_GLOBAL)
55 #define is_instance_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_INSTANCE)
56 #define is_attrset_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_ATTRSET)
57 #define is_const_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_CONST)
58 #define is_class_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_CLASS)
59 #define is_junk_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_JUNK)
60 #define id_type(id) (is_notop_id(id) ? (int)((id)&ID_SCOPE_MASK) : -1)
62 #define is_asgn_or_id(id) ((is_notop_id(id)) && \
63 (((id)&ID_SCOPE_MASK) == ID_GLOBAL || \
64 ((id)&ID_SCOPE_MASK) == ID_INSTANCE || \
65 ((id)&ID_SCOPE_MASK) == ID_CLASS))
68 EXPR_BEG_bit, /* ignore newline, +/- is a sign. */
69 EXPR_END_bit, /* newline significant, +/- is an operator. */
70 EXPR_ENDARG_bit, /* ditto, and unbound braces. */
71 EXPR_ENDFN_bit, /* ditto, and unbound braces. */
72 EXPR_ARG_bit, /* newline significant, +/- is an operator. */
73 EXPR_CMDARG_bit, /* newline significant, +/- is an operator. */
74 EXPR_MID_bit, /* newline significant, +/- is an operator. */
75 EXPR_FNAME_bit, /* ignore newline, no reserved words. */
76 EXPR_DOT_bit, /* right after `.' or `::', no reserved words. */
77 EXPR_CLASS_bit, /* immediate after `class', no here document. */
78 EXPR_VALUE_bit, /* alike EXPR_BEG but label is disallowed. */
81 /* examine combinations */
83 #define DEF_EXPR(n) EXPR_##n = (1 << EXPR_##n##_bit)
95 EXPR_BEG_ANY = (EXPR_BEG | EXPR_VALUE | EXPR_MID | EXPR_CLASS),
96 EXPR_ARG_ANY = (EXPR_ARG | EXPR_CMDARG),
97 EXPR_END_ANY = (EXPR_END | EXPR_ENDARG | EXPR_ENDFN)
99 #define IS_lex_state_for(x, ls) ((x) & (ls))
100 #define IS_lex_state(ls) IS_lex_state_for(lex_state, (ls))
103 static const char *lex_state_name(enum lex_state_e state);
106 typedef VALUE stack_type;
108 # define BITSTACK_PUSH(stack, n) ((stack) = ((stack)<<1)|((n)&1))
109 # define BITSTACK_POP(stack) ((stack) = (stack) >> 1)
110 # define BITSTACK_LEXPOP(stack) ((stack) = ((stack) >> 1) | ((stack) & 1))
111 # define BITSTACK_SET_P(stack) ((stack)&1)
113 #define COND_PUSH(n) BITSTACK_PUSH(cond_stack, (n))
114 #define COND_POP() BITSTACK_POP(cond_stack)
115 #define COND_LEXPOP() BITSTACK_LEXPOP(cond_stack)
116 #define COND_P() BITSTACK_SET_P(cond_stack)
118 #define CMDARG_PUSH(n) BITSTACK_PUSH(cmdarg_stack, (n))
119 #define CMDARG_POP() BITSTACK_POP(cmdarg_stack)
120 #define CMDARG_LEXPOP() BITSTACK_LEXPOP(cmdarg_stack)
121 #define CMDARG_P() BITSTACK_SET_P(cmdarg_stack)
134 struct local_vars *prev;
138 #define DVARS_INHERIT ((void*)1)
139 #define DVARS_TOPSCOPE NULL
140 #define DVARS_SPECIAL_P(tbl) (!POINTER_P(tbl))
141 #define POINTER_P(val) ((VALUE)(val) & ~(VALUE)3)
144 vtable_size(const struct vtable *tbl)
146 if (POINTER_P(tbl)) {
156 static struct vtable *
157 vtable_alloc(struct vtable *prev)
159 struct vtable *tbl = ALLOC(struct vtable);
162 tbl->tbl = ALLOC_N(ID, tbl->capa);
164 if (VTBL_DEBUG) printf("vtable_alloc: %p\n", (void *)tbl);
169 vtable_free(struct vtable *tbl)
171 if (VTBL_DEBUG)printf("vtable_free: %p\n", (void *)tbl);
172 if (POINTER_P(tbl)) {
181 vtable_add(struct vtable *tbl, ID id)
183 if (!POINTER_P(tbl)) {
184 rb_bug("vtable_add: vtable is not allocated (%p)", (void *)tbl);
186 if (VTBL_DEBUG) printf("vtable_add: %p, %s\n", (void *)tbl, rb_id2name(id));
188 if (tbl->pos == tbl->capa) {
189 tbl->capa = tbl->capa * 2;
190 REALLOC_N(tbl->tbl, ID, tbl->capa);
192 tbl->tbl[tbl->pos++] = id;
196 vtable_included(const struct vtable * tbl, ID id)
200 if (POINTER_P(tbl)) {
201 for (i = 0; i < tbl->pos; i++) {
202 if (tbl->tbl[i] == id) {
212 typedef struct token_info {
217 struct token_info *next;
222 Structure of Lexer Buffer:
224 lex_pbeg tokp lex_p lex_pend
226 |-----------+--------------+------------|
230 struct parser_params {
234 YYSTYPE *parser_yylval;
237 NODE *parser_lex_strterm;
238 enum lex_state_e parser_lex_state;
239 stack_type parser_cond_stack;
240 stack_type parser_cmdarg_stack;
241 int parser_class_nest;
242 int parser_paren_nest;
244 int parser_in_single;
246 int parser_brace_nest;
247 int parser_compile_for_eval;
248 VALUE parser_cur_mid;
249 int parser_in_defined;
250 char *parser_tokenbuf;
254 VALUE parser_lex_input;
255 VALUE parser_lex_lastline;
256 VALUE parser_lex_nextline;
257 const char *parser_lex_pbeg;
258 const char *parser_lex_p;
259 const char *parser_lex_pend;
260 int parser_heredoc_end;
261 int parser_command_start;
262 NODE *parser_deferred_nodes;
263 long parser_lex_gets_ptr;
264 VALUE (*parser_lex_gets)(struct parser_params*,VALUE);
265 struct local_vars *parser_lvtbl;
266 int parser_ruby__end__seen;
269 char *parser_ruby_sourcefile; /* current source file */
270 int parser_ruby_sourceline; /* current line no. */
271 VALUE parser_ruby_sourcefile_string;
278 NODE *parser_eval_tree_begin;
279 NODE *parser_eval_tree;
284 int parser_token_info_enabled;
285 token_info *parser_token_info;
295 VALUE parsing_thread;
300 #define STR_NEW(p,n) rb_enc_str_new((p),(n),current_enc)
301 #define STR_NEW0() rb_enc_str_new(0,0,current_enc)
302 #define STR_NEW2(p) rb_enc_str_new((p),strlen(p),current_enc)
303 #define STR_NEW3(p,n,e,func) parser_str_new((p),(n),(e),(func),current_enc)
304 #define ENC_SINGLE(cr) ((cr)==ENC_CODERANGE_7BIT)
305 #define TOK_INTERN(mb) rb_intern3(tok(), toklen(), current_enc)
307 static int parser_yyerror(struct parser_params*, const char*);
308 #define yyerror(msg) parser_yyerror(parser, (msg))
310 #define lex_strterm (parser->parser_lex_strterm)
311 #define lex_state (parser->parser_lex_state)
312 #define cond_stack (parser->parser_cond_stack)
313 #define cmdarg_stack (parser->parser_cmdarg_stack)
314 #define class_nest (parser->parser_class_nest)
315 #define paren_nest (parser->parser_paren_nest)
316 #define lpar_beg (parser->parser_lpar_beg)
317 #define brace_nest (parser->parser_brace_nest)
318 #define in_single (parser->parser_in_single)
319 #define in_def (parser->parser_in_def)
320 #define compile_for_eval (parser->parser_compile_for_eval)
321 #define cur_mid (parser->parser_cur_mid)
322 #define in_defined (parser->parser_in_defined)
323 #define tokenbuf (parser->parser_tokenbuf)
324 #define tokidx (parser->parser_tokidx)
325 #define toksiz (parser->parser_toksiz)
326 #define tokline (parser->parser_tokline)
327 #define lex_input (parser->parser_lex_input)
328 #define lex_lastline (parser->parser_lex_lastline)
329 #define lex_nextline (parser->parser_lex_nextline)
330 #define lex_pbeg (parser->parser_lex_pbeg)
331 #define lex_p (parser->parser_lex_p)
332 #define lex_pend (parser->parser_lex_pend)
333 #define heredoc_end (parser->parser_heredoc_end)
334 #define command_start (parser->parser_command_start)
335 #define deferred_nodes (parser->parser_deferred_nodes)
336 #define lex_gets_ptr (parser->parser_lex_gets_ptr)
337 #define lex_gets (parser->parser_lex_gets)
338 #define lvtbl (parser->parser_lvtbl)
339 #define ruby__end__seen (parser->parser_ruby__end__seen)
340 #define ruby_sourceline (parser->parser_ruby_sourceline)
341 #define ruby_sourcefile (parser->parser_ruby_sourcefile)
342 #define ruby_sourcefile_string (parser->parser_ruby_sourcefile_string)
343 #define current_enc (parser->enc)
344 #define yydebug (parser->parser_yydebug)
347 #define ruby_eval_tree (parser->parser_eval_tree)
348 #define ruby_eval_tree_begin (parser->parser_eval_tree_begin)
349 #define ruby_debug_lines (parser->debug_lines)
350 #define ruby_coverage (parser->coverage)
354 static int yylex(void*, void*);
356 static int yylex(void*);
360 #define yyparse ruby_yyparse
362 static NODE* node_newnode(struct parser_params *, enum node_type, VALUE, VALUE, VALUE);
363 #define rb_node_newnode(type, a1, a2, a3) node_newnode(parser, (type), (a1), (a2), (a3))
365 static NODE *cond_gen(struct parser_params*,NODE*);
366 #define cond(node) cond_gen(parser, (node))
367 static NODE *logop_gen(struct parser_params*,enum node_type,NODE*,NODE*);
368 #define logop(type,node1,node2) logop_gen(parser, (type), (node1), (node2))
370 static NODE *newline_node(NODE*);
371 static void fixpos(NODE*,NODE*);
373 static int value_expr_gen(struct parser_params*,NODE*);
374 static void void_expr_gen(struct parser_params*,NODE*);
375 static NODE *remove_begin(NODE*);
376 #define value_expr(node) value_expr_gen(parser, (node) = remove_begin(node))
377 #define void_expr0(node) void_expr_gen(parser, (node))
378 #define void_expr(node) void_expr0((node) = remove_begin(node))
379 static void void_stmts_gen(struct parser_params*,NODE*);
380 #define void_stmts(node) void_stmts_gen(parser, (node))
381 static void reduce_nodes_gen(struct parser_params*,NODE**);
382 #define reduce_nodes(n) reduce_nodes_gen(parser,(n))
383 static void block_dup_check_gen(struct parser_params*,NODE*,NODE*);
384 #define block_dup_check(n1,n2) block_dup_check_gen(parser,(n1),(n2))
386 static NODE *block_append_gen(struct parser_params*,NODE*,NODE*);
387 #define block_append(h,t) block_append_gen(parser,(h),(t))
388 static NODE *list_append_gen(struct parser_params*,NODE*,NODE*);
389 #define list_append(l,i) list_append_gen(parser,(l),(i))
390 static NODE *list_concat_gen(struct parser_params*,NODE*,NODE*);
391 #define list_concat(h,t) list_concat_gen(parser,(h),(t))
392 static NODE *arg_append_gen(struct parser_params*,NODE*,NODE*);
393 #define arg_append(h,t) arg_append_gen(parser,(h),(t))
394 static NODE *arg_concat_gen(struct parser_params*,NODE*,NODE*);
395 #define arg_concat(h,t) arg_concat_gen(parser,(h),(t))
396 static NODE *literal_concat_gen(struct parser_params*,NODE*,NODE*);
397 #define literal_concat(h,t) literal_concat_gen(parser,(h),(t))
398 static int literal_concat0(struct parser_params *, VALUE, VALUE);
399 static NODE *new_evstr_gen(struct parser_params*,NODE*);
400 #define new_evstr(n) new_evstr_gen(parser,(n))
401 static NODE *evstr2dstr_gen(struct parser_params*,NODE*);
402 #define evstr2dstr(n) evstr2dstr_gen(parser,(n))
403 static NODE *splat_array(NODE*);
405 static NODE *call_bin_op_gen(struct parser_params*,NODE*,ID,NODE*);
406 #define call_bin_op(recv,id,arg1) call_bin_op_gen(parser, (recv),(id),(arg1))
407 static NODE *call_uni_op_gen(struct parser_params*,NODE*,ID);
408 #define call_uni_op(recv,id) call_uni_op_gen(parser, (recv),(id))
410 static NODE *new_args_gen(struct parser_params*,NODE*,NODE*,ID,NODE*,NODE*);
411 #define new_args(f,o,r,p,t) new_args_gen(parser, (f),(o),(r),(p),(t))
412 static NODE *new_args_tail_gen(struct parser_params*,NODE*,ID,ID);
413 #define new_args_tail(k,kr,b) new_args_tail_gen(parser, (k),(kr),(b))
415 static NODE *negate_lit(NODE*);
416 static NODE *ret_args_gen(struct parser_params*,NODE*);
417 #define ret_args(node) ret_args_gen(parser, (node))
418 static NODE *arg_blk_pass(NODE*,NODE*);
419 static NODE *new_yield_gen(struct parser_params*,NODE*);
420 #define new_yield(node) new_yield_gen(parser, (node))
421 static NODE *dsym_node_gen(struct parser_params*,NODE*);
422 #define dsym_node(node) dsym_node_gen(parser, (node))
424 static NODE *gettable_gen(struct parser_params*,ID);
425 #define gettable(id) gettable_gen(parser,(id))
426 static NODE *assignable_gen(struct parser_params*,ID,NODE*);
427 #define assignable(id,node) assignable_gen(parser, (id), (node))
429 static NODE *aryset_gen(struct parser_params*,NODE*,NODE*);
430 #define aryset(node1,node2) aryset_gen(parser, (node1), (node2))
431 static NODE *attrset_gen(struct parser_params*,NODE*,ID);
432 #define attrset(node,id) attrset_gen(parser, (node), (id))
434 static void rb_backref_error_gen(struct parser_params*,NODE*);
435 #define rb_backref_error(n) rb_backref_error_gen(parser,(n))
436 static NODE *node_assign_gen(struct parser_params*,NODE*,NODE*);
437 #define node_assign(node1, node2) node_assign_gen(parser, (node1), (node2))
439 static NODE *new_op_assign_gen(struct parser_params *parser, NODE *lhs, ID op, NODE *rhs);
440 static NODE *new_attr_op_assign_gen(struct parser_params *parser, NODE *lhs, ID attr, ID op, NODE *rhs);
441 #define new_attr_op_assign(lhs, type, attr, op, rhs) new_attr_op_assign_gen(parser, (lhs), (attr), (op), (rhs))
442 static NODE *new_const_op_assign_gen(struct parser_params *parser, NODE *lhs, ID op, NODE *rhs);
443 #define new_const_op_assign(lhs, op, rhs) new_const_op_assign_gen(parser, (lhs), (op), (rhs))
445 static NODE *match_op_gen(struct parser_params*,NODE*,NODE*);
446 #define match_op(node1,node2) match_op_gen(parser, (node1), (node2))
448 static ID *local_tbl_gen(struct parser_params*);
449 #define local_tbl() local_tbl_gen(parser)
451 static void fixup_nodes(NODE **);
453 static VALUE reg_compile_gen(struct parser_params*, VALUE, int);
454 #define reg_compile(str,options) reg_compile_gen(parser, (str), (options))
455 static void reg_fragment_setenc_gen(struct parser_params*, VALUE, int);
456 #define reg_fragment_setenc(str,options) reg_fragment_setenc_gen(parser, (str), (options))
457 static int reg_fragment_check_gen(struct parser_params*, VALUE, int);
458 #define reg_fragment_check(str,options) reg_fragment_check_gen(parser, (str), (options))
459 static NODE *reg_named_capture_assign_gen(struct parser_params* parser, VALUE regexp, NODE *match);
460 #define reg_named_capture_assign(regexp,match) reg_named_capture_assign_gen(parser,(regexp),(match))
462 #define get_id(id) (id)
463 #define get_value(val) (val)
465 #define value_expr(node) ((void)(node))
466 #define remove_begin(node) (node)
467 #define rb_dvar_defined(id) 0
468 #define rb_local_defined(id) 0
469 static ID ripper_get_id(VALUE);
470 #define get_id(id) ripper_get_id(id)
471 static VALUE ripper_get_value(VALUE);
472 #define get_value(val) ripper_get_value(val)
473 static VALUE assignable_gen(struct parser_params*,VALUE);
474 #define assignable(lhs,node) assignable_gen(parser, (lhs))
475 static int id_is_var_gen(struct parser_params *parser, ID id);
476 #define id_is_var(id) id_is_var_gen(parser, (id))
478 #define node_assign(node1, node2) dispatch2(assign, (node1), (node2))
480 static VALUE new_op_assign_gen(struct parser_params *parser, VALUE lhs, VALUE op, VALUE rhs);
481 static VALUE new_attr_op_assign_gen(struct parser_params *parser, VALUE lhs, VALUE type, VALUE attr, VALUE op, VALUE rhs);
482 #define new_attr_op_assign(lhs, type, attr, op, rhs) new_attr_op_assign_gen(parser, (lhs), (type), (attr), (op), (rhs))
486 #define new_op_assign(lhs, op, rhs) new_op_assign_gen(parser, (lhs), (op), (rhs))
488 static ID formal_argument_gen(struct parser_params*, ID);
489 #define formal_argument(id) formal_argument_gen(parser, (id))
490 static ID shadowing_lvar_gen(struct parser_params*,ID);
491 #define shadowing_lvar(name) shadowing_lvar_gen(parser, (name))
492 static void new_bv_gen(struct parser_params*,ID);
493 #define new_bv(id) new_bv_gen(parser, (id))
495 static void local_push_gen(struct parser_params*,int);
496 #define local_push(top) local_push_gen(parser,(top))
497 static void local_pop_gen(struct parser_params*);
498 #define local_pop() local_pop_gen(parser)
499 static int local_var_gen(struct parser_params*, ID);
500 #define local_var(id) local_var_gen(parser, (id))
501 static int arg_var_gen(struct parser_params*, ID);
502 #define arg_var(id) arg_var_gen(parser, (id))
503 static int local_id_gen(struct parser_params*, ID);
504 #define local_id(id) local_id_gen(parser, (id))
505 static ID internal_id_gen(struct parser_params*);
506 #define internal_id() internal_id_gen(parser)
508 static const struct vtable *dyna_push_gen(struct parser_params *);
509 #define dyna_push() dyna_push_gen(parser)
510 static void dyna_pop_gen(struct parser_params*, const struct vtable *);
511 #define dyna_pop(node) dyna_pop_gen(parser, (node))
512 static int dyna_in_block_gen(struct parser_params*);
513 #define dyna_in_block() dyna_in_block_gen(parser)
514 #define dyna_var(id) local_var(id)
515 static int dvar_defined_gen(struct parser_params*,ID,int);
516 #define dvar_defined(id) dvar_defined_gen(parser, (id), 0)
517 #define dvar_defined_get(id) dvar_defined_gen(parser, (id), 1)
518 static int dvar_curr_gen(struct parser_params*,ID);
519 #define dvar_curr(id) dvar_curr_gen(parser, (id))
521 static int lvar_defined_gen(struct parser_params*, ID);
522 #define lvar_defined(id) lvar_defined_gen(parser, (id))
524 #define RE_OPTION_ONCE (1<<16)
525 #define RE_OPTION_ENCODING_SHIFT 8
526 #define RE_OPTION_ENCODING(e) (((e)&0xff)<<RE_OPTION_ENCODING_SHIFT)
527 #define RE_OPTION_ENCODING_IDX(o) (((o)>>RE_OPTION_ENCODING_SHIFT)&0xff)
528 #define RE_OPTION_ENCODING_NONE(o) ((o)&RE_OPTION_ARG_ENCODING_NONE)
529 #define RE_OPTION_MASK 0xff
530 #define RE_OPTION_ARG_ENCODING_NONE 32
532 #define NODE_STRTERM NODE_ZARRAY /* nothing to gc */
533 #define NODE_HEREDOC NODE_ARRAY /* 1, 3 to gc */
534 #define SIGN_EXTEND(x,n) (((1<<(n)-1)^((x)&~(~0<<(n))))-(1<<(n)-1))
535 #define nd_func u1.id
536 #if SIZEOF_SHORT == 2
537 #define nd_term(node) ((signed short)(node)->u2.id)
539 #define nd_term(node) SIGN_EXTEND((node)->u2.id, CHAR_BIT*2)
541 #define nd_paren(node) (char)((node)->u2.id >> CHAR_BIT*2)
542 #define nd_nest u3.cnt
544 /****** Ripper *******/
547 #define RIPPER_VERSION "0.1.0"
549 #include "eventids1.c"
550 #include "eventids2.c"
552 static VALUE ripper_dispatch0(struct parser_params*,ID);
553 static VALUE ripper_dispatch1(struct parser_params*,ID,VALUE);
554 static VALUE ripper_dispatch2(struct parser_params*,ID,VALUE,VALUE);
555 static VALUE ripper_dispatch3(struct parser_params*,ID,VALUE,VALUE,VALUE);
556 static VALUE ripper_dispatch4(struct parser_params*,ID,VALUE,VALUE,VALUE,VALUE);
557 static VALUE ripper_dispatch5(struct parser_params*,ID,VALUE,VALUE,VALUE,VALUE,VALUE);
558 static VALUE ripper_dispatch7(struct parser_params*,ID,VALUE,VALUE,VALUE,VALUE,VALUE,VALUE,VALUE);
560 #define dispatch0(n) ripper_dispatch0(parser, TOKEN_PASTE(ripper_id_, n))
561 #define dispatch1(n,a) ripper_dispatch1(parser, TOKEN_PASTE(ripper_id_, n), (a))
562 #define dispatch2(n,a,b) ripper_dispatch2(parser, TOKEN_PASTE(ripper_id_, n), (a), (b))
563 #define dispatch3(n,a,b,c) ripper_dispatch3(parser, TOKEN_PASTE(ripper_id_, n), (a), (b), (c))
564 #define dispatch4(n,a,b,c,d) ripper_dispatch4(parser, TOKEN_PASTE(ripper_id_, n), (a), (b), (c), (d))
565 #define dispatch5(n,a,b,c,d,e) ripper_dispatch5(parser, TOKEN_PASTE(ripper_id_, n), (a), (b), (c), (d), (e))
566 #define dispatch7(n,a,b,c,d,e,f,g) ripper_dispatch7(parser, TOKEN_PASTE(ripper_id_, n), (a), (b), (c), (d), (e), (f), (g))
568 #define yyparse ripper_yyparse
570 #define ripper_intern(s) ID2SYM(rb_intern(s))
571 static VALUE ripper_id2sym(ID);
573 #define ripper_id2sym(id) ((id) < 256 && rb_ispunct(id) ? \
574 ID2SYM(id) : ripper_id2sym(id))
577 #define arg_new() dispatch0(args_new)
578 #define arg_add(l,a) dispatch2(args_add, (l), (a))
579 #define arg_add_star(l,a) dispatch2(args_add_star, (l), (a))
580 #define arg_add_block(l,b) dispatch2(args_add_block, (l), (b))
581 #define arg_add_optblock(l,b) ((b)==Qundef? (l) : dispatch2(args_add_block, (l), (b)))
582 #define bare_assoc(v) dispatch1(bare_assoc_hash, (v))
583 #define arg_add_assocs(l,b) arg_add((l), bare_assoc(b))
585 #define args2mrhs(a) dispatch1(mrhs_new_from_args, (a))
586 #define mrhs_new() dispatch0(mrhs_new)
587 #define mrhs_add(l,a) dispatch2(mrhs_add, (l), (a))
588 #define mrhs_add_star(l,a) dispatch2(mrhs_add_star, (l), (a))
590 #define mlhs_new() dispatch0(mlhs_new)
591 #define mlhs_add(l,a) dispatch2(mlhs_add, (l), (a))
592 #define mlhs_add_star(l,a) dispatch2(mlhs_add_star, (l), (a))
594 #define params_new(pars, opts, rest, pars2, kws, kwrest, blk) \
595 dispatch7(params, (pars), (opts), (rest), (pars2), (kws), (kwrest), (blk))
597 #define blockvar_new(p,v) dispatch2(block_var, (p), (v))
598 #define blockvar_add_star(l,a) dispatch2(block_var_add_star, (l), (a))
599 #define blockvar_add_block(l,a) dispatch2(block_var_add_block, (l), (a))
601 #define method_optarg(m,a) ((a)==Qundef ? (m) : dispatch2(method_add_arg,(m),(a)))
602 #define method_arg(m,a) dispatch2(method_add_arg,(m),(a))
603 #define method_add_block(m,b) dispatch2(method_add_block, (m), (b))
605 #define escape_Qundef(x) ((x)==Qundef ? Qnil : (x))
608 new_args_gen(struct parser_params *parser, VALUE f, VALUE o, VALUE r, VALUE p, VALUE tail)
610 NODE *t = (NODE *)tail;
611 VALUE k = t->u1.value, kr = t->u2.value, b = t->u3.value;
612 return params_new(f, o, r, p, k, kr, escape_Qundef(b));
614 #define new_args(f,o,r,p,t) new_args_gen(parser, (f),(o),(r),(p),(t))
617 new_args_tail_gen(struct parser_params *parser, VALUE k, VALUE kr, VALUE b)
619 return (VALUE)rb_node_newnode(NODE_MEMO, k, kr, b);
621 #define new_args_tail(k,kr,b) new_args_tail_gen(parser, (k),(kr),(b))
629 # define ifndef_ripper(x) (x)
632 # define ifndef_ripper(x)
636 # define rb_warn0(fmt) rb_compile_warn(ruby_sourcefile, ruby_sourceline, (fmt))
637 # define rb_warnI(fmt,a) rb_compile_warn(ruby_sourcefile, ruby_sourceline, (fmt), (a))
638 # define rb_warnS(fmt,a) rb_compile_warn(ruby_sourcefile, ruby_sourceline, (fmt), (a))
639 # define rb_warn4S(file,line,fmt,a) rb_compile_warn((file), (line), (fmt), (a))
640 # define rb_warning0(fmt) rb_compile_warning(ruby_sourcefile, ruby_sourceline, (fmt))
641 # define rb_warningS(fmt,a) rb_compile_warning(ruby_sourcefile, ruby_sourceline, (fmt), (a))
643 # define rb_warn0(fmt) ripper_warn0(parser, (fmt))
644 # define rb_warnI(fmt,a) ripper_warnI(parser, (fmt), (a))
645 # define rb_warnS(fmt,a) ripper_warnS(parser, (fmt), (a))
646 # define rb_warn4S(file,line,fmt,a) ripper_warnS(parser, (fmt), (a))
647 # define rb_warning0(fmt) ripper_warning0(parser, (fmt))
648 # define rb_warningS(fmt,a) ripper_warningS(parser, (fmt), (a))
649 static void ripper_warn0(struct parser_params*, const char*);
650 static void ripper_warnI(struct parser_params*, const char*, int);
651 static void ripper_warnS(struct parser_params*, const char*, const char*);
652 static void ripper_warning0(struct parser_params*, const char*);
653 static void ripper_warningS(struct parser_params*, const char*, const char*);
657 static void ripper_compile_error(struct parser_params*, const char *fmt, ...);
658 # define rb_compile_error ripper_compile_error
659 # define compile_error ripper_compile_error
660 # define PARSER_ARG parser,
662 # define rb_compile_error rb_compile_error_with_enc
663 # define compile_error parser->nerr++,rb_compile_error_with_enc
664 # define PARSER_ARG ruby_sourcefile, ruby_sourceline, current_enc,
667 /* Older versions of Yacc set YYMAXDEPTH to a very low value by default (150,
668 for instance). This is too low for Ruby to parse some files, such as
669 date/format.rb, therefore bump the value up to at least Bison's default. */
672 #define YYMAXDEPTH 10000
677 static void token_info_push(struct parser_params*, const char *token);
678 static void token_info_pop(struct parser_params*, const char *token);
679 #define token_info_push(token) (RTEST(ruby_verbose) ? token_info_push(parser, (token)) : (void)0)
680 #define token_info_pop(token) (RTEST(ruby_verbose) ? token_info_pop(parser, (token)) : (void)0)
682 #define token_info_push(token) /* nothing */
683 #define token_info_pop(token) /* nothing */
688 %lex-param {struct parser_params *parser}
689 %parse-param {struct parser_params *parser}
696 const struct vtable *vars;
754 %token <val> tIDENTIFIER tFID tGVAR tIVAR tCONSTANT tCVAR tLABEL
755 %token <val> tINTEGER tFLOAT tSTRING_CONTENT tCHAR
756 %token <val> tNTH_REF tBACK_REF
757 %token <val> tREGEXP_END
759 %type <val> singleton strings string string1 xstring regexp
760 %type <val> string_contents xstring_contents regexp_contents string_content
761 %type <val> words symbols symbol_list qwords qsymbols word_list qword_list qsym_list word
762 %type <val> literal numeric dsym cpath
763 %type <val> top_compstmt top_stmts top_stmt
764 %type <val> bodystmt compstmt stmts stmt_or_begin stmt expr arg primary command command_call method_call
765 %type <val> expr_value arg_value primary_value fcall
766 %type <val> if_tail opt_else case_body cases opt_rescue exc_list exc_var opt_ensure
767 %type <val> args call_args opt_call_args
768 %type <val> paren_args opt_paren_args args_tail opt_args_tail block_args_tail opt_block_args_tail
769 %type <val> command_args aref_args opt_block_arg block_arg var_ref var_lhs
770 %type <val> command_asgn mrhs superclass block_call block_command
771 %type <val> f_block_optarg f_block_opt
772 %type <val> f_arglist f_args f_arg f_arg_item f_optarg f_marg f_marg_list f_margs
773 %type <val> assoc_list assocs assoc undef_list backref string_dvar for_var
774 %type <val> block_param opt_block_param block_param_def f_opt
775 %type <val> f_kwarg f_kw f_block_kwarg f_block_kw
776 %type <val> bv_decls opt_bv_decl bvar
777 %type <val> lambda f_larglist lambda_body
778 %type <val> brace_block cmd_brace_block do_block lhs none fitem
779 %type <val> mlhs mlhs_head mlhs_basic mlhs_item mlhs_node mlhs_post mlhs_inner
780 %type <val> fsym keyword_variable user_variable sym symbol operation operation2 operation3
781 %type <val> cname fname op f_rest_arg f_block_arg opt_f_block_arg f_norm_arg f_bad_arg
785 %type <val> program reswords then do dot_or_colon
787 %token END_OF_INPUT 0 "end-of-input"
788 %token tUPLUS 130 "unary+"
789 %token tUMINUS 131 "unary-"
791 %token tCMP 134 "<=>"
793 %token tEQQ 140 "==="
799 %token tMATCH 142 "=~"
800 %token tNMATCH 143 "!~"
801 %token tDOT2 128 ".."
802 %token tDOT3 129 "..."
803 %token tAREF 144 "[]"
804 %token tASET 145 "[]="
805 %token tLSHFT 135 "<<"
806 %token tRSHFT 136 ">>"
808 %token tCOLON3 ":: at EXPR_BEG"
809 %token <val> tOP_ASGN /* +=, -= etc. */
812 %token tLPAREN_ARG "( arg"
816 %token tLBRACE_ARG "{ arg"
818 %token tDSTAR "**arg"
821 %token tSYMBEG tSTRING_BEG tXSTRING_BEG tREGEXP_BEG tWORDS_BEG tQWORDS_BEG tSYMBOLS_BEG tQSYMBOLS_BEG
822 %token tSTRING_DBEG tSTRING_DEND tSTRING_DVAR tSTRING_END tLAMBEG
829 %nonassoc tLBRACE_ARG
831 %nonassoc modifier_if modifier_unless modifier_while modifier_until
832 %left keyword_or keyword_and
834 %nonassoc keyword_defined
836 %left modifier_rescue
838 %nonassoc tDOT2 tDOT3
841 %nonassoc tCMP tEQ tEQQ tNEQ tMATCH tNMATCH
842 %left '>' tGEQ '<' tLEQ
848 %right tUMINUS_NUM tUMINUS
850 %right '!' '~' tUPLUS
856 lex_state = EXPR_BEG;
858 local_push(compile_for_eval || rb_parse_in_main());
866 if ($2 && !compile_for_eval) {
867 /* last expression should not be void */
868 if (nd_type($2) != NODE_BLOCK) void_expr($2);
871 while (node->nd_next) {
872 node = node->nd_next;
874 void_expr(node->nd_head);
877 ruby_eval_tree = NEW_SCOPE(0, block_append(ruby_eval_tree, $2));
880 parser->result = dispatch1(program, $$);
886 top_compstmt : top_stmts opt_terms
890 fixup_nodes(&deferred_nodes);
902 $$ = dispatch2(stmts_add, dispatch0(stmts_new),
903 dispatch0(void_stmt));
909 $$ = newline_node($1);
911 $$ = dispatch2(stmts_add, dispatch0(stmts_new), $1);
914 | top_stmts terms top_stmt
917 $$ = block_append($1, newline_node($3));
919 $$ = dispatch2(stmts_add, $1, $3);
924 $$ = remove_begin($2);
939 ruby_eval_tree_begin = block_append(ruby_eval_tree_begin,
941 /* NEW_PREEXE($4)); */
945 $$ = dispatch1(BEGIN, $4);
958 $$ = NEW_RESCUE($1, $2, $3);
961 rb_warn0("else without rescue is useless");
962 $$ = block_append($$, $3);
966 $$ = NEW_ENSURE($$, $4);
969 $$ = block_append($4, NEW_NIL());
974 $$ = dispatch4(bodystmt,
983 compstmt : stmts opt_terms
987 fixup_nodes(&deferred_nodes);
999 $$ = dispatch2(stmts_add, dispatch0(stmts_new),
1000 dispatch0(void_stmt));
1006 $$ = newline_node($1);
1008 $$ = dispatch2(stmts_add, dispatch0(stmts_new), $1);
1011 | stmts terms stmt_or_begin
1014 $$ = block_append($1, newline_node($3));
1016 $$ = dispatch2(stmts_add, $1, $3);
1021 $$ = remove_begin($2);
1025 stmt_or_begin : stmt
1031 yyerror("BEGIN is permitted only at toplevel");
1033 /* local_push(0); */
1037 '{' top_compstmt '}'
1040 ruby_eval_tree_begin = block_append(ruby_eval_tree_begin,
1042 /* NEW_PREEXE($4)); */
1046 $$ = dispatch1(BEGIN, $4);
1050 stmt : keyword_alias fitem {lex_state = EXPR_FNAME;} fitem
1053 $$ = NEW_ALIAS($2, $4);
1055 $$ = dispatch2(alias, $2, $4);
1058 | keyword_alias tGVAR tGVAR
1061 $$ = NEW_VALIAS($2, $3);
1063 $$ = dispatch2(var_alias, $2, $3);
1066 | keyword_alias tGVAR tBACK_REF
1071 buf[1] = (char)$3->nd_nth;
1072 $$ = NEW_VALIAS($2, rb_intern2(buf, 2));
1074 $$ = dispatch2(var_alias, $2, $3);
1077 | keyword_alias tGVAR tNTH_REF
1080 yyerror("can't make alias for the number variables");
1083 $$ = dispatch2(var_alias, $2, $3);
1084 $$ = dispatch1(alias_error, $$);
1087 | keyword_undef undef_list
1092 $$ = dispatch1(undef, $2);
1095 | stmt modifier_if expr_value
1098 $$ = NEW_IF(cond($3), remove_begin($1), 0);
1101 $$ = dispatch2(if_mod, $3, $1);
1104 | stmt modifier_unless expr_value
1107 $$ = NEW_UNLESS(cond($3), remove_begin($1), 0);
1110 $$ = dispatch2(unless_mod, $3, $1);
1113 | stmt modifier_while expr_value
1116 if ($1 && nd_type($1) == NODE_BEGIN) {
1117 $$ = NEW_WHILE(cond($3), $1->nd_body, 0);
1120 $$ = NEW_WHILE(cond($3), $1, 1);
1123 $$ = dispatch2(while_mod, $3, $1);
1126 | stmt modifier_until expr_value
1129 if ($1 && nd_type($1) == NODE_BEGIN) {
1130 $$ = NEW_UNTIL(cond($3), $1->nd_body, 0);
1133 $$ = NEW_UNTIL(cond($3), $1, 1);
1136 $$ = dispatch2(until_mod, $3, $1);
1139 | stmt modifier_rescue stmt
1142 NODE *resq = NEW_RESBODY(0, remove_begin($3), 0);
1143 $$ = NEW_RESCUE(remove_begin($1), resq, 0);
1145 $$ = dispatch2(rescue_mod, $1, $3);
1148 | keyword_END '{' compstmt '}'
1150 if (in_def || in_single) {
1151 rb_warn0("END in method; use at_exit");
1154 $$ = NEW_POSTEXE(NEW_NODE(
1155 NODE_SCOPE, 0 /* tbl */, $3 /* body */, 0 /* args */));
1157 $$ = dispatch1(END, $3);
1161 | mlhs '=' command_call
1168 $$ = dispatch2(massign, $1, $3);
1171 | var_lhs tOP_ASGN command_call
1174 $$ = new_op_assign($1, $2, $3);
1176 | primary_value '[' opt_call_args rbracket tOP_ASGN command_call
1182 if (!$3) $3 = NEW_ZARRAY();
1183 args = arg_concat($3, $6);
1187 else if ($5 == tANDOP) {
1190 $$ = NEW_OP_ASGN1($1, $5, args);
1193 $$ = dispatch2(aref_field, $1, escape_Qundef($3));
1194 $$ = dispatch3(opassign, $$, $5, $6);
1197 | primary_value '.' tIDENTIFIER tOP_ASGN command_call
1200 $$ = new_attr_op_assign($1, ripper_id2sym('.'), $3, $4, $5);
1202 | primary_value '.' tCONSTANT tOP_ASGN command_call
1205 $$ = new_attr_op_assign($1, ripper_id2sym('.'), $3, $4, $5);
1207 | primary_value tCOLON2 tCONSTANT tOP_ASGN command_call
1210 $$ = NEW_COLON2($1, $3);
1211 $$ = new_const_op_assign($$, $4, $5);
1213 $$ = dispatch2(const_path_field, $1, $3);
1214 $$ = dispatch3(opassign, $$, $4, $5);
1217 | primary_value tCOLON2 tIDENTIFIER tOP_ASGN command_call
1220 $$ = new_attr_op_assign($1, ripper_intern("::"), $3, $4, $5);
1222 | backref tOP_ASGN command_call
1225 rb_backref_error($1);
1228 $$ = dispatch2(assign, dispatch1(var_field, $1), $3);
1229 $$ = dispatch1(assign_error, $$);
1236 $$ = node_assign($1, $3);
1238 $$ = dispatch2(assign, $1, $3);
1241 | mlhs '=' arg_value
1247 $$ = dispatch2(massign, $1, $3);
1256 $$ = dispatch2(massign, $1, $3);
1262 command_asgn : lhs '=' command_call
1266 $$ = node_assign($1, $3);
1268 $$ = dispatch2(assign, $1, $3);
1271 | lhs '=' command_asgn
1275 $$ = node_assign($1, $3);
1277 $$ = dispatch2(assign, $1, $3);
1284 | expr keyword_and expr
1287 $$ = logop(NODE_AND, $1, $3);
1289 $$ = dispatch3(binary, $1, ripper_intern("and"), $3);
1292 | expr keyword_or expr
1295 $$ = logop(NODE_OR, $1, $3);
1297 $$ = dispatch3(binary, $1, ripper_intern("or"), $3);
1300 | keyword_not opt_nl expr
1303 $$ = call_uni_op(cond($3), '!');
1305 $$ = dispatch2(unary, ripper_intern("not"), $3);
1311 $$ = call_uni_op(cond($2), '!');
1313 $$ = dispatch2(unary, ripper_id2sym('!'), $2);
1324 if (!$$) $$ = NEW_NIL();
1331 command_call : command
1335 block_command : block_call
1336 | block_call dot_or_colon operation2 command_args
1339 $$ = NEW_CALL($1, $3, $4);
1341 $$ = dispatch3(call, $1, $2, $3);
1342 $$ = method_arg($$, $4);
1347 cmd_brace_block : tLBRACE_ARG
1349 $<vars>1 = dyna_push();
1351 $<num>$ = ruby_sourceline;
1360 $$ = NEW_ITER($3,$4);
1361 nd_set_line($$, $<num>2);
1363 $$ = dispatch2(brace_block, escape_Qundef($3), $4);
1372 $$ = NEW_FCALL($1, 0);
1373 nd_set_line($$, tokline);
1379 command : fcall command_args %prec tLOWEST
1385 $$ = dispatch2(command, $1, $2);
1388 | fcall command_args cmd_brace_block
1391 block_dup_check($2,$3);
1397 $$ = dispatch2(command, $1, $2);
1398 $$ = method_add_block($$, $3);
1401 | primary_value '.' operation2 command_args %prec tLOWEST
1404 $$ = NEW_CALL($1, $3, $4);
1407 $$ = dispatch4(command_call, $1, ripper_id2sym('.'), $3, $4);
1410 | primary_value '.' operation2 command_args cmd_brace_block
1413 block_dup_check($4,$5);
1414 $5->nd_iter = NEW_CALL($1, $3, $4);
1418 $$ = dispatch4(command_call, $1, ripper_id2sym('.'), $3, $4);
1419 $$ = method_add_block($$, $5);
1422 | primary_value tCOLON2 operation2 command_args %prec tLOWEST
1425 $$ = NEW_CALL($1, $3, $4);
1428 $$ = dispatch4(command_call, $1, ripper_intern("::"), $3, $4);
1431 | primary_value tCOLON2 operation2 command_args cmd_brace_block
1434 block_dup_check($4,$5);
1435 $5->nd_iter = NEW_CALL($1, $3, $4);
1439 $$ = dispatch4(command_call, $1, ripper_intern("::"), $3, $4);
1440 $$ = method_add_block($$, $5);
1443 | keyword_super command_args
1449 $$ = dispatch1(super, $2);
1452 | keyword_yield command_args
1458 $$ = dispatch1(yield, $2);
1461 | keyword_return call_args
1464 $$ = NEW_RETURN(ret_args($2));
1466 $$ = dispatch1(return, $2);
1469 | keyword_break call_args
1472 $$ = NEW_BREAK(ret_args($2));
1474 $$ = dispatch1(break, $2);
1477 | keyword_next call_args
1480 $$ = NEW_NEXT(ret_args($2));
1482 $$ = dispatch1(next, $2);
1488 | tLPAREN mlhs_inner rparen
1493 $$ = dispatch1(mlhs_paren, $2);
1498 mlhs_inner : mlhs_basic
1499 | tLPAREN mlhs_inner rparen
1502 $$ = NEW_MASGN(NEW_LIST($2), 0);
1504 $$ = dispatch1(mlhs_paren, $2);
1509 mlhs_basic : mlhs_head
1512 $$ = NEW_MASGN($1, 0);
1517 | mlhs_head mlhs_item
1520 $$ = NEW_MASGN(list_append($1,$2), 0);
1522 $$ = mlhs_add($1, $2);
1525 | mlhs_head tSTAR mlhs_node
1528 $$ = NEW_MASGN($1, $3);
1530 $$ = mlhs_add_star($1, $3);
1533 | mlhs_head tSTAR mlhs_node ',' mlhs_post
1536 $$ = NEW_MASGN($1, NEW_POSTARG($3,$5));
1538 $1 = mlhs_add_star($1, $3);
1539 $$ = mlhs_add($1, $5);
1545 $$ = NEW_MASGN($1, -1);
1547 $$ = mlhs_add_star($1, Qnil);
1550 | mlhs_head tSTAR ',' mlhs_post
1553 $$ = NEW_MASGN($1, NEW_POSTARG(-1, $4));
1555 $1 = mlhs_add_star($1, Qnil);
1556 $$ = mlhs_add($1, $4);
1562 $$ = NEW_MASGN(0, $2);
1564 $$ = mlhs_add_star(mlhs_new(), $2);
1567 | tSTAR mlhs_node ',' mlhs_post
1570 $$ = NEW_MASGN(0, NEW_POSTARG($2,$4));
1572 $2 = mlhs_add_star(mlhs_new(), $2);
1573 $$ = mlhs_add($2, $4);
1579 $$ = NEW_MASGN(0, -1);
1581 $$ = mlhs_add_star(mlhs_new(), Qnil);
1584 | tSTAR ',' mlhs_post
1587 $$ = NEW_MASGN(0, NEW_POSTARG(-1, $3));
1589 $$ = mlhs_add_star(mlhs_new(), Qnil);
1590 $$ = mlhs_add($$, $3);
1595 mlhs_item : mlhs_node
1596 | tLPAREN mlhs_inner rparen
1601 $$ = dispatch1(mlhs_paren, $2);
1606 mlhs_head : mlhs_item ','
1611 $$ = mlhs_add(mlhs_new(), $1);
1614 | mlhs_head mlhs_item ','
1617 $$ = list_append($1, $2);
1619 $$ = mlhs_add($1, $2);
1624 mlhs_post : mlhs_item
1629 $$ = mlhs_add(mlhs_new(), $1);
1632 | mlhs_post ',' mlhs_item
1635 $$ = list_append($1, $3);
1637 $$ = mlhs_add($1, $3);
1642 mlhs_node : user_variable
1644 $$ = assignable($1, 0);
1648 $$ = assignable($1, 0);
1650 | primary_value '[' opt_call_args rbracket
1653 $$ = aryset($1, $3);
1655 $$ = dispatch2(aref_field, $1, escape_Qundef($3));
1658 | primary_value '.' tIDENTIFIER
1661 $$ = attrset($1, $3);
1663 $$ = dispatch3(field, $1, ripper_id2sym('.'), $3);
1666 | primary_value tCOLON2 tIDENTIFIER
1669 $$ = attrset($1, $3);
1671 $$ = dispatch2(const_path_field, $1, $3);
1674 | primary_value '.' tCONSTANT
1677 $$ = attrset($1, $3);
1679 $$ = dispatch3(field, $1, ripper_id2sym('.'), $3);
1682 | primary_value tCOLON2 tCONSTANT
1685 if (in_def || in_single)
1686 yyerror("dynamic constant assignment");
1687 $$ = NEW_CDECL(0, 0, NEW_COLON2($1, $3));
1689 if (in_def || in_single)
1690 yyerror("dynamic constant assignment");
1691 $$ = dispatch2(const_path_field, $1, $3);
1697 if (in_def || in_single)
1698 yyerror("dynamic constant assignment");
1699 $$ = NEW_CDECL(0, 0, NEW_COLON3($2));
1701 $$ = dispatch1(top_const_field, $2);
1707 rb_backref_error($1);
1710 $$ = dispatch1(var_field, $1);
1711 $$ = dispatch1(assign_error, $$);
1718 $$ = assignable($1, 0);
1720 if (!$$) $$ = NEW_BEGIN(0);
1722 $$ = dispatch1(var_field, $$);
1727 $$ = assignable($1, 0);
1729 if (!$$) $$ = NEW_BEGIN(0);
1731 $$ = dispatch1(var_field, $$);
1734 | primary_value '[' opt_call_args rbracket
1737 $$ = aryset($1, $3);
1739 $$ = dispatch2(aref_field, $1, escape_Qundef($3));
1742 | primary_value '.' tIDENTIFIER
1745 $$ = attrset($1, $3);
1747 $$ = dispatch3(field, $1, ripper_id2sym('.'), $3);
1750 | primary_value tCOLON2 tIDENTIFIER
1753 $$ = attrset($1, $3);
1755 $$ = dispatch3(field, $1, ripper_intern("::"), $3);
1758 | primary_value '.' tCONSTANT
1761 $$ = attrset($1, $3);
1763 $$ = dispatch3(field, $1, ripper_id2sym('.'), $3);
1766 | primary_value tCOLON2 tCONSTANT
1769 if (in_def || in_single)
1770 yyerror("dynamic constant assignment");
1771 $$ = NEW_CDECL(0, 0, NEW_COLON2($1, $3));
1773 $$ = dispatch2(const_path_field, $1, $3);
1774 if (in_def || in_single) {
1775 $$ = dispatch1(assign_error, $$);
1782 if (in_def || in_single)
1783 yyerror("dynamic constant assignment");
1784 $$ = NEW_CDECL(0, 0, NEW_COLON3($2));
1786 $$ = dispatch1(top_const_field, $2);
1787 if (in_def || in_single) {
1788 $$ = dispatch1(assign_error, $$);
1795 rb_backref_error($1);
1798 $$ = dispatch1(assign_error, $1);
1806 yyerror("class/module name must be CONSTANT");
1808 $$ = dispatch1(class_name_error, $1);
1814 cpath : tCOLON3 cname
1817 $$ = NEW_COLON3($2);
1819 $$ = dispatch1(top_const_ref, $2);
1825 $$ = NEW_COLON2(0, $$);
1827 $$ = dispatch1(const_ref, $1);
1830 | primary_value tCOLON2 cname
1833 $$ = NEW_COLON2($1, $3);
1835 $$ = dispatch2(const_path_ref, $1, $3);
1845 lex_state = EXPR_ENDFN;
1850 lex_state = EXPR_ENDFN;
1866 $$ = NEW_LIT(ID2SYM($1));
1868 $$ = dispatch1(symbol_literal, $1);
1879 $$ = rb_ary_new3(1, $1);
1882 | undef_list ',' {lex_state = EXPR_FNAME;} fitem
1885 $$ = block_append($1, NEW_UNDEF($4));
1887 rb_ary_push($1, $4);
1892 op : '|' { ifndef_ripper($$ = '|'); }
1893 | '^' { ifndef_ripper($$ = '^'); }
1894 | '&' { ifndef_ripper($$ = '&'); }
1895 | tCMP { ifndef_ripper($$ = tCMP); }
1896 | tEQ { ifndef_ripper($$ = tEQ); }
1897 | tEQQ { ifndef_ripper($$ = tEQQ); }
1898 | tMATCH { ifndef_ripper($$ = tMATCH); }
1899 | tNMATCH { ifndef_ripper($$ = tNMATCH); }
1900 | '>' { ifndef_ripper($$ = '>'); }
1901 | tGEQ { ifndef_ripper($$ = tGEQ); }
1902 | '<' { ifndef_ripper($$ = '<'); }
1903 | tLEQ { ifndef_ripper($$ = tLEQ); }
1904 | tNEQ { ifndef_ripper($$ = tNEQ); }
1905 | tLSHFT { ifndef_ripper($$ = tLSHFT); }
1906 | tRSHFT { ifndef_ripper($$ = tRSHFT); }
1907 | '+' { ifndef_ripper($$ = '+'); }
1908 | '-' { ifndef_ripper($$ = '-'); }
1909 | '*' { ifndef_ripper($$ = '*'); }
1910 | tSTAR { ifndef_ripper($$ = '*'); }
1911 | '/' { ifndef_ripper($$ = '/'); }
1912 | '%' { ifndef_ripper($$ = '%'); }
1913 | tPOW { ifndef_ripper($$ = tPOW); }
1914 | tDSTAR { ifndef_ripper($$ = tDSTAR); }
1915 | '!' { ifndef_ripper($$ = '!'); }
1916 | '~' { ifndef_ripper($$ = '~'); }
1917 | tUPLUS { ifndef_ripper($$ = tUPLUS); }
1918 | tUMINUS { ifndef_ripper($$ = tUMINUS); }
1919 | tAREF { ifndef_ripper($$ = tAREF); }
1920 | tASET { ifndef_ripper($$ = tASET); }
1921 | '`' { ifndef_ripper($$ = '`'); }
1924 reswords : keyword__LINE__ | keyword__FILE__ | keyword__ENCODING__
1925 | keyword_BEGIN | keyword_END
1926 | keyword_alias | keyword_and | keyword_begin
1927 | keyword_break | keyword_case | keyword_class | keyword_def
1928 | keyword_defined | keyword_do | keyword_else | keyword_elsif
1929 | keyword_end | keyword_ensure | keyword_false
1930 | keyword_for | keyword_in | keyword_module | keyword_next
1931 | keyword_nil | keyword_not | keyword_or | keyword_redo
1932 | keyword_rescue | keyword_retry | keyword_return | keyword_self
1933 | keyword_super | keyword_then | keyword_true | keyword_undef
1934 | keyword_when | keyword_yield | keyword_if | keyword_unless
1935 | keyword_while | keyword_until
1942 $$ = node_assign($1, $3);
1944 $$ = dispatch2(assign, $1, $3);
1947 | lhs '=' arg modifier_rescue arg
1951 $3 = NEW_RESCUE($3, NEW_RESBODY(0,$5,0), 0);
1952 $$ = node_assign($1, $3);
1954 $$ = dispatch2(assign, $1, dispatch2(rescue_mod, $3, $5));
1957 | var_lhs tOP_ASGN arg
1960 $$ = new_op_assign($1, $2, $3);
1962 | var_lhs tOP_ASGN arg modifier_rescue arg
1966 $3 = NEW_RESCUE($3, NEW_RESBODY(0,$5,0), 0);
1968 $3 = dispatch2(rescue_mod, $3, $5);
1970 $$ = new_op_assign($1, $2, $3);
1972 | primary_value '[' opt_call_args rbracket tOP_ASGN arg
1978 if (!$3) $3 = NEW_ZARRAY();
1979 if (nd_type($3) == NODE_BLOCK_PASS) {
1980 args = NEW_ARGSCAT($3, $6);
1983 args = arg_concat($3, $6);
1988 else if ($5 == tANDOP) {
1991 $$ = NEW_OP_ASGN1($1, $5, args);
1994 $1 = dispatch2(aref_field, $1, escape_Qundef($3));
1995 $$ = dispatch3(opassign, $1, $5, $6);
1998 | primary_value '.' tIDENTIFIER tOP_ASGN arg
2001 $$ = new_attr_op_assign($1, ripper_id2sym('.'), $3, $4, $5);
2003 | primary_value '.' tCONSTANT tOP_ASGN arg
2006 $$ = new_attr_op_assign($1, ripper_id2sym('.'), $3, $4, $5);
2008 | primary_value tCOLON2 tIDENTIFIER tOP_ASGN arg
2011 $$ = new_attr_op_assign($1, ripper_intern("::"), $3, $4, $5);
2013 | primary_value tCOLON2 tCONSTANT tOP_ASGN arg
2016 $$ = NEW_COLON2($1, $3);
2017 $$ = new_const_op_assign($$, $4, $5);
2019 $$ = dispatch2(const_path_field, $1, $3);
2020 $$ = dispatch3(opassign, $$, $4, $5);
2023 | tCOLON3 tCONSTANT tOP_ASGN arg
2026 $$ = NEW_COLON3($2);
2027 $$ = new_const_op_assign($$, $3, $4);
2029 $$ = dispatch1(top_const_field, $2);
2030 $$ = dispatch3(opassign, $$, $3, $4);
2033 | backref tOP_ASGN arg
2036 rb_backref_error($1);
2039 $$ = dispatch1(var_field, $1);
2040 $$ = dispatch3(opassign, $$, $2, $3);
2041 $$ = dispatch1(assign_error, $$);
2049 $$ = NEW_DOT2($1, $3);
2050 if (nd_type($1) == NODE_LIT && FIXNUM_P($1->nd_lit) &&
2051 nd_type($3) == NODE_LIT && FIXNUM_P($3->nd_lit)) {
2052 deferred_nodes = list_append(deferred_nodes, $$);
2055 $$ = dispatch2(dot2, $1, $3);
2063 $$ = NEW_DOT3($1, $3);
2064 if (nd_type($1) == NODE_LIT && FIXNUM_P($1->nd_lit) &&
2065 nd_type($3) == NODE_LIT && FIXNUM_P($3->nd_lit)) {
2066 deferred_nodes = list_append(deferred_nodes, $$);
2069 $$ = dispatch2(dot3, $1, $3);
2075 $$ = call_bin_op($1, '+', $3);
2077 $$ = dispatch3(binary, $1, ID2SYM('+'), $3);
2083 $$ = call_bin_op($1, '-', $3);
2085 $$ = dispatch3(binary, $1, ID2SYM('-'), $3);
2091 $$ = call_bin_op($1, '*', $3);
2093 $$ = dispatch3(binary, $1, ID2SYM('*'), $3);
2099 $$ = call_bin_op($1, '/', $3);
2101 $$ = dispatch3(binary, $1, ID2SYM('/'), $3);
2107 $$ = call_bin_op($1, '%', $3);
2109 $$ = dispatch3(binary, $1, ID2SYM('%'), $3);
2115 $$ = call_bin_op($1, tPOW, $3);
2117 $$ = dispatch3(binary, $1, ripper_intern("**"), $3);
2120 | tUMINUS_NUM tINTEGER tPOW arg
2123 $$ = NEW_CALL(call_bin_op($2, tPOW, $4), tUMINUS, 0);
2125 $$ = dispatch3(binary, $2, ripper_intern("**"), $4);
2126 $$ = dispatch2(unary, ripper_intern("-@"), $$);
2129 | tUMINUS_NUM tFLOAT tPOW arg
2132 $$ = NEW_CALL(call_bin_op($2, tPOW, $4), tUMINUS, 0);
2134 $$ = dispatch3(binary, $2, ripper_intern("**"), $4);
2135 $$ = dispatch2(unary, ripper_intern("-@"), $$);
2141 $$ = call_uni_op($2, tUPLUS);
2143 $$ = dispatch2(unary, ripper_intern("+@"), $2);
2149 $$ = call_uni_op($2, tUMINUS);
2151 $$ = dispatch2(unary, ripper_intern("-@"), $2);
2157 $$ = call_bin_op($1, '|', $3);
2159 $$ = dispatch3(binary, $1, ID2SYM('|'), $3);
2165 $$ = call_bin_op($1, '^', $3);
2167 $$ = dispatch3(binary, $1, ID2SYM('^'), $3);
2173 $$ = call_bin_op($1, '&', $3);
2175 $$ = dispatch3(binary, $1, ID2SYM('&'), $3);
2181 $$ = call_bin_op($1, tCMP, $3);
2183 $$ = dispatch3(binary, $1, ripper_intern("<=>"), $3);
2189 $$ = call_bin_op($1, '>', $3);
2191 $$ = dispatch3(binary, $1, ID2SYM('>'), $3);
2197 $$ = call_bin_op($1, tGEQ, $3);
2199 $$ = dispatch3(binary, $1, ripper_intern(">="), $3);
2205 $$ = call_bin_op($1, '<', $3);
2207 $$ = dispatch3(binary, $1, ID2SYM('<'), $3);
2213 $$ = call_bin_op($1, tLEQ, $3);
2215 $$ = dispatch3(binary, $1, ripper_intern("<="), $3);
2221 $$ = call_bin_op($1, tEQ, $3);
2223 $$ = dispatch3(binary, $1, ripper_intern("=="), $3);
2229 $$ = call_bin_op($1, tEQQ, $3);
2231 $$ = dispatch3(binary, $1, ripper_intern("==="), $3);
2237 $$ = call_bin_op($1, tNEQ, $3);
2239 $$ = dispatch3(binary, $1, ripper_intern("!="), $3);
2245 $$ = match_op($1, $3);
2246 if (nd_type($1) == NODE_LIT && RB_TYPE_P($1->nd_lit, T_REGEXP)) {
2247 $$ = reg_named_capture_assign($1->nd_lit, $$);
2250 $$ = dispatch3(binary, $1, ripper_intern("=~"), $3);
2256 $$ = call_bin_op($1, tNMATCH, $3);
2258 $$ = dispatch3(binary, $1, ripper_intern("!~"), $3);
2264 $$ = call_uni_op(cond($2), '!');
2266 $$ = dispatch2(unary, ID2SYM('!'), $2);
2272 $$ = call_uni_op($2, '~');
2274 $$ = dispatch2(unary, ID2SYM('~'), $2);
2280 $$ = call_bin_op($1, tLSHFT, $3);
2282 $$ = dispatch3(binary, $1, ripper_intern("<<"), $3);
2288 $$ = call_bin_op($1, tRSHFT, $3);
2290 $$ = dispatch3(binary, $1, ripper_intern(">>"), $3);
2296 $$ = logop(NODE_AND, $1, $3);
2298 $$ = dispatch3(binary, $1, ripper_intern("&&"), $3);
2304 $$ = logop(NODE_OR, $1, $3);
2306 $$ = dispatch3(binary, $1, ripper_intern("||"), $3);
2309 | keyword_defined opt_nl {in_defined = 1;} arg
2313 $$ = NEW_DEFINED($4);
2316 $$ = dispatch1(defined, $4);
2319 | arg '?' arg opt_nl ':' arg
2323 $$ = NEW_IF(cond($1), $3, $6);
2326 $$ = dispatch3(ifop, $1, $3, $6);
2340 if (!$$) $$ = NEW_NIL();
2352 | args ',' assocs trailer
2355 $$ = arg_append($1, NEW_HASH($3));
2357 $$ = arg_add_assocs($1, $3);
2363 $$ = NEW_LIST(NEW_HASH($1));
2365 $$ = arg_add_assocs(arg_new(), $1);
2370 paren_args : '(' opt_call_args rparen
2375 $$ = dispatch1(arg_paren, escape_Qundef($2));
2380 opt_paren_args : none
2384 opt_call_args : none
2390 | args ',' assocs ','
2393 $$ = arg_append($1, NEW_HASH($3));
2395 $$ = arg_add_assocs($1, $3);
2401 $$ = NEW_LIST(NEW_HASH($1));
2403 $$ = arg_add_assocs(arg_new(), $1);
2414 $$ = arg_add(arg_new(), $1);
2417 | args opt_block_arg
2420 $$ = arg_blk_pass($1, $2);
2422 $$ = arg_add_optblock($1, $2);
2425 | assocs opt_block_arg
2428 $$ = NEW_LIST(NEW_HASH($1));
2429 $$ = arg_blk_pass($$, $2);
2431 $$ = arg_add_assocs(arg_new(), $1);
2432 $$ = arg_add_optblock($$, $2);
2435 | args ',' assocs opt_block_arg
2438 $$ = arg_append($1, NEW_HASH($3));
2439 $$ = arg_blk_pass($$, $4);
2441 $$ = arg_add_optblock(arg_add_assocs($1, $3), $4);
2448 $$ = arg_add_block(arg_new(), $1);
2454 $<val>$ = cmdarg_stack;
2460 cmdarg_stack = $<val>1;
2465 block_arg : tAMPER arg_value
2468 $$ = NEW_BLOCK_PASS($2);
2475 opt_block_arg : ',' block_arg
2490 $$ = arg_add(arg_new(), $1);
2498 $$ = arg_add_star(arg_new(), $2);
2501 | args ',' arg_value
2505 if ((n1 = splat_array($1)) != 0) {
2506 $$ = list_append(n1, $3);
2509 $$ = arg_append($1, $3);
2512 $$ = arg_add($1, $3);
2515 | args ',' tSTAR arg_value
2519 if ((nd_type($4) == NODE_ARRAY) && (n1 = splat_array($1)) != 0) {
2520 $$ = list_concat(n1, $4);
2523 $$ = arg_concat($1, $4);
2526 $$ = arg_add_star($1, $4);
2531 mrhs : args ',' arg_value
2535 if ((n1 = splat_array($1)) != 0) {
2536 $$ = list_append(n1, $3);
2539 $$ = arg_append($1, $3);
2542 $$ = mrhs_add(args2mrhs($1), $3);
2545 | args ',' tSTAR arg_value
2549 if (nd_type($4) == NODE_ARRAY &&
2550 (n1 = splat_array($1)) != 0) {
2551 $$ = list_concat(n1, $4);
2554 $$ = arg_concat($1, $4);
2557 $$ = mrhs_add_star(args2mrhs($1), $4);
2565 $$ = mrhs_add_star(mrhs_new(), $2);
2583 $$ = NEW_FCALL($1, 0);
2585 $$ = method_arg(dispatch1(fcall, $1), arg_new());
2590 $<val>1 = cmdarg_stack;
2593 $<num>$ = ruby_sourceline;
2600 cmdarg_stack = $<val>1;
2606 if (nd_type($3) == NODE_RESCUE ||
2607 nd_type($3) == NODE_ENSURE)
2608 nd_set_line($3, $<num>2);
2611 nd_set_line($$, $<num>2);
2613 $$ = dispatch1(begin, $3);
2616 | tLPAREN_ARG {lex_state = EXPR_ENDARG;} rparen
2621 $$ = dispatch1(paren, 0);
2626 $<val>1 = cmdarg_stack;
2629 expr {lex_state = EXPR_ENDARG;} rparen
2631 cmdarg_stack = $<val>1;
2635 $$ = dispatch1(paren, $3);
2638 | tLPAREN compstmt ')'
2643 $$ = dispatch1(paren, $2);
2646 | primary_value tCOLON2 tCONSTANT
2649 $$ = NEW_COLON2($1, $3);
2651 $$ = dispatch2(const_path_ref, $1, $3);
2657 $$ = NEW_COLON3($2);
2659 $$ = dispatch1(top_const_ref, $2);
2662 | tLBRACK aref_args ']'
2666 $$ = NEW_ZARRAY(); /* zero length array*/
2672 $$ = dispatch1(array, escape_Qundef($2));
2675 | tLBRACE assoc_list '}'
2680 $$ = dispatch1(hash, escape_Qundef($2));
2688 $$ = dispatch0(return0);
2691 | keyword_yield '(' call_args rparen
2696 $$ = dispatch1(yield, dispatch1(paren, $3));
2699 | keyword_yield '(' rparen
2704 $$ = dispatch1(yield, dispatch1(paren, arg_new()));
2712 $$ = dispatch0(yield0);
2715 | keyword_defined opt_nl '(' {in_defined = 1;} expr rparen
2719 $$ = NEW_DEFINED($5);
2722 $$ = dispatch1(defined, $5);
2725 | keyword_not '(' expr rparen
2728 $$ = call_uni_op(cond($3), '!');
2730 $$ = dispatch2(unary, ripper_intern("not"), $3);
2733 | keyword_not '(' rparen
2736 $$ = call_uni_op(cond(NEW_NIL()), '!');
2738 $$ = dispatch2(unary, ripper_intern("not"), Qnil);
2747 $$ = method_arg(dispatch1(fcall, $1), arg_new());
2748 $$ = method_add_block($$, $2);
2752 | method_call brace_block
2755 block_dup_check($1->nd_args, $2);
2759 $$ = method_add_block($1, $2);
2766 | k_if expr_value then
2772 $$ = NEW_IF(cond($2), $4, $5);
2775 $$ = dispatch3(if, $2, $4, escape_Qundef($5));
2778 | k_unless expr_value then
2784 $$ = NEW_UNLESS(cond($2), $4, $5);
2787 $$ = dispatch3(unless, $2, $4, escape_Qundef($5));
2790 | k_while {COND_PUSH(1);} expr_value do {COND_POP();}
2795 $$ = NEW_WHILE(cond($3), $6, 1);
2798 $$ = dispatch2(while, $3, $6);
2801 | k_until {COND_PUSH(1);} expr_value do {COND_POP();}
2806 $$ = NEW_UNTIL(cond($3), $6, 1);
2809 $$ = dispatch2(until, $3, $6);
2812 | k_case expr_value opt_terms
2817 $$ = NEW_CASE($2, $4);
2820 $$ = dispatch2(case, $2, $4);
2823 | k_case opt_terms case_body k_end
2826 $$ = NEW_CASE(0, $3);
2828 $$ = dispatch2(case, Qnil, $3);
2831 | k_for for_var keyword_in
2842 * e.each{|*x| a, b, c = x
2846 * e.each{|x| a, = x}
2848 ID id = internal_id();
2849 ID *tbl = ALLOC_N(ID, 2);
2850 NODE *m = NEW_ARGS_AUX(0, 0);
2853 if (nd_type($2) == NODE_MASGN) {
2854 /* if args.length == 1 && args[0].kind_of?(Array)
2858 NODE *one = NEW_LIST(NEW_LIT(INT2FIX(1)));
2859 NODE *zero = NEW_LIST(NEW_LIT(INT2FIX(0)));
2860 m->nd_next = block_append(
2863 NEW_CALL(NEW_CALL(NEW_DVAR(id), idLength, 0),
2865 NEW_CALL(NEW_CALL(NEW_DVAR(id), idAREF, zero),
2866 rb_intern("kind_of?"), NEW_LIST(NEW_LIT(rb_cArray))),
2869 NEW_CALL(NEW_DVAR(id), idAREF, zero)),
2871 node_assign($2, NEW_DVAR(id)));
2873 args = new_args(m, 0, id, 0, new_args_tail(0, 0, 0));
2876 if (nd_type($2) == NODE_LASGN ||
2877 nd_type($2) == NODE_DASGN ||
2878 nd_type($2) == NODE_DASGN_CURR) {
2879 $2->nd_value = NEW_DVAR(id);
2882 args = new_args(m, 0, 0, 0, new_args_tail(0, 0, 0));
2885 m->nd_next = node_assign(NEW_MASGN(NEW_LIST($2), 0), NEW_DVAR(id));
2886 args = new_args(m, 0, id, 0, new_args_tail(0, 0, 0));
2889 scope = NEW_NODE(NODE_SCOPE, tbl, $8, args);
2890 tbl[0] = 1; tbl[1] = id;
2891 $$ = NEW_FOR(0, $5, scope);
2894 $$ = dispatch3(for, $2, $5, $8);
2897 | k_class cpath superclass
2899 if (in_def || in_single)
2900 yyerror("class definition in method body");
2903 $<num>$ = ruby_sourceline;
2911 $$ = NEW_CLASS($2, $5, $3);
2912 nd_set_line($$, $<num>4);
2914 $$ = dispatch3(class, $2, $3, $5);
2918 | k_class tLSHFT expr
2925 $<num>$ = in_single;
2933 $$ = NEW_SCLASS($3, $7);
2936 $$ = dispatch2(sclass, $3, $7);
2940 in_single = $<num>6;
2944 if (in_def || in_single)
2945 yyerror("module definition in method body");
2948 $<num>$ = ruby_sourceline;
2956 $$ = NEW_MODULE($2, $4);
2957 nd_set_line($$, $<num>3);
2959 $$ = dispatch2(module, $2, $4);
2975 NODE *body = remove_begin($5);
2976 reduce_nodes(&body);
2977 $$ = NEW_DEFN($2, $4, body, NOEX_PRIVATE);
2978 nd_set_line($$, $<num>1);
2980 $$ = dispatch3(def, $2, $4, $5);
2986 | k_def singleton dot_or_colon {lex_state = EXPR_FNAME;} fname
2989 lex_state = EXPR_ENDFN; /* force for args */
2997 NODE *body = remove_begin($8);
2998 reduce_nodes(&body);
2999 $$ = NEW_DEFS($2, $5, $7, body);
3000 nd_set_line($$, $<num>1);
3002 $$ = dispatch5(defs, $2, $3, $5, $7, $8);
3012 $$ = dispatch1(break, arg_new());
3020 $$ = dispatch1(next, arg_new());
3028 $$ = dispatch0(redo);
3036 $$ = dispatch0(retry);
3041 primary_value : primary
3046 if (!$$) $$ = NEW_NIL();
3053 k_begin : keyword_begin
3055 token_info_push("begin");
3061 token_info_push("if");
3065 k_unless : keyword_unless
3067 token_info_push("unless");
3071 k_while : keyword_while
3073 token_info_push("while");
3077 k_until : keyword_until
3079 token_info_push("until");
3083 k_case : keyword_case
3085 token_info_push("case");
3091 token_info_push("for");
3095 k_class : keyword_class
3097 token_info_push("class");
3101 k_module : keyword_module
3103 token_info_push("module");
3109 token_info_push("def");
3111 $<num>$ = ruby_sourceline;
3119 token_info_pop("end");
3145 | keyword_elsif expr_value then
3150 $$ = NEW_IF(cond($2), $4, $5);
3153 $$ = dispatch3(elsif, $2, $4, escape_Qundef($5));
3159 | keyword_else compstmt
3164 $$ = dispatch1(else, $2);
3175 $$ = assignable($1, 0);
3178 $$ = dispatch1(mlhs_paren, $$);
3181 | tLPAREN f_margs rparen
3186 $$ = dispatch1(mlhs_paren, $2);
3191 f_marg_list : f_marg
3196 $$ = mlhs_add(mlhs_new(), $1);
3199 | f_marg_list ',' f_marg
3202 $$ = list_append($1, $3);
3204 $$ = mlhs_add($1, $3);
3209 f_margs : f_marg_list
3212 $$ = NEW_MASGN($1, 0);
3217 | f_marg_list ',' tSTAR f_norm_arg
3219 $$ = assignable($4, 0);
3221 $$ = NEW_MASGN($1, $$);
3223 $$ = mlhs_add_star($1, $$);
3226 | f_marg_list ',' tSTAR f_norm_arg ',' f_marg_list
3228 $$ = assignable($4, 0);
3230 $$ = NEW_MASGN($1, NEW_POSTARG($$, $6));
3232 $$ = mlhs_add_star($1, $$);
3235 | f_marg_list ',' tSTAR
3238 $$ = NEW_MASGN($1, -1);
3240 $$ = mlhs_add_star($1, Qnil);
3243 | f_marg_list ',' tSTAR ',' f_marg_list
3246 $$ = NEW_MASGN($1, NEW_POSTARG(-1, $5));
3248 $$ = mlhs_add_star($1, $5);
3253 $$ = assignable($2, 0);
3255 $$ = NEW_MASGN(0, $$);
3257 $$ = mlhs_add_star(mlhs_new(), $$);
3260 | tSTAR f_norm_arg ',' f_marg_list
3262 $$ = assignable($2, 0);
3264 $$ = NEW_MASGN(0, NEW_POSTARG($$, $4));
3269 $$ = mlhs_add_star($$, $4);
3275 $$ = NEW_MASGN(0, -1);
3277 $$ = mlhs_add_star(mlhs_new(), Qnil);
3280 | tSTAR ',' f_marg_list
3283 $$ = NEW_MASGN(0, NEW_POSTARG(-1, $3));
3285 $$ = mlhs_add_star(mlhs_new(), Qnil);
3291 block_args_tail : f_block_kwarg ',' f_kwrest opt_f_block_arg
3293 $$ = new_args_tail($1, $3, $4);
3295 | f_block_kwarg opt_f_block_arg
3297 $$ = new_args_tail($1, Qnone, $2);
3299 | f_kwrest opt_f_block_arg
3301 $$ = new_args_tail(Qnone, $1, $2);
3305 $$ = new_args_tail(Qnone, Qnone, $1);
3309 opt_block_args_tail : ',' block_args_tail
3315 $$ = new_args_tail(Qnone, Qnone, Qnone);
3319 block_param : f_arg ',' f_block_optarg ',' f_rest_arg opt_block_args_tail
3321 $$ = new_args($1, $3, $5, Qnone, $6);
3323 | f_arg ',' f_block_optarg ',' f_rest_arg ',' f_arg opt_block_args_tail
3325 $$ = new_args($1, $3, $5, $7, $8);
3327 | f_arg ',' f_block_optarg opt_block_args_tail
3329 $$ = new_args($1, $3, Qnone, Qnone, $4);
3331 | f_arg ',' f_block_optarg ',' f_arg opt_block_args_tail
3333 $$ = new_args($1, $3, Qnone, $5, $6);
3335 | f_arg ',' f_rest_arg opt_block_args_tail
3337 $$ = new_args($1, Qnone, $3, Qnone, $4);
3341 $$ = new_args($1, Qnone, 1, Qnone, new_args_tail(Qnone, Qnone, Qnone));
3344 dispatch1(excessed_comma, $$);
3347 | f_arg ',' f_rest_arg ',' f_arg opt_block_args_tail
3349 $$ = new_args($1, Qnone, $3, $5, $6);
3351 | f_arg opt_block_args_tail
3353 $$ = new_args($1, Qnone, Qnone, Qnone, $2);
3355 | f_block_optarg ',' f_rest_arg opt_block_args_tail
3357 $$ = new_args(Qnone, $1, $3, Qnone, $4);
3359 | f_block_optarg ',' f_rest_arg ',' f_arg opt_block_args_tail
3361 $$ = new_args(Qnone, $1, $3, $5, $6);
3363 | f_block_optarg opt_block_args_tail
3365 $$ = new_args(Qnone, $1, Qnone, Qnone, $2);
3367 | f_block_optarg ',' f_arg opt_block_args_tail
3369 $$ = new_args(Qnone, $1, Qnone, $3, $4);
3371 | f_rest_arg opt_block_args_tail
3373 $$ = new_args(Qnone, Qnone, $1, Qnone, $2);
3375 | f_rest_arg ',' f_arg opt_block_args_tail
3377 $$ = new_args(Qnone, Qnone, $1, $3, $4);
3381 $$ = new_args(Qnone, Qnone, Qnone, Qnone, $1);
3385 opt_block_param : none
3388 command_start = TRUE;
3392 block_param_def : '|' opt_bv_decl '|'
3397 $$ = blockvar_new(params_new(Qnil,Qnil,Qnil,Qnil,Qnil,Qnil,Qnil),
3406 $$ = blockvar_new(params_new(Qnil,Qnil,Qnil,Qnil,Qnil,Qnil,Qnil),
3410 | '|' block_param opt_bv_decl '|'
3415 $$ = blockvar_new(escape_Qundef($2), escape_Qundef($3));
3421 opt_bv_decl : opt_nl
3425 | opt_nl ';' bv_decls opt_nl
3439 $$ = rb_ary_new3(1, $1);
3446 rb_ary_push($1, $3);
3466 $<vars>$ = dyna_push();
3470 lpar_beg = ++paren_nest;
3474 $<num>$ = ruby_sourceline;
3480 $$ = NEW_LAMBDA($3, $5);
3481 nd_set_line($$, $<num>4);
3483 $$ = dispatch2(lambda, $3, $5);
3489 f_larglist : '(' f_args opt_bv_decl ')'
3494 $$ = dispatch1(paren, $2);
3507 lambda_body : tLAMBEG compstmt '}'
3511 | keyword_do_LAMBDA compstmt keyword_end
3517 do_block : keyword_do_block
3519 $<vars>1 = dyna_push();
3521 $<num>$ = ruby_sourceline;
3529 $$ = NEW_ITER($3,$4);
3530 nd_set_line($$, $<num>2);
3532 $$ = dispatch2(do_block, escape_Qundef($3), $4);
3538 block_call : command do_block
3541 if (nd_type($1) == NODE_YIELD) {
3542 compile_error(PARSER_ARG "block given to yield");
3545 block_dup_check($1->nd_args, $2);
3551 $$ = method_add_block($1, $2);
3554 | block_call dot_or_colon operation2 opt_paren_args
3557 $$ = NEW_CALL($1, $3, $4);
3559 $$ = dispatch3(call, $1, $2, $3);
3560 $$ = method_optarg($$, $4);
3563 | block_call dot_or_colon operation2 opt_paren_args brace_block
3566 block_dup_check($4, $5);
3567 $5->nd_iter = NEW_CALL($1, $3, $4);
3571 $$ = dispatch4(command_call, $1, $2, $3, $4);
3572 $$ = method_add_block($$, $5);
3575 | block_call dot_or_colon operation2 command_args do_block
3578 block_dup_check($4, $5);
3579 $5->nd_iter = NEW_CALL($1, $3, $4);
3583 $$ = dispatch4(command_call, $1, $2, $3, $4);
3584 $$ = method_add_block($$, $5);
3589 method_call : fcall paren_args
3595 $$ = method_arg(dispatch1(fcall, $1), $2);
3598 | primary_value '.' operation2
3601 $<num>$ = ruby_sourceline;
3607 $$ = NEW_CALL($1, $3, $5);
3608 nd_set_line($$, $<num>4);
3610 $$ = dispatch3(call, $1, ripper_id2sym('.'), $3);
3611 $$ = method_optarg($$, $5);
3614 | primary_value tCOLON2 operation2
3617 $<num>$ = ruby_sourceline;
3623 $$ = NEW_CALL($1, $3, $5);
3624 nd_set_line($$, $<num>4);
3626 $$ = dispatch3(call, $1, ripper_id2sym('.'), $3);
3627 $$ = method_optarg($$, $5);
3630 | primary_value tCOLON2 operation3
3633 $$ = NEW_CALL($1, $3, 0);
3635 $$ = dispatch3(call, $1, ripper_intern("::"), $3);
3641 $<num>$ = ruby_sourceline;
3647 $$ = NEW_CALL($1, rb_intern("call"), $4);
3648 nd_set_line($$, $<num>3);
3650 $$ = dispatch3(call, $1, ripper_id2sym('.'),
3651 ripper_intern("call"));
3652 $$ = method_optarg($$, $4);
3655 | primary_value tCOLON2
3658 $<num>$ = ruby_sourceline;
3664 $$ = NEW_CALL($1, rb_intern("call"), $4);
3665 nd_set_line($$, $<num>3);
3667 $$ = dispatch3(call, $1, ripper_intern("::"),
3668 ripper_intern("call"));
3669 $$ = method_optarg($$, $4);
3672 | keyword_super paren_args
3677 $$ = dispatch1(super, $2);
3685 $$ = dispatch0(zsuper);
3688 | primary_value '[' opt_call_args rbracket
3691 if ($1 && nd_type($1) == NODE_SELF)
3692 $$ = NEW_FCALL(tAREF, $3);
3694 $$ = NEW_CALL($1, tAREF, $3);
3697 $$ = dispatch2(aref, $1, escape_Qundef($3));
3704 $<vars>1 = dyna_push();
3706 $<num>$ = ruby_sourceline;
3714 $$ = NEW_ITER($3,$4);
3715 nd_set_line($$, $<num>2);
3717 $$ = dispatch2(brace_block, escape_Qundef($3), $4);
3723 $<vars>1 = dyna_push();
3725 $<num>$ = ruby_sourceline;
3730 compstmt keyword_end
3733 $$ = NEW_ITER($3,$4);
3734 nd_set_line($$, $<num>2);
3736 $$ = dispatch2(do_block, escape_Qundef($3), $4);
3742 case_body : keyword_when args then
3747 $$ = NEW_WHEN($2, $4, $5);
3749 $$ = dispatch3(when, $2, $4, escape_Qundef($5));
3758 opt_rescue : keyword_rescue exc_list exc_var then
3764 $3 = node_assign($3, NEW_ERRINFO());
3765 $5 = block_append($3, $5);
3767 $$ = NEW_RESBODY($2, $5, $6);
3768 fixpos($$, $2?$2:$5);
3770 $$ = dispatch4(rescue,
3780 exc_list : arg_value
3785 $$ = rb_ary_new3(1, $1);
3791 if (!($$ = splat_array($1))) $$ = $1;
3799 exc_var : tASSOC lhs
3806 opt_ensure : keyword_ensure compstmt
3811 $$ = dispatch1(ensure, $2);
3821 $$ = NEW_LIT(ID2SYM($1));
3823 $$ = dispatch1(symbol_literal, $1);
3834 node = NEW_STR(STR_NEW0());
3837 node = evstr2dstr(node);
3851 $$ = literal_concat($1, $2);
3853 $$ = dispatch2(string_concat, $1, $2);
3858 string1 : tSTRING_BEG string_contents tSTRING_END
3863 $$ = dispatch1(string_literal, $2);
3868 xstring : tXSTRING_BEG xstring_contents tSTRING_END
3873 node = NEW_XSTR(STR_NEW0());
3876 switch (nd_type(node)) {
3878 nd_set_type(node, NODE_XSTR);
3881 nd_set_type(node, NODE_DXSTR);
3884 node = NEW_NODE(NODE_DXSTR, Qnil, 1, NEW_LIST(node));
3890 $$ = dispatch1(xstring_literal, $2);
3895 regexp : tREGEXP_BEG regexp_contents tREGEXP_END
3902 node = NEW_LIT(reg_compile(STR_NEW0(), options));
3904 else switch (nd_type(node)) {
3907 VALUE src = node->nd_lit;
3908 nd_set_type(node, NODE_LIT);
3909 node->nd_lit = reg_compile(src, options);
3913 node = NEW_NODE(NODE_DSTR, STR_NEW0(), 1, NEW_LIST(node));
3915 if (options & RE_OPTION_ONCE) {
3916 nd_set_type(node, NODE_DREGX_ONCE);
3919 nd_set_type(node, NODE_DREGX);
3921 node->nd_cflag = options & RE_OPTION_MASK;
3922 if (!NIL_P(node->nd_lit)) reg_fragment_check(node->nd_lit, options);
3923 for (list = (prev = node)->nd_next; list; list = list->nd_next) {
3924 if (nd_type(list->nd_head) == NODE_STR) {
3925 VALUE tail = list->nd_head->nd_lit;
3926 if (reg_fragment_check(tail, options) && prev && !NIL_P(prev->nd_lit)) {
3927 VALUE lit = prev == node ? prev->nd_lit : prev->nd_head->nd_lit;
3928 if (!literal_concat0(parser, lit, tail)) {
3932 rb_str_resize(tail, 0);
3933 prev->nd_next = list->nd_next;
3934 rb_gc_force_recycle((VALUE)list->nd_head);
3935 rb_gc_force_recycle((VALUE)list);
3946 if (!node->nd_next) {
3947 VALUE src = node->nd_lit;
3948 nd_set_type(node, NODE_LIT);
3949 node->nd_lit = reg_compile(src, options);
3955 $$ = dispatch2(regexp_literal, $2, $3);
3960 words : tWORDS_BEG ' ' tSTRING_END
3965 $$ = dispatch0(words_new);
3966 $$ = dispatch1(array, $$);
3969 | tWORDS_BEG word_list tSTRING_END
3974 $$ = dispatch1(array, $2);
3979 word_list : /* none */
3984 $$ = dispatch0(words_new);
3987 | word_list word ' '
3990 $$ = list_append($1, evstr2dstr($2));
3992 $$ = dispatch2(words_add, $1, $2);
3997 word : string_content
4001 $$ = dispatch0(word_new);
4002 $$ = dispatch2(word_add, $$, $1);
4005 | word string_content
4008 $$ = literal_concat($1, $2);
4010 $$ = dispatch2(word_add, $1, $2);
4015 symbols : tSYMBOLS_BEG ' ' tSTRING_END
4020 $$ = dispatch0(symbols_new);
4021 $$ = dispatch1(array, $$);
4024 | tSYMBOLS_BEG symbol_list tSTRING_END
4029 $$ = dispatch1(array, $2);
4034 symbol_list : /* none */
4039 $$ = dispatch0(symbols_new);
4042 | symbol_list word ' '
4045 $2 = evstr2dstr($2);
4046 if (nd_type($2) == NODE_DSTR) {
4047 nd_set_type($2, NODE_DSYM);
4050 nd_set_type($2, NODE_LIT);
4051 $2->nd_lit = rb_str_intern($2->nd_lit);
4053 $$ = list_append($1, $2);
4055 $$ = dispatch2(symbols_add, $1, $2);
4060 qwords : tQWORDS_BEG ' ' tSTRING_END
4065 $$ = dispatch0(qwords_new);
4066 $$ = dispatch1(array, $$);
4069 | tQWORDS_BEG qword_list tSTRING_END
4074 $$ = dispatch1(array, $2);
4079 qsymbols : tQSYMBOLS_BEG ' ' tSTRING_END
4084 $$ = dispatch0(qsymbols_new);
4085 $$ = dispatch1(array, $$);
4088 | tQSYMBOLS_BEG qsym_list tSTRING_END
4093 $$ = dispatch1(array, $2);
4098 qword_list : /* none */
4103 $$ = dispatch0(qwords_new);
4106 | qword_list tSTRING_CONTENT ' '
4109 $$ = list_append($1, $2);
4111 $$ = dispatch2(qwords_add, $1, $2);
4116 qsym_list : /* none */
4121 $$ = dispatch0(qsymbols_new);
4124 | qsym_list tSTRING_CONTENT ' '
4129 $2->nd_lit = ID2SYM(rb_intern_str(lit));
4130 nd_set_type($2, NODE_LIT);
4131 $$ = list_append($1, $2);
4133 $$ = dispatch2(qsymbols_add, $1, $2);
4138 string_contents : /* none */
4143 $$ = dispatch0(string_content);
4146 | string_contents string_content
4149 $$ = literal_concat($1, $2);
4151 $$ = dispatch2(string_add, $1, $2);
4156 xstring_contents: /* none */
4161 $$ = dispatch0(xstring_new);
4164 | xstring_contents string_content
4167 $$ = literal_concat($1, $2);
4169 $$ = dispatch2(xstring_add, $1, $2);
4174 regexp_contents: /* none */
4179 $$ = dispatch0(regexp_new);
4182 | regexp_contents string_content
4185 NODE *head = $1, *tail = $2;
4193 switch (nd_type(head)) {
4195 nd_set_type(head, NODE_DSTR);
4200 head = list_append(NEW_DSTR(Qnil), head);
4203 $$ = list_append(head, tail);
4206 $$ = dispatch2(regexp_add, $1, $2);
4211 string_content : tSTRING_CONTENT
4214 $<node>$ = lex_strterm;
4216 lex_state = EXPR_BEG;
4221 lex_strterm = $<node>2;
4224 lex_strterm = $<node>2;
4225 $$ = dispatch1(string_dvar, $3);
4230 $<val>1 = cond_stack;
4231 $<val>$ = cmdarg_stack;
4236 $<node>$ = lex_strterm;
4238 lex_state = EXPR_BEG;
4241 $<num>$ = brace_nest;
4244 compstmt tSTRING_DEND
4246 cond_stack = $<val>1;
4247 cmdarg_stack = $<val>2;
4248 lex_strterm = $<node>3;
4249 brace_nest = $<num>4;
4251 if ($5) $5->flags &= ~NODE_FL_NEWLINE;
4254 $$ = dispatch1(string_embexpr, $5);
4264 $$ = dispatch1(var_ref, $1);
4272 $$ = dispatch1(var_ref, $1);
4280 $$ = dispatch1(var_ref, $1);
4286 symbol : tSYMBEG sym
4288 lex_state = EXPR_END;
4292 $$ = dispatch1(symbol, $2);
4303 dsym : tSYMBEG xstring_contents tSTRING_END
4305 lex_state = EXPR_END;
4309 $$ = dispatch1(dyna_symbol, $2);
4316 | tUMINUS_NUM tINTEGER %prec tLOWEST
4319 $$ = negate_lit($2);
4321 $$ = dispatch2(unary, ripper_intern("-@"), $2);
4324 | tUMINUS_NUM tFLOAT %prec tLOWEST
4327 $$ = negate_lit($2);
4329 $$ = dispatch2(unary, ripper_intern("-@"), $2);
4334 user_variable : tIDENTIFIER
4341 keyword_variable: keyword_nil {ifndef_ripper($$ = keyword_nil);}
4342 | keyword_self {ifndef_ripper($$ = keyword_self);}
4343 | keyword_true {ifndef_ripper($$ = keyword_true);}
4344 | keyword_false {ifndef_ripper($$ = keyword_false);}
4345 | keyword__FILE__ {ifndef_ripper($$ = keyword__FILE__);}
4346 | keyword__LINE__ {ifndef_ripper($$ = keyword__LINE__);}
4347 | keyword__ENCODING__ {ifndef_ripper($$ = keyword__ENCODING__);}
4350 var_ref : user_variable
4353 if (!($$ = gettable($1))) $$ = NEW_BEGIN(0);
4355 if (id_is_var(get_id($1))) {
4356 $$ = dispatch1(var_ref, $1);
4359 $$ = dispatch1(vcall, $1);
4366 if (!($$ = gettable($1))) $$ = NEW_BEGIN(0);
4368 $$ = dispatch1(var_ref, $1);
4373 var_lhs : user_variable
4375 $$ = assignable($1, 0);
4378 $$ = dispatch1(var_field, $$);
4383 $$ = assignable($1, 0);
4386 $$ = dispatch1(var_field, $$);
4405 lex_state = EXPR_BEG;
4406 command_start = TRUE;
4424 f_arglist : '(' f_args rparen
4429 $$ = dispatch1(paren, $2);
4431 lex_state = EXPR_BEG;
4432 command_start = TRUE;
4437 lex_state = EXPR_BEG;
4438 command_start = TRUE;
4442 args_tail : f_kwarg ',' f_kwrest opt_f_block_arg
4444 $$ = new_args_tail($1, $3, $4);
4446 | f_kwarg opt_f_block_arg
4448 $$ = new_args_tail($1, Qnone, $2);
4450 | f_kwrest opt_f_block_arg
4452 $$ = new_args_tail(Qnone, $1, $2);
4456 $$ = new_args_tail(Qnone, Qnone, $1);
4460 opt_args_tail : ',' args_tail
4466 $$ = new_args_tail(Qnone, Qnone, Qnone);
4470 f_args : f_arg ',' f_optarg ',' f_rest_arg opt_args_tail
4472 $$ = new_args($1, $3, $5, Qnone, $6);
4474 | f_arg ',' f_optarg ',' f_rest_arg ',' f_arg opt_args_tail
4476 $$ = new_args($1, $3, $5, $7, $8);
4478 | f_arg ',' f_optarg opt_args_tail
4480 $$ = new_args($1, $3, Qnone, Qnone, $4);
4482 | f_arg ',' f_optarg ',' f_arg opt_args_tail
4484 $$ = new_args($1, $3, Qnone, $5, $6);
4486 | f_arg ',' f_rest_arg opt_args_tail
4488 $$ = new_args($1, Qnone, $3, Qnone, $4);
4490 | f_arg ',' f_rest_arg ',' f_arg opt_args_tail
4492 $$ = new_args($1, Qnone, $3, $5, $6);
4494 | f_arg opt_args_tail
4496 $$ = new_args($1, Qnone, Qnone, Qnone, $2);
4498 | f_optarg ',' f_rest_arg opt_args_tail
4500 $$ = new_args(Qnone, $1, $3, Qnone, $4);
4502 | f_optarg ',' f_rest_arg ',' f_arg opt_args_tail
4504 $$ = new_args(Qnone, $1, $3, $5, $6);
4506 | f_optarg opt_args_tail
4508 $$ = new_args(Qnone, $1, Qnone, Qnone, $2);
4510 | f_optarg ',' f_arg opt_args_tail
4512 $$ = new_args(Qnone, $1, Qnone, $3, $4);
4514 | f_rest_arg opt_args_tail
4516 $$ = new_args(Qnone, Qnone, $1, Qnone, $2);
4518 | f_rest_arg ',' f_arg opt_args_tail
4520 $$ = new_args(Qnone, Qnone, $1, $3, $4);
4524 $$ = new_args(Qnone, Qnone, Qnone, Qnone, $1);
4528 $$ = new_args_tail(Qnone, Qnone, Qnone);
4529 $$ = new_args(Qnone, Qnone, Qnone, Qnone, $$);
4533 f_bad_arg : tCONSTANT
4536 yyerror("formal argument cannot be a constant");
4539 $$ = dispatch1(param_error, $1);
4545 yyerror("formal argument cannot be an instance variable");
4548 $$ = dispatch1(param_error, $1);
4554 yyerror("formal argument cannot be a global variable");
4557 $$ = dispatch1(param_error, $1);
4563 yyerror("formal argument cannot be a class variable");
4566 $$ = dispatch1(param_error, $1);
4571 f_norm_arg : f_bad_arg
4574 formal_argument(get_id($1));
4579 f_arg_item : f_norm_arg
4581 arg_var(get_id($1));
4583 $$ = NEW_ARGS_AUX($1, 1);
4588 | tLPAREN f_margs rparen
4590 ID tid = internal_id();
4593 if (dyna_in_block()) {
4594 $2->nd_value = NEW_DVAR(tid);
4597 $2->nd_value = NEW_LVAR(tid);
4599 $$ = NEW_ARGS_AUX(tid, 1);
4602 $$ = dispatch1(mlhs_paren, $2);
4611 $$ = rb_ary_new3(1, $1);
4614 | f_arg ',' f_arg_item
4619 $$->nd_next = block_append($$->nd_next, $3->nd_next);
4620 rb_gc_force_recycle((VALUE)$3);
4622 $$ = rb_ary_push($1, $3);
4627 f_kw : tLABEL arg_value
4629 arg_var(formal_argument(get_id($1)));
4630 $$ = assignable($1, $2);
4632 $$ = NEW_KW_ARG(0, $$);
4634 $$ = rb_assoc_new($$, $2);
4639 f_block_kw : tLABEL primary_value
4641 arg_var(formal_argument(get_id($1)));
4642 $$ = assignable($1, $2);
4644 $$ = NEW_KW_ARG(0, $$);
4646 $$ = rb_assoc_new($$, $2);
4651 f_block_kwarg : f_block_kw
4656 $$ = rb_ary_new3(1, $1);
4659 | f_block_kwarg ',' f_block_kw
4664 while (kws->nd_next) {
4670 $$ = rb_ary_push($1, $3);
4681 $$ = rb_ary_new3(1, $1);
4689 while (kws->nd_next) {
4695 $$ = rb_ary_push($1, $3);
4704 f_kwrest : kwrest_mark tIDENTIFIER
4706 shadowing_lvar(get_id($2));
4715 f_opt : tIDENTIFIER '=' arg_value
4717 arg_var(formal_argument(get_id($1)));
4718 $$ = assignable($1, $3);
4720 $$ = NEW_OPT_ARG(0, $$);
4722 $$ = rb_assoc_new($$, $3);
4727 f_block_opt : tIDENTIFIER '=' primary_value
4729 arg_var(formal_argument(get_id($1)));
4730 $$ = assignable($1, $3);
4732 $$ = NEW_OPT_ARG(0, $$);
4734 $$ = rb_assoc_new($$, $3);
4739 f_block_optarg : f_block_opt
4744 $$ = rb_ary_new3(1, $1);
4747 | f_block_optarg ',' f_block_opt
4752 while (opts->nd_next) {
4753 opts = opts->nd_next;
4758 $$ = rb_ary_push($1, $3);
4768 $$ = rb_ary_new3(1, $1);
4771 | f_optarg ',' f_opt
4776 while (opts->nd_next) {
4777 opts = opts->nd_next;
4782 $$ = rb_ary_push($1, $3);
4791 f_rest_arg : restarg_mark tIDENTIFIER
4794 if (!is_local_id($2))
4795 yyerror("rest argument must be local variable");
4797 arg_var(shadowing_lvar(get_id($2)));
4801 $$ = dispatch1(rest_param, $2);
4810 $$ = dispatch1(rest_param, Qnil);
4819 f_block_arg : blkarg_mark tIDENTIFIER
4822 if (!is_local_id($2))
4823 yyerror("block argument must be local variable");
4824 else if (!dyna_in_block() && local_id($2))
4825 yyerror("duplicated block argument name");
4827 arg_var(shadowing_lvar(get_id($2)));
4831 $$ = dispatch1(blockarg, $2);
4836 opt_f_block_arg : ',' f_block_arg
4855 if (!$$) $$ = NEW_NIL();
4860 | '(' {lex_state = EXPR_BEG;} expr rparen
4864 yyerror("can't define singleton method for ().");
4867 switch (nd_type($3)) {
4876 yyerror("can't define singleton method for literals");
4884 $$ = dispatch1(paren, $3);
4895 $$ = dispatch1(assoclist_from_args, $1);
4904 $$ = rb_ary_new3(1, $1);
4910 $$ = list_concat($1, $3);
4912 $$ = rb_ary_push($1, $3);
4917 assoc : arg_value tASSOC arg_value
4920 $$ = list_append(NEW_LIST($1), $3);
4922 $$ = dispatch2(assoc_new, $1, $3);
4928 $$ = list_append(NEW_LIST(NEW_LIT(ID2SYM($1))), $2);
4930 $$ = dispatch2(assoc_new, $1, $2);
4936 $$ = list_append(NEW_LIST(0), $2);
4938 $$ = dispatch1(assoc_splat, $2);
4945 operation : tIDENTIFIER
4950 operation2 : tIDENTIFIER
4956 operation3 : tIDENTIFIER
4973 opt_terms : /* none */
4984 rbracket : opt_nl ']'
4987 trailer : /* none */
4992 term : ';' {yyerrok;}
4997 | terms ';' {yyerrok;}
5013 # define yylval (*((YYSTYPE*)(parser->parser_yylval)))
5015 static int parser_regx_options(struct parser_params*);
5016 static int parser_tokadd_string(struct parser_params*,int,int,int,long*,rb_encoding**);
5017 static void parser_tokaddmbc(struct parser_params *parser, int c, rb_encoding *enc);
5018 static int parser_parse_string(struct parser_params*,NODE*);
5019 static int parser_here_document(struct parser_params*,NODE*);
5022 # define nextc() parser_nextc(parser)
5023 # define pushback(c) parser_pushback(parser, (c))
5024 # define newtok() parser_newtok(parser)
5025 # define tokspace(n) parser_tokspace(parser, (n))
5026 # define tokadd(c) parser_tokadd(parser, (c))
5027 # define tok_hex(numlen) parser_tok_hex(parser, (numlen))
5028 # define read_escape(flags,e) parser_read_escape(parser, (flags), (e))
5029 # define tokadd_escape(e) parser_tokadd_escape(parser, (e))
5030 # define regx_options() parser_regx_options(parser)
5031 # define tokadd_string(f,t,p,n,e) parser_tokadd_string(parser,(f),(t),(p),(n),(e))
5032 # define parse_string(n) parser_parse_string(parser,(n))
5033 # define tokaddmbc(c, enc) parser_tokaddmbc(parser, (c), (enc))
5034 # define here_document(n) parser_here_document(parser,(n))
5035 # define heredoc_identifier() parser_heredoc_identifier(parser)
5036 # define heredoc_restore(n) parser_heredoc_restore(parser,(n))
5037 # define whole_match_p(e,l,i) parser_whole_match_p(parser,(e),(l),(i))
5040 # define set_yylval_str(x) (yylval.node = NEW_STR(x))
5041 # define set_yylval_num(x) (yylval.num = (x))
5042 # define set_yylval_id(x) (yylval.id = (x))
5043 # define set_yylval_name(x) (yylval.id = (x))
5044 # define set_yylval_literal(x) (yylval.node = NEW_LIT(x))
5045 # define set_yylval_node(x) (yylval.node = (x))
5046 # define yylval_id() (yylval.id)
5049 ripper_yylval_id(ID x)
5051 return (VALUE)NEW_LASGN(x, ID2SYM(x));
5053 # define set_yylval_str(x) (void)(x)
5054 # define set_yylval_num(x) (void)(x)
5055 # define set_yylval_id(x) (void)(x)
5056 # define set_yylval_name(x) (void)(yylval.val = ripper_yylval_id(x))
5057 # define set_yylval_literal(x) (void)(x)
5058 # define set_yylval_node(x) (void)(x)
5059 # define yylval_id() yylval.id
5063 #define ripper_flush(p) (void)(p)
5065 #define ripper_flush(p) ((p)->tokp = (p)->parser_lex_p)
5067 #define yylval_rval (*(RB_TYPE_P(yylval.val, T_NODE) ? &yylval.node->nd_rval : &yylval.val))
5070 ripper_has_scan_event(struct parser_params *parser)
5073 if (lex_p < parser->tokp) rb_raise(rb_eRuntimeError, "lex_p < tokp");
5074 return lex_p > parser->tokp;
5078 ripper_scan_event_val(struct parser_params *parser, int t)
5080 VALUE str = STR_NEW(parser->tokp, lex_p - parser->tokp);
5081 VALUE rval = ripper_dispatch1(parser, ripper_token2eventid(t), str);
5082 ripper_flush(parser);
5087 ripper_dispatch_scan_event(struct parser_params *parser, int t)
5089 if (!ripper_has_scan_event(parser)) return;
5090 yylval_rval = ripper_scan_event_val(parser, t);
5094 ripper_dispatch_ignored_scan_event(struct parser_params *parser, int t)
5096 if (!ripper_has_scan_event(parser)) return;
5097 (void)ripper_scan_event_val(parser, t);
5101 ripper_dispatch_delayed_token(struct parser_params *parser, int t)
5103 int saved_line = ruby_sourceline;
5104 const char *saved_tokp = parser->tokp;
5106 ruby_sourceline = parser->delayed_line;
5107 parser->tokp = lex_pbeg + parser->delayed_col;
5108 yylval_rval = ripper_dispatch1(parser, ripper_token2eventid(t), parser->delayed);
5109 parser->delayed = Qnil;
5110 ruby_sourceline = saved_line;
5111 parser->tokp = saved_tokp;
5115 #include "ruby/regex.h"
5116 #include "ruby/util.h"
5118 /* We remove any previous definition of `SIGN_EXTEND_CHAR',
5119 since ours (we hope) works properly with all combinations of
5120 machines, compilers, `char' and `unsigned char' argument types.
5121 (Per Bothner suggested the basic approach.) */
5122 #undef SIGN_EXTEND_CHAR
5124 # define SIGN_EXTEND_CHAR(c) ((signed char)(c))
5125 #else /* not __STDC__ */
5126 /* As in Harbison and Steele. */
5127 # define SIGN_EXTEND_CHAR(c) ((((unsigned char)(c)) ^ 128) - 128)
5130 #define parser_encoding_name() (current_enc->name)
5131 #define parser_mbclen() mbclen((lex_p-1),lex_pend,current_enc)
5132 #define parser_precise_mbclen() rb_enc_precise_mbclen((lex_p-1),lex_pend,current_enc)
5133 #define is_identchar(p,e,enc) (rb_enc_isalnum(*(p),(enc)) || (*(p)) == '_' || !ISASCII(*(p)))
5134 #define parser_is_identchar() (!parser->eofp && is_identchar((lex_p-1),lex_pend,current_enc))
5136 #define parser_isascii() ISASCII(*(lex_p-1))
5140 token_info_get_column(struct parser_params *parser, const char *token)
5143 const char *p, *pend = lex_p - strlen(token);
5144 for (p = lex_pbeg; p < pend; p++) {
5146 column = (((column - 1) / 8) + 1) * 8;
5154 token_info_has_nonspaces(struct parser_params *parser, const char *token)
5156 const char *p, *pend = lex_p - strlen(token);
5157 for (p = lex_pbeg; p < pend; p++) {
5158 if (*p != ' ' && *p != '\t') {
5165 #undef token_info_push
5167 token_info_push(struct parser_params *parser, const char *token)
5171 if (!parser->parser_token_info_enabled) return;
5172 ptinfo = ALLOC(token_info);
5173 ptinfo->token = token;
5174 ptinfo->linenum = ruby_sourceline;
5175 ptinfo->column = token_info_get_column(parser, token);
5176 ptinfo->nonspc = token_info_has_nonspaces(parser, token);
5177 ptinfo->next = parser->parser_token_info;
5179 parser->parser_token_info = ptinfo;
5182 #undef token_info_pop
5184 token_info_pop(struct parser_params *parser, const char *token)
5187 token_info *ptinfo = parser->parser_token_info;
5189 if (!ptinfo) return;
5190 parser->parser_token_info = ptinfo->next;
5191 if (token_info_get_column(parser, token) == ptinfo->column) { /* OK */
5194 linenum = ruby_sourceline;
5195 if (linenum == ptinfo->linenum) { /* SKIP */
5198 if (token_info_has_nonspaces(parser, token) || ptinfo->nonspc) { /* SKIP */
5201 if (parser->parser_token_info_enabled) {
5202 rb_compile_warn(ruby_sourcefile, linenum,
5203 "mismatched indentations at '%s' with '%s' at %d",
5204 token, ptinfo->token, ptinfo->linenum);
5213 parser_yyerror(struct parser_params *parser, const char *msg)
5216 const int max_line_margin = 30;
5222 compile_error(PARSER_ARG "%s", msg);
5224 while (lex_pbeg <= p) {
5225 if (*p == '\n') break;
5231 while (pe < lex_pend) {
5232 if (*pe == '\n') break;
5239 const char *pre = "", *post = "";
5241 if (len > max_line_margin * 2 + 10) {
5242 if (lex_p - p > max_line_margin) {
5243 p = rb_enc_prev_char(p, lex_p - max_line_margin, pe, rb_enc_get(lex_lastline));
5246 if (pe - lex_p > max_line_margin) {
5247 pe = rb_enc_prev_char(lex_p, lex_p + max_line_margin, pe, rb_enc_get(lex_lastline));
5252 buf = ALLOCA_N(char, len+2);
5253 MEMCPY(buf, p, char, len);
5255 rb_compile_error_with_enc(NULL, 0, (void *)current_enc, "%s%s%s", pre, buf, post);
5257 i = (int)(lex_p - p);
5258 p2 = buf; pe = buf + len;
5261 if (*p2 != '\t') *p2 = ' ';
5266 rb_compile_error_append("%s%s", pre, buf);
5269 dispatch1(parse_error, STR_NEW2(msg));
5270 #endif /* !RIPPER */
5274 static void parser_prepare(struct parser_params *parser);
5278 debug_lines(VALUE fname)
5281 CONST_ID(script_lines, "SCRIPT_LINES__");
5282 if (rb_const_defined_at(rb_cObject, script_lines)) {
5283 VALUE hash = rb_const_get_at(rb_cObject, script_lines);
5284 if (RB_TYPE_P(hash, T_HASH)) {
5285 VALUE lines = rb_ary_new();
5286 rb_hash_aset(hash, fname, lines);
5294 coverage(VALUE fname, int n)
5296 VALUE coverages = rb_get_coverages();
5297 if (RTEST(coverages) && RBASIC(coverages)->klass == 0) {
5298 VALUE lines = rb_ary_new2(n);
5300 RBASIC(lines)->klass = 0;
5301 for (i = 0; i < n; i++) RARRAY_PTR(lines)[i] = Qnil;
5302 RARRAY(lines)->as.heap.len = n;
5303 rb_hash_aset(coverages, fname, lines);
5310 e_option_supplied(struct parser_params *parser)
5312 return strcmp(ruby_sourcefile, "-e") == 0;
5316 yycompile0(VALUE arg)
5320 struct parser_params *parser = (struct parser_params *)arg;
5322 if (!compile_for_eval && rb_safe_level() == 0) {
5323 ruby_debug_lines = debug_lines(ruby_sourcefile_string);
5324 if (ruby_debug_lines && ruby_sourceline > 0) {
5325 VALUE str = STR_NEW0();
5326 n = ruby_sourceline;
5328 rb_ary_push(ruby_debug_lines, str);
5332 if (!e_option_supplied(parser)) {
5333 ruby_coverage = coverage(ruby_sourcefile_string, ruby_sourceline);
5337 parser_prepare(parser);
5340 parser->parser_token_info_enabled = !compile_for_eval && RTEST(ruby_verbose);
5343 if (RUBY_DTRACE_PARSE_BEGIN_ENABLED()) {
5344 RUBY_DTRACE_PARSE_BEGIN(parser->parser_ruby_sourcefile,
5345 parser->parser_ruby_sourceline);
5348 n = yyparse((void*)parser);
5350 if (RUBY_DTRACE_PARSE_END_ENABLED()) {
5351 RUBY_DTRACE_PARSE_END(parser->parser_ruby_sourcefile,
5352 parser->parser_ruby_sourceline);
5355 ruby_debug_lines = 0;
5357 compile_for_eval = 0;
5360 lex_p = lex_pbeg = lex_pend = 0;
5361 lex_lastline = lex_nextline = 0;
5365 tree = ruby_eval_tree;
5369 else if (ruby_eval_tree_begin) {
5370 tree->nd_body = NEW_PRELUDE(ruby_eval_tree_begin, tree->nd_body);
5376 yycompile(struct parser_params *parser, VALUE fname, int line)
5378 ruby_sourcefile_string = rb_str_new_frozen(fname);
5379 ruby_sourcefile = RSTRING_PTR(fname);
5380 ruby_sourceline = line - 1;
5381 return (NODE *)rb_suppress_tracing(yycompile0, (VALUE)parser);
5383 #endif /* !RIPPER */
5385 static rb_encoding *
5386 must_be_ascii_compatible(VALUE s)
5388 rb_encoding *enc = rb_enc_get(s);
5389 if (!rb_enc_asciicompat(enc)) {
5390 rb_raise(rb_eArgError, "invalid source encoding");
5396 lex_get_str(struct parser_params *parser, VALUE s)
5398 char *beg, *end, *pend;
5399 rb_encoding *enc = must_be_ascii_compatible(s);
5401 beg = RSTRING_PTR(s);
5403 if (RSTRING_LEN(s) == lex_gets_ptr) return Qnil;
5404 beg += lex_gets_ptr;
5406 pend = RSTRING_PTR(s) + RSTRING_LEN(s);
5408 while (end < pend) {
5409 if (*end++ == '\n') break;
5411 lex_gets_ptr = end - RSTRING_PTR(s);
5412 return rb_enc_str_new(beg, end - beg, enc);
5416 lex_getline(struct parser_params *parser)
5418 VALUE line = (*parser->parser_lex_gets)(parser, parser->parser_lex_input);
5419 if (NIL_P(line)) return line;
5420 must_be_ascii_compatible(line);
5422 if (ruby_debug_lines) {
5423 rb_enc_associate(line, current_enc);
5424 rb_ary_push(ruby_debug_lines, line);
5426 if (ruby_coverage) {
5427 rb_ary_push(ruby_coverage, Qnil);
5434 static rb_data_type_t parser_data_type;
5436 static const rb_data_type_t parser_data_type;
5439 parser_compile_string(volatile VALUE vparser, VALUE fname, VALUE s, int line)
5441 struct parser_params *parser;
5444 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
5445 lex_gets = lex_get_str;
5448 lex_pbeg = lex_p = lex_pend = 0;
5449 compile_for_eval = rb_parse_in_eval();
5451 node = yycompile(parser, fname, line);
5452 RB_GC_GUARD(vparser); /* prohibit tail call optimization */
5458 rb_compile_string(const char *f, VALUE s, int line)
5460 must_be_ascii_compatible(s);
5461 return parser_compile_string(rb_parser_new(), rb_filesystem_str_new_cstr(f), s, line);
5465 rb_parser_compile_string(volatile VALUE vparser, const char *f, VALUE s, int line)
5467 return rb_parser_compile_string_path(vparser, rb_filesystem_str_new_cstr(f), s, line);
5471 rb_parser_compile_string_path(volatile VALUE vparser, VALUE f, VALUE s, int line)
5473 must_be_ascii_compatible(s);
5474 return parser_compile_string(vparser, f, s, line);
5478 rb_compile_cstr(const char *f, const char *s, int len, int line)
5480 VALUE str = rb_str_new(s, len);
5481 return parser_compile_string(rb_parser_new(), rb_filesystem_str_new_cstr(f), str, line);
5485 rb_parser_compile_cstr(volatile VALUE vparser, const char *f, const char *s, int len, int line)
5487 VALUE str = rb_str_new(s, len);
5488 return parser_compile_string(vparser, rb_filesystem_str_new_cstr(f), str, line);
5492 lex_io_gets(struct parser_params *parser, VALUE io)
5494 return rb_io_gets(io);
5498 rb_compile_file(const char *f, VALUE file, int start)
5500 VALUE volatile vparser = rb_parser_new();
5502 return rb_parser_compile_file(vparser, f, file, start);
5506 rb_parser_compile_file(volatile VALUE vparser, const char *f, VALUE file, int start)
5508 return rb_parser_compile_file_path(vparser, rb_filesystem_str_new_cstr(f), file, start);
5512 rb_parser_compile_file_path(volatile VALUE vparser, VALUE fname, VALUE file, int start)
5514 struct parser_params *parser;
5517 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
5518 lex_gets = lex_io_gets;
5520 lex_pbeg = lex_p = lex_pend = 0;
5521 compile_for_eval = rb_parse_in_eval();
5523 node = yycompile(parser, fname, start);
5524 RB_GC_GUARD(vparser); /* prohibit tail call optimization */
5528 #endif /* !RIPPER */
5530 #define STR_FUNC_ESCAPE 0x01
5531 #define STR_FUNC_EXPAND 0x02
5532 #define STR_FUNC_REGEXP 0x04
5533 #define STR_FUNC_QWORDS 0x08
5534 #define STR_FUNC_SYMBOL 0x10
5535 #define STR_FUNC_INDENT 0x20
5539 str_dquote = (STR_FUNC_EXPAND),
5540 str_xquote = (STR_FUNC_EXPAND),
5541 str_regexp = (STR_FUNC_REGEXP|STR_FUNC_ESCAPE|STR_FUNC_EXPAND),
5542 str_sword = (STR_FUNC_QWORDS),
5543 str_dword = (STR_FUNC_QWORDS|STR_FUNC_EXPAND),
5544 str_ssym = (STR_FUNC_SYMBOL),
5545 str_dsym = (STR_FUNC_SYMBOL|STR_FUNC_EXPAND)
5549 parser_str_new(const char *p, long n, rb_encoding *enc, int func, rb_encoding *enc0)
5553 str = rb_enc_str_new(p, n, enc);
5554 if (!(func & STR_FUNC_REGEXP) && rb_enc_asciicompat(enc)) {
5555 if (rb_enc_str_coderange(str) == ENC_CODERANGE_7BIT) {
5557 else if (enc0 == rb_usascii_encoding() && enc != rb_utf8_encoding()) {
5558 rb_enc_associate(str, rb_ascii8bit_encoding());
5565 #define lex_goto_eol(parser) ((parser)->parser_lex_p = (parser)->parser_lex_pend)
5566 #define lex_eol_p() (lex_p >= lex_pend)
5567 #define peek(c) peek_n((c), 0)
5568 #define peek_n(c,n) (lex_p+(n) < lex_pend && (c) == (unsigned char)lex_p[n])
5571 parser_nextc(struct parser_params *parser)
5575 if (lex_p == lex_pend) {
5576 VALUE v = lex_nextline;
5582 if (!lex_input || NIL_P(v = lex_getline(parser))) {
5583 parser->eofp = Qtrue;
5584 lex_goto_eol(parser);
5590 if (parser->tokp < lex_pend) {
5591 if (NIL_P(parser->delayed)) {
5592 parser->delayed = rb_str_buf_new(1024);
5593 rb_enc_associate(parser->delayed, current_enc);
5594 rb_str_buf_cat(parser->delayed,
5595 parser->tokp, lex_pend - parser->tokp);
5596 parser->delayed_line = ruby_sourceline;
5597 parser->delayed_col = (int)(parser->tokp - lex_pbeg);
5600 rb_str_buf_cat(parser->delayed,
5601 parser->tokp, lex_pend - parser->tokp);
5605 if (heredoc_end > 0) {
5606 ruby_sourceline = heredoc_end;
5610 parser->line_count++;
5611 lex_pbeg = lex_p = RSTRING_PTR(v);
5612 lex_pend = lex_p + RSTRING_LEN(v);
5613 ripper_flush(parser);
5617 c = (unsigned char)*lex_p++;
5618 if (c == '\r' && peek('\n')) {
5627 parser_pushback(struct parser_params *parser, int c)
5629 if (c == -1) return;
5631 if (lex_p > lex_pbeg && lex_p[0] == '\n' && lex_p[-1] == '\r') {
5636 #define was_bol() (lex_p == lex_pbeg + 1)
5638 #define tokfix() (tokenbuf[tokidx]='\0')
5639 #define tok() tokenbuf
5640 #define toklen() tokidx
5641 #define toklast() (tokidx>0?tokenbuf[tokidx-1]:0)
5644 parser_newtok(struct parser_params *parser)
5647 tokline = ruby_sourceline;
5650 tokenbuf = ALLOC_N(char, 60);
5652 if (toksiz > 4096) {
5654 REALLOC_N(tokenbuf, char, 60);
5660 parser_tokspace(struct parser_params *parser, int n)
5664 if (tokidx >= toksiz) {
5665 do {toksiz *= 2;} while (toksiz < tokidx);
5666 REALLOC_N(tokenbuf, char, toksiz);
5668 return &tokenbuf[tokidx-n];
5672 parser_tokadd(struct parser_params *parser, int c)
5674 tokenbuf[tokidx++] = (char)c;
5675 if (tokidx >= toksiz) {
5677 REALLOC_N(tokenbuf, char, toksiz);
5682 parser_tok_hex(struct parser_params *parser, size_t *numlen)
5686 c = scan_hex(lex_p, 2, numlen);
5688 yyerror("invalid hex escape");
5695 #define tokcopy(n) memcpy(tokspace(n), lex_p - (n), (n))
5697 /* return value is for ?\u3042 */
5699 parser_tokadd_utf8(struct parser_params *parser, rb_encoding **encp,
5700 int string_literal, int symbol_literal, int regexp_literal)
5703 * If string_literal is true, then we allow multiple codepoints
5704 * in \u{}, and add the codepoints to the current token.
5705 * Otherwise we're parsing a character literal and return a single
5706 * codepoint without adding it
5712 if (regexp_literal) { tokadd('\\'); tokadd('u'); }
5714 if (peek('{')) { /* handle \u{...} form */
5716 if (regexp_literal) { tokadd(*lex_p); }
5718 codepoint = scan_hex(lex_p, 6, &numlen);
5720 yyerror("invalid Unicode escape");
5723 if (codepoint > 0x10ffff) {
5724 yyerror("invalid Unicode codepoint (too large)");
5728 if (regexp_literal) {
5729 tokcopy((int)numlen);
5731 else if (codepoint >= 0x80) {
5732 *encp = rb_utf8_encoding();
5733 if (string_literal) tokaddmbc(codepoint, *encp);
5735 else if (string_literal) {
5738 } while (string_literal && (peek(' ') || peek('\t')));
5741 yyerror("unterminated Unicode escape");
5745 if (regexp_literal) { tokadd('}'); }
5748 else { /* handle \uxxxx form */
5749 codepoint = scan_hex(lex_p, 4, &numlen);
5751 yyerror("invalid Unicode escape");
5755 if (regexp_literal) {
5758 else if (codepoint >= 0x80) {
5759 *encp = rb_utf8_encoding();
5760 if (string_literal) tokaddmbc(codepoint, *encp);
5762 else if (string_literal) {
5770 #define ESCAPE_CONTROL 1
5771 #define ESCAPE_META 2
5774 parser_read_escape(struct parser_params *parser, int flags,
5780 switch (c = nextc()) {
5781 case '\\': /* Backslash */
5784 case 'n': /* newline */
5787 case 't': /* horizontal tab */
5790 case 'r': /* carriage-return */
5793 case 'f': /* form-feed */
5796 case 'v': /* vertical tab */
5799 case 'a': /* alarm(bell) */
5802 case 'e': /* escape */
5805 case '0': case '1': case '2': case '3': /* octal constant */
5806 case '4': case '5': case '6': case '7':
5808 c = scan_oct(lex_p, 3, &numlen);
5812 case 'x': /* hex constant */
5813 c = tok_hex(&numlen);
5814 if (numlen == 0) return 0;
5817 case 'b': /* backspace */
5820 case 's': /* space */
5824 if (flags & ESCAPE_META) goto eof;
5825 if ((c = nextc()) != '-') {
5829 if ((c = nextc()) == '\\') {
5830 if (peek('u')) goto eof;
5831 return read_escape(flags|ESCAPE_META, encp) | 0x80;
5833 else if (c == -1 || !ISASCII(c)) goto eof;
5835 return ((c & 0xff) | 0x80);
5839 if ((c = nextc()) != '-') {
5844 if (flags & ESCAPE_CONTROL) goto eof;
5845 if ((c = nextc())== '\\') {
5846 if (peek('u')) goto eof;
5847 c = read_escape(flags|ESCAPE_CONTROL, encp);
5851 else if (c == -1 || !ISASCII(c)) goto eof;
5856 yyerror("Invalid escape character syntax");
5865 parser_tokaddmbc(struct parser_params *parser, int c, rb_encoding *enc)
5867 int len = rb_enc_codelen(c, enc);
5868 rb_enc_mbcput(c, tokspace(len), enc);
5872 parser_tokadd_escape(struct parser_params *parser, rb_encoding **encp)
5879 switch (c = nextc()) {
5881 return 0; /* just ignore */
5883 case '0': case '1': case '2': case '3': /* octal constant */
5884 case '4': case '5': case '6': case '7':
5886 ruby_scan_oct(--lex_p, 3, &numlen);
5887 if (numlen == 0) goto eof;
5889 tokcopy((int)numlen + 1);
5893 case 'x': /* hex constant */
5896 if (numlen == 0) return -1;
5897 tokcopy((int)numlen + 2);
5902 if (flags & ESCAPE_META) goto eof;
5903 if ((c = nextc()) != '-') {
5908 flags |= ESCAPE_META;
5912 if (flags & ESCAPE_CONTROL) goto eof;
5913 if ((c = nextc()) != '-') {
5921 if (flags & ESCAPE_CONTROL) goto eof;
5923 flags |= ESCAPE_CONTROL;
5925 if ((c = nextc()) == '\\') {
5928 else if (c == -1) goto eof;
5934 yyerror("Invalid escape character syntax");
5945 parser_regx_options(struct parser_params *parser)
5953 while (c = nextc(), ISALPHA(c)) {
5955 options |= RE_OPTION_ONCE;
5957 else if (rb_char_to_option_kcode(c, &opt, &kc)) {
5959 if (kc != rb_ascii8bit_encindex()) kcode = c;
5974 compile_error(PARSER_ARG "unknown regexp option%s - %s",
5975 toklen() > 1 ? "s" : "", tok());
5977 return options | RE_OPTION_ENCODING(kcode);
5981 dispose_string(VALUE str)
5984 rb_gc_force_recycle(str);
5988 parser_tokadd_mbchar(struct parser_params *parser, int c)
5990 int len = parser_precise_mbclen();
5991 if (!MBCLEN_CHARFOUND_P(len)) {
5992 compile_error(PARSER_ARG "invalid multibyte char (%s)", parser_encoding_name());
5997 if (len > 0) tokcopy(len);
6001 #define tokadd_mbchar(c) parser_tokadd_mbchar(parser, (c))
6004 simple_re_meta(int c)
6007 case '$': case '*': case '+': case '.':
6008 case '?': case '^': case '|':
6009 case ')': case ']': case '}': case '>':
6017 parser_tokadd_string(struct parser_params *parser,
6018 int func, int term, int paren, long *nest,
6022 int has_nonascii = 0;
6023 rb_encoding *enc = *encp;
6025 static const char mixed_msg[] = "%s mixed within %s source";
6027 #define mixed_error(enc1, enc2) if (!errbuf) { \
6028 size_t len = sizeof(mixed_msg) - 4; \
6029 len += strlen(rb_enc_name(enc1)); \
6030 len += strlen(rb_enc_name(enc2)); \
6031 errbuf = ALLOCA_N(char, len); \
6032 snprintf(errbuf, len, mixed_msg, \
6033 rb_enc_name(enc1), \
6034 rb_enc_name(enc2)); \
6037 #define mixed_escape(beg, enc1, enc2) do { \
6038 const char *pos = lex_p; \
6040 mixed_error((enc1), (enc2)); \
6044 while ((c = nextc()) != -1) {
6045 if (paren && c == paren) {
6048 else if (c == term) {
6049 if (!nest || !*nest) {
6055 else if ((func & STR_FUNC_EXPAND) && c == '#' && lex_p < lex_pend) {
6057 if (c2 == '$' || c2 == '@' || c2 == '{') {
6062 else if (c == '\\') {
6063 const char *beg = lex_p - 1;
6067 if (func & STR_FUNC_QWORDS) break;
6068 if (func & STR_FUNC_EXPAND) continue;
6073 if (func & STR_FUNC_ESCAPE) tokadd(c);
6077 if ((func & STR_FUNC_EXPAND) == 0) {
6081 parser_tokadd_utf8(parser, &enc, 1,
6082 func & STR_FUNC_SYMBOL,
6083 func & STR_FUNC_REGEXP);
6084 if (has_nonascii && enc != *encp) {
6085 mixed_escape(beg, enc, *encp);
6090 if (c == -1) return -1;
6092 if ((func & STR_FUNC_EXPAND) == 0) tokadd('\\');
6095 if (func & STR_FUNC_REGEXP) {
6096 if (c == term && !simple_re_meta(c)) {
6101 if ((c = tokadd_escape(&enc)) < 0)
6103 if (has_nonascii && enc != *encp) {
6104 mixed_escape(beg, enc, *encp);
6108 else if (func & STR_FUNC_EXPAND) {
6110 if (func & STR_FUNC_ESCAPE) tokadd('\\');
6111 c = read_escape(0, &enc);
6113 else if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) {
6114 /* ignore backslashed spaces in %w */
6116 else if (c != term && !(paren && c == paren)) {
6123 else if (!parser_isascii()) {
6127 mixed_error(enc, *encp);
6130 if (tokadd_mbchar(c) == -1) return -1;
6133 else if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) {
6140 mixed_error(enc, *encp);
6150 #define NEW_STRTERM(func, term, paren) \
6151 rb_node_newnode(NODE_STRTERM, (func), (term) | ((paren) << (CHAR_BIT * 2)), 0)
6155 ripper_flush_string_content(struct parser_params *parser, rb_encoding *enc)
6157 if (!NIL_P(parser->delayed)) {
6158 ptrdiff_t len = lex_p - parser->tokp;
6160 rb_enc_str_buf_cat(parser->delayed, parser->tokp, len, enc);
6162 ripper_dispatch_delayed_token(parser, tSTRING_CONTENT);
6163 parser->tokp = lex_p;
6167 #define flush_string_content(enc) ripper_flush_string_content(parser, (enc))
6169 #define flush_string_content(enc) ((void)(enc))
6172 RUBY_FUNC_EXPORTED const unsigned int ruby_global_name_punct_bits[(0x7e - 0x20 + 31) / 32];
6173 /* this can be shared with ripper, since it's independent from struct
6176 #define BIT(c, idx) (((c) / 32 - 1 == idx) ? (1U << ((c) % 32)) : 0)
6177 #define SPECIAL_PUNCT(idx) ( \
6178 BIT('~', idx) | BIT('*', idx) | BIT('$', idx) | BIT('?', idx) | \
6179 BIT('!', idx) | BIT('@', idx) | BIT('/', idx) | BIT('\\', idx) | \
6180 BIT(';', idx) | BIT(',', idx) | BIT('.', idx) | BIT('=', idx) | \
6181 BIT(':', idx) | BIT('<', idx) | BIT('>', idx) | BIT('\"', idx) | \
6182 BIT('&', idx) | BIT('`', idx) | BIT('\'', idx) | BIT('+', idx) | \
6184 const unsigned int ruby_global_name_punct_bits[] = {
6190 #undef SPECIAL_PUNCT
6194 is_global_name_punct(const char c)
6196 if (c <= 0x20 || 0x7e < c) return 0;
6197 return (ruby_global_name_punct_bits[(c - 0x20) / 32] >> (c % 32)) & 1;
6201 parser_peek_variable_name(struct parser_params *parser)
6204 const char *p = lex_p;
6206 if (p + 1 >= lex_pend) return 0;
6210 if ((c = *p) == '-') {
6211 if (++p >= lex_pend) return 0;
6214 else if (is_global_name_punct(c) || ISDIGIT(c)) {
6215 return tSTRING_DVAR;
6219 if ((c = *p) == '@') {
6220 if (++p >= lex_pend) return 0;
6226 command_start = TRUE;
6227 return tSTRING_DBEG;
6231 if (!ISASCII(c) || c == '_' || ISALPHA(c))
6232 return tSTRING_DVAR;
6237 parser_parse_string(struct parser_params *parser, NODE *quote)
6239 int func = (int)quote->nd_func;
6240 int term = nd_term(quote);
6241 int paren = nd_paren(quote);
6243 rb_encoding *enc = current_enc;
6245 if (func == -1) return tSTRING_END;
6247 if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) {
6248 do {c = nextc();} while (ISSPACE(c));
6251 if (c == term && !quote->nd_nest) {
6252 if (func & STR_FUNC_QWORDS) {
6253 quote->nd_func = -1;
6256 if (!(func & STR_FUNC_REGEXP)) return tSTRING_END;
6257 set_yylval_num(regx_options());
6265 if ((func & STR_FUNC_EXPAND) && c == '#') {
6266 int t = parser_peek_variable_name(parser);
6272 if (tokadd_string(func, term, paren, "e->nd_nest,
6274 ruby_sourceline = nd_line(quote);
6275 if (func & STR_FUNC_REGEXP) {
6277 compile_error(PARSER_ARG "unterminated regexp meets end of file");
6282 compile_error(PARSER_ARG "unterminated string meets end of file");
6288 set_yylval_str(STR_NEW3(tok(), toklen(), enc, func));
6289 flush_string_content(enc);
6291 return tSTRING_CONTENT;
6295 parser_heredoc_identifier(struct parser_params *parser)
6297 int c = nextc(), term, func = 0;
6302 func = STR_FUNC_INDENT;
6306 func |= str_squote; goto quoted;
6308 func |= str_dquote; goto quoted;
6315 while ((c = nextc()) != -1 && c != term) {
6316 if (tokadd_mbchar(c) == -1) return 0;
6319 compile_error(PARSER_ARG "unterminated here document identifier");
6325 if (!parser_is_identchar()) {
6327 if (func & STR_FUNC_INDENT) {
6334 tokadd(func |= str_dquote);
6336 if (tokadd_mbchar(c) == -1) return 0;
6337 } while ((c = nextc()) != -1 && parser_is_identchar());
6344 ripper_dispatch_scan_event(parser, tHEREDOC_BEG);
6346 len = lex_p - lex_pbeg;
6347 lex_goto_eol(parser);
6348 lex_strterm = rb_node_newnode(NODE_HEREDOC,
6349 STR_NEW(tok(), toklen()), /* nd_lit */
6351 lex_lastline); /* nd_orig */
6352 nd_set_line(lex_strterm, ruby_sourceline);
6353 ripper_flush(parser);
6354 return term == '`' ? tXSTRING_BEG : tSTRING_BEG;
6358 parser_heredoc_restore(struct parser_params *parser, NODE *here)
6362 line = here->nd_orig;
6363 lex_lastline = line;
6364 lex_pbeg = RSTRING_PTR(line);
6365 lex_pend = lex_pbeg + RSTRING_LEN(line);
6366 lex_p = lex_pbeg + here->nd_nth;
6367 heredoc_end = ruby_sourceline;
6368 ruby_sourceline = nd_line(here);
6369 dispose_string(here->nd_lit);
6370 rb_gc_force_recycle((VALUE)here);
6371 ripper_flush(parser);
6375 parser_whole_match_p(struct parser_params *parser,
6376 const char *eos, long len, int indent)
6378 const char *p = lex_pbeg;
6382 while (*p && ISSPACE(*p)) p++;
6384 n = lex_pend - (p + len);
6385 if (n < 0 || (n > 0 && p[len] != '\n' && p[len] != '\r')) return FALSE;
6386 return strncmp(eos, p, len) == 0;
6391 ripper_dispatch_heredoc_end(struct parser_params *parser)
6393 if (!NIL_P(parser->delayed))
6394 ripper_dispatch_delayed_token(parser, tSTRING_CONTENT);
6395 lex_goto_eol(parser);
6396 ripper_dispatch_ignored_scan_event(parser, tHEREDOC_END);
6399 #define dispatch_heredoc_end() ripper_dispatch_heredoc_end(parser)
6401 #define dispatch_heredoc_end() ((void)0)
6405 parser_here_document(struct parser_params *parser, NODE *here)
6407 int c, func, indent = 0;
6408 const char *eos, *p, *pend;
6411 rb_encoding *enc = current_enc;
6413 eos = RSTRING_PTR(here->nd_lit);
6414 len = RSTRING_LEN(here->nd_lit) - 1;
6415 indent = (func = *eos++) & STR_FUNC_INDENT;
6417 if ((c = nextc()) == -1) {
6419 compile_error(PARSER_ARG "can't find string \"%s\" anywhere before EOF", eos);
6421 if (NIL_P(parser->delayed)) {
6422 ripper_dispatch_scan_event(parser, tSTRING_CONTENT);
6426 ((len = lex_p - parser->tokp) > 0 &&
6427 (str = STR_NEW3(parser->tokp, len, enc, func), 1))) {
6428 rb_str_append(parser->delayed, str);
6430 ripper_dispatch_delayed_token(parser, tSTRING_CONTENT);
6432 lex_goto_eol(parser);
6435 heredoc_restore(lex_strterm);
6439 if (was_bol() && whole_match_p(eos, len, indent)) {
6440 dispatch_heredoc_end();
6441 heredoc_restore(lex_strterm);
6445 if (!(func & STR_FUNC_EXPAND)) {
6447 p = RSTRING_PTR(lex_lastline);
6452 if (--pend == p || pend[-1] != '\r') {
6461 rb_str_cat(str, p, pend - p);
6463 str = STR_NEW(p, pend - p);
6464 if (pend < lex_pend) rb_str_cat(str, "\n", 1);
6465 lex_goto_eol(parser);
6466 if (nextc() == -1) {
6468 dispose_string(str);
6473 } while (!whole_match_p(eos, len, indent));
6476 /* int mb = ENC_CODERANGE_7BIT, *mbp = &mb;*/
6479 int t = parser_peek_variable_name(parser);
6486 if ((c = tokadd_string(func, '\n', 0, NULL, &enc)) == -1) {
6487 if (parser->eofp) goto error;
6491 set_yylval_str(STR_NEW3(tok(), toklen(), enc, func));
6492 flush_string_content(enc);
6493 return tSTRING_CONTENT;
6496 /* if (mbp && mb == ENC_CODERANGE_UNKNOWN) mbp = 0;*/
6497 if ((c = nextc()) == -1) goto error;
6498 } while (!whole_match_p(eos, len, indent));
6499 str = STR_NEW3(tok(), toklen(), enc, func);
6501 dispatch_heredoc_end();
6502 heredoc_restore(lex_strterm);
6503 lex_strterm = NEW_STRTERM(-1, 0, 0);
6504 set_yylval_str(str);
6505 return tSTRING_CONTENT;
6511 arg_ambiguous_gen(struct parser_params *parser)
6514 rb_warning0("ambiguous first argument; put parentheses or even spaces");
6516 dispatch0(arg_ambiguous);
6519 #define arg_ambiguous() (arg_ambiguous_gen(parser), 1)
6522 formal_argument_gen(struct parser_params *parser, ID lhs)
6525 if (!is_local_id(lhs))
6526 yyerror("formal argument must be local variable");
6528 shadowing_lvar(lhs);
6533 lvar_defined_gen(struct parser_params *parser, ID id)
6535 return (dyna_in_block() && dvar_defined_get(id)) || local_id(id);
6538 /* emacsen -*- hack */
6540 parser_encode_length(struct parser_params *parser, const char *name, long len)
6544 if (len > 5 && name[nlen = len - 5] == '-') {
6545 if (rb_memcicmp(name + nlen + 1, "unix", 4) == 0)
6548 if (len > 4 && name[nlen = len - 4] == '-') {
6549 if (rb_memcicmp(name + nlen + 1, "dos", 3) == 0)
6551 if (rb_memcicmp(name + nlen + 1, "mac", 3) == 0 &&
6552 !(len == 8 && rb_memcicmp(name, "utf8-mac", len) == 0))
6553 /* exclude UTF8-MAC because the encoding named "UTF8" doesn't exist in Ruby */
6560 parser_set_encode(struct parser_params *parser, const char *name)
6562 int idx = rb_enc_find_index(name);
6567 excargs[1] = rb_sprintf("unknown encoding name: %s", name);
6569 excargs[0] = rb_eArgError;
6570 excargs[2] = rb_make_backtrace();
6571 rb_ary_unshift(excargs[2], rb_sprintf("%s:%d", ruby_sourcefile, ruby_sourceline));
6572 rb_exc_raise(rb_make_exception(3, excargs));
6574 enc = rb_enc_from_index(idx);
6575 if (!rb_enc_asciicompat(enc)) {
6576 excargs[1] = rb_sprintf("%s is not ASCII compatible", rb_enc_name(enc));
6581 if (ruby_debug_lines) {
6582 long i, n = RARRAY_LEN(ruby_debug_lines);
6583 const VALUE *p = RARRAY_PTR(ruby_debug_lines);
6584 for (i = 0; i < n; ++i) {
6585 rb_enc_associate_index(*p, idx);
6592 comment_at_top(struct parser_params *parser)
6594 const char *p = lex_pbeg, *pend = lex_p - 1;
6595 if (parser->line_count != (parser->has_shebang ? 2 : 1)) return 0;
6597 if (!ISSPACE(*p)) return 0;
6604 typedef long (*rb_magic_comment_length_t)(struct parser_params *parser, const char *name, long len);
6605 typedef void (*rb_magic_comment_setter_t)(struct parser_params *parser, const char *name, const char *val);
6608 magic_comment_encoding(struct parser_params *parser, const char *name, const char *val)
6610 if (!comment_at_top(parser)) {
6613 parser_set_encode(parser, val);
6617 parser_set_token_info(struct parser_params *parser, const char *name, const char *val)
6619 int *p = &parser->parser_token_info_enabled;
6623 if (strcasecmp(val, "true") == 0) {
6629 if (strcasecmp(val, "false") == 0) {
6635 rb_compile_warning(ruby_sourcefile, ruby_sourceline, "invalid value for %s: %s", name, val);
6638 struct magic_comment {
6640 rb_magic_comment_setter_t func;
6641 rb_magic_comment_length_t length;
6644 static const struct magic_comment magic_comments[] = {
6645 {"coding", magic_comment_encoding, parser_encode_length},
6646 {"encoding", magic_comment_encoding, parser_encode_length},
6647 {"warn_indent", parser_set_token_info},
6652 magic_comment_marker(const char *str, long len)
6659 if (str[i-1] == '*' && str[i-2] == '-') {
6665 if (i + 1 >= len) return 0;
6666 if (str[i+1] != '-') {
6669 else if (str[i-1] != '-') {
6685 parser_magic_comment(struct parser_params *parser, const char *str, long len)
6687 VALUE name = 0, val = 0;
6688 const char *beg, *end, *vbeg, *vend;
6689 #define str_copy(_s, _p, _n) ((_s) \
6690 ? (void)(rb_str_resize((_s), (_n)), \
6691 MEMCPY(RSTRING_PTR(_s), (_p), char, (_n)), (_s)) \
6692 : (void)((_s) = STR_NEW((_p), (_n))))
6694 if (len <= 7) return FALSE;
6695 if (!(beg = magic_comment_marker(str, len))) return FALSE;
6696 if (!(end = magic_comment_marker(beg, str + len - beg))) return FALSE;
6698 len = end - beg - 3;
6700 /* %r"([^\\s\'\":;]+)\\s*:\\s*(\"(?:\\\\.|[^\"])*\"|[^\"\\s;]+)[\\s;]*" */
6703 const struct magic_comment *p = magic_comments;
6709 for (; len > 0 && *str; str++, --len) {
6711 case '\'': case '"': case ':': case ';':
6714 if (!ISSPACE(*str)) break;
6716 for (beg = str; len > 0; str++, --len) {
6718 case '\'': case '"': case ':': case ';':
6721 if (ISSPACE(*str)) break;
6726 for (end = str; len > 0 && ISSPACE(*str); str++, --len);
6728 if (*str != ':') continue;
6730 do str++; while (--len > 0 && ISSPACE(*str));
6733 for (vbeg = ++str; --len > 0 && *str != '"'; str++) {
6746 for (vbeg = str; len > 0 && *str != '"' && *str != ';' && !ISSPACE(*str); --len, str++);
6749 while (len > 0 && (*str == ';' || ISSPACE(*str))) --len, str++;
6752 str_copy(name, beg, n);
6753 s = RSTRING_PTR(name);
6754 for (i = 0; i < n; ++i) {
6755 if (s[i] == '-') s[i] = '_';
6759 if (STRNCASECMP(p->name, s, n) == 0) {
6762 n = (*p->length)(parser, vbeg, n);
6764 str_copy(val, vbeg, n);
6765 (*p->func)(parser, s, RSTRING_PTR(val));
6768 } while (++p < magic_comments + numberof(magic_comments));
6770 str_copy(val, vbeg, vend - vbeg);
6771 dispatch2(magic_comment, name, val);
6779 set_file_encoding(struct parser_params *parser, const char *str, const char *send)
6782 const char *beg = str;
6786 if (send - str <= 6) return;
6788 case 'C': case 'c': str += 6; continue;
6789 case 'O': case 'o': str += 5; continue;
6790 case 'D': case 'd': str += 4; continue;
6791 case 'I': case 'i': str += 3; continue;
6792 case 'N': case 'n': str += 2; continue;
6793 case 'G': case 'g': str += 1; continue;
6800 if (ISSPACE(*str)) break;
6803 if (STRNCASECMP(str-6, "coding", 6) == 0) break;
6807 if (++str >= send) return;
6808 } while (ISSPACE(*str));
6810 if (*str != '=' && *str != ':') return;
6815 while ((*str == '-' || *str == '_' || ISALNUM(*str)) && ++str < send);
6816 s = rb_str_new(beg, parser_encode_length(parser, beg, str - beg));
6817 parser_set_encode(parser, RSTRING_PTR(s));
6818 rb_str_resize(s, 0);
6822 parser_prepare(struct parser_params *parser)
6827 if (peek('!')) parser->has_shebang = 1;
6829 case 0xef: /* UTF-8 BOM marker */
6830 if (lex_pend - lex_p >= 2 &&
6831 (unsigned char)lex_p[0] == 0xbb &&
6832 (unsigned char)lex_p[1] == 0xbf) {
6833 parser->enc = rb_utf8_encoding();
6843 parser->enc = rb_enc_get(lex_lastline);
6846 #define IS_ARG() IS_lex_state(EXPR_ARG_ANY)
6847 #define IS_END() IS_lex_state(EXPR_END_ANY)
6848 #define IS_BEG() IS_lex_state(EXPR_BEG_ANY)
6849 #define IS_SPCARG(c) (IS_ARG() && space_seen && !ISSPACE(c))
6850 #define IS_LABEL_POSSIBLE() ((IS_lex_state(EXPR_BEG | EXPR_ENDFN) && !cmd_state) || IS_ARG())
6851 #define IS_LABEL_SUFFIX(n) (peek_n(':',(n)) && !peek_n(':', (n)+1))
6852 #define IS_AFTER_OPERATOR() IS_lex_state(EXPR_FNAME | EXPR_DOT)
6855 #define ambiguous_operator(op, syn) ( \
6856 rb_warning0("`"op"' after local variable is interpreted as binary operator"), \
6857 rb_warning0("even though it seems like "syn""))
6859 #define ambiguous_operator(op, syn) dispatch2(operator_ambiguous, ripper_intern(op), rb_str_new_cstr(syn))
6861 #define warn_balanced(op, syn) ((void) \
6862 (!IS_lex_state_for(last_state, EXPR_CLASS|EXPR_DOT|EXPR_FNAME|EXPR_ENDFN|EXPR_ENDARG) && \
6863 space_seen && !ISSPACE(c) && \
6864 (ambiguous_operator(op, syn), 0)))
6867 parser_yylex(struct parser_params *parser)
6872 enum lex_state_e last_state;
6876 int fallthru = FALSE;
6881 if (nd_type(lex_strterm) == NODE_HEREDOC) {
6882 token = here_document(lex_strterm);
6883 if (token == tSTRING_END) {
6885 lex_state = EXPR_END;
6889 token = parse_string(lex_strterm);
6890 if (token == tSTRING_END || token == tREGEXP_END) {
6891 rb_gc_force_recycle((VALUE)lex_strterm);
6893 lex_state = EXPR_END;
6898 cmd_state = command_start;
6899 command_start = FALSE;
6901 last_state = lex_state;
6902 switch (c = nextc()) {
6903 case '\0': /* NUL */
6904 case '\004': /* ^D */
6905 case '\032': /* ^Z */
6906 case -1: /* end of script. */
6910 case ' ': case '\t': case '\f': case '\r':
6911 case '\13': /* '\v' */
6914 while ((c = nextc())) {
6916 case ' ': case '\t': case '\f': case '\r':
6917 case '\13': /* '\v' */
6925 ripper_dispatch_scan_event(parser, tSP);
6929 case '#': /* it's a comment */
6930 /* no magic_comment in shebang line */
6931 if (!parser_magic_comment(parser, lex_p, lex_pend - lex_p)) {
6932 if (comment_at_top(parser)) {
6933 set_file_encoding(parser, lex_p, lex_pend);
6938 ripper_dispatch_scan_event(parser, tCOMMENT);
6943 if (IS_lex_state(EXPR_BEG | EXPR_VALUE | EXPR_CLASS | EXPR_FNAME | EXPR_DOT)) {
6946 ripper_dispatch_scan_event(parser, tIGNORED_NL);
6952 while ((c = nextc())) {
6954 case ' ': case '\t': case '\f': case '\r':
6955 case '\13': /* '\v' */
6959 if ((c = nextc()) != '.') {
6967 lex_nextline = lex_lastline;
6968 case -1: /* EOF no decrement*/
6969 lex_goto_eol(parser);
6972 parser->tokp = lex_p;
6975 goto normal_newline;
6979 command_start = TRUE;
6980 lex_state = EXPR_BEG;
6984 if ((c = nextc()) == '*') {
6985 if ((c = nextc()) == '=') {
6986 set_yylval_id(tPOW);
6987 lex_state = EXPR_BEG;
6992 rb_warning0("`**' interpreted as argument prefix");
6995 else if (IS_BEG()) {
6999 warn_balanced("**", "argument prefix");
7006 lex_state = EXPR_BEG;
7011 rb_warning0("`*' interpreted as argument prefix");
7014 else if (IS_BEG()) {
7018 warn_balanced("*", "argument prefix");
7022 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7027 if (IS_AFTER_OPERATOR()) {
7028 lex_state = EXPR_ARG;
7034 lex_state = EXPR_BEG;
7047 /* skip embedded rd document */
7048 if (strncmp(lex_p, "begin", 5) == 0 && ISSPACE(lex_p[5])) {
7052 lex_goto_eol(parser);
7053 ripper_dispatch_scan_event(parser, tEMBDOC_BEG);
7056 lex_goto_eol(parser);
7059 ripper_dispatch_scan_event(parser, tEMBDOC);
7065 compile_error(PARSER_ARG "embedded document meets end of file");
7068 if (c != '=') continue;
7069 if (strncmp(lex_p, "end", 3) == 0 &&
7070 (lex_p + 3 == lex_pend || ISSPACE(lex_p[3]))) {
7074 lex_goto_eol(parser);
7076 ripper_dispatch_scan_event(parser, tEMBDOC_END);
7082 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7083 if ((c = nextc()) == '=') {
7084 if ((c = nextc()) == '=') {
7093 else if (c == '>') {
7100 last_state = lex_state;
7103 !IS_lex_state(EXPR_DOT | EXPR_CLASS) &&
7105 (!IS_ARG() || space_seen)) {
7106 int token = heredoc_identifier();
7107 if (token) return token;
7109 if (IS_AFTER_OPERATOR()) {
7110 lex_state = EXPR_ARG;
7113 if (IS_lex_state(EXPR_CLASS))
7114 command_start = TRUE;
7115 lex_state = EXPR_BEG;
7118 if ((c = nextc()) == '>') {
7125 if ((c = nextc()) == '=') {
7126 set_yylval_id(tLSHFT);
7127 lex_state = EXPR_BEG;
7131 warn_balanced("<<", "here document");
7138 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7139 if ((c = nextc()) == '=') {
7143 if ((c = nextc()) == '=') {
7144 set_yylval_id(tRSHFT);
7145 lex_state = EXPR_BEG;
7155 lex_strterm = NEW_STRTERM(str_dquote, '"', 0);
7159 if (IS_lex_state(EXPR_FNAME)) {
7160 lex_state = EXPR_ENDFN;
7163 if (IS_lex_state(EXPR_DOT)) {
7165 lex_state = EXPR_CMDARG;
7167 lex_state = EXPR_ARG;
7170 lex_strterm = NEW_STRTERM(str_xquote, '`', 0);
7171 return tXSTRING_BEG;
7174 lex_strterm = NEW_STRTERM(str_squote, '\'', 0);
7179 lex_state = EXPR_VALUE;
7184 compile_error(PARSER_ARG "incomplete character syntax");
7187 if (rb_enc_isspace(c, current_enc)) {
7211 rb_warnI("invalid character syntax; use ?\\%c", c2);
7216 lex_state = EXPR_VALUE;
7221 if (!parser_isascii()) {
7222 if (tokadd_mbchar(c) == -1) return 0;
7224 else if ((rb_enc_isalnum(c, current_enc) || c == '_') &&
7225 lex_p < lex_pend && is_identchar(lex_p, lex_pend, current_enc)) {
7228 else if (c == '\\') {
7231 c = parser_tokadd_utf8(parser, &enc, 0, 0, 0);
7239 else if (!lex_eol_p() && !(c = *lex_p, ISASCII(c))) {
7241 if (tokadd_mbchar(c) == -1) return 0;
7244 c = read_escape(0, &enc);
7252 set_yylval_str(STR_NEW3(tok(), toklen(), enc, 0));
7253 lex_state = EXPR_END;
7257 if ((c = nextc()) == '&') {
7258 lex_state = EXPR_BEG;
7259 if ((c = nextc()) == '=') {
7260 set_yylval_id(tANDOP);
7261 lex_state = EXPR_BEG;
7267 else if (c == '=') {
7269 lex_state = EXPR_BEG;
7274 rb_warning0("`&' interpreted as argument prefix");
7277 else if (IS_BEG()) {
7281 warn_balanced("&", "argument prefix");
7284 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7288 if ((c = nextc()) == '|') {
7289 lex_state = EXPR_BEG;
7290 if ((c = nextc()) == '=') {
7291 set_yylval_id(tOROP);
7292 lex_state = EXPR_BEG;
7300 lex_state = EXPR_BEG;
7303 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7309 if (IS_AFTER_OPERATOR()) {
7310 lex_state = EXPR_ARG;
7319 lex_state = EXPR_BEG;
7322 if (IS_BEG() || (IS_SPCARG(c) && arg_ambiguous())) {
7323 lex_state = EXPR_BEG;
7325 if (c != -1 && ISDIGIT(c)) {
7331 lex_state = EXPR_BEG;
7333 warn_balanced("+", "unary operator");
7338 if (IS_AFTER_OPERATOR()) {
7339 lex_state = EXPR_ARG;
7348 lex_state = EXPR_BEG;
7352 lex_state = EXPR_ENDFN;
7355 if (IS_BEG() || (IS_SPCARG(c) && arg_ambiguous())) {
7356 lex_state = EXPR_BEG;
7358 if (c != -1 && ISDIGIT(c)) {
7363 lex_state = EXPR_BEG;
7365 warn_balanced("-", "unary operator");
7369 lex_state = EXPR_BEG;
7370 if ((c = nextc()) == '.') {
7371 if ((c = nextc()) == '.') {
7378 if (c != -1 && ISDIGIT(c)) {
7379 yyerror("no .<digit> floating literal anymore; put 0 before dot");
7381 lex_state = EXPR_DOT;
7385 case '0': case '1': case '2': case '3': case '4':
7386 case '5': case '6': case '7': case '8': case '9':
7388 int is_float, seen_point, seen_e, nondigit;
7390 is_float = seen_point = seen_e = nondigit = 0;
7391 lex_state = EXPR_END;
7393 if (c == '-' || c == '+') {
7398 #define no_digits() do {yyerror("numeric literal without digits"); return 0;} while (0)
7399 int start = toklen();
7401 if (c == 'x' || c == 'X') {
7404 if (c != -1 && ISXDIGIT(c)) {
7407 if (nondigit) break;
7411 if (!ISXDIGIT(c)) break;
7414 } while ((c = nextc()) != -1);
7418 if (toklen() == start) {
7421 else if (nondigit) goto trailing_uc;
7422 set_yylval_literal(rb_cstr_to_inum(tok(), 16, FALSE));
7425 if (c == 'b' || c == 'B') {
7428 if (c == '0' || c == '1') {
7431 if (nondigit) break;
7435 if (c != '0' && c != '1') break;
7438 } while ((c = nextc()) != -1);
7442 if (toklen() == start) {
7445 else if (nondigit) goto trailing_uc;
7446 set_yylval_literal(rb_cstr_to_inum(tok(), 2, FALSE));
7449 if (c == 'd' || c == 'D') {
7452 if (c != -1 && ISDIGIT(c)) {
7455 if (nondigit) break;
7459 if (!ISDIGIT(c)) break;
7462 } while ((c = nextc()) != -1);
7466 if (toklen() == start) {
7469 else if (nondigit) goto trailing_uc;
7470 set_yylval_literal(rb_cstr_to_inum(tok(), 10, FALSE));
7477 if (c == 'o' || c == 'O') {
7478 /* prefixed octal */
7480 if (c == -1 || c == '_' || !ISDIGIT(c)) {
7484 if (c >= '0' && c <= '7') {
7489 if (nondigit) break;
7493 if (c < '0' || c > '9') break;
7494 if (c > '7') goto invalid_octal;
7497 } while ((c = nextc()) != -1);
7498 if (toklen() > start) {
7501 if (nondigit) goto trailing_uc;
7502 set_yylval_literal(rb_cstr_to_inum(tok(), 8, FALSE));
7510 if (c > '7' && c <= '9') {
7512 yyerror("Invalid octal digit");
7514 else if (c == '.' || c == 'e' || c == 'E') {
7519 set_yylval_literal(INT2FIX(0));
7526 case '0': case '1': case '2': case '3': case '4':
7527 case '5': case '6': case '7': case '8': case '9':
7533 if (nondigit) goto trailing_uc;
7534 if (seen_point || seen_e) {
7539 if (c0 == -1 || !ISDIGIT(c0)) {
7567 if (c != '-' && c != '+') continue;
7572 case '_': /* `_' in number just ignored */
7573 if (nondigit) goto decode_num;
7588 snprintf(tmp, sizeof(tmp), "trailing `%c' in number", nondigit);
7593 double d = strtod(tok(), 0);
7594 if (errno == ERANGE) {
7595 rb_warningS("Float %s out of range", tok());
7598 set_yylval_literal(DBL2NUM(d));
7601 set_yylval_literal(rb_cstr_to_inum(tok(), 10, FALSE));
7612 lex_state = EXPR_ENDFN;
7614 lex_state = EXPR_ENDARG;
7616 if (!brace_nest--) c = tSTRING_DEND;
7623 if (IS_BEG() || IS_lex_state(EXPR_CLASS) || IS_SPCARG(-1)) {
7624 lex_state = EXPR_BEG;
7627 lex_state = EXPR_DOT;
7630 if (IS_END() || ISSPACE(c)) {
7632 warn_balanced(":", "symbol literal");
7633 lex_state = EXPR_BEG;
7638 lex_strterm = NEW_STRTERM(str_ssym, c, 0);
7641 lex_strterm = NEW_STRTERM(str_dsym, c, 0);
7647 lex_state = EXPR_FNAME;
7651 if (IS_lex_state(EXPR_BEG_ANY)) {
7652 lex_strterm = NEW_STRTERM(str_regexp, '/', 0);
7655 if ((c = nextc()) == '=') {
7657 lex_state = EXPR_BEG;
7662 (void)arg_ambiguous();
7663 lex_strterm = NEW_STRTERM(str_regexp, '/', 0);
7666 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7667 warn_balanced("/", "regexp literal");
7671 if ((c = nextc()) == '=') {
7673 lex_state = EXPR_BEG;
7676 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7681 lex_state = EXPR_BEG;
7682 command_start = TRUE;
7686 lex_state = EXPR_BEG;
7690 if (IS_AFTER_OPERATOR()) {
7691 if ((c = nextc()) != '@') {
7694 lex_state = EXPR_ARG;
7697 lex_state = EXPR_BEG;
7705 else if (IS_SPCARG(-1)) {
7711 lex_state = EXPR_BEG;
7716 if (IS_AFTER_OPERATOR()) {
7717 lex_state = EXPR_ARG;
7718 if ((c = nextc()) == ']') {
7719 if ((c = nextc()) == '=') {
7728 else if (IS_BEG()) {
7731 else if (IS_ARG() && space_seen) {
7734 lex_state = EXPR_BEG;
7741 if (lpar_beg && lpar_beg == paren_nest) {
7742 lex_state = EXPR_BEG;
7749 if (IS_ARG() || IS_lex_state(EXPR_END | EXPR_ENDFN))
7750 c = '{'; /* block (primary) */
7751 else if (IS_lex_state(EXPR_ENDARG))
7752 c = tLBRACE_ARG; /* block (expr) */
7754 c = tLBRACE; /* hash */
7757 lex_state = EXPR_BEG;
7758 if (c != tLBRACE) command_start = TRUE;
7766 ripper_dispatch_scan_event(parser, tSP);
7768 goto retry; /* skip \\n */
7774 if (IS_lex_state(EXPR_BEG_ANY)) {
7780 if (c == -1 || !ISALNUM(c)) {
7786 if (rb_enc_isalnum(term, current_enc) || !parser_isascii()) {
7787 yyerror("unknown type of %string");
7791 if (c == -1 || term == -1) {
7792 compile_error(PARSER_ARG "unterminated quoted string meets end of file");
7796 if (term == '(') term = ')';
7797 else if (term == '[') term = ']';
7798 else if (term == '{') term = '}';
7799 else if (term == '<') term = '>';
7804 lex_strterm = NEW_STRTERM(str_dquote, term, paren);
7808 lex_strterm = NEW_STRTERM(str_squote, term, paren);
7812 lex_strterm = NEW_STRTERM(str_dword, term, paren);
7813 do {c = nextc();} while (ISSPACE(c));
7818 lex_strterm = NEW_STRTERM(str_sword, term, paren);
7819 do {c = nextc();} while (ISSPACE(c));
7824 lex_strterm = NEW_STRTERM(str_dword, term, paren);
7825 do {c = nextc();} while (ISSPACE(c));
7827 return tSYMBOLS_BEG;
7830 lex_strterm = NEW_STRTERM(str_sword, term, paren);
7831 do {c = nextc();} while (ISSPACE(c));
7833 return tQSYMBOLS_BEG;
7836 lex_strterm = NEW_STRTERM(str_xquote, term, paren);
7837 return tXSTRING_BEG;
7840 lex_strterm = NEW_STRTERM(str_regexp, term, paren);
7844 lex_strterm = NEW_STRTERM(str_ssym, term, paren);
7845 lex_state = EXPR_FNAME;
7849 yyerror("unknown type of %string");
7853 if ((c = nextc()) == '=') {
7855 lex_state = EXPR_BEG;
7861 lex_state = IS_AFTER_OPERATOR() ? EXPR_ARG : EXPR_BEG;
7863 warn_balanced("%%", "string literal");
7867 lex_state = EXPR_END;
7871 case '_': /* $_: last read line string */
7873 if (parser_is_identchar()) {
7881 case '~': /* $~: match-data */
7882 case '*': /* $*: argv */
7883 case '$': /* $$: pid */
7884 case '?': /* $?: last status */
7885 case '!': /* $!: error string */
7886 case '@': /* $@: error position */
7887 case '/': /* $/: input record separator */
7888 case '\\': /* $\: output record separator */
7889 case ';': /* $;: field separator */
7890 case ',': /* $,: output field separator */
7891 case '.': /* $.: last read line number */
7892 case '=': /* $=: ignorecase */
7893 case ':': /* $:: load path */
7894 case '<': /* $<: reading filename */
7895 case '>': /* $>: default output handle */
7896 case '\"': /* $": already loaded files */
7900 set_yylval_name(rb_intern(tok()));
7907 if (parser_is_identchar()) {
7908 if (tokadd_mbchar(c) == -1) return 0;
7915 set_yylval_name(rb_intern(tok()));
7918 case '&': /* $&: last match */
7919 case '`': /* $`: string before last match */
7920 case '\'': /* $': string after last match */
7921 case '+': /* $+: string matches last paren. */
7922 if (IS_lex_state_for(last_state, EXPR_FNAME)) {
7927 set_yylval_node(NEW_BACK_REF(c));
7930 case '1': case '2': case '3':
7931 case '4': case '5': case '6':
7932 case '7': case '8': case '9':
7937 } while (c != -1 && ISDIGIT(c));
7939 if (IS_lex_state_for(last_state, EXPR_FNAME)) goto gvar;
7941 set_yylval_node(NEW_NTH_REF(atoi(tok()+1)));
7945 if (!parser_is_identchar()) {
7947 compile_error(PARSER_ARG "`$%c' is not allowed as a global variable name", c);
7963 if (c != -1 && (ISDIGIT(c) || !parser_is_identchar())) {
7966 compile_error(PARSER_ARG "`@%c' is not allowed as an instance variable name", c);
7969 compile_error(PARSER_ARG "`@@%c' is not allowed as a class variable name", c);
7976 if (was_bol() && whole_match_p("__END__", 7, 0)) {
7977 ruby__end__seen = 1;
7978 parser->eofp = Qtrue;
7982 lex_goto_eol(parser);
7983 ripper_dispatch_scan_event(parser, k__END__);
7991 if (!parser_is_identchar()) {
7992 compile_error(PARSER_ARG "Invalid char `\\x%02X' in expression", c);
8000 mb = ENC_CODERANGE_7BIT;
8002 if (!ISASCII(c)) mb = ENC_CODERANGE_UNKNOWN;
8003 if (tokadd_mbchar(c) == -1) return 0;
8005 } while (parser_is_identchar());
8011 if ((c == '!' || c == '?') && !peek('=')) {
8023 last_state = lex_state;
8026 lex_state = EXPR_END;
8030 lex_state = EXPR_END;
8031 if (tok()[1] == '@')
8038 if (toklast() == '!' || toklast() == '?') {
8042 if (IS_lex_state(EXPR_FNAME)) {
8043 if ((c = nextc()) == '=' && !peek('~') && !peek('>') &&
8044 (!peek('=') || (peek_n('>', 1)))) {
8045 result = tIDENTIFIER;
8053 if (result == 0 && ISUPPER(tok()[0])) {
8057 result = tIDENTIFIER;
8061 if (IS_LABEL_POSSIBLE()) {
8062 if (IS_LABEL_SUFFIX(0)) {
8063 lex_state = EXPR_BEG;
8065 set_yylval_name(TOK_INTERN(!ENC_SINGLE(mb)));
8069 if (mb == ENC_CODERANGE_7BIT && !IS_lex_state(EXPR_DOT)) {
8070 const struct kwtable *kw;
8072 /* See if it is a reserved word. */
8073 kw = rb_reserved_word(tok(), toklen());
8075 enum lex_state_e state = lex_state;
8076 lex_state = kw->state;
8077 if (state == EXPR_FNAME) {
8078 set_yylval_name(rb_intern(kw->name));
8081 if (lex_state == EXPR_BEG) {
8082 command_start = TRUE;
8084 if (kw->id[0] == keyword_do) {
8085 if (lpar_beg && lpar_beg == paren_nest) {
8088 return keyword_do_LAMBDA;
8090 if (COND_P()) return keyword_do_cond;
8091 if (CMDARG_P() && state != EXPR_CMDARG)
8092 return keyword_do_block;
8093 if (state & (EXPR_BEG | EXPR_ENDARG))
8094 return keyword_do_block;
8097 if (state & (EXPR_BEG | EXPR_VALUE))
8100 if (kw->id[0] != kw->id[1])
8101 lex_state = EXPR_BEG;
8107 if (IS_lex_state(EXPR_BEG_ANY | EXPR_ARG_ANY | EXPR_DOT)) {
8109 lex_state = EXPR_CMDARG;
8112 lex_state = EXPR_ARG;
8115 else if (lex_state == EXPR_FNAME) {
8116 lex_state = EXPR_ENDFN;
8119 lex_state = EXPR_END;
8123 ID ident = TOK_INTERN(!ENC_SINGLE(mb));
8125 set_yylval_name(ident);
8126 if (!IS_lex_state_for(last_state, EXPR_DOT|EXPR_FNAME) &&
8127 is_local_id(ident) && lvar_defined(ident)) {
8128 lex_state = EXPR_END;
8137 yylex(void *lval, void *p)
8142 struct parser_params *parser = (struct parser_params*)p;
8146 parser->parser_yylval = lval;
8147 parser->parser_yylval->val = Qundef;
8149 t = parser_yylex(parser);
8151 if (!NIL_P(parser->delayed)) {
8152 ripper_dispatch_delayed_token(parser, t);
8156 ripper_dispatch_scan_event(parser, t);
8164 node_newnode(struct parser_params *parser, enum node_type type, VALUE a0, VALUE a1, VALUE a2)
8166 NODE *n = (rb_node_newnode)(type, a0, a1, a2);
8167 nd_set_line(n, ruby_sourceline);
8171 static enum node_type
8172 nodetype(NODE *node) /* for debug */
8174 return (enum node_type)nd_type(node);
8178 nodeline(NODE *node)
8180 return nd_line(node);
8184 newline_node(NODE *node)
8187 node = remove_begin(node);
8188 node->flags |= NODE_FL_NEWLINE;
8194 fixpos(NODE *node, NODE *orig)
8198 if (orig == (NODE*)1) return;
8199 nd_set_line(node, nd_line(orig));
8203 parser_warning(struct parser_params *parser, NODE *node, const char *mesg)
8205 rb_compile_warning(ruby_sourcefile, nd_line(node), "%s", mesg);
8207 #define parser_warning(node, mesg) parser_warning(parser, (node), (mesg))
8210 parser_warn(struct parser_params *parser, NODE *node, const char *mesg)
8212 rb_compile_warn(ruby_sourcefile, nd_line(node), "%s", mesg);
8214 #define parser_warn(node, mesg) parser_warn(parser, (node), (mesg))
8217 block_append_gen(struct parser_params *parser, NODE *head, NODE *tail)
8219 NODE *end, *h = head, *nd;
8221 if (tail == 0) return head;
8223 if (h == 0) return tail;
8224 switch (nd_type(h)) {
8231 parser_warning(h, "unused literal ignored");
8234 h = end = NEW_BLOCK(head);
8245 switch (nd_type(nd)) {
8251 if (RTEST(ruby_verbose)) {
8252 parser_warning(tail, "statement not reached");
8260 if (nd_type(tail) != NODE_BLOCK) {
8261 tail = NEW_BLOCK(tail);
8262 tail->nd_end = tail;
8264 end->nd_next = tail;
8265 h->nd_end = tail->nd_end;
8269 /* append item to the list */
8271 list_append_gen(struct parser_params *parser, NODE *list, NODE *item)
8275 if (list == 0) return NEW_LIST(item);
8276 if (list->nd_next) {
8277 last = list->nd_next->nd_end;
8284 last->nd_next = NEW_LIST(item);
8285 list->nd_next->nd_end = last->nd_next;
8289 /* concat two lists */
8291 list_concat_gen(struct parser_params *parser, NODE *head, NODE *tail)
8295 if (head->nd_next) {
8296 last = head->nd_next->nd_end;
8302 head->nd_alen += tail->nd_alen;
8303 last->nd_next = tail;
8304 if (tail->nd_next) {
8305 head->nd_next->nd_end = tail->nd_next->nd_end;
8308 head->nd_next->nd_end = tail;
8315 literal_concat0(struct parser_params *parser, VALUE head, VALUE tail)
8317 if (NIL_P(tail)) return 1;
8318 if (!rb_enc_compatible(head, tail)) {
8319 compile_error(PARSER_ARG "string literal encodings differ (%s / %s)",
8320 rb_enc_name(rb_enc_get(head)),
8321 rb_enc_name(rb_enc_get(tail)));
8322 rb_str_resize(head, 0);
8323 rb_str_resize(tail, 0);
8326 rb_str_buf_append(head, tail);
8330 /* concat two string literals */
8332 literal_concat_gen(struct parser_params *parser, NODE *head, NODE *tail)
8334 enum node_type htype;
8338 if (!head) return tail;
8339 if (!tail) return head;
8341 htype = nd_type(head);
8342 if (htype == NODE_EVSTR) {
8343 NODE *node = NEW_DSTR(Qnil);
8344 head = list_append(node, head);
8347 switch (nd_type(tail)) {
8349 if (htype == NODE_DSTR && (headlast = head->nd_next->nd_end->nd_head) &&
8350 nd_type(headlast) == NODE_STR) {
8352 lit = headlast->nd_lit;
8357 if (htype == NODE_STR) {
8358 if (!literal_concat0(parser, lit, tail->nd_lit)) {
8360 rb_gc_force_recycle((VALUE)head);
8361 rb_gc_force_recycle((VALUE)tail);
8364 rb_gc_force_recycle((VALUE)tail);
8367 list_append(head, tail);
8372 if (htype == NODE_STR) {
8373 if (!literal_concat0(parser, head->nd_lit, tail->nd_lit))
8375 tail->nd_lit = head->nd_lit;
8376 rb_gc_force_recycle((VALUE)head);
8379 else if (NIL_P(tail->nd_lit)) {
8381 head->nd_alen += tail->nd_alen - 1;
8382 head->nd_next->nd_end->nd_next = tail->nd_next;
8383 head->nd_next->nd_end = tail->nd_next->nd_end;
8384 rb_gc_force_recycle((VALUE)tail);
8386 else if (htype == NODE_DSTR && (headlast = head->nd_next->nd_end->nd_head) &&
8387 nd_type(headlast) == NODE_STR) {
8388 lit = headlast->nd_lit;
8389 if (!literal_concat0(parser, lit, tail->nd_lit))
8391 tail->nd_lit = Qnil;
8395 nd_set_type(tail, NODE_ARRAY);
8396 tail->nd_head = NEW_STR(tail->nd_lit);
8397 list_concat(head, tail);
8402 if (htype == NODE_STR) {
8403 nd_set_type(head, NODE_DSTR);
8406 list_append(head, tail);
8413 evstr2dstr_gen(struct parser_params *parser, NODE *node)
8415 if (nd_type(node) == NODE_EVSTR) {
8416 node = list_append(NEW_DSTR(Qnil), node);
8422 new_evstr_gen(struct parser_params *parser, NODE *node)
8427 switch (nd_type(node)) {
8428 case NODE_STR: case NODE_DSTR: case NODE_EVSTR:
8432 return NEW_EVSTR(head);
8436 call_bin_op_gen(struct parser_params *parser, NODE *recv, ID id, NODE *arg1)
8440 return NEW_CALL(recv, id, NEW_LIST(arg1));
8444 call_uni_op_gen(struct parser_params *parser, NODE *recv, ID id)
8447 return NEW_CALL(recv, id, 0);
8451 match_op_gen(struct parser_params *parser, NODE *node1, NODE *node2)
8456 switch (nd_type(node1)) {
8458 case NODE_DREGX_ONCE:
8459 return NEW_MATCH2(node1, node2);
8462 if (RB_TYPE_P(node1->nd_lit, T_REGEXP)) {
8463 return NEW_MATCH2(node1, node2);
8469 switch (nd_type(node2)) {
8471 case NODE_DREGX_ONCE:
8472 return NEW_MATCH3(node2, node1);
8475 if (RB_TYPE_P(node2->nd_lit, T_REGEXP)) {
8476 return NEW_MATCH3(node2, node1);
8481 return NEW_CALL(node1, tMATCH, NEW_LIST(node2));
8485 gettable_gen(struct parser_params *parser, ID id)
8496 case keyword__FILE__:
8497 return NEW_STR(rb_str_dup(ruby_sourcefile_string));
8498 case keyword__LINE__:
8499 return NEW_LIT(INT2FIX(tokline));
8500 case keyword__ENCODING__:
8501 return NEW_LIT(rb_enc_from_encoding(current_enc));
8503 switch (id_type(id)) {
8505 if (dyna_in_block() && dvar_defined(id)) return NEW_DVAR(id);
8506 if (local_id(id)) return NEW_LVAR(id);
8507 /* method call without arguments */
8508 return NEW_VCALL(id);
8510 return NEW_GVAR(id);
8512 return NEW_IVAR(id);
8514 return NEW_CONST(id);
8516 return NEW_CVAR(id);
8518 compile_error(PARSER_ARG "identifier %s is not valid to get", rb_id2name(id));
8523 id_is_var_gen(struct parser_params *parser, ID id)
8525 if (is_notop_id(id)) {
8526 switch (id & ID_SCOPE_MASK) {
8527 case ID_GLOBAL: case ID_INSTANCE: case ID_CONST: case ID_CLASS:
8530 if (dyna_in_block() && dvar_defined(id)) return 1;
8531 if (local_id(id)) return 1;
8532 /* method call without arguments */
8536 compile_error(PARSER_ARG "identifier %s is not valid to get", rb_id2name(id));
8539 #endif /* !RIPPER */
8543 lex_state_name(enum lex_state_e state)
8545 static const char names[][12] = {
8546 "EXPR_BEG", "EXPR_END", "EXPR_ENDARG", "EXPR_ENDFN", "EXPR_ARG",
8547 "EXPR_CMDARG", "EXPR_MID", "EXPR_FNAME", "EXPR_DOT", "EXPR_CLASS",
8551 if ((unsigned)state & ~(~0u << EXPR_MAX_STATE))
8552 return names[ffs(state)];
8559 assignable_gen(struct parser_params *parser, VALUE lhs)
8562 assignable_gen(struct parser_params *parser, ID id, NODE *val)
8566 ID id = get_id(lhs);
8567 # define assignable_result(x) get_value(lhs)
8568 # define parser_yyerror(parser, x) dispatch1(assign_error, lhs)
8570 # define assignable_result(x) (x)
8572 if (!id) return assignable_result(0);
8575 yyerror("Can't change the value of self");
8578 yyerror("Can't assign to nil");
8581 yyerror("Can't assign to true");
8584 yyerror("Can't assign to false");
8586 case keyword__FILE__:
8587 yyerror("Can't assign to __FILE__");
8589 case keyword__LINE__:
8590 yyerror("Can't assign to __LINE__");
8592 case keyword__ENCODING__:
8593 yyerror("Can't assign to __ENCODING__");
8596 switch (id_type(id)) {
8598 if (dyna_in_block()) {
8599 if (dvar_curr(id)) {
8600 return assignable_result(NEW_DASGN_CURR(id, val));
8602 else if (dvar_defined(id)) {
8603 return assignable_result(NEW_DASGN(id, val));
8605 else if (local_id(id)) {
8606 return assignable_result(NEW_LASGN(id, val));
8610 return assignable_result(NEW_DASGN_CURR(id, val));
8614 if (!local_id(id)) {
8617 return assignable_result(NEW_LASGN(id, val));
8621 return assignable_result(NEW_GASGN(id, val));
8623 return assignable_result(NEW_IASGN(id, val));
8625 if (!in_def && !in_single)
8626 return assignable_result(NEW_CDECL(id, val, 0));
8627 yyerror("dynamic constant assignment");
8630 return assignable_result(NEW_CVASGN(id, val));
8632 compile_error(PARSER_ARG "identifier %s is not valid to set", rb_id2name(id));
8635 return assignable_result(0);
8636 #undef assignable_result
8637 #undef parser_yyerror
8641 is_private_local_id(ID name)
8644 if (name == idUScore) return 1;
8645 if (!is_local_id(name)) return 0;
8646 s = rb_id2str(name);
8648 return RSTRING_PTR(s)[0] == '_';
8651 #define LVAR_USED ((ID)1 << (sizeof(ID) * CHAR_BIT - 1))
8654 shadowing_lvar_gen(struct parser_params *parser, ID name)
8656 if (is_private_local_id(name)) return name;
8657 if (dyna_in_block()) {
8658 if (dvar_curr(name)) {
8659 yyerror("duplicated argument name");
8661 else if (dvar_defined_get(name) || local_id(name)) {
8662 rb_warningS("shadowing outer local variable - %s", rb_id2name(name));
8663 vtable_add(lvtbl->vars, name);
8665 vtable_add(lvtbl->used, (ID)ruby_sourceline | LVAR_USED);
8670 if (local_id(name)) {
8671 yyerror("duplicated argument name");
8678 new_bv_gen(struct parser_params *parser, ID name)
8681 if (!is_local_id(name)) {
8682 compile_error(PARSER_ARG "invalid local variable - %s",
8686 shadowing_lvar(name);
8692 aryset_gen(struct parser_params *parser, NODE *recv, NODE *idx)
8694 if (recv && nd_type(recv) == NODE_SELF)
8696 return NEW_ATTRASGN(recv, tASET, idx);
8700 block_dup_check_gen(struct parser_params *parser, NODE *node1, NODE *node2)
8702 if (node2 && node1 && nd_type(node1) == NODE_BLOCK_PASS) {
8703 compile_error(PARSER_ARG "both block arg and actual block given");
8707 static const char id_type_names[][9] = {
8719 rb_id_attrset(ID id)
8721 if (!is_notop_id(id)) {
8723 case tAREF: case tASET:
8724 return tASET; /* only exception */
8726 rb_name_error(id, "cannot make operator ID :%s attrset", rb_id2name(id));
8729 int scope = (int)(id & ID_SCOPE_MASK);
8731 case ID_LOCAL: case ID_INSTANCE: case ID_GLOBAL:
8732 case ID_CONST: case ID_CLASS: case ID_JUNK:
8737 rb_name_error(id, "cannot make %s ID %+"PRIsVALUE" attrset",
8738 id_type_names[scope], ID2SYM(id));
8742 id &= ~ID_SCOPE_MASK;
8748 attrset_gen(struct parser_params *parser, NODE *recv, ID id)
8750 if (recv && nd_type(recv) == NODE_SELF)
8752 return NEW_ATTRASGN(recv, rb_id_attrset(id), 0);
8756 rb_backref_error_gen(struct parser_params *parser, NODE *node)
8758 switch (nd_type(node)) {
8760 compile_error(PARSER_ARG "Can't set variable $%ld", node->nd_nth);
8763 compile_error(PARSER_ARG "Can't set variable $%c", (int)node->nd_nth);
8769 arg_concat_gen(struct parser_params *parser, NODE *node1, NODE *node2)
8771 if (!node2) return node1;
8772 switch (nd_type(node1)) {
8773 case NODE_BLOCK_PASS:
8775 node1->nd_head = arg_concat(node1->nd_head, node2);
8777 node1->nd_head = NEW_LIST(node2);
8780 if (nd_type(node2) != NODE_ARRAY) break;
8781 node1->nd_body = list_concat(NEW_LIST(node1->nd_body), node2);
8782 nd_set_type(node1, NODE_ARGSCAT);
8785 if (nd_type(node2) != NODE_ARRAY ||
8786 nd_type(node1->nd_body) != NODE_ARRAY) break;
8787 node1->nd_body = list_concat(node1->nd_body, node2);
8790 return NEW_ARGSCAT(node1, node2);
8794 arg_append_gen(struct parser_params *parser, NODE *node1, NODE *node2)
8796 if (!node1) return NEW_LIST(node2);
8797 switch (nd_type(node1)) {
8799 return list_append(node1, node2);
8800 case NODE_BLOCK_PASS:
8801 node1->nd_head = arg_append(node1->nd_head, node2);
8804 node1->nd_body = list_append(NEW_LIST(node1->nd_body), node2);
8805 nd_set_type(node1, NODE_ARGSCAT);
8808 return NEW_ARGSPUSH(node1, node2);
8812 splat_array(NODE* node)
8814 if (nd_type(node) == NODE_SPLAT) node = node->nd_head;
8815 if (nd_type(node) == NODE_ARRAY) return node;
8820 node_assign_gen(struct parser_params *parser, NODE *lhs, NODE *rhs)
8824 switch (nd_type(lhs)) {
8830 case NODE_DASGN_CURR:
8834 lhs->nd_value = rhs;
8839 lhs->nd_args = arg_append(lhs->nd_args, rhs);
8843 /* should not happen */
8851 value_expr_gen(struct parser_params *parser, NODE *node)
8856 rb_warning0("empty expression");
8859 switch (nd_type(node)) {
8862 parser_warning(node, "void value expression");
8870 if (!cond) yyerror("void value expression");
8871 /* or "control never reach"? */
8875 while (node->nd_next) {
8876 node = node->nd_next;
8878 node = node->nd_head;
8882 node = node->nd_body;
8886 if (!node->nd_body) {
8887 node = node->nd_else;
8890 else if (!node->nd_else) {
8891 node = node->nd_body;
8894 if (!value_expr(node->nd_body)) return FALSE;
8895 node = node->nd_else;
8901 node = node->nd_2nd;
8913 void_expr_gen(struct parser_params *parser, NODE *node)
8915 const char *useless = 0;
8917 if (!RTEST(ruby_verbose)) return;
8920 switch (nd_type(node)) {
8922 switch (node->nd_mid) {
8941 useless = rb_id2name(node->nd_mid);
8953 useless = "a variable";
8956 useless = "a constant";
8962 case NODE_DREGX_ONCE:
8963 useless = "a literal";
8988 useless = "defined?";
8993 int line = ruby_sourceline;
8995 ruby_sourceline = nd_line(node);
8996 rb_warnS("possibly useless use of %s in void context", useless);
8997 ruby_sourceline = line;
9002 void_stmts_gen(struct parser_params *parser, NODE *node)
9004 if (!RTEST(ruby_verbose)) return;
9006 if (nd_type(node) != NODE_BLOCK) return;
9009 if (!node->nd_next) return;
9010 void_expr0(node->nd_head);
9011 node = node->nd_next;
9016 remove_begin(NODE *node)
9018 NODE **n = &node, *n1 = node;
9019 while (n1 && nd_type(n1) == NODE_BEGIN && n1->nd_body) {
9020 *n = n1 = n1->nd_body;
9026 reduce_nodes_gen(struct parser_params *parser, NODE **body)
9034 #define subnodes(n1, n2) \
9035 ((!node->n1) ? (node->n2 ? (body = &node->n2, 1) : 0) : \
9036 (!node->n2) ? (body = &node->n1, 1) : \
9037 (reduce_nodes(&node->n1), body = &node->n2, 1))
9040 int newline = (int)(node->flags & NODE_FL_NEWLINE);
9041 switch (nd_type(node)) {
9047 *body = node = node->nd_stts;
9048 if (newline && node) node->flags |= NODE_FL_NEWLINE;
9051 *body = node = node->nd_body;
9052 if (newline && node) node->flags |= NODE_FL_NEWLINE;
9055 body = &node->nd_end->nd_head;
9058 if (subnodes(nd_body, nd_else)) break;
9061 body = &node->nd_body;
9064 if (!subnodes(nd_body, nd_next)) goto end;
9067 if (!subnodes(nd_head, nd_resq)) goto end;
9070 if (node->nd_else) {
9071 body = &node->nd_resq;
9074 if (!subnodes(nd_head, nd_resq)) goto end;
9080 if (newline && node) node->flags |= NODE_FL_NEWLINE;
9087 is_static_content(NODE *node)
9089 if (!node) return 1;
9090 switch (nd_type(node)) {
9092 if (!(node = node->nd_head)) break;
9095 if (!is_static_content(node->nd_head)) return 0;
9096 } while ((node = node->nd_next) != 0);
9111 assign_in_cond(struct parser_params *parser, NODE *node)
9113 switch (nd_type(node)) {
9115 yyerror("multiple assignment in conditional");
9120 case NODE_DASGN_CURR:
9129 if (!node->nd_value) return 1;
9130 if (is_static_content(node->nd_value)) {
9131 /* reports always */
9132 parser_warn(node->nd_value, "found = in conditional, should be ==");
9138 warn_unless_e_option(struct parser_params *parser, NODE *node, const char *str)
9140 if (!e_option_supplied(parser)) parser_warn(node, str);
9144 warning_unless_e_option(struct parser_params *parser, NODE *node, const char *str)
9146 if (!e_option_supplied(parser)) parser_warning(node, str);
9150 fixup_nodes(NODE **rootnode)
9152 NODE *node, *next, *head;
9154 for (node = *rootnode; node; node = next) {
9155 enum node_type type;
9158 next = node->nd_next;
9159 head = node->nd_head;
9160 rb_gc_force_recycle((VALUE)node);
9162 switch (type = nd_type(head)) {
9165 val = rb_range_new(head->nd_beg->nd_lit, head->nd_end->nd_lit,
9167 rb_gc_force_recycle((VALUE)head->nd_beg);
9168 rb_gc_force_recycle((VALUE)head->nd_end);
9169 nd_set_type(head, NODE_LIT);
9178 static NODE *cond0(struct parser_params*,NODE*);
9181 range_op(struct parser_params *parser, NODE *node)
9183 enum node_type type;
9185 if (node == 0) return 0;
9187 type = nd_type(node);
9189 if (type == NODE_LIT && FIXNUM_P(node->nd_lit)) {
9190 warn_unless_e_option(parser, node, "integer literal in conditional range");
9191 return NEW_CALL(node, tEQ, NEW_LIST(NEW_GVAR(rb_intern("$."))));
9193 return cond0(parser, node);
9197 literal_node(NODE *node)
9199 if (!node) return 1; /* same as NODE_NIL */
9200 switch (nd_type(node)) {
9206 case NODE_DREGX_ONCE:
9218 cond0(struct parser_params *parser, NODE *node)
9220 if (node == 0) return 0;
9221 assign_in_cond(parser, node);
9223 switch (nd_type(node)) {
9227 rb_warn0("string literal in condition");
9231 case NODE_DREGX_ONCE:
9232 warning_unless_e_option(parser, node, "regex literal in condition");
9233 return NEW_MATCH2(node, NEW_GVAR(rb_intern("$_")));
9237 node->nd_1st = cond0(parser, node->nd_1st);
9238 node->nd_2nd = cond0(parser, node->nd_2nd);
9243 node->nd_beg = range_op(parser, node->nd_beg);
9244 node->nd_end = range_op(parser, node->nd_end);
9245 if (nd_type(node) == NODE_DOT2) nd_set_type(node,NODE_FLIP2);
9246 else if (nd_type(node) == NODE_DOT3) nd_set_type(node, NODE_FLIP3);
9247 if (!e_option_supplied(parser)) {
9248 int b = literal_node(node->nd_beg);
9249 int e = literal_node(node->nd_end);
9250 if ((b == 1 && e == 1) || (b + e >= 2 && RTEST(ruby_verbose))) {
9251 parser_warn(node, "range literal in condition");
9257 parser_warning(node, "literal in condition");
9261 if (RB_TYPE_P(node->nd_lit, T_REGEXP)) {
9262 warn_unless_e_option(parser, node, "regex literal in condition");
9263 nd_set_type(node, NODE_MATCH);
9266 parser_warning(node, "literal in condition");
9275 cond_gen(struct parser_params *parser, NODE *node)
9277 if (node == 0) return 0;
9278 return cond0(parser, node);
9282 logop_gen(struct parser_params *parser, enum node_type type, NODE *left, NODE *right)
9285 if (left && (enum node_type)nd_type(left) == type) {
9286 NODE *node = left, *second;
9287 while ((second = node->nd_2nd) != 0 && (enum node_type)nd_type(second) == type) {
9290 node->nd_2nd = NEW_NODE(type, second, right, 0);
9293 return NEW_NODE(type, left, right, 0);
9297 no_blockarg(struct parser_params *parser, NODE *node)
9299 if (node && nd_type(node) == NODE_BLOCK_PASS) {
9300 compile_error(PARSER_ARG "block argument should not be given");
9305 ret_args_gen(struct parser_params *parser, NODE *node)
9308 no_blockarg(parser, node);
9309 if (nd_type(node) == NODE_ARRAY) {
9310 if (node->nd_next == 0) {
9311 node = node->nd_head;
9314 nd_set_type(node, NODE_VALUES);
9322 new_yield_gen(struct parser_params *parser, NODE *node)
9324 if (node) no_blockarg(parser, node);
9326 return NEW_YIELD(node);
9330 negate_lit(NODE *node)
9332 switch (TYPE(node->nd_lit)) {
9334 node->nd_lit = LONG2FIX(-FIX2LONG(node->nd_lit));
9337 node->nd_lit = rb_funcall(node->nd_lit,tUMINUS,0,0);
9341 if (FLONUM_P(node->nd_lit)) {
9342 node->nd_lit = DBL2NUM(-RFLOAT_VALUE(node->nd_lit));
9345 RFLOAT(node->nd_lit)->float_value = -RFLOAT_VALUE(node->nd_lit);
9348 RFLOAT(node->nd_lit)->float_value = -RFLOAT_VALUE(node->nd_lit);
9358 arg_blk_pass(NODE *node1, NODE *node2)
9361 node2->nd_head = node1;
9369 new_args_gen(struct parser_params *parser, NODE *m, NODE *o, ID r, NODE *p, NODE *tail)
9371 int saved_line = ruby_sourceline;
9372 struct rb_args_info *args = tail->nd_ainfo;
9374 args->pre_args_num = m ? rb_long2int(m->nd_plen) : 0;
9375 args->pre_init = m ? m->nd_next : 0;
9377 args->post_args_num = p ? rb_long2int(p->nd_plen) : 0;
9378 args->post_init = p ? p->nd_next : 0;
9379 args->first_post_arg = p ? p->nd_pid : 0;
9385 ruby_sourceline = saved_line;
9391 new_args_tail_gen(struct parser_params *parser, NODE *k, ID kr, ID b)
9393 int saved_line = ruby_sourceline;
9394 struct rb_args_info *args;
9395 NODE *kw_rest_arg = 0;
9398 args = ALLOC(struct rb_args_info);
9399 MEMZERO(args, struct rb_args_info, 1);
9400 node = NEW_NODE(NODE_ARGS, 0, 0, args);
9402 args->block_arg = b;
9404 if (k && !kr) kr = internal_id();
9407 kw_rest_arg = NEW_DVAR(kr);
9409 args->kw_rest_arg = kw_rest_arg;
9411 ruby_sourceline = saved_line;
9416 dsym_node_gen(struct parser_params *parser, NODE *node)
9421 return NEW_LIT(ID2SYM(idNULL));
9424 switch (nd_type(node)) {
9426 nd_set_type(node, NODE_DSYM);
9430 node->nd_lit = ID2SYM(rb_intern_str(lit));
9431 nd_set_type(node, NODE_LIT);
9434 node = NEW_NODE(NODE_DSYM, Qnil, 1, NEW_LIST(node));
9439 #endif /* !RIPPER */
9443 new_op_assign_gen(struct parser_params *parser, NODE *lhs, ID op, NODE *rhs)
9448 ID vid = lhs->nd_vid;
9450 lhs->nd_value = rhs;
9451 asgn = NEW_OP_ASGN_OR(gettable(vid), lhs);
9452 if (is_asgn_or_id(vid)) {
9456 else if (op == tANDOP) {
9457 lhs->nd_value = rhs;
9458 asgn = NEW_OP_ASGN_AND(gettable(vid), lhs);
9462 asgn->nd_value = NEW_CALL(gettable(vid), op, NEW_LIST(rhs));
9466 asgn = NEW_BEGIN(0);
9472 new_attr_op_assign_gen(struct parser_params *parser, NODE *lhs, ID attr, ID op, NODE *rhs)
9479 else if (op == tANDOP) {
9482 asgn = NEW_OP_ASGN2(lhs, attr, op, rhs);
9488 new_const_op_assign_gen(struct parser_params *parser, NODE *lhs, ID op, NODE *rhs)
9495 else if (op == tANDOP) {
9499 asgn = NEW_OP_CDECL(lhs, op, rhs);
9502 asgn = NEW_BEGIN(0);
9509 new_op_assign_gen(struct parser_params *parser, VALUE lhs, VALUE op, VALUE rhs)
9511 return dispatch3(opassign, lhs, op, rhs);
9515 new_attr_op_assign_gen(struct parser_params *parser, VALUE lhs, VALUE type, VALUE attr, VALUE op, VALUE rhs)
9517 VALUE recv = dispatch3(field, lhs, type, attr);
9518 return dispatch3(opassign, recv, op, rhs);
9523 warn_unused_var(struct parser_params *parser, struct local_vars *local)
9528 if (!local->used) return;
9529 v = local->vars->tbl;
9530 u = local->used->tbl;
9531 cnt = local->used->pos;
9532 if (cnt != local->vars->pos) {
9533 rb_bug("local->used->pos != local->vars->pos");
9535 for (i = 0; i < cnt; ++i) {
9536 if (!v[i] || (u[i] & LVAR_USED)) continue;
9537 if (is_private_local_id(v[i])) continue;
9538 rb_warn4S(ruby_sourcefile, (int)u[i], "assigned but unused variable - %s", rb_id2name(v[i]));
9543 local_push_gen(struct parser_params *parser, int inherit_dvars)
9545 struct local_vars *local;
9547 local = ALLOC(struct local_vars);
9548 local->prev = lvtbl;
9549 local->args = vtable_alloc(0);
9550 local->vars = vtable_alloc(inherit_dvars ? DVARS_INHERIT : DVARS_TOPSCOPE);
9551 local->used = !(inherit_dvars &&
9552 (ifndef_ripper(compile_for_eval || e_option_supplied(parser))+0)) &&
9553 RTEST(ruby_verbose) ? vtable_alloc(0) : 0;
9554 local->cmdargs = cmdarg_stack;
9560 local_pop_gen(struct parser_params *parser)
9562 struct local_vars *local = lvtbl->prev;
9564 warn_unused_var(parser, lvtbl);
9565 vtable_free(lvtbl->used);
9567 vtable_free(lvtbl->args);
9568 vtable_free(lvtbl->vars);
9569 cmdarg_stack = lvtbl->cmdargs;
9576 local_tbl_gen(struct parser_params *parser)
9578 int cnt_args = vtable_size(lvtbl->args);
9579 int cnt_vars = vtable_size(lvtbl->vars);
9580 int cnt = cnt_args + cnt_vars;
9584 if (cnt <= 0) return 0;
9585 buf = ALLOC_N(ID, cnt + 1);
9586 MEMCPY(buf+1, lvtbl->args->tbl, ID, cnt_args);
9587 /* remove IDs duplicated to warn shadowing */
9588 for (i = 0, j = cnt_args+1; i < cnt_vars; ++i) {
9589 ID id = lvtbl->vars->tbl[i];
9590 if (!vtable_included(lvtbl->args, id)) {
9594 if (--j < cnt) REALLOC_N(buf, ID, (cnt = j) + 1);
9601 arg_var_gen(struct parser_params *parser, ID id)
9603 vtable_add(lvtbl->args, id);
9604 return vtable_size(lvtbl->args) - 1;
9608 local_var_gen(struct parser_params *parser, ID id)
9610 vtable_add(lvtbl->vars, id);
9612 vtable_add(lvtbl->used, (ID)ruby_sourceline);
9614 return vtable_size(lvtbl->vars) - 1;
9618 local_id_gen(struct parser_params *parser, ID id)
9620 struct vtable *vars, *args, *used;
9626 while (vars && POINTER_P(vars->prev)) {
9629 if (used) used = used->prev;
9632 if (vars && vars->prev == DVARS_INHERIT) {
9633 return rb_local_defined(id);
9635 else if (vtable_included(args, id)) {
9639 int i = vtable_included(vars, id);
9640 if (i && used) used->tbl[i-1] |= LVAR_USED;
9645 static const struct vtable *
9646 dyna_push_gen(struct parser_params *parser)
9648 lvtbl->args = vtable_alloc(lvtbl->args);
9649 lvtbl->vars = vtable_alloc(lvtbl->vars);
9651 lvtbl->used = vtable_alloc(lvtbl->used);
9657 dyna_pop_1(struct parser_params *parser)
9661 if ((tmp = lvtbl->used) != 0) {
9662 warn_unused_var(parser, lvtbl);
9663 lvtbl->used = lvtbl->used->prev;
9667 lvtbl->args = lvtbl->args->prev;
9670 lvtbl->vars = lvtbl->vars->prev;
9675 dyna_pop_gen(struct parser_params *parser, const struct vtable *lvargs)
9677 while (lvtbl->args != lvargs) {
9680 struct local_vars *local = lvtbl->prev;
9689 dyna_in_block_gen(struct parser_params *parser)
9691 return POINTER_P(lvtbl->vars) && lvtbl->vars->prev != DVARS_TOPSCOPE;
9695 dvar_defined_gen(struct parser_params *parser, ID id, int get)
9697 struct vtable *vars, *args, *used;
9704 while (POINTER_P(vars)) {
9705 if (vtable_included(args, id)) {
9708 if ((i = vtable_included(vars, id)) != 0) {
9709 if (used) used->tbl[i-1] |= LVAR_USED;
9715 if (used) used = used->prev;
9718 if (vars == DVARS_INHERIT) {
9719 return rb_dvar_defined(id);
9726 dvar_curr_gen(struct parser_params *parser, ID id)
9728 return (vtable_included(lvtbl->args, id) ||
9729 vtable_included(lvtbl->vars, id));
9734 reg_fragment_setenc_gen(struct parser_params* parser, VALUE str, int options)
9736 int c = RE_OPTION_ENCODING_IDX(options);
9740 rb_char_to_option_kcode(c, &opt, &idx);
9741 if (idx != ENCODING_GET(str) &&
9742 rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) {
9745 ENCODING_SET(str, idx);
9747 else if (RE_OPTION_ENCODING_NONE(options)) {
9748 if (!ENCODING_IS_ASCII8BIT(str) &&
9749 rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) {
9753 rb_enc_associate(str, rb_ascii8bit_encoding());
9755 else if (current_enc == rb_usascii_encoding()) {
9756 if (rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) {
9758 rb_enc_associate(str, rb_usascii_encoding());
9761 rb_enc_associate(str, rb_ascii8bit_encoding());
9767 compile_error(PARSER_ARG
9768 "regexp encoding option '%c' differs from source encoding '%s'",
9769 c, rb_enc_name(rb_enc_get(str)));
9773 reg_fragment_check_gen(struct parser_params* parser, VALUE str, int options)
9776 reg_fragment_setenc(str, options);
9777 err = rb_reg_check_preprocess(str);
9779 err = rb_obj_as_string(err);
9780 compile_error(PARSER_ARG "%s", RSTRING_PTR(err));
9788 struct parser_params* parser;
9793 } reg_named_capture_assign_t;
9796 reg_named_capture_assign_iter(const OnigUChar *name, const OnigUChar *name_end,
9797 int back_num, int *back_refs, OnigRegex regex, void *arg0)
9799 reg_named_capture_assign_t *arg = (reg_named_capture_assign_t*)arg0;
9800 struct parser_params* parser = arg->parser;
9801 rb_encoding *enc = arg->enc;
9802 long len = name_end - name;
9803 const char *s = (const char *)name;
9808 if (arg->succ_block == 0) {
9809 arg->succ_block = NEW_BEGIN(0);
9810 arg->fail_block = NEW_BEGIN(0);
9813 if (!len || (*name != '_' && ISASCII(*name) && !rb_enc_islower(*name, enc)) ||
9814 (len < MAX_WORD_LENGTH && rb_reserved_word(s, (int)len)) ||
9815 !rb_enc_symname2_p(s, len, enc)) {
9818 var = rb_intern3(s, len, enc);
9819 if (dvar_defined(var) || local_id(var)) {
9820 rb_warningS("named capture conflicts a local variable - %s",
9823 arg->succ_block = block_append(arg->succ_block,
9824 newline_node(node_assign(assignable(var,0),
9826 gettable(rb_intern("$~")),
9828 NEW_LIST(NEW_LIT(ID2SYM(var))))
9830 arg->fail_block = block_append(arg->fail_block,
9831 newline_node(node_assign(assignable(var,0), NEW_LIT(Qnil))));
9836 reg_named_capture_assign_gen(struct parser_params* parser, VALUE regexp, NODE *match)
9838 reg_named_capture_assign_t arg;
9840 arg.parser = parser;
9841 arg.enc = rb_enc_get(regexp);
9845 onig_foreach_name(RREGEXP(regexp)->ptr, reg_named_capture_assign_iter, (void*)&arg);
9852 newline_node(match),
9853 NEW_IF(gettable(rb_intern("$~")),
9855 newline_node(arg.succ_block),
9858 gettable(rb_intern("$~")),
9860 NEW_LIST(NEW_LIT(INT2FIX(0)))))),
9862 newline_node(arg.fail_block),
9868 reg_compile_gen(struct parser_params* parser, VALUE str, int options)
9873 reg_fragment_setenc(str, options);
9875 re = rb_reg_compile(str, options & RE_OPTION_MASK, ruby_sourcefile, ruby_sourceline);
9877 ID mesg = rb_intern("mesg");
9878 VALUE m = rb_attr_get(rb_errinfo(), mesg);
9879 rb_set_errinfo(err);
9881 rb_str_append(rb_str_cat(rb_attr_get(err, mesg), "\n", 1), m);
9884 compile_error(PARSER_ARG "%s", RSTRING_PTR(m));
9892 rb_gc_mark_parser(void)
9897 rb_parser_append_print(VALUE vparser, NODE *node)
9901 struct parser_params *parser;
9903 if (!node) return node;
9905 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
9907 node = node->nd_body;
9909 if (nd_type(node) == NODE_PRELUDE) {
9911 node = node->nd_body;
9914 node = block_append(node,
9915 NEW_FCALL(rb_intern("print"),
9916 NEW_ARRAY(NEW_GVAR(rb_intern("$_")))));
9918 prelude->nd_body = node;
9919 scope->nd_body = prelude;
9922 scope->nd_body = node;
9929 rb_parser_while_loop(VALUE vparser, NODE *node, int chop, int split)
9933 struct parser_params *parser;
9935 if (!node) return node;
9937 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
9939 node = node->nd_body;
9941 if (nd_type(node) == NODE_PRELUDE) {
9943 node = node->nd_body;
9946 node = block_append(NEW_GASGN(rb_intern("$F"),
9947 NEW_CALL(NEW_GVAR(rb_intern("$_")),
9948 rb_intern("split"), 0)),
9952 node = block_append(NEW_CALL(NEW_GVAR(rb_intern("$_")),
9953 rb_intern("chop!"), 0), node);
9956 node = NEW_OPT_N(node);
9959 prelude->nd_body = node;
9960 scope->nd_body = prelude;
9963 scope->nd_body = node;
9969 static const struct {
9994 #define op_tbl_count numberof(op_tbl)
9996 #ifndef ENABLE_SELECTOR_NAMESPACE
9997 #define ENABLE_SELECTOR_NAMESPACE 0
10000 static struct symbols {
10004 #if ENABLE_SELECTOR_NAMESPACE
10005 st_table *ivar2_id;
10006 st_table *id_ivar2;
10008 VALUE op_sym[tLAST_OP_ID];
10009 } global_symbols = {tLAST_TOKEN};
10011 static const struct st_hash_type symhash = {
10016 #if ENABLE_SELECTOR_NAMESPACE
10023 ivar2_cmp(struct ivar2_key *key1, struct ivar2_key *key2)
10025 if (key1->id == key2->id && key1->klass == key2->klass) {
10032 ivar2_hash(struct ivar2_key *key)
10034 return (key->id << 8) ^ (key->klass >> 2);
10037 static const struct st_hash_type ivar2_hash_type = {
10046 global_symbols.sym_id = st_init_table_with_size(&symhash, 1000);
10047 global_symbols.id_str = st_init_numtable_with_size(1000);
10048 #if ENABLE_SELECTOR_NAMESPACE
10049 global_symbols.ivar2_id = st_init_table_with_size(&ivar2_hash_type, 1000);
10050 global_symbols.id_ivar2 = st_init_numtable_with_size(1000);
10056 (void)lex_state_name(-1);
10063 rb_gc_mark_symbols(void)
10065 rb_mark_tbl(global_symbols.id_str);
10066 rb_gc_mark_locations(global_symbols.op_sym,
10067 global_symbols.op_sym + numberof(global_symbols.op_sym));
10069 #endif /* !RIPPER */
10072 internal_id_gen(struct parser_params *parser)
10074 ID id = (ID)vtable_size(lvtbl->args) + (ID)vtable_size(lvtbl->vars);
10075 id += ((tLAST_TOKEN - ID_INTERNAL) >> ID_SCOPE_SHIFT) + 1;
10076 return ID_INTERNAL | (id << ID_SCOPE_SHIFT);
10081 is_special_global_name(const char *m, const char *e, rb_encoding *enc)
10085 if (m >= e) return 0;
10086 if (is_global_name_punct(*m)) {
10089 else if (*m == '-') {
10091 if (m < e && is_identchar(m, e, enc)) {
10092 if (!ISASCII(*m)) mb = 1;
10093 m += rb_enc_mbclen(m, e, enc);
10097 if (!rb_enc_isdigit(*m, enc)) return 0;
10099 if (!ISASCII(*m)) mb = 1;
10101 } while (m < e && rb_enc_isdigit(*m, enc));
10103 return m == e ? mb + 1 : 0;
10107 rb_symname_p(const char *name)
10109 return rb_enc_symname_p(name, rb_ascii8bit_encoding());
10113 rb_enc_symname_p(const char *name, rb_encoding *enc)
10115 return rb_enc_symname2_p(name, strlen(name), enc);
10118 #define IDSET_ATTRSET_FOR_SYNTAX ((1U<<ID_LOCAL)|(1U<<ID_CONST))
10119 #define IDSET_ATTRSET_FOR_INTERN (~(~0U<<(1<<ID_SCOPE_SHIFT)) & ~(1U<<ID_ATTRSET))
10122 rb_enc_symname_type(const char *name, long len, rb_encoding *enc, unsigned int allowed_atttset)
10124 const char *m = name;
10125 const char *e = m + len;
10126 int type = ID_JUNK;
10128 if (!m || len <= 0) return -1;
10135 if (is_special_global_name(++m, e, enc)) return type;
10139 type = ID_INSTANCE;
10148 case '<': ++m; break;
10149 case '=': if (*++m == '>') ++m; break;
10156 case '>': case '=': ++m; break;
10162 case '~': ++m; break;
10163 case '=': if (*++m == '=') ++m; break;
10164 default: return -1;
10169 if (*++m == '*') ++m;
10172 case '+': case '-':
10173 if (*++m == '@') ++m;
10176 case '|': case '^': case '&': case '/': case '%': case '~': case '`':
10181 if (*++m != ']') return -1;
10182 if (*++m == '=') ++m;
10186 if (len == 1) return ID_JUNK;
10188 case '=': case '~': ++m; break;
10189 default: return -1;
10194 type = rb_enc_isupper(*m, enc) ? ID_CONST : ID_LOCAL;
10196 if (m >= e || (*m != '_' && !rb_enc_isalpha(*m, enc) && ISASCII(*m)))
10198 while (m < e && is_identchar(m, e, enc)) m += rb_enc_mbclen(m, e, enc);
10201 case '!': case '?':
10202 if (type == ID_GLOBAL || type == ID_CLASS || type == ID_INSTANCE) return -1;
10205 if (m + 1 < e || *m != '=') break;
10208 if (!(allowed_atttset & (1U << type))) return -1;
10215 return m == e ? type : -1;
10219 rb_enc_symname2_p(const char *name, long len, rb_encoding *enc)
10221 return rb_enc_symname_type(name, len, enc, IDSET_ATTRSET_FOR_SYNTAX) != -1;
10225 rb_str_symname_type(VALUE name, unsigned int allowed_atttset)
10227 const char *ptr = StringValuePtr(name);
10228 long len = RSTRING_LEN(name);
10229 int type = rb_enc_symname_type(ptr, len, rb_enc_get(name), allowed_atttset);
10235 register_symid(ID id, const char *name, long len, rb_encoding *enc)
10237 VALUE str = rb_enc_str_new(name, len, enc);
10238 return register_symid_str(id, str);
10242 register_symid_str(ID id, VALUE str)
10245 st_add_direct(global_symbols.sym_id, (st_data_t)str, id);
10246 st_add_direct(global_symbols.id_str, id, (st_data_t)str);
10251 sym_check_asciionly(VALUE str)
10253 if (!rb_enc_asciicompat(rb_enc_get(str))) return FALSE;
10254 switch (rb_enc_str_coderange(str)) {
10255 case ENC_CODERANGE_BROKEN:
10256 rb_raise(rb_eEncodingError, "invalid encoding symbol");
10257 case ENC_CODERANGE_7BIT:
10264 * _str_ itself will be registered at the global symbol table. _str_
10265 * can be modified before the registration, since the encoding will be
10266 * set to ASCII-8BIT if it is a special global name.
10268 static ID intern_str(VALUE str);
10271 rb_intern3(const char *name, long len, rb_encoding *enc)
10275 struct RString fake_str;
10276 fake_str.basic.flags = T_STRING|RSTRING_NOEMBED;
10277 fake_str.basic.klass = rb_cString;
10278 fake_str.as.heap.len = len;
10279 fake_str.as.heap.ptr = (char *)name;
10280 fake_str.as.heap.aux.capa = len;
10281 str = (VALUE)&fake_str;
10282 rb_enc_associate(str, enc);
10285 if (st_lookup(global_symbols.sym_id, str, &data))
10288 str = rb_enc_str_new(name, len, enc); /* make true string */
10289 return intern_str(str);
10293 intern_str(VALUE str)
10295 const char *name, *m, *e;
10297 rb_encoding *enc, *symenc;
10302 RSTRING_GETMEM(str, name, len);
10305 enc = rb_enc_get(str);
10308 if (!len || (rb_cString && !rb_enc_asciicompat(enc))) {
10317 if (len < 2) goto junk;
10319 if ((mb = is_special_global_name(++m, e, enc)) != 0) {
10320 if (!--mb) symenc = rb_usascii_encoding();
10326 if (len < 3) goto junk;
10331 if (len < 2) goto junk;
10338 if (c != '_' && rb_enc_isascii(c, enc) && rb_enc_ispunct(c, enc)) {
10346 for (i = 0; i < op_tbl_count; i++) {
10347 if (*op_tbl[i].name == *m &&
10348 strcmp(op_tbl[i].name, m) == 0) {
10349 id = op_tbl[i].token;
10356 if (name[last] == '=') {
10357 /* attribute assignment */
10358 if (last > 1 && name[last-1] == '=')
10360 id = rb_intern3(name, last, enc);
10361 if (id > tLAST_OP_ID && !is_attrset_id(id)) {
10362 enc = rb_enc_get(rb_id2str(id));
10363 id = rb_id_attrset(id);
10368 else if (id == 0) {
10369 if (rb_enc_isupper(m[0], enc)) {
10376 if (!rb_enc_isdigit(*m, enc)) {
10377 while (m <= name + last && is_identchar(m, e, enc)) {
10382 m += rb_enc_mbclen(m, e, enc);
10386 if (id != ID_ATTRSET && m - name < len) id = ID_JUNK;
10387 if (sym_check_asciionly(str)) symenc = rb_usascii_encoding();
10389 if (symenc != enc) rb_enc_associate(str, symenc);
10390 if (global_symbols.last_id >= ~(ID)0 >> (ID_SCOPE_SHIFT+RUBY_SPECIAL_SHIFT)) {
10392 rb_raise(rb_eRuntimeError, "symbol table overflow (symbol %.20s...)",
10396 rb_raise(rb_eRuntimeError, "symbol table overflow (symbol %.*s)",
10400 id |= ++global_symbols.last_id << ID_SCOPE_SHIFT;
10402 return register_symid_str(id, str);
10406 rb_intern2(const char *name, long len)
10408 return rb_intern3(name, len, rb_usascii_encoding());
10413 rb_intern(const char *name)
10415 return rb_intern2(name, strlen(name));
10419 rb_intern_str(VALUE str)
10423 if (st_lookup(global_symbols.sym_id, str, &id))
10425 return intern_str(rb_str_dup(str));
10433 if (id < tLAST_TOKEN) {
10436 if (id < INT_MAX && rb_ispunct((int)id)) {
10437 VALUE str = global_symbols.op_sym[i = (int)id];
10440 name[0] = (char)id;
10442 str = rb_usascii_str_new(name, 1);
10444 global_symbols.op_sym[i] = str;
10448 for (i = 0; i < op_tbl_count; i++) {
10449 if (op_tbl[i].token == id) {
10450 VALUE str = global_symbols.op_sym[i];
10452 str = rb_usascii_str_new2(op_tbl[i].name);
10454 global_symbols.op_sym[i] = str;
10461 if (st_lookup(global_symbols.id_str, id, &data)) {
10462 VALUE str = (VALUE)data;
10463 if (RBASIC(str)->klass == 0)
10464 RBASIC(str)->klass = rb_cString;
10468 if (is_attrset_id(id)) {
10469 ID id_stem = (id & ~ID_SCOPE_MASK);
10473 if (!!(str = rb_id2str(id_stem | ID_LOCAL))) break;
10474 if (!!(str = rb_id2str(id_stem | ID_CONST))) break;
10475 if (!!(str = rb_id2str(id_stem | ID_INSTANCE))) break;
10476 if (!!(str = rb_id2str(id_stem | ID_GLOBAL))) break;
10477 if (!!(str = rb_id2str(id_stem | ID_CLASS))) break;
10478 if (!!(str = rb_id2str(id_stem | ID_JUNK))) break;
10481 str = rb_str_dup(str);
10482 rb_str_cat(str, "=", 1);
10483 register_symid_str(id, str);
10484 if (st_lookup(global_symbols.id_str, id, &data)) {
10485 VALUE str = (VALUE)data;
10486 if (RBASIC(str)->klass == 0)
10487 RBASIC(str)->klass = rb_cString;
10497 VALUE str = rb_id2str(id);
10499 if (!str) return 0;
10500 return RSTRING_PTR(str);
10504 symbols_i(VALUE sym, ID value, VALUE ary)
10506 rb_ary_push(ary, ID2SYM(value));
10507 return ST_CONTINUE;
10512 * Symbol.all_symbols => array
10514 * Returns an array of all the symbols currently in Ruby's symbol
10517 * Symbol.all_symbols.size #=> 903
10518 * Symbol.all_symbols[1,20] #=> [:floor, :ARGV, :Binding, :symlink,
10519 * :chown, :EOFError, :$;, :String,
10520 * :LOCK_SH, :"setuid?", :$<,
10521 * :default_proc, :compact, :extend,
10522 * :Tms, :getwd, :$=, :ThreadGroup,
10527 rb_sym_all_symbols(void)
10529 VALUE ary = rb_ary_new2(global_symbols.sym_id->num_entries);
10531 st_foreach(global_symbols.sym_id, symbols_i, ary);
10536 rb_is_const_id(ID id)
10538 return is_const_id(id);
10542 rb_is_class_id(ID id)
10544 return is_class_id(id);
10548 rb_is_global_id(ID id)
10550 return is_global_id(id);
10554 rb_is_instance_id(ID id)
10556 return is_instance_id(id);
10560 rb_is_attrset_id(ID id)
10562 return is_attrset_id(id);
10566 rb_is_local_id(ID id)
10568 return is_local_id(id);
10572 rb_is_junk_id(ID id)
10574 return is_junk_id(id);
10578 * Returns ID for the given name if it is interned already, or 0.
10580 * \param namep the pointer to the name object
10581 * \return the ID for *namep
10582 * \pre the object referred by \p namep must be a Symbol or
10583 * a String, or possible to convert with to_str method.
10584 * \post the object referred by \p namep is a Symbol or a
10585 * String if non-zero value is returned, or is a String
10586 * if 0 is returned.
10589 rb_check_id(volatile VALUE *namep)
10593 VALUE name = *namep;
10595 if (SYMBOL_P(name)) {
10596 return SYM2ID(name);
10598 else if (!RB_TYPE_P(name, T_STRING)) {
10599 tmp = rb_check_string_type(name);
10601 tmp = rb_inspect(name);
10602 rb_raise(rb_eTypeError, "%s is not a symbol",
10609 sym_check_asciionly(name);
10611 if (st_lookup(global_symbols.sym_id, (st_data_t)name, &id))
10614 if (rb_is_attrset_name(name)) {
10615 struct RString fake_str;
10616 const VALUE localname = (VALUE)&fake_str;
10617 /* make local name by chopping '=' */
10618 fake_str.basic.flags = T_STRING|RSTRING_NOEMBED;
10619 fake_str.basic.klass = rb_cString;
10620 fake_str.as.heap.len = RSTRING_LEN(name) - 1;
10621 fake_str.as.heap.ptr = RSTRING_PTR(name);
10622 fake_str.as.heap.aux.capa = fake_str.as.heap.len;
10623 rb_enc_copy(localname, name);
10624 OBJ_FREEZE(localname);
10626 if (st_lookup(global_symbols.sym_id, (st_data_t)localname, &id)) {
10627 return rb_id_attrset((ID)id);
10636 rb_check_id_cstr(const char *ptr, long len, rb_encoding *enc)
10639 struct RString fake_str;
10640 const VALUE name = (VALUE)&fake_str;
10641 fake_str.basic.flags = T_STRING|RSTRING_NOEMBED;
10642 fake_str.basic.klass = rb_cString;
10643 fake_str.as.heap.len = len;
10644 fake_str.as.heap.ptr = (char *)ptr;
10645 fake_str.as.heap.aux.capa = len;
10646 rb_enc_associate(name, enc);
10648 sym_check_asciionly(name);
10650 if (st_lookup(global_symbols.sym_id, (st_data_t)name, &id))
10653 if (rb_is_attrset_name(name)) {
10654 fake_str.as.heap.len = len - 1;
10655 if (st_lookup(global_symbols.sym_id, (st_data_t)name, &id)) {
10656 return rb_id_attrset((ID)id);
10664 rb_is_const_name(VALUE name)
10666 return rb_str_symname_type(name, 0) == ID_CONST;
10670 rb_is_class_name(VALUE name)
10672 return rb_str_symname_type(name, 0) == ID_CLASS;
10676 rb_is_global_name(VALUE name)
10678 return rb_str_symname_type(name, 0) == ID_GLOBAL;
10682 rb_is_instance_name(VALUE name)
10684 return rb_str_symname_type(name, 0) == ID_INSTANCE;
10688 rb_is_attrset_name(VALUE name)
10690 return rb_str_symname_type(name, IDSET_ATTRSET_FOR_INTERN) == ID_ATTRSET;
10694 rb_is_local_name(VALUE name)
10696 return rb_str_symname_type(name, 0) == ID_LOCAL;
10700 rb_is_method_name(VALUE name)
10702 switch (rb_str_symname_type(name, 0)) {
10703 case ID_LOCAL: case ID_ATTRSET: case ID_JUNK:
10710 rb_is_junk_name(VALUE name)
10712 return rb_str_symname_type(name, IDSET_ATTRSET_FOR_SYNTAX) == -1;
10715 #endif /* !RIPPER */
10718 parser_initialize(struct parser_params *parser)
10720 parser->eofp = Qfalse;
10722 parser->parser_lex_strterm = 0;
10723 parser->parser_cond_stack = 0;
10724 parser->parser_cmdarg_stack = 0;
10725 parser->parser_class_nest = 0;
10726 parser->parser_paren_nest = 0;
10727 parser->parser_lpar_beg = 0;
10728 parser->parser_brace_nest = 0;
10729 parser->parser_in_single = 0;
10730 parser->parser_in_def = 0;
10731 parser->parser_in_defined = 0;
10732 parser->parser_compile_for_eval = 0;
10733 parser->parser_cur_mid = 0;
10734 parser->parser_tokenbuf = NULL;
10735 parser->parser_tokidx = 0;
10736 parser->parser_toksiz = 0;
10737 parser->parser_heredoc_end = 0;
10738 parser->parser_command_start = TRUE;
10739 parser->parser_deferred_nodes = 0;
10740 parser->parser_lex_pbeg = 0;
10741 parser->parser_lex_p = 0;
10742 parser->parser_lex_pend = 0;
10743 parser->parser_lvtbl = 0;
10744 parser->parser_ruby__end__seen = 0;
10745 parser->parser_ruby_sourcefile = 0;
10746 parser->parser_ruby_sourcefile_string = Qnil;
10748 parser->is_ripper = 0;
10749 parser->parser_eval_tree_begin = 0;
10750 parser->parser_eval_tree = 0;
10752 parser->is_ripper = 1;
10753 parser->delayed = Qnil;
10755 parser->result = Qnil;
10756 parser->parsing_thread = Qnil;
10757 parser->toplevel_p = TRUE;
10760 parser->heap = NULL;
10762 parser->enc = rb_utf8_encoding();
10766 #define parser_mark ripper_parser_mark
10767 #define parser_free ripper_parser_free
10771 parser_mark(void *ptr)
10773 struct parser_params *p = (struct parser_params*)ptr;
10775 rb_gc_mark((VALUE)p->parser_lex_strterm);
10776 rb_gc_mark((VALUE)p->parser_deferred_nodes);
10777 rb_gc_mark(p->parser_lex_input);
10778 rb_gc_mark(p->parser_lex_lastline);
10779 rb_gc_mark(p->parser_lex_nextline);
10780 rb_gc_mark(p->parser_ruby_sourcefile_string);
10782 rb_gc_mark((VALUE)p->parser_eval_tree_begin) ;
10783 rb_gc_mark((VALUE)p->parser_eval_tree) ;
10784 rb_gc_mark(p->debug_lines);
10786 rb_gc_mark(p->delayed);
10787 rb_gc_mark(p->value);
10788 rb_gc_mark(p->result);
10789 rb_gc_mark(p->parsing_thread);
10792 rb_gc_mark((VALUE)p->heap);
10797 parser_free(void *ptr)
10799 struct parser_params *p = (struct parser_params*)ptr;
10800 struct local_vars *local, *prev;
10802 if (p->parser_tokenbuf) {
10803 xfree(p->parser_tokenbuf);
10805 for (local = p->parser_lvtbl; local; local = prev) {
10806 if (local->vars) xfree(local->vars);
10807 prev = local->prev;
10814 parser_memsize(const void *ptr)
10816 struct parser_params *p = (struct parser_params*)ptr;
10817 struct local_vars *local;
10818 size_t size = sizeof(*p);
10820 if (!ptr) return 0;
10821 size += p->parser_toksiz;
10822 for (local = p->parser_lvtbl; local; local = local->prev) {
10823 size += sizeof(*local);
10824 if (local->vars) size += local->vars->capa * sizeof(ID);
10833 rb_data_type_t parser_data_type = {
10843 #undef rb_reserved_word
10845 const struct kwtable *
10846 rb_reserved_word(const char *str, unsigned int len)
10848 return reserved_word(str, len);
10851 static struct parser_params *
10854 struct parser_params *p;
10856 p = ALLOC_N(struct parser_params, 1);
10857 MEMZERO(p, struct parser_params, 1);
10858 parser_initialize(p);
10863 rb_parser_new(void)
10865 struct parser_params *p = parser_new();
10867 return TypedData_Wrap_Struct(0, &parser_data_type, p);
10872 * ripper#end_seen? -> Boolean
10874 * Return true if parsed source ended by +\_\_END\_\_+.
10877 rb_parser_end_seen_p(VALUE vparser)
10879 struct parser_params *parser;
10881 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
10882 return ruby__end__seen ? Qtrue : Qfalse;
10887 * ripper#encoding -> encoding
10889 * Return encoding of the source.
10892 rb_parser_encoding(VALUE vparser)
10894 struct parser_params *parser;
10896 TypedData_Get_Struct(vparser, struct parser_params, &parser_data_type, parser);
10897 return rb_enc_from_encoding(current_enc);
10902 * ripper.yydebug -> true or false
10907 rb_parser_get_yydebug(VALUE self)
10909 struct parser_params *parser;
10911 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
10912 return yydebug ? Qtrue : Qfalse;
10917 * ripper.yydebug = flag
10922 rb_parser_set_yydebug(VALUE self, VALUE flag)
10924 struct parser_params *parser;
10926 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
10927 yydebug = RTEST(flag);
10932 #define HEAPCNT(n, size) ((n) * (size) / sizeof(YYSTYPE))
10933 #define NEWHEAP() rb_node_newnode(NODE_ALLOCA, 0, (VALUE)parser->heap, 0)
10934 #define ADD2HEAP(n, c, p) ((parser->heap = (n))->u1.node = (p), \
10935 (n)->u3.cnt = (c), (p))
10938 rb_parser_malloc(struct parser_params *parser, size_t size)
10940 size_t cnt = HEAPCNT(1, size);
10941 NODE *n = NEWHEAP();
10942 void *ptr = xmalloc(size);
10944 return ADD2HEAP(n, cnt, ptr);
10948 rb_parser_calloc(struct parser_params *parser, size_t nelem, size_t size)
10950 size_t cnt = HEAPCNT(nelem, size);
10951 NODE *n = NEWHEAP();
10952 void *ptr = xcalloc(nelem, size);
10954 return ADD2HEAP(n, cnt, ptr);
10958 rb_parser_realloc(struct parser_params *parser, void *ptr, size_t size)
10961 size_t cnt = HEAPCNT(1, size);
10963 if (ptr && (n = parser->heap) != NULL) {
10965 if (n->u1.node == ptr) {
10966 n->u1.node = ptr = xrealloc(ptr, size);
10967 if (n->u3.cnt) n->u3.cnt = cnt;
10970 } while ((n = n->u2.node) != NULL);
10973 ptr = xrealloc(ptr, size);
10974 return ADD2HEAP(n, cnt, ptr);
10978 rb_parser_free(struct parser_params *parser, void *ptr)
10980 NODE **prev = &parser->heap, *n;
10982 while ((n = *prev) != NULL) {
10983 if (n->u1.node == ptr) {
10984 *prev = n->u2.node;
10985 rb_gc_force_recycle((VALUE)n);
10988 prev = &n->u2.node;
10996 #ifdef RIPPER_DEBUG
10997 extern int rb_is_pointer_to_heap(VALUE);
11001 ripper_validate_object(VALUE self, VALUE x)
11003 if (x == Qfalse) return x;
11004 if (x == Qtrue) return x;
11005 if (x == Qnil) return x;
11007 rb_raise(rb_eArgError, "Qundef given");
11008 if (FIXNUM_P(x)) return x;
11009 if (SYMBOL_P(x)) return x;
11010 if (!rb_is_pointer_to_heap(x))
11011 rb_raise(rb_eArgError, "invalid pointer: %p", x);
11020 if (nd_type(x) != NODE_LASGN) {
11021 rb_raise(rb_eArgError, "NODE given: %p", x);
11023 return ((NODE *)x)->nd_rval;
11025 rb_raise(rb_eArgError, "wrong type of ruby object: %p (%s)",
11026 x, rb_obj_classname(x));
11032 #define validate(x) ((x) = get_value(x))
11035 ripper_dispatch0(struct parser_params *parser, ID mid)
11037 return rb_funcall(parser->value, mid, 0);
11041 ripper_dispatch1(struct parser_params *parser, ID mid, VALUE a)
11044 return rb_funcall(parser->value, mid, 1, a);
11048 ripper_dispatch2(struct parser_params *parser, ID mid, VALUE a, VALUE b)
11052 return rb_funcall(parser->value, mid, 2, a, b);
11056 ripper_dispatch3(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c)
11061 return rb_funcall(parser->value, mid, 3, a, b, c);
11065 ripper_dispatch4(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c, VALUE d)
11071 return rb_funcall(parser->value, mid, 4, a, b, c, d);
11075 ripper_dispatch5(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c, VALUE d, VALUE e)
11082 return rb_funcall(parser->value, mid, 5, a, b, c, d, e);
11086 ripper_dispatch7(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c, VALUE d, VALUE e, VALUE f, VALUE g)
11095 return rb_funcall(parser->value, mid, 7, a, b, c, d, e, f, g);
11098 static const struct kw_assoc {
11101 } keyword_to_name[] = {
11102 {keyword_class, "class"},
11103 {keyword_module, "module"},
11104 {keyword_def, "def"},
11105 {keyword_undef, "undef"},
11106 {keyword_begin, "begin"},
11107 {keyword_rescue, "rescue"},
11108 {keyword_ensure, "ensure"},
11109 {keyword_end, "end"},
11110 {keyword_if, "if"},
11111 {keyword_unless, "unless"},
11112 {keyword_then, "then"},
11113 {keyword_elsif, "elsif"},
11114 {keyword_else, "else"},
11115 {keyword_case, "case"},
11116 {keyword_when, "when"},
11117 {keyword_while, "while"},
11118 {keyword_until, "until"},
11119 {keyword_for, "for"},
11120 {keyword_break, "break"},
11121 {keyword_next, "next"},
11122 {keyword_redo, "redo"},
11123 {keyword_retry, "retry"},
11124 {keyword_in, "in"},
11125 {keyword_do, "do"},
11126 {keyword_do_cond, "do"},
11127 {keyword_do_block, "do"},
11128 {keyword_return, "return"},
11129 {keyword_yield, "yield"},
11130 {keyword_super, "super"},
11131 {keyword_self, "self"},
11132 {keyword_nil, "nil"},
11133 {keyword_true, "true"},
11134 {keyword_false, "false"},
11135 {keyword_and, "and"},
11136 {keyword_or, "or"},
11137 {keyword_not, "not"},
11138 {modifier_if, "if"},
11139 {modifier_unless, "unless"},
11140 {modifier_while, "while"},
11141 {modifier_until, "until"},
11142 {modifier_rescue, "rescue"},
11143 {keyword_alias, "alias"},
11144 {keyword_defined, "defined?"},
11145 {keyword_BEGIN, "BEGIN"},
11146 {keyword_END, "END"},
11147 {keyword__LINE__, "__LINE__"},
11148 {keyword__FILE__, "__FILE__"},
11149 {keyword__ENCODING__, "__ENCODING__"},
11154 keyword_id_to_str(ID id)
11156 const struct kw_assoc *a;
11158 for (a = keyword_to_name; a->id; a++) {
11165 #undef ripper_id2sym
11167 ripper_id2sym(ID id)
11175 return ID2SYM(rb_intern2(buf, 1));
11177 if ((name = keyword_id_to_str(id))) {
11178 return ID2SYM(rb_intern(name));
11188 name = rb_id2name(id);
11190 rb_bug("cannot convert ID to string: %ld", (unsigned long)id);
11194 return ID2SYM(rb_intern(name));
11198 ripper_get_id(VALUE v)
11201 if (!RB_TYPE_P(v, T_NODE)) return 0;
11203 if (nd_type(nd) != NODE_LASGN) return 0;
11208 ripper_get_value(VALUE v)
11211 if (v == Qundef) return Qnil;
11212 if (!RB_TYPE_P(v, T_NODE)) return v;
11214 if (nd_type(nd) != NODE_LASGN) return Qnil;
11215 return nd->nd_rval;
11219 ripper_compile_error(struct parser_params *parser, const char *fmt, ...)
11224 va_start(args, fmt);
11225 str = rb_vsprintf(fmt, args);
11227 rb_funcall(parser->value, rb_intern("compile_error"), 1, str);
11231 ripper_warn0(struct parser_params *parser, const char *fmt)
11233 rb_funcall(parser->value, rb_intern("warn"), 1, STR_NEW2(fmt));
11237 ripper_warnI(struct parser_params *parser, const char *fmt, int a)
11239 rb_funcall(parser->value, rb_intern("warn"), 2,
11240 STR_NEW2(fmt), INT2NUM(a));
11244 ripper_warnS(struct parser_params *parser, const char *fmt, const char *str)
11246 rb_funcall(parser->value, rb_intern("warn"), 2,
11247 STR_NEW2(fmt), STR_NEW2(str));
11251 ripper_warning0(struct parser_params *parser, const char *fmt)
11253 rb_funcall(parser->value, rb_intern("warning"), 1, STR_NEW2(fmt));
11257 ripper_warningS(struct parser_params *parser, const char *fmt, const char *str)
11259 rb_funcall(parser->value, rb_intern("warning"), 2,
11260 STR_NEW2(fmt), STR_NEW2(str));
11264 ripper_lex_get_generic(struct parser_params *parser, VALUE src)
11266 return rb_io_gets(src);
11270 ripper_s_allocate(VALUE klass)
11272 struct parser_params *p;
11275 p = ALLOC_N(struct parser_params, 1);
11276 MEMZERO(p, struct parser_params, 1);
11277 self = TypedData_Wrap_Struct(klass, &parser_data_type, p);
11282 #define ripper_initialized_p(r) ((r)->parser_lex_input != 0)
11286 * Ripper.new(src, filename="(ripper)", lineno=1) -> ripper
11288 * Create a new Ripper object.
11289 * _src_ must be a String, an IO, or an Object which has #gets method.
11291 * This method does not starts parsing.
11292 * See also Ripper#parse and Ripper.parse.
11295 ripper_initialize(int argc, VALUE *argv, VALUE self)
11297 struct parser_params *parser;
11298 VALUE src, fname, lineno;
11300 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
11301 rb_scan_args(argc, argv, "12", &src, &fname, &lineno);
11302 if (RB_TYPE_P(src, T_FILE)) {
11303 parser->parser_lex_gets = ripper_lex_get_generic;
11307 parser->parser_lex_gets = lex_get_str;
11309 parser->parser_lex_input = src;
11310 parser->eofp = Qfalse;
11311 if (NIL_P(fname)) {
11312 fname = STR_NEW2("(ripper)");
11315 StringValue(fname);
11317 parser_initialize(parser);
11319 parser->parser_ruby_sourcefile_string = fname;
11320 parser->parser_ruby_sourcefile = RSTRING_PTR(fname);
11321 parser->parser_ruby_sourceline = NIL_P(lineno) ? 0 : NUM2INT(lineno) - 1;
11326 struct ripper_args {
11327 struct parser_params *parser;
11333 ripper_parse0(VALUE parser_v)
11335 struct parser_params *parser;
11337 TypedData_Get_Struct(parser_v, struct parser_params, &parser_data_type, parser);
11338 parser_prepare(parser);
11339 ripper_yyparse((void*)parser);
11340 return parser->result;
11344 ripper_ensure(VALUE parser_v)
11346 struct parser_params *parser;
11348 TypedData_Get_Struct(parser_v, struct parser_params, &parser_data_type, parser);
11349 parser->parsing_thread = Qnil;
11357 * Start parsing and returns the value of the root action.
11360 ripper_parse(VALUE self)
11362 struct parser_params *parser;
11364 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
11365 if (!ripper_initialized_p(parser)) {
11366 rb_raise(rb_eArgError, "method called for uninitialized object");
11368 if (!NIL_P(parser->parsing_thread)) {
11369 if (parser->parsing_thread == rb_thread_current())
11370 rb_raise(rb_eArgError, "Ripper#parse is not reentrant");
11372 rb_raise(rb_eArgError, "Ripper#parse is not multithread-safe");
11374 parser->parsing_thread = rb_thread_current();
11375 rb_ensure(ripper_parse0, self, ripper_ensure, self);
11377 return parser->result;
11382 * ripper#column -> Integer
11384 * Return column number of current parsing line.
11385 * This number starts from 0.
11388 ripper_column(VALUE self)
11390 struct parser_params *parser;
11393 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
11394 if (!ripper_initialized_p(parser)) {
11395 rb_raise(rb_eArgError, "method called for uninitialized object");
11397 if (NIL_P(parser->parsing_thread)) return Qnil;
11398 col = parser->tokp - parser->parser_lex_pbeg;
11399 return LONG2NUM(col);
11404 * ripper#filename -> String
11406 * Return current parsing filename.
11409 ripper_filename(VALUE self)
11411 struct parser_params *parser;
11413 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
11414 if (!ripper_initialized_p(parser)) {
11415 rb_raise(rb_eArgError, "method called for uninitialized object");
11417 return parser->parser_ruby_sourcefile_string;
11422 * ripper#lineno -> Integer
11424 * Return line number of current parsing line.
11425 * This number starts from 1.
11428 ripper_lineno(VALUE self)
11430 struct parser_params *parser;
11432 TypedData_Get_Struct(self, struct parser_params, &parser_data_type, parser);
11433 if (!ripper_initialized_p(parser)) {
11434 rb_raise(rb_eArgError, "method called for uninitialized object");
11436 if (NIL_P(parser->parsing_thread)) return Qnil;
11437 return INT2NUM(parser->parser_ruby_sourceline);
11440 #ifdef RIPPER_DEBUG
11443 ripper_assert_Qundef(VALUE self, VALUE obj, VALUE msg)
11446 if (obj == Qundef) {
11447 rb_raise(rb_eArgError, "%s", RSTRING_PTR(msg));
11454 ripper_value(VALUE self, VALUE obj)
11456 return ULONG2NUM(obj);
11464 parser_data_type.parent = RTYPEDDATA_TYPE(rb_parser_new());
11466 ripper_init_eventids1();
11467 ripper_init_eventids2();
11468 /* ensure existing in symbol table */
11469 (void)rb_intern("||");
11470 (void)rb_intern("&&");
11476 InitVM_ripper(void)
11480 Ripper = rb_define_class("Ripper", rb_cObject);
11481 rb_define_const(Ripper, "Version", rb_usascii_str_new2(RIPPER_VERSION));
11482 rb_define_alloc_func(Ripper, ripper_s_allocate);
11483 rb_define_method(Ripper, "initialize", ripper_initialize, -1);
11484 rb_define_method(Ripper, "parse", ripper_parse, 0);
11485 rb_define_method(Ripper, "column", ripper_column, 0);
11486 rb_define_method(Ripper, "filename", ripper_filename, 0);
11487 rb_define_method(Ripper, "lineno", ripper_lineno, 0);
11488 rb_define_method(Ripper, "end_seen?", rb_parser_end_seen_p, 0);
11489 rb_define_method(Ripper, "encoding", rb_parser_encoding, 0);
11490 rb_define_method(Ripper, "yydebug", rb_parser_get_yydebug, 0);
11491 rb_define_method(Ripper, "yydebug=", rb_parser_set_yydebug, 1);
11492 #ifdef RIPPER_DEBUG
11493 rb_define_method(rb_mKernel, "assert_Qundef", ripper_assert_Qundef, 2);
11494 rb_define_method(rb_mKernel, "rawVALUE", ripper_value, 1);
11495 rb_define_method(rb_mKernel, "validate_object", ripper_validate_object, 1);
11498 ripper_init_eventids1_table(Ripper);
11499 ripper_init_eventids2_table(Ripper);
11502 /* Hack to let RDoc document SCRIPT_LINES__ */
11505 * When a Hash is assigned to +SCRIPT_LINES__+ the contents of files loaded
11506 * after the assignment will be added as an Array of lines with the file
11509 rb_define_global_const("SCRIPT_LINES__", Qnil);
11513 #endif /* RIPPER */