diff options
Diffstat (limited to 'trunk/parse.y')
-rw-r--r-- | trunk/parse.y | 10013 |
1 files changed, 0 insertions, 10013 deletions
diff --git a/trunk/parse.y b/trunk/parse.y deleted file mode 100644 index 10e0c2c128..0000000000 --- a/trunk/parse.y +++ /dev/null @@ -1,10013 +0,0 @@ -/********************************************************************** - - parse.y - - - $Author$ - created at: Fri May 28 18:02:42 JST 1993 - - Copyright (C) 1993-2007 Yukihiro Matsumoto - -**********************************************************************/ - -%{ - -#define YYDEBUG 1 -#define YYERROR_VERBOSE 1 -#define YYSTACK_USE_ALLOCA 0 - -#include "ruby/ruby.h" -#include "ruby/intern.h" -#include "ruby/node.h" -#include "ruby/st.h" -#include "ruby/encoding.h" -#include "id.h" -#include "regenc.h" -#include <stdio.h> -#include <errno.h> -#include <ctype.h> - -#define YYMALLOC(size) rb_parser_malloc(parser, size) -#define YYREALLOC(ptr, size) rb_parser_realloc(parser, ptr, size) -#define YYCALLOC(nelem, size) rb_parser_calloc(parser, nelem, size) -#define YYFREE(ptr) rb_parser_free(parser, ptr) -#define malloc YYMALLOC -#define realloc YYREALLOC -#define calloc YYCALLOC -#define free YYFREE - -#ifndef RIPPER -static ID register_symid(ID, const char *, long, rb_encoding *); -#define REGISTER_SYMID(id, name) register_symid(id, name, strlen(name), enc) -#include "id.c" -#endif - -#define is_notop_id(id) ((id)>tLAST_TOKEN) -#define is_local_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_LOCAL) -#define is_global_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_GLOBAL) -#define is_instance_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_INSTANCE) -#define is_attrset_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_ATTRSET) -#define is_const_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_CONST) -#define is_class_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_CLASS) -#define is_junk_id(id) (is_notop_id(id)&&((id)&ID_SCOPE_MASK)==ID_JUNK) - -#define is_asgn_or_id(id) ((is_notop_id(id)) && \ - (((id)&ID_SCOPE_MASK) == ID_GLOBAL || \ - ((id)&ID_SCOPE_MASK) == ID_INSTANCE || \ - ((id)&ID_SCOPE_MASK) == ID_CLASS)) - -enum lex_state_e { - EXPR_BEG, /* ignore newline, +/- is a sign. */ - EXPR_END, /* newline significant, +/- is a operator. */ - EXPR_ENDARG, /* ditto, and unbound braces. */ - EXPR_ARG, /* newline significant, +/- is a operator. */ - EXPR_CMDARG, /* newline significant, +/- is a operator. */ - EXPR_MID, /* newline significant, +/- is a operator. */ - EXPR_FNAME, /* ignore newline, no reserved words. */ - EXPR_DOT, /* right after `.' or `::', no reserved words. */ - EXPR_CLASS, /* immediate after `class', no here document. */ - EXPR_VALUE /* alike EXPR_BEG but label is disallowed. */ -}; - -# ifdef HAVE_LONG_LONG -typedef unsigned LONG_LONG stack_type; -# else -typedef unsigned long stack_type; -# endif - -# define BITSTACK_PUSH(stack, n) (stack = (stack<<1)|((n)&1)) -# define BITSTACK_POP(stack) (stack = stack >> 1) -# define BITSTACK_LEXPOP(stack) (stack = (stack >> 1) | (stack & 1)) -# define BITSTACK_SET_P(stack) (stack&1) - -#define COND_PUSH(n) BITSTACK_PUSH(cond_stack, n) -#define COND_POP() BITSTACK_POP(cond_stack) -#define COND_LEXPOP() BITSTACK_LEXPOP(cond_stack) -#define COND_P() BITSTACK_SET_P(cond_stack) - -#define CMDARG_PUSH(n) BITSTACK_PUSH(cmdarg_stack, n) -#define CMDARG_POP() BITSTACK_POP(cmdarg_stack) -#define CMDARG_LEXPOP() BITSTACK_LEXPOP(cmdarg_stack) -#define CMDARG_P() BITSTACK_SET_P(cmdarg_stack) - -struct vtable { - ID *tbl; - int pos; - int capa; - struct vtable *prev; -}; - -struct local_vars { - struct vtable *args; - struct vtable *vars; - struct local_vars *prev; -}; - -#define DVARS_INHERIT ((void*)1) -#define DVARS_TOPSCOPE NULL -#define DVARS_SPECIAL_P(tbl) (!POINTER_P(tbl)) -#define POINTER_P(val) ((VALUE)(val) & ~(VALUE)3) - -#ifndef RIPPER -static int -vtable_size(const struct vtable *tbl) -{ - if (POINTER_P(tbl)) { - return tbl->pos; - } - else { - return 0; - } -} - -#define VTBL_DEBUG 0 - -static struct vtable * -vtable_alloc(struct vtable *prev) -{ - struct vtable *tbl = ALLOC(struct vtable); - tbl->pos = 0; - tbl->capa = 8; - tbl->tbl = ALLOC_N(ID, tbl->capa); - tbl->prev = prev; - if (VTBL_DEBUG) printf("vtable_alloc: %p\n", tbl); - return tbl; -} - -static void -vtable_free(struct vtable *tbl) -{ - if (VTBL_DEBUG)printf("vtable_free: %p\n", tbl); - if (POINTER_P(tbl)) { - if (tbl->tbl) { - xfree(tbl->tbl); - } - xfree(tbl); - } -} - -static void -vtable_add(struct vtable *tbl, ID id) -{ - if (!POINTER_P(tbl)) { - rb_bug("vtable_add: vtable is not allocated (%p)", tbl); - } - if (VTBL_DEBUG) printf("vtable_add: %p, %s\n", tbl, rb_id2name(id)); - - if (tbl->pos == tbl->capa) { - tbl->capa = tbl->capa * 2; - REALLOC_N(tbl->tbl, ID, tbl->capa); - } - tbl->tbl[tbl->pos++] = id; -} - -static int -vtable_included(const struct vtable * tbl, ID id) -{ - int i; - - if (POINTER_P(tbl)) { - for (i = 0; i < tbl->pos; i++) { - if (tbl->tbl[i] == id) { - return 1; - } - } - } - return 0; -} -#endif - -/* - Structure of Lexer Buffer: - - lex_pbeg tokp lex_p lex_pend - | | | | - |-----------+--------------+------------| - |<------------>| - token -*/ -struct parser_params { - int is_ripper; - NODE *heap; - - YYSTYPE *parser_yylval; - VALUE eofp; - - NODE *parser_lex_strterm; - enum lex_state_e parser_lex_state; - stack_type parser_cond_stack; - stack_type parser_cmdarg_stack; - int parser_class_nest; - int parser_paren_nest; - int parser_lpar_beg; - int parser_in_single; - int parser_in_def; - int parser_compile_for_eval; - VALUE parser_cur_mid; - int parser_in_defined; - char *parser_tokenbuf; - int parser_tokidx; - int parser_toksiz; - VALUE parser_lex_input; - VALUE parser_lex_lastline; - VALUE parser_lex_nextline; - const char *parser_lex_pbeg; - const char *parser_lex_p; - const char *parser_lex_pend; - int parser_heredoc_end; - int parser_command_start; - NODE *parser_deferred_nodes; - int parser_lex_gets_ptr; - VALUE (*parser_lex_gets)(struct parser_params*,VALUE); - struct local_vars *parser_lvtbl; - int parser_ruby__end__seen; - int line_count; - int has_shebang; - char *parser_ruby_sourcefile; /* current source file */ - int parser_ruby_sourceline; /* current line no. */ - rb_encoding *enc; - rb_encoding *utf8; - - int parser_yydebug; - -#ifndef RIPPER - /* Ruby core only */ - NODE *parser_eval_tree_begin; - NODE *parser_eval_tree; - VALUE debug_lines; - VALUE coverage; - int nerr; -#else - /* Ripper only */ - VALUE parser_ruby_sourcefile_string; - const char *tokp; - VALUE delayed; - int delayed_line; - int delayed_col; - - VALUE value; - VALUE result; - VALUE parsing_thread; - int toplevel_p; -#endif -}; - -#define UTF8_ENC() (parser->utf8 ? parser->utf8 : \ - (parser->utf8 = rb_utf8_encoding())) -#define STR_NEW(p,n) rb_enc_str_new((p),(n),parser->enc) -#define STR_NEW0() rb_usascii_str_new(0,0) -#define STR_NEW2(p) rb_enc_str_new((p),strlen(p),parser->enc) -#define STR_NEW3(p,n,e,func) parser_str_new((p),(n),(e),(func),parser->enc) -#define STR_ENC(m) ((m)?parser->enc:rb_usascii_encoding()) -#define ENC_SINGLE(cr) ((cr)==ENC_CODERANGE_7BIT) -#define TOK_INTERN(mb) rb_intern3(tok(), toklen(), STR_ENC(mb)) - -#ifdef YYMALLOC -void *rb_parser_malloc(struct parser_params *, size_t); -void *rb_parser_realloc(struct parser_params *, void *, size_t); -void *rb_parser_calloc(struct parser_params *, size_t, size_t); -void rb_parser_free(struct parser_params *, void *); -#endif - -static int parser_yyerror(struct parser_params*, const char*); -#define yyerror(msg) parser_yyerror(parser, msg) - -#define YYLEX_PARAM parser - -#define lex_strterm (parser->parser_lex_strterm) -#define lex_state (parser->parser_lex_state) -#define cond_stack (parser->parser_cond_stack) -#define cmdarg_stack (parser->parser_cmdarg_stack) -#define class_nest (parser->parser_class_nest) -#define paren_nest (parser->parser_paren_nest) -#define lpar_beg (parser->parser_lpar_beg) -#define in_single (parser->parser_in_single) -#define in_def (parser->parser_in_def) -#define compile_for_eval (parser->parser_compile_for_eval) -#define cur_mid (parser->parser_cur_mid) -#define in_defined (parser->parser_in_defined) -#define tokenbuf (parser->parser_tokenbuf) -#define tokidx (parser->parser_tokidx) -#define toksiz (parser->parser_toksiz) -#define lex_input (parser->parser_lex_input) -#define lex_lastline (parser->parser_lex_lastline) -#define lex_nextline (parser->parser_lex_nextline) -#define lex_pbeg (parser->parser_lex_pbeg) -#define lex_p (parser->parser_lex_p) -#define lex_pend (parser->parser_lex_pend) -#define heredoc_end (parser->parser_heredoc_end) -#define command_start (parser->parser_command_start) -#define deferred_nodes (parser->parser_deferred_nodes) -#define lex_gets_ptr (parser->parser_lex_gets_ptr) -#define lex_gets (parser->parser_lex_gets) -#define lvtbl (parser->parser_lvtbl) -#define ruby__end__seen (parser->parser_ruby__end__seen) -#define ruby_sourceline (parser->parser_ruby_sourceline) -#define ruby_sourcefile (parser->parser_ruby_sourcefile) -#define yydebug (parser->parser_yydebug) -#ifdef RIPPER -#else -#define ruby_eval_tree (parser->parser_eval_tree) -#define ruby_eval_tree_begin (parser->parser_eval_tree_begin) -#define ruby_debug_lines (parser->debug_lines) -#define ruby_coverage (parser->coverage) -#endif - -static int yylex(void*, void*); - -#ifndef RIPPER -#define yyparse ruby_yyparse - -static NODE* node_newnode(struct parser_params *, enum node_type, VALUE, VALUE, VALUE); -#define rb_node_newnode(type, a1, a2, a3) node_newnode(parser, type, a1, a2, a3) - -static NODE *cond_gen(struct parser_params*,NODE*); -#define cond(node) cond_gen(parser, node) -static NODE *logop_gen(struct parser_params*,enum node_type,NODE*,NODE*); -#define logop(type,node1,node2) logop_gen(parser, type, node1, node2) - -static NODE *newline_node(NODE*); -static void fixpos(NODE*,NODE*); - -static int value_expr_gen(struct parser_params*,NODE*); -static void void_expr_gen(struct parser_params*,NODE*); -static NODE *remove_begin(NODE*); -#define value_expr(node) value_expr_gen(parser, (node) = remove_begin(node)) -#define void_expr0(node) void_expr_gen(parser, (node)) -#define void_expr(node) void_expr0((node) = remove_begin(node)) -static void void_stmts_gen(struct parser_params*,NODE*); -#define void_stmts(node) void_stmts_gen(parser, node) -static void reduce_nodes_gen(struct parser_params*,NODE**); -#define reduce_nodes(n) reduce_nodes_gen(parser,n) -static void block_dup_check_gen(struct parser_params*,NODE*,NODE*); -#define block_dup_check(n1,n2) block_dup_check_gen(parser,n1,n2) - -static NODE *block_append_gen(struct parser_params*,NODE*,NODE*); -#define block_append(h,t) block_append_gen(parser,h,t) -static NODE *list_append_gen(struct parser_params*,NODE*,NODE*); -#define list_append(l,i) list_append_gen(parser,l,i) -static NODE *list_concat_gen(struct parser_params*,NODE*,NODE*); -#define list_concat(h,t) list_concat_gen(parser,h,t) -static NODE *arg_append_gen(struct parser_params*,NODE*,NODE*); -#define arg_append(h,t) arg_append_gen(parser,h,t) -static NODE *arg_concat_gen(struct parser_params*,NODE*,NODE*); -#define arg_concat(h,t) arg_concat_gen(parser,h,t) -static NODE *literal_concat_gen(struct parser_params*,NODE*,NODE*); -#define literal_concat(h,t) literal_concat_gen(parser,h,t) -static NODE *new_evstr_gen(struct parser_params*,NODE*); -#define new_evstr(n) new_evstr_gen(parser,n) -static NODE *evstr2dstr_gen(struct parser_params*,NODE*); -#define evstr2dstr(n) evstr2dstr_gen(parser,n) -static NODE *splat_array(NODE*); - -static NODE *call_bin_op_gen(struct parser_params*,NODE*,ID,NODE*); -#define call_bin_op(recv,id,arg1) call_bin_op_gen(parser, recv,id,arg1) -static NODE *call_uni_op_gen(struct parser_params*,NODE*,ID); -#define call_uni_op(recv,id) call_uni_op_gen(parser, recv,id) - -static NODE *new_args_gen(struct parser_params*,NODE*,NODE*,ID,NODE*,ID); -#define new_args(f,o,r,p,b) new_args_gen(parser, f,o,r,p,b) -static void shadowing_lvar_gen(struct parser_params*,ID); -#define shadowing_lvar(name) shadowing_lvar_gen(parser, name) - -static NODE *negate_lit(NODE*); -static NODE *ret_args_gen(struct parser_params*,NODE*); -#define ret_args(node) ret_args_gen(parser, node) -static NODE *arg_blk_pass(NODE*,NODE*); -static NODE *new_yield_gen(struct parser_params*,NODE*); -#define new_yield(node) new_yield_gen(parser, node) - -static NODE *gettable_gen(struct parser_params*,ID); -#define gettable(id) gettable_gen(parser,id) -static NODE *assignable_gen(struct parser_params*,ID,NODE*); -#define assignable(id,node) assignable_gen(parser, id, node) -static void new_bv_gen(struct parser_params*,ID); -#define new_bv(id) new_bv_gen(parser, id) -static NODE *aryset_gen(struct parser_params*,NODE*,NODE*); -#define aryset(node1,node2) aryset_gen(parser, node1, node2) -static NODE *attrset_gen(struct parser_params*,NODE*,ID); -#define attrset(node,id) attrset_gen(parser, node, id) - -static void rb_backref_error_gen(struct parser_params*,NODE*); -#define rb_backref_error(n) rb_backref_error_gen(parser,n) -static NODE *node_assign_gen(struct parser_params*,NODE*,NODE*); -#define node_assign(node1, node2) node_assign_gen(parser, node1, node2) - -static NODE *match_op_gen(struct parser_params*,NODE*,NODE*); -#define match_op(node1,node2) match_op_gen(parser, node1, node2) - -static void local_push_gen(struct parser_params*,int); -#define local_push(top) local_push_gen(parser,top) -static void local_pop_gen(struct parser_params*); -#define local_pop() local_pop_gen(parser) -static int local_var_gen(struct parser_params*, ID); -#define local_var(id) local_var_gen(parser, id); -static int arg_var_gen(struct parser_params*, ID); -#define arg_var(id) arg_var_gen(parser, id) -static int local_id_gen(struct parser_params*, ID); -#define local_id(id) local_id_gen(parser, id) -static ID *local_tbl_gen(struct parser_params*); -#define local_tbl() local_tbl_gen(parser) -static ID internal_id_gen(struct parser_params*); -#define internal_id() internal_id_gen(parser) - -static void dyna_push_gen(struct parser_params*); -#define dyna_push() dyna_push_gen(parser) -static void dyna_pop_gen(struct parser_params*); -#define dyna_pop() dyna_pop_gen(parser) -static int dyna_in_block_gen(struct parser_params*); -#define dyna_in_block() dyna_in_block_gen(parser) -#define dyna_var(id) local_var(id) -static int dvar_defined_gen(struct parser_params*,ID); -#define dvar_defined(id) dvar_defined_gen(parser, id) -static int dvar_curr_gen(struct parser_params*,ID); -#define dvar_curr(id) dvar_curr_gen(parser, id) - -static void fixup_nodes(NODE **); - -extern int rb_dvar_defined(ID); -extern int rb_local_defined(ID); -extern int rb_parse_in_eval(void); - -static VALUE reg_compile_gen(struct parser_params*, VALUE, int); -#define reg_compile(str,options) reg_compile_gen(parser, str, options) -static void reg_fragment_setenc_gen(struct parser_params*, VALUE, int); -#define reg_fragment_setenc(str,options) reg_fragment_setenc_gen(parser, str, options) -static void reg_fragment_check_gen(struct parser_params*, VALUE, int); -#define reg_fragment_check(str,options) reg_fragment_check_gen(parser, str, options) -static NODE *reg_named_capture_assign_gen(struct parser_params* parser, VALUE regexp, NODE *match); -#define reg_named_capture_assign(regexp,match) reg_named_capture_assign_gen(parser,regexp,match) -int rb_enc_symname2_p(const char *, int, rb_encoding *); -#else -#define remove_begin(node) (node) -#endif /* !RIPPER */ -static int lvar_defined_gen(struct parser_params*, ID); -#define lvar_defined(id) lvar_defined_gen(parser, id) - -#define RE_OPTION_ONCE (1<<16) -#define RE_OPTION_ENCODING_SHIFT 8 -#define RE_OPTION_ENCODING(e) (((e)&0xff)<<RE_OPTION_ENCODING_SHIFT) -#define RE_OPTION_ENCODING_IDX(o) (((o)>>RE_OPTION_ENCODING_SHIFT)&0xff) -#define RE_OPTION_ENCODING_NONE(o) ((o)&RE_OPTION_ARG_ENCODING_NONE) -#define RE_OPTION_MASK 0xff -#define RE_OPTION_ARG_ENCODING_NONE 32 - -#define NODE_STRTERM NODE_ZARRAY /* nothing to gc */ -#define NODE_HEREDOC NODE_ARRAY /* 1, 3 to gc */ -#define SIGN_EXTEND(x,n) (((1<<(n)-1)^((x)&~(~0<<(n))))-(1<<(n)-1)) -#define nd_func u1.id -#if SIZEOF_SHORT == 2 -#define nd_term(node) ((signed short)(node)->u2.id) -#else -#define nd_term(node) SIGN_EXTEND((node)->u2.id, CHAR_BIT*2) -#endif -#define nd_paren(node) (char)((node)->u2.id >> CHAR_BIT*2) -#define nd_nest u3.cnt - -/****** Ripper *******/ - -#ifdef RIPPER -#define RIPPER_VERSION "0.1.0" - -#include "eventids1.c" -#include "eventids2.c" -static ID ripper_id_gets; - -static VALUE ripper_dispatch0(struct parser_params*,ID); -static VALUE ripper_dispatch1(struct parser_params*,ID,VALUE); -static VALUE ripper_dispatch2(struct parser_params*,ID,VALUE,VALUE); -static VALUE ripper_dispatch3(struct parser_params*,ID,VALUE,VALUE,VALUE); -static VALUE ripper_dispatch4(struct parser_params*,ID,VALUE,VALUE,VALUE,VALUE); -static VALUE ripper_dispatch5(struct parser_params*,ID,VALUE,VALUE,VALUE,VALUE,VALUE); - -#define dispatch0(n) ripper_dispatch0(parser, TOKEN_PASTE(ripper_id_, n)) -#define dispatch1(n,a) ripper_dispatch1(parser, TOKEN_PASTE(ripper_id_, n), a) -#define dispatch2(n,a,b) ripper_dispatch2(parser, TOKEN_PASTE(ripper_id_, n), a, b) -#define dispatch3(n,a,b,c) ripper_dispatch3(parser, TOKEN_PASTE(ripper_id_, n), a, b, c) -#define dispatch4(n,a,b,c,d) ripper_dispatch4(parser, TOKEN_PASTE(ripper_id_, n), a, b, c, d) -#define dispatch5(n,a,b,c,d,e) ripper_dispatch5(parser, TOKEN_PASTE(ripper_id_, n), a, b, c, d, e) - -#define yyparse ripper_yyparse - -static VALUE ripper_intern(const char*); -static VALUE ripper_id2sym(ID); -#ifdef __GNUC__ -#define ripper_id2sym(id) ((id) < 256 && rb_ispunct(id) ? \ - ID2SYM(id) : ripper_id2sym(id)) -#endif - -#define arg_new() dispatch0(args_new) -#define arg_add(l,a) dispatch2(args_add, l, a) -#define arg_prepend(l,a) dispatch2(args_prepend, l, a) -#define arg_add_star(l,a) dispatch2(args_add_star, l, a) -#define arg_add_block(l,b) dispatch2(args_add_block, l, b) -#define arg_add_optblock(l,b) ((b)==Qundef? l : dispatch2(args_add_block, l, b)) -#define bare_assoc(v) dispatch1(bare_assoc_hash, v) -#define arg_add_assocs(l,b) arg_add(l, bare_assoc(b)) - -#define args2mrhs(a) dispatch1(mrhs_new_from_args, a) -#define mrhs_new() dispatch0(mrhs_new) -#define mrhs_add(l,a) dispatch2(mrhs_add, l, a) -#define mrhs_add_star(l,a) dispatch2(mrhs_add_star, l, a) - -#define mlhs_new() dispatch0(mlhs_new) -#define mlhs_add(l,a) dispatch2(mlhs_add, l, a) -#define mlhs_add_star(l,a) dispatch2(mlhs_add_star, l, a) - -#define params_new(pars, opts, rest, pars2, blk) \ - dispatch5(params, pars, opts, rest, pars2, blk) - -#define blockvar_new(p,v) dispatch2(block_var, p, v) -#define blockvar_add_star(l,a) dispatch2(block_var_add_star, l, a) -#define blockvar_add_block(l,a) dispatch2(block_var_add_block, l, a) - -#define method_optarg(m,a) ((a)==Qundef ? m : dispatch2(method_add_arg,m,a)) -#define method_arg(m,a) dispatch2(method_add_arg,m,a) -#define method_add_block(m,b) dispatch2(method_add_block, m, b) - -#define escape_Qundef(x) ((x)==Qundef ? Qnil : (x)) - -#define FIXME 0 - -#endif /* RIPPER */ - -#ifndef RIPPER -# define ifndef_ripper(x) x -#else -# define ifndef_ripper(x) -#endif - -#ifndef RIPPER -# define rb_warn0(fmt) rb_compile_warn(ruby_sourcefile, ruby_sourceline, fmt) -# define rb_warnI(fmt,a) rb_compile_warn(ruby_sourcefile, ruby_sourceline, fmt, a) -# define rb_warnS(fmt,a) rb_compile_warn(ruby_sourcefile, ruby_sourceline, fmt, a) -# define rb_warning0(fmt) rb_compile_warning(ruby_sourcefile, ruby_sourceline, fmt) -# define rb_warningS(fmt,a) rb_compile_warning(ruby_sourcefile, ruby_sourceline, fmt, a) -#else -# define rb_warn0(fmt) ripper_warn0(parser, fmt) -# define rb_warnI(fmt,a) ripper_warnI(parser, fmt, a) -# define rb_warnS(fmt,a) ripper_warnS(parser, fmt, a) -# define rb_warning0(fmt) ripper_warning0(parser, fmt) -# define rb_warningS(fmt,a) ripper_warningS(parser, fmt, a) -static void ripper_warn0(struct parser_params*, const char*); -static void ripper_warnI(struct parser_params*, const char*, int); -#if 0 -static void ripper_warnS(struct parser_params*, const char*, const char*); -#endif -static void ripper_warning0(struct parser_params*, const char*); -static void ripper_warningS(struct parser_params*, const char*, const char*); -#endif - -#ifdef RIPPER -static void ripper_compile_error(struct parser_params*, const char *fmt, ...); -# define rb_compile_error ripper_compile_error -# define compile_error ripper_compile_error -# define PARSER_ARG parser, -#else -# define compile_error parser->nerr++,rb_compile_error -# define PARSER_ARG ruby_sourcefile, ruby_sourceline, -#endif - -/* Older versions of Yacc set YYMAXDEPTH to a very low value by default (150, - for instance). This is too low for Ruby to parse some files, such as - date/format.rb, therefore bump the value up to at least Bison's default. */ -#ifdef OLD_YACC -#ifndef YYMAXDEPTH -#define YYMAXDEPTH 10000 -#endif -#endif - -%} - -%pure_parser -%parse-param {struct parser_params *parser} - -%union { - VALUE val; - NODE *node; - ID id; - int num; -} - -/*%%%*/ -%token -/*% -%token <val> -%*/ - keyword_class - keyword_module - keyword_def - keyword_undef - keyword_begin - keyword_rescue - keyword_ensure - keyword_end - keyword_if - keyword_unless - keyword_then - keyword_elsif - keyword_else - keyword_case - keyword_when - keyword_while - keyword_until - keyword_for - keyword_break - keyword_next - keyword_redo - keyword_retry - keyword_in - keyword_do - keyword_do_cond - keyword_do_block - keyword_do_LAMBDA - keyword_return - keyword_yield - keyword_super - keyword_self - keyword_nil - keyword_true - keyword_false - keyword_and - keyword_or - keyword_not - modifier_if - modifier_unless - modifier_while - modifier_until - modifier_rescue - keyword_alias - keyword_defined - keyword_BEGIN - keyword_END - keyword__LINE__ - keyword__FILE__ - keyword__ENCODING__ - -%token <id> tIDENTIFIER tFID tGVAR tIVAR tCONSTANT tCVAR tLABEL -%token <node> tINTEGER tFLOAT tSTRING_CONTENT tCHAR -%token <node> tNTH_REF tBACK_REF -%token <num> tREGEXP_END - -%type <node> singleton strings string string1 xstring regexp -%type <node> string_contents xstring_contents string_content -%type <node> words qwords word_list qword_list word -%type <node> literal numeric dsym cpath -%type <node> bodystmt compstmt stmts stmt expr arg primary command command_call method_call -%type <node> expr_value arg_value primary_value -%type <node> if_tail opt_else case_body cases opt_rescue exc_list exc_var opt_ensure -%type <node> args call_args opt_call_args -%type <node> paren_args opt_paren_args -%type <node> command_args aref_args opt_block_arg block_arg var_ref var_lhs -%type <node> mrhs superclass block_call block_command -%type <node> f_arglist f_args f_arg f_arg_item f_optarg f_marg f_marg_list f_margs -%type <node> assoc_list assocs assoc undef_list backref string_dvar for_var -%type <node> block_param opt_block_param block_param_def f_opt -%type <node> bv_decls opt_bv_decl bvar -%type <node> lambda f_larglist lambda_body -%type <node> brace_block cmd_brace_block do_block lhs none fitem -%type <node> mlhs mlhs_head mlhs_basic mlhs_item mlhs_node mlhs_post mlhs_inner -%type <id> fsym variable sym symbol operation operation2 operation3 -%type <id> cname fname op f_rest_arg f_block_arg opt_f_block_arg f_norm_arg f_bad_arg -/*%%%*/ -/*% -%type <val> program reswords then do dot_or_colon -%*/ -%token tUPLUS /* unary+ */ -%token tUMINUS /* unary- */ -%token tPOW /* ** */ -%token tCMP /* <=> */ -%token tEQ /* == */ -%token tEQQ /* === */ -%token tNEQ /* != */ -%token tGEQ /* >= */ -%token tLEQ /* <= */ -%token tANDOP tOROP /* && and || */ -%token tMATCH tNMATCH /* =~ and !~ */ -%token tDOT2 tDOT3 /* .. and ... */ -%token tAREF tASET /* [] and []= */ -%token tLSHFT tRSHFT /* << and >> */ -%token tCOLON2 /* :: */ -%token tCOLON3 /* :: at EXPR_BEG */ -%token <id> tOP_ASGN /* +=, -= etc. */ -%token tASSOC /* => */ -%token tLPAREN /* ( */ -%token tLPAREN_ARG /* ( */ -%token tRPAREN /* ) */ -%token tLBRACK /* [ */ -%token tLBRACE /* { */ -%token tLBRACE_ARG /* { */ -%token tSTAR /* * */ -%token tAMPER /* & */ -%token tLAMBDA /* -> */ -%token tSYMBEG tSTRING_BEG tXSTRING_BEG tREGEXP_BEG tWORDS_BEG tQWORDS_BEG -%token tSTRING_DBEG tSTRING_DVAR tSTRING_END tLAMBEG - -/* - * precedence table - */ - -%nonassoc tLOWEST -%nonassoc tLBRACE_ARG - -%nonassoc modifier_if modifier_unless modifier_while modifier_until -%left keyword_or keyword_and -%right keyword_not -%nonassoc keyword_defined -%right '=' tOP_ASGN -%left modifier_rescue -%right '?' ':' -%nonassoc tDOT2 tDOT3 -%left tOROP -%left tANDOP -%nonassoc tCMP tEQ tEQQ tNEQ tMATCH tNMATCH -%left '>' tGEQ '<' tLEQ -%left '|' '^' -%left '&' -%left tLSHFT tRSHFT -%left '+' '-' -%left '*' '/' '%' -%right tUMINUS_NUM tUMINUS -%right tPOW -%right '!' '~' tUPLUS - -%nonassoc idNULL -%nonassoc idRespond_to -%nonassoc idIFUNC -%nonassoc idCFUNC -%nonassoc idThrowState -%nonassoc id_core_set_method_alias -%nonassoc id_core_set_variable_alias -%nonassoc id_core_undef_method -%nonassoc id_core_define_method -%nonassoc id_core_define_singleton_method -%nonassoc id_core_set_postexe - -%token tLAST_TOKEN - -%% -program : { - lex_state = EXPR_BEG; - /*%%%*/ - local_push(compile_for_eval); - /*% - %*/ - } - compstmt - { - /*%%%*/ - if ($2 && !compile_for_eval) { - /* last expression should not be void */ - if (nd_type($2) != NODE_BLOCK) void_expr($2); - else { - NODE *node = $2; - while (node->nd_next) { - node = node->nd_next; - } - void_expr(node->nd_head); - } - } - ruby_eval_tree = NEW_SCOPE(0, block_append(ruby_eval_tree, $2)); - local_pop(); - /*% - $$ = $2; - parser->result = dispatch1(program, $$); - %*/ - } - ; - -bodystmt : compstmt - opt_rescue - opt_else - opt_ensure - { - /*%%%*/ - $$ = $1; - if ($2) { - $$ = NEW_RESCUE($1, $2, $3); - } - else if ($3) { - rb_warn0("else without rescue is useless"); - $$ = block_append($$, $3); - } - if ($4) { - if ($$) { - $$ = NEW_ENSURE($$, $4); - } - else { - $$ = block_append($4, NEW_NIL()); - } - } - fixpos($$, $1); - /*% - $$ = dispatch4(body_stmt, - escape_Qundef($1), - escape_Qundef($2), - escape_Qundef($3), - escape_Qundef($4)); - %*/ - } - ; - -compstmt : stmts opt_terms - { - /*%%%*/ - void_stmts($1); - fixup_nodes(&deferred_nodes); - /*% - %*/ - $$ = $1; - } - ; - -stmts : none - { - /*%%%*/ - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch2(stmts_add, dispatch0(stmts_new), - dispatch0(void_stmt)); - %*/ - } - | stmt - { - /*%%%*/ - $$ = newline_node($1); - /*% - $$ = dispatch2(stmts_add, dispatch0(stmts_new), $1); - %*/ - } - | stmts terms stmt - { - /*%%%*/ - $$ = block_append($1, newline_node($3)); - /*% - $$ = dispatch2(stmts_add, $1, $3); - %*/ - } - | error stmt - { - $$ = remove_begin($2); - } - ; - -stmt : keyword_alias fitem {lex_state = EXPR_FNAME;} fitem - { - /*%%%*/ - $$ = NEW_ALIAS($2, $4); - /*% - $$ = dispatch2(alias, $2, $4); - %*/ - } - | keyword_alias tGVAR tGVAR - { - /*%%%*/ - $$ = NEW_VALIAS($2, $3); - /*% - $$ = dispatch2(var_alias, $2, $3); - %*/ - } - | keyword_alias tGVAR tBACK_REF - { - /*%%%*/ - char buf[3]; - - sprintf(buf, "$%c", (char)$3->nd_nth); - $$ = NEW_VALIAS($2, rb_intern(buf)); - /*% - $$ = dispatch2(var_alias, $2, $3); - %*/ - } - | keyword_alias tGVAR tNTH_REF - { - /*%%%*/ - yyerror("can't make alias for the number variables"); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch2(var_alias, $2, $3); - $$ = dispatch1(alias_error, $$); - %*/ - } - | keyword_undef undef_list - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(undef, $2); - %*/ - } - | stmt modifier_if expr_value - { - /*%%%*/ - $$ = NEW_IF(cond($3), remove_begin($1), 0); - fixpos($$, $3); - /*% - $$ = dispatch2(if_mod, $3, $1); - %*/ - } - | stmt modifier_unless expr_value - { - /*%%%*/ - $$ = NEW_UNLESS(cond($3), remove_begin($1), 0); - fixpos($$, $3); - /*% - $$ = dispatch2(unless_mod, $3, $1); - %*/ - } - | stmt modifier_while expr_value - { - /*%%%*/ - if ($1 && nd_type($1) == NODE_BEGIN) { - $$ = NEW_WHILE(cond($3), $1->nd_body, 0); - } - else { - $$ = NEW_WHILE(cond($3), $1, 1); - } - /*% - $$ = dispatch2(while_mod, $3, $1); - %*/ - } - | stmt modifier_until expr_value - { - /*%%%*/ - if ($1 && nd_type($1) == NODE_BEGIN) { - $$ = NEW_UNTIL(cond($3), $1->nd_body, 0); - } - else { - $$ = NEW_UNTIL(cond($3), $1, 1); - } - /*% - $$ = dispatch2(until_mod, $3, $1); - %*/ - } - | stmt modifier_rescue stmt - { - /*%%%*/ - NODE *resq = NEW_RESBODY(0, remove_begin($3), 0); - $$ = NEW_RESCUE(remove_begin($1), resq, 0); - /*% - $$ = dispatch2(rescue_mod, $3, $1); - %*/ - } - | keyword_BEGIN - { - if (in_def || in_single) { - yyerror("BEGIN in method"); - } - /*%%%*/ - /* local_push(0); */ - /*% - %*/ - } - '{' compstmt '}' - { - /*%%%*/ - ruby_eval_tree_begin = block_append(ruby_eval_tree_begin, - $4); - /* NEW_PREEXE($4)); */ - /* local_pop(); */ - $$ = 0; - /*% - $$ = dispatch1(BEGIN, $4); - %*/ - } - | keyword_END '{' compstmt '}' - { - if (in_def || in_single) { - rb_warn0("END in method; use at_exit"); - } - /*%%%*/ - $$ = NEW_POSTEXE(NEW_NODE( - NODE_SCOPE, 0 /* tbl */, $3 /* body */, 0 /* args */)); - /*% - $$ = dispatch1(END, $3); - %*/ - } - | lhs '=' command_call - { - /*%%%*/ - value_expr($3); - $$ = node_assign($1, $3); - /*% - $$ = dispatch2(assign, $1, $3); - %*/ - } - | mlhs '=' command_call - { - /*%%%*/ - value_expr($3); - $1->nd_value = $3; - $$ = $1; - /*% - $$ = dispatch2(massign, $1, $3); - %*/ - } - | var_lhs tOP_ASGN command_call - { - /*%%%*/ - value_expr($3); - if ($1) { - ID vid = $1->nd_vid; - if ($2 == tOROP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_OR(gettable(vid), $1); - if (is_asgn_or_id(vid)) { - $$->nd_aid = vid; - } - } - else if ($2 == tANDOP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_AND(gettable(vid), $1); - } - else { - $$ = $1; - $$->nd_value = NEW_CALL(gettable(vid), $2, NEW_LIST($3)); - } - } - else { - $$ = NEW_BEGIN(0); - } - /*% - $$ = dispatch3(opassign, $1, $2, $3); - %*/ - } - | primary_value '[' opt_call_args rbracket tOP_ASGN command_call - { - /*%%%*/ - NODE *args; - - value_expr($6); - if (!$3) $3 = NEW_ZARRAY(); - args = arg_concat($6, $3); - if ($5 == tOROP) { - $5 = 0; - } - else if ($5 == tANDOP) { - $5 = 1; - } - $$ = NEW_OP_ASGN1($1, $5, args); - fixpos($$, $1); - /*% - $$ = dispatch2(aref_field, $1, escape_Qundef($3)); - $$ = dispatch3(opassign, $$, $5, $6); - %*/ - } - | primary_value '.' tIDENTIFIER tOP_ASGN command_call - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - $$ = dispatch3(opassign, $$, $4, $5); - %*/ - } - | primary_value '.' tCONSTANT tOP_ASGN command_call - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - $$ = dispatch3(opassign, $$, $4, $5); - %*/ - } - | primary_value tCOLON2 tIDENTIFIER tOP_ASGN command_call - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $$ = dispatch3(field, $1, ripper_intern("::"), $3); - $$ = dispatch3(opassign, $$, $4, $5); - %*/ - } - | backref tOP_ASGN command_call - { - /*%%%*/ - rb_backref_error($1); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch2(assign, dispatch1(var_field, $1), $3); - $$ = dispatch1(assign_error, $$); - %*/ - } - | lhs '=' mrhs - { - /*%%%*/ - value_expr($3); - $$ = node_assign($1, $3); - /*% - $$ = dispatch2(assign, $1, $3); - %*/ - } - | mlhs '=' arg_value - { - /*%%%*/ - $1->nd_value = $3; - $$ = $1; - /*% - dispatch2(massign, $1, $3); - %*/ - } - | mlhs '=' mrhs - { - /*%%%*/ - $1->nd_value = $3; - $$ = $1; - /*% - $$ = dispatch2(massign, $1, $3); - %*/ - } - | expr - ; - -expr : command_call - | expr keyword_and expr - { - /*%%%*/ - $$ = logop(NODE_AND, $1, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("and"), $3); - %*/ - } - | expr keyword_or expr - { - /*%%%*/ - $$ = logop(NODE_OR, $1, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("or"), $3); - %*/ - } - | keyword_not expr - { - /*%%%*/ - $$ = call_uni_op(cond($2), '!'); - /*% - $$ = dispatch2(unary, ripper_intern("not"), $2); - %*/ - } - | '!' command_call - { - /*%%%*/ - $$ = call_uni_op(cond($2), '!'); - /*% - $$ = dispatch2(unary, ripper_id2sym('!'), $2); - %*/ - } - | arg - ; - -expr_value : expr - { - /*%%%*/ - value_expr($1); - $$ = $1; - if (!$$) $$ = NEW_NIL(); - /*% - $$ = $1; - %*/ - } - ; - -command_call : command - | block_command - | keyword_return call_args - { - /*%%%*/ - $$ = NEW_RETURN(ret_args($2)); - /*% - $$ = dispatch1(return, $2); - %*/ - } - | keyword_break call_args - { - /*%%%*/ - $$ = NEW_BREAK(ret_args($2)); - /*% - $$ = dispatch1(break, $2); - %*/ - } - | keyword_next call_args - { - /*%%%*/ - $$ = NEW_NEXT(ret_args($2)); - /*% - $$ = dispatch1(next, $2); - %*/ - } - ; - -block_command : block_call - | block_call '.' operation2 command_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - /*% - $$ = dispatch3(call, $1, ripper_id2sym('.'), $3); - $$ = method_arg($$, $4); - %*/ - } - | block_call tCOLON2 operation2 command_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - /*% - $$ = dispatch3(call, $1, ripper_intern("::"), $3); - $$ = method_arg($$, $4); - %*/ - } - ; - -cmd_brace_block : tLBRACE_ARG - { - /*%%%*/ - dyna_push(); - $<num>$ = ruby_sourceline; - /*% - %*/ - } - opt_block_param - compstmt - '}' - { - /*%%%*/ - $$ = NEW_ITER($3,$4); - nd_set_line($$, $<num>2); - dyna_pop(); - /*% - $$ = dispatch2(brace_block, escape_Qundef($3), $4); - %*/ - } - ; - -command : operation command_args %prec tLOWEST - { - /*%%%*/ - $$ = NEW_FCALL($1, $2); - fixpos($$, $2); - /*% - $$ = dispatch2(command, $1, $2); - %*/ - } - | operation command_args cmd_brace_block - { - /*%%%*/ - block_dup_check($2,$3); - $3->nd_iter = NEW_FCALL($1, $2); - $$ = $3; - fixpos($$, $2); - /*% - $$ = dispatch2(command, $1, $2); - $$ = method_add_block($$, $3); - %*/ - } - | primary_value '.' operation2 command_args %prec tLOWEST - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - fixpos($$, $1); - /*% - $$ = dispatch4(command_call, $1, ripper_id2sym('.'), $3, $4); - %*/ - } - | primary_value '.' operation2 command_args cmd_brace_block - { - /*%%%*/ - block_dup_check($4,$5); - $5->nd_iter = NEW_CALL($1, $3, $4); - $$ = $5; - fixpos($$, $1); - /*% - $$ = dispatch4(command_call, $1, ripper_id2sym('.'), $3, $4); - $$ = method_add_block($$, $5); - %*/ - } - | primary_value tCOLON2 operation2 command_args %prec tLOWEST - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - fixpos($$, $1); - /*% - $$ = dispatch4(command_call, $1, ripper_intern("::"), $3, $4); - %*/ - } - | primary_value tCOLON2 operation2 command_args cmd_brace_block - { - /*%%%*/ - block_dup_check($4,$5); - $5->nd_iter = NEW_CALL($1, $3, $4); - $$ = $5; - fixpos($$, $1); - /*% - $$ = dispatch4(command_call, $1, ripper_intern("::"), $3, $4); - $$ = method_add_block($$, $5); - %*/ - } - | keyword_super command_args - { - /*%%%*/ - $$ = NEW_SUPER($2); - fixpos($$, $2); - /*% - $$ = dispatch1(super, $2); - %*/ - } - | keyword_yield command_args - { - /*%%%*/ - $$ = new_yield($2); - fixpos($$, $2); - /*% - $$ = dispatch1(yield, $2); - %*/ - } - ; - -mlhs : mlhs_basic - | tLPAREN mlhs_inner rparen - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(mlhs_paren, $2); - %*/ - } - ; - -mlhs_inner : mlhs_basic - | tLPAREN mlhs_inner rparen - { - /*%%%*/ - $$ = NEW_MASGN(NEW_LIST($2), 0); - /*% - $$ = dispatch1(mlhs_paren, $2); - %*/ - } - ; - -mlhs_basic : mlhs_head - { - /*%%%*/ - $$ = NEW_MASGN($1, 0); - /*% - $$ = $1; - %*/ - } - | mlhs_head mlhs_item - { - /*%%%*/ - $$ = NEW_MASGN(list_append($1,$2), 0); - /*% - $$ = mlhs_add($1, $2); - %*/ - } - | mlhs_head tSTAR mlhs_node - { - /*%%%*/ - $$ = NEW_MASGN($1, $3); - /*% - $$ = mlhs_add_star($1, $3); - %*/ - } - | mlhs_head tSTAR mlhs_node ',' mlhs_post - { - /*%%%*/ - $$ = NEW_MASGN($1, NEW_POSTARG($3,$5)); - /*% - $$ = mlhs_add_star($1, $3); - %*/ - } - | mlhs_head tSTAR - { - /*%%%*/ - $$ = NEW_MASGN($1, -1); - /*% - $$ = mlhs_add_star($1, Qnil); - %*/ - } - | mlhs_head tSTAR ',' mlhs_post - { - /*%%%*/ - $$ = NEW_MASGN($1, NEW_POSTARG(-1, $4)); - /*% - $$ = mlhs_add_star($1, Qnil); - %*/ - } - | tSTAR mlhs_node - { - /*%%%*/ - $$ = NEW_MASGN(0, $2); - /*% - $$ = mlhs_add_star(mlhs_new(), $2); - %*/ - } - | tSTAR mlhs_node ',' mlhs_post - { - /*%%%*/ - $$ = NEW_MASGN(0, NEW_POSTARG($2,$4)); - /*% - $$ = mlhs_add_star(mlhs_new(), $2); - %*/ - } - | tSTAR - { - /*%%%*/ - $$ = NEW_MASGN(0, -1); - /*% - $$ = mlhs_add_star(mlhs_new(), Qnil); - %*/ - } - | tSTAR ',' mlhs_post - { - /*%%%*/ - $$ = NEW_MASGN(0, NEW_POSTARG(-1, $3)); - /*% - $$ = mlhs_add_star(mlhs_new(), Qnil); - %*/ - } - ; - -mlhs_item : mlhs_node - | tLPAREN mlhs_inner rparen - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(mlhs_paren, $2); - %*/ - } - ; - -mlhs_head : mlhs_item ',' - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = mlhs_add(mlhs_new(), $1); - %*/ - } - | mlhs_head mlhs_item ',' - { - /*%%%*/ - $$ = list_append($1, $2); - /*% - $$ = mlhs_add($1, $2); - %*/ - } - ; - -mlhs_post : mlhs_item - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = mlhs_add(mlhs_new(), $1); - %*/ - } - | mlhs_post ',' mlhs_item - { - /*%%%*/ - $$ = list_append($1, $3); - /*% - $$ = mlhs_add($1, $3); - %*/ - } - ; - -mlhs_node : variable - { - /*%%%*/ - $$ = assignable($1, 0); - /*% - $$ = $1; - %*/ - } - | primary_value '[' opt_call_args rbracket - { - /*%%%*/ - $$ = aryset($1, $3); - /*% - $$ = dispatch2(aref_field, $1, escape_Qundef($3)); - %*/ - } - | primary_value '.' tIDENTIFIER - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - %*/ - } - | primary_value tCOLON2 tIDENTIFIER - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch2(const_path_field, $1, $3); - %*/ - } - | primary_value '.' tCONSTANT - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - %*/ - } - | primary_value tCOLON2 tCONSTANT - { - /*%%%*/ - if (in_def || in_single) - yyerror("dynamic constant assignment"); - $$ = NEW_CDECL(0, 0, NEW_COLON2($1, $3)); - /*% - if (in_def || in_single) - yyerror("dynamic constant assignment"); - $$ = dispatch2(const_path_field, $1, $3); - %*/ - } - | tCOLON3 tCONSTANT - { - /*%%%*/ - if (in_def || in_single) - yyerror("dynamic constant assignment"); - $$ = NEW_CDECL(0, 0, NEW_COLON3($2)); - /*% - $$ = dispatch1(top_const_field, $2); - %*/ - } - | backref - { - /*%%%*/ - rb_backref_error($1); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(var_field, $1); - $$ = dispatch1(assign_error, $$); - %*/ - } - ; - -lhs : variable - { - /*%%%*/ - if (!($$ = assignable($1, 0))) $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(var_field, $1); - %*/ - } - | primary_value '[' opt_call_args rbracket - { - /*%%%*/ - $$ = aryset($1, $3); - /*% - $$ = dispatch2(aref_field, $1, escape_Qundef($3)); - %*/ - } - | primary_value '.' tIDENTIFIER - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - %*/ - } - | primary_value tCOLON2 tIDENTIFIER - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch3(field, $1, ripper_intern("::"), $3); - %*/ - } - | primary_value '.' tCONSTANT - { - /*%%%*/ - $$ = attrset($1, $3); - /*% - $$ = dispatch3(field, $1, ripper_id2sym('.'), $3); - %*/ - } - | primary_value tCOLON2 tCONSTANT - { - /*%%%*/ - if (in_def || in_single) - yyerror("dynamic constant assignment"); - $$ = NEW_CDECL(0, 0, NEW_COLON2($1, $3)); - /*% - $$ = dispatch2(const_path_field, $1, $3); - if (in_def || in_single) { - $$ = dispatch1(assign_error, $$); - } - %*/ - } - | tCOLON3 tCONSTANT - { - /*%%%*/ - if (in_def || in_single) - yyerror("dynamic constant assignment"); - $$ = NEW_CDECL(0, 0, NEW_COLON3($2)); - /*% - $$ = dispatch1(top_const_field, $2); - if (in_def || in_single) { - $$ = dispatch1(assign_error, $$); - } - %*/ - } - | backref - { - /*%%%*/ - rb_backref_error($1); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(assign_error, $1); - %*/ - } - ; - -cname : tIDENTIFIER - { - /*%%%*/ - yyerror("class/module name must be CONSTANT"); - /*% - $$ = dispatch1(class_name_error, $1); - %*/ - } - | tCONSTANT - ; - -cpath : tCOLON3 cname - { - /*%%%*/ - $$ = NEW_COLON3($2); - /*% - $$ = dispatch1(top_const_ref, $2); - %*/ - } - | cname - { - /*%%%*/ - $$ = NEW_COLON2(0, $$); - /*% - $$ = dispatch1(const_ref, $1); - %*/ - } - | primary_value tCOLON2 cname - { - /*%%%*/ - $$ = NEW_COLON2($1, $3); - /*% - $$ = dispatch2(const_path_ref, $1, $3); - %*/ - } - ; - -fname : tIDENTIFIER - | tCONSTANT - | tFID - | op - { - /*%%%*/ - lex_state = EXPR_END; - $$ = $1; - /*% - lex_state = EXPR_END; - $$ = $1; - %*/ - } - | reswords - { - /*%%%*/ - lex_state = EXPR_END; - $$ = $<id>1; - /*% - lex_state = EXPR_END; - $$ = $1; - %*/ - } - ; - -fsym : fname - | symbol - ; - -fitem : fsym - { - /*%%%*/ - $$ = NEW_LIT(ID2SYM($1)); - /*% - $$ = dispatch1(symbol_literal, $1); - %*/ - } - | dsym - ; - -undef_list : fitem - { - /*%%%*/ - $$ = NEW_UNDEF($1); - /*% - $$ = rb_ary_new3(1, $1); - %*/ - } - | undef_list ',' {lex_state = EXPR_FNAME;} fitem - { - /*%%%*/ - $$ = block_append($1, NEW_UNDEF($4)); - /*% - rb_ary_push($1, $4); - %*/ - } - ; - -op : '|' { ifndef_ripper($$ = '|'); } - | '^' { ifndef_ripper($$ = '^'); } - | '&' { ifndef_ripper($$ = '&'); } - | tCMP { ifndef_ripper($$ = tCMP); } - | tEQ { ifndef_ripper($$ = tEQ); } - | tEQQ { ifndef_ripper($$ = tEQQ); } - | tMATCH { ifndef_ripper($$ = tMATCH); } - | tNMATCH { ifndef_ripper($$ = tNMATCH); } - | '>' { ifndef_ripper($$ = '>'); } - | tGEQ { ifndef_ripper($$ = tGEQ); } - | '<' { ifndef_ripper($$ = '<'); } - | tLEQ { ifndef_ripper($$ = tLEQ); } - | tNEQ { ifndef_ripper($$ = tNEQ); } - | tLSHFT { ifndef_ripper($$ = tLSHFT); } - | tRSHFT { ifndef_ripper($$ = tRSHFT); } - | '+' { ifndef_ripper($$ = '+'); } - | '-' { ifndef_ripper($$ = '-'); } - | '*' { ifndef_ripper($$ = '*'); } - | tSTAR { ifndef_ripper($$ = '*'); } - | '/' { ifndef_ripper($$ = '/'); } - | '%' { ifndef_ripper($$ = '%'); } - | tPOW { ifndef_ripper($$ = tPOW); } - | '!' { ifndef_ripper($$ = '!'); } - | '~' { ifndef_ripper($$ = '~'); } - | tUPLUS { ifndef_ripper($$ = tUPLUS); } - | tUMINUS { ifndef_ripper($$ = tUMINUS); } - | tAREF { ifndef_ripper($$ = tAREF); } - | tASET { ifndef_ripper($$ = tASET); } - | '`' { ifndef_ripper($$ = '`'); } - ; - -reswords : keyword__LINE__ | keyword__FILE__ | keyword__ENCODING__ - | keyword_BEGIN | keyword_END - | keyword_alias | keyword_and | keyword_begin - | keyword_break | keyword_case | keyword_class | keyword_def - | keyword_defined | keyword_do | keyword_else | keyword_elsif - | keyword_end | keyword_ensure | keyword_false - | keyword_for | keyword_in | keyword_module | keyword_next - | keyword_nil | keyword_not | keyword_or | keyword_redo - | keyword_rescue | keyword_retry | keyword_return | keyword_self - | keyword_super | keyword_then | keyword_true | keyword_undef - | keyword_when | keyword_yield | keyword_if | keyword_unless - | keyword_while | keyword_until - ; - -arg : lhs '=' arg - { - /*%%%*/ - value_expr($3); - $$ = node_assign($1, $3); - /*% - $$ = dispatch2(assign, $1, $3); - %*/ - } - | lhs '=' arg modifier_rescue arg - { - /*%%%*/ - value_expr($3); - $3 = NEW_RESCUE($3, NEW_RESBODY(0,$5,0), 0); - $$ = node_assign($1, $3); - /*% - $$ = dispatch2(assign, $1, dispatch2(rescue_mod, $3, $5)); - %*/ - } - | var_lhs tOP_ASGN arg - { - /*%%%*/ - value_expr($3); - if ($1) { - ID vid = $1->nd_vid; - if ($2 == tOROP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_OR(gettable(vid), $1); - if (is_asgn_or_id(vid)) { - $$->nd_aid = vid; - } - } - else if ($2 == tANDOP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_AND(gettable(vid), $1); - } - else { - $$ = $1; - $$->nd_value = NEW_CALL(gettable(vid), $2, NEW_LIST($3)); - } - } - else { - $$ = NEW_BEGIN(0); - } - /*% - $$ = dispatch3(opassign, $1, $2, $3); - %*/ - } - | var_lhs tOP_ASGN arg modifier_rescue arg - { - /*%%%*/ - value_expr($3); - $3 = NEW_RESCUE($3, NEW_RESBODY(0,$5,0), 0); - if ($1) { - ID vid = $1->nd_vid; - if ($2 == tOROP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_OR(gettable(vid), $1); - if (is_asgn_or_id(vid)) { - $$->nd_aid = vid; - } - } - else if ($2 == tANDOP) { - $1->nd_value = $3; - $$ = NEW_OP_ASGN_AND(gettable(vid), $1); - } - else { - $$ = $1; - $$->nd_value = NEW_CALL(gettable(vid), $2, NEW_LIST($3)); - } - } - else { - $$ = NEW_BEGIN(0); - } - /*% - $3 = dispatch2(rescue_mod, $3, $5); - $$ = dispatch3(opassign, $1, $2, $3); - %*/ - } - | primary_value '[' opt_call_args rbracket tOP_ASGN arg - { - /*%%%*/ - NODE *args; - - value_expr($6); - if (!$3) $3 = NEW_ZARRAY(); - args = arg_concat($6, $3); - if ($5 == tOROP) { - $5 = 0; - } - else if ($5 == tANDOP) { - $5 = 1; - } - $$ = NEW_OP_ASGN1($1, $5, args); - fixpos($$, $1); - /*% - $1 = dispatch2(aref_field, $1, escape_Qundef($3)); - $$ = dispatch3(opassign, $1, $5, $6); - %*/ - } - | primary_value '.' tIDENTIFIER tOP_ASGN arg - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $1 = dispatch3(field, $1, ripper_id2sym('.'), $3); - $$ = dispatch3(opassign, $1, $4, $5); - %*/ - } - | primary_value '.' tCONSTANT tOP_ASGN arg - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $1 = dispatch3(field, $1, ripper_id2sym('.'), $3); - $$ = dispatch3(opassign, $1, $4, $5); - %*/ - } - | primary_value tCOLON2 tIDENTIFIER tOP_ASGN arg - { - /*%%%*/ - value_expr($5); - if ($4 == tOROP) { - $4 = 0; - } - else if ($4 == tANDOP) { - $4 = 1; - } - $$ = NEW_OP_ASGN2($1, $3, $4, $5); - fixpos($$, $1); - /*% - $1 = dispatch3(field, $1, ripper_intern("::"), $3); - $$ = dispatch3(opassign, $1, $4, $5); - %*/ - } - | primary_value tCOLON2 tCONSTANT tOP_ASGN arg - { - /*%%%*/ - yyerror("constant re-assignment"); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch2(const_path_field, $1, $3); - $$ = dispatch3(opassign, $$, $4, $5); - $$ = dispatch1(assign_error, $$); - %*/ - } - | tCOLON3 tCONSTANT tOP_ASGN arg - { - /*%%%*/ - yyerror("constant re-assignment"); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(top_const_field, $2); - $$ = dispatch3(opassign, $$, $3, $4); - $$ = dispatch1(assign_error, $$); - %*/ - } - | backref tOP_ASGN arg - { - /*%%%*/ - rb_backref_error($1); - $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(var_field, $1); - $$ = dispatch3(opassign, $$, $2, $3); - $$ = dispatch1(assign_error, $$); - %*/ - } - | arg tDOT2 arg - { - /*%%%*/ - value_expr($1); - value_expr($3); - $$ = NEW_DOT2($1, $3); - if (nd_type($1) == NODE_LIT && FIXNUM_P($1->nd_lit) && - nd_type($3) == NODE_LIT && FIXNUM_P($3->nd_lit)) { - deferred_nodes = list_append(deferred_nodes, $$); - } - /*% - $$ = dispatch2(dot2, $1, $3); - %*/ - } - | arg tDOT3 arg - { - /*%%%*/ - value_expr($1); - value_expr($3); - $$ = NEW_DOT3($1, $3); - if (nd_type($1) == NODE_LIT && FIXNUM_P($1->nd_lit) && - nd_type($3) == NODE_LIT && FIXNUM_P($3->nd_lit)) { - deferred_nodes = list_append(deferred_nodes, $$); - } - /*% - $$ = dispatch2(dot3, $1, $3); - %*/ - } - | arg '+' arg - { - /*%%%*/ - $$ = call_bin_op($1, '+', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('+'), $3); - %*/ - } - | arg '-' arg - { - /*%%%*/ - $$ = call_bin_op($1, '-', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('-'), $3); - %*/ - } - | arg '*' arg - { - /*%%%*/ - $$ = call_bin_op($1, '*', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('*'), $3); - %*/ - } - | arg '/' arg - { - /*%%%*/ - $$ = call_bin_op($1, '/', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('/'), $3); - %*/ - } - | arg '%' arg - { - /*%%%*/ - $$ = call_bin_op($1, '%', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('%'), $3); - %*/ - } - | arg tPOW arg - { - /*%%%*/ - $$ = call_bin_op($1, tPOW, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("**"), $3); - %*/ - } - | tUMINUS_NUM tINTEGER tPOW arg - { - /*%%%*/ - $$ = NEW_CALL(call_bin_op($2, tPOW, $4), tUMINUS, 0); - /*% - $$ = dispatch3(binary, $2, ripper_intern("**"), $4); - $$ = dispatch2(unary, ripper_intern("-@"), $$); - %*/ - } - | tUMINUS_NUM tFLOAT tPOW arg - { - /*%%%*/ - $$ = NEW_CALL(call_bin_op($2, tPOW, $4), tUMINUS, 0); - /*% - $$ = dispatch3(binary, $2, ripper_intern("**"), $4); - $$ = dispatch2(unary, ripper_intern("-@"), $$); - %*/ - } - | tUPLUS arg - { - /*%%%*/ - $$ = call_uni_op($2, tUPLUS); - /*% - $$ = dispatch2(unary, ripper_intern("+@"), $2); - %*/ - } - | tUMINUS arg - { - /*%%%*/ - $$ = call_uni_op($2, tUMINUS); - /*% - $$ = dispatch2(unary, ripper_intern("-@"), $2); - %*/ - } - | arg '|' arg - { - /*%%%*/ - $$ = call_bin_op($1, '|', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('|'), $3); - %*/ - } - | arg '^' arg - { - /*%%%*/ - $$ = call_bin_op($1, '^', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('^'), $3); - %*/ - } - | arg '&' arg - { - /*%%%*/ - $$ = call_bin_op($1, '&', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('&'), $3); - %*/ - } - | arg tCMP arg - { - /*%%%*/ - $$ = call_bin_op($1, tCMP, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("<=>"), $3); - %*/ - } - | arg '>' arg - { - /*%%%*/ - $$ = call_bin_op($1, '>', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('>'), $3); - %*/ - } - | arg tGEQ arg - { - /*%%%*/ - $$ = call_bin_op($1, tGEQ, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern(">="), $3); - %*/ - } - | arg '<' arg - { - /*%%%*/ - $$ = call_bin_op($1, '<', $3); - /*% - $$ = dispatch3(binary, $1, ID2SYM('<'), $3); - %*/ - } - | arg tLEQ arg - { - /*%%%*/ - $$ = call_bin_op($1, tLEQ, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("<="), $3); - %*/ - } - | arg tEQ arg - { - /*%%%*/ - $$ = call_bin_op($1, tEQ, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("=="), $3); - %*/ - } - | arg tEQQ arg - { - /*%%%*/ - $$ = call_bin_op($1, tEQQ, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("==="), $3); - %*/ - } - | arg tNEQ arg - { - /*%%%*/ - $$ = call_bin_op($1, tNEQ, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("!="), $3); - %*/ - } - | arg tMATCH arg - { - /*%%%*/ - $$ = match_op($1, $3); - if (nd_type($1) == NODE_LIT && TYPE($1->nd_lit) == T_REGEXP) { - $$ = reg_named_capture_assign($1->nd_lit, $$); - } - /*% - $$ = dispatch3(binary, $1, ripper_intern("=~"), $3); - %*/ - } - | arg tNMATCH arg - { - /*%%%*/ - $$ = call_bin_op($1, tNMATCH, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("!~"), $3); - %*/ - } - | '!' arg - { - /*%%%*/ - $$ = call_uni_op(cond($2), '!'); - /*% - $$ = dispatch2(unary, ID2SYM('!'), $2); - %*/ - } - | '~' arg - { - /*%%%*/ - $$ = call_uni_op($2, '~'); - /*% - $$ = dispatch2(unary, ID2SYM('~'), $2); - %*/ - } - | arg tLSHFT arg - { - /*%%%*/ - $$ = call_bin_op($1, tLSHFT, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("<<"), $3); - %*/ - } - | arg tRSHFT arg - { - /*%%%*/ - $$ = call_bin_op($1, tRSHFT, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern(">>"), $3); - %*/ - } - | arg tANDOP arg - { - /*%%%*/ - $$ = logop(NODE_AND, $1, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("&&"), $3); - %*/ - } - | arg tOROP arg - { - /*%%%*/ - $$ = logop(NODE_OR, $1, $3); - /*% - $$ = dispatch3(binary, $1, ripper_intern("||"), $3); - %*/ - } - | keyword_defined opt_nl {in_defined = 1;} arg - { - /*%%%*/ - in_defined = 0; - $$ = NEW_DEFINED($4); - /*% - in_defined = 0; - $$ = dispatch1(defined, $4); - %*/ - } - | arg '?' arg opt_nl ':' arg - { - /*%%%*/ - value_expr($1); - $$ = NEW_IF(cond($1), $3, $6); - fixpos($$, $1); - /*% - $$ = dispatch3(ifop, $1, $3, $6); - %*/ - } - | primary - { - $$ = $1; - } - ; - -arg_value : arg - { - /*%%%*/ - value_expr($1); - $$ = $1; - if (!$$) $$ = NEW_NIL(); - /*% - $$ = $1; - %*/ - } - ; - -aref_args : none - | args trailer - { - $$ = $1; - } - | args ',' assocs trailer - { - /*%%%*/ - $$ = arg_append($1, NEW_HASH($3)); - /*% - $$ = arg_add_assocs($1, $3); - %*/ - } - | assocs trailer - { - /*%%%*/ - $$ = NEW_LIST(NEW_HASH($1)); - /*% - $$ = arg_add_assocs(arg_new(), $1); - %*/ - } - ; - -paren_args : '(' opt_call_args rparen - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(arg_paren, escape_Qundef($2)); - %*/ - } - ; - -opt_paren_args : none - | paren_args - ; - -opt_call_args : none - | call_args - ; - -call_args : command - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = arg_add(arg_new(), $1); - %*/ - } - | args opt_block_arg - { - /*%%%*/ - $$ = arg_blk_pass($1, $2); - /*% - $$ = arg_add_optblock($1, $2); - %*/ - } - | assocs opt_block_arg - { - /*%%%*/ - $$ = NEW_LIST(NEW_HASH($1)); - $$ = arg_blk_pass($$, $2); - /*% - $$ = arg_add_assocs(arg_new(), $1); - $$ = arg_add_optblock($$, $2); - %*/ - } - | args ',' assocs opt_block_arg - { - /*%%%*/ - $$ = arg_append($1, NEW_HASH($3)); - $$ = arg_blk_pass($$, $4); - /*% - $$ = arg_add_optblock(arg_add_assocs($1, $3), $4); - %*/ - } - | block_arg - /*%c%*/ - /*%c - { - $$ = arg_add_block(arg_new(), $1); - } - %*/ - ; - -command_args : { - $<num>$ = cmdarg_stack; - CMDARG_PUSH(1); - } - call_args - { - /* CMDARG_POP() */ - cmdarg_stack = $<num>1; - $$ = $2; - } - ; - -block_arg : tAMPER arg_value - { - /*%%%*/ - $$ = NEW_BLOCK_PASS($2); - /*% - $$ = $2; - %*/ - } - ; - -opt_block_arg : ',' block_arg - { - $$ = $2; - } - | none - { - $$ = 0; - } - ; - -args : arg_value - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = arg_add(arg_new(), $1); - %*/ - } - | tSTAR arg_value - { - /*%%%*/ - $$ = NEW_SPLAT($2); - /*% - $$ = arg_add_star(arg_new(), $2); - %*/ - } - | args ',' arg_value - { - /*%%%*/ - NODE *n1; - if ((n1 = splat_array($1)) != 0) { - $$ = list_append(n1, $3); - } - else { - $$ = arg_append($1, $3); - } - /*% - $$ = arg_add($1, $3); - %*/ - } - | args ',' tSTAR arg_value - { - /*%%%*/ - NODE *n1; - if (nd_type($4) == NODE_ARRAY && - (n1 = splat_array($1)) != 0) { - $$ = list_concat(n1, $4); - } - else { - $$ = arg_concat($1, $4); - } - /*% - $$ = arg_add_star($1, $4); - %*/ - } - ; - -mrhs : args ',' arg_value - { - /*%%%*/ - NODE *n1; - if ((n1 = splat_array($1)) != 0) { - $$ = list_append(n1, $3); - } - else { - $$ = arg_append($1, $3); - } - /*% - $$ = mrhs_add(args2mrhs($1), $3); - %*/ - } - | args ',' tSTAR arg_value - { - /*%%%*/ - NODE *n1; - if (nd_type($4) == NODE_ARRAY && - (n1 = splat_array($1)) != 0) { - $$ = list_concat(n1, $4); - } - else { - $$ = arg_concat($1, $4); - } - /*% - $$ = mrhs_add_star(args2mrhs($1), $4); - %*/ - } - | tSTAR arg_value - { - /*%%%*/ - $$ = NEW_SPLAT($2); - /*% - $$ = mrhs_add_star(mrhs_new(), $2); - %*/ - } - ; - -primary : literal - | strings - | xstring - | regexp - | words - | qwords - | var_ref - | backref - | tFID - { - /*%%%*/ - $$ = NEW_FCALL($1, 0); - /*% - $$ = method_arg(dispatch1(fcall, $1), arg_new()); - %*/ - } - | keyword_begin - { - /*%%%*/ - $<num>$ = ruby_sourceline; - /*% - %*/ - } - bodystmt - keyword_end - { - /*%%%*/ - if ($3 == NULL) { - $$ = NEW_NIL(); - } - else { - if (nd_type($3) == NODE_RESCUE || - nd_type($3) == NODE_ENSURE) - nd_set_line($3, $<num>2); - $$ = NEW_BEGIN($3); - } - nd_set_line($$, $<num>2); - /*% - $$ = dispatch1(begin, $3); - %*/ - } - | tLPAREN_ARG expr {lex_state = EXPR_ENDARG;} rparen - { - rb_warning0("(...) interpreted as grouped expression"); - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(paren, $2); - %*/ - } - | tLPAREN compstmt ')' - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(paren, $2); - %*/ - } - | primary_value tCOLON2 tCONSTANT - { - /*%%%*/ - $$ = NEW_COLON2($1, $3); - /*% - $$ = dispatch2(const_path_ref, $1, $3); - %*/ - } - | tCOLON3 tCONSTANT - { - /*%%%*/ - $$ = NEW_COLON3($2); - /*% - $$ = dispatch1(top_const_ref, $2); - %*/ - } - | tLBRACK aref_args ']' - { - /*%%%*/ - if ($2 == 0) { - $$ = NEW_ZARRAY(); /* zero length array*/ - } - else { - $$ = $2; - } - /*% - $$ = dispatch1(array, escape_Qundef($2)); - %*/ - } - | tLBRACE assoc_list '}' - { - /*%%%*/ - $$ = NEW_HASH($2); - /*% - $$ = dispatch1(hash, escape_Qundef($2)); - %*/ - } - | keyword_return - { - /*%%%*/ - $$ = NEW_RETURN(0); - /*% - $$ = dispatch0(return0); - %*/ - } - | keyword_yield '(' call_args rparen - { - /*%%%*/ - $$ = new_yield($3); - /*% - $$ = dispatch1(yield, dispatch1(paren, $3)); - %*/ - } - | keyword_yield '(' rparen - { - /*%%%*/ - $$ = NEW_YIELD(0, Qfalse); - /*% - $$ = dispatch1(yield, dispatch1(paren, arg_new())); - %*/ - } - | keyword_yield - { - /*%%%*/ - $$ = NEW_YIELD(0, Qfalse); - /*% - $$ = dispatch0(yield0); - %*/ - } - | keyword_defined opt_nl '(' {in_defined = 1;} expr rparen - { - /*%%%*/ - in_defined = 0; - $$ = NEW_DEFINED($5); - /*% - in_defined = 0; - $$ = dispatch1(defined, $5); - %*/ - } - | keyword_not '(' expr rparen - { - /*%%%*/ - $$ = call_uni_op(cond($3), '!'); - /*% - $$ = dispatch2(unary, ripper_intern("not"), $3); - %*/ - } - | keyword_not '(' rparen - { - /*%%%*/ - $$ = call_uni_op(cond(NEW_NIL()), '!'); - /*% - $$ = dispatch2(unary, ripper_intern("not"), Qnil); - %*/ - } - | operation brace_block - { - /*%%%*/ - $2->nd_iter = NEW_FCALL($1, 0); - $$ = $2; - fixpos($2->nd_iter, $2); - /*% - $$ = method_arg(dispatch1(fcall, $1), arg_new()); - $$ = method_add_block($$, $2); - %*/ - } - | method_call - | method_call brace_block - { - /*%%%*/ - block_dup_check($1->nd_args, $2); - $2->nd_iter = $1; - $$ = $2; - fixpos($$, $1); - /*% - $$ = method_add_block($1, $2); - %*/ - } - | tLAMBDA lambda - { - $$ = $2; - } - | keyword_if expr_value then - compstmt - if_tail - keyword_end - { - /*%%%*/ - $$ = NEW_IF(cond($2), $4, $5); - fixpos($$, $2); - /*% - $$ = dispatch3(if, $2, $4, escape_Qundef($5)); - %*/ - } - | keyword_unless expr_value then - compstmt - opt_else - keyword_end - { - /*%%%*/ - $$ = NEW_UNLESS(cond($2), $4, $5); - fixpos($$, $2); - /*% - $$ = dispatch3(unless, $2, $4, escape_Qundef($5)); - %*/ - } - | keyword_while {COND_PUSH(1);} expr_value do {COND_POP();} - compstmt - keyword_end - { - /*%%%*/ - $$ = NEW_WHILE(cond($3), $6, 1); - fixpos($$, $3); - /*% - $$ = dispatch2(while, $3, $6); - %*/ - } - | keyword_until {COND_PUSH(1);} expr_value do {COND_POP();} - compstmt - keyword_end - { - /*%%%*/ - $$ = NEW_UNTIL(cond($3), $6, 1); - fixpos($$, $3); - /*% - $$ = dispatch2(until, $3, $6); - %*/ - } - | keyword_case expr_value opt_terms - case_body - keyword_end - { - /*%%%*/ - $$ = NEW_CASE($2, $4); - fixpos($$, $2); - /*% - $$ = dispatch2(case, $2, $4); - %*/ - } - | keyword_case opt_terms case_body keyword_end - { - /*%%%*/ - $$ = NEW_CASE(0, $3); - /*% - $$ = dispatch2(case, Qnil, $3); - %*/ - } - | keyword_for for_var keyword_in - {COND_PUSH(1);} - expr_value do - {COND_POP();} - compstmt - keyword_end - { - /*%%%*/ - /* - * for a, b, c in e - * #=> - * e.each{|*x| a, b, c = x - * - * for a in e - * #=> - * e.each{|x| a, = x} - */ - ID id = internal_id(); - ID *tbl = ALLOC_N(ID, 2); - NODE *m = NEW_ARGS_AUX(0, 0); - NODE *args, *scope; - - if (nd_type($2) == NODE_MASGN) { - /* if args.length == 1 && args[0].kind_of?(Array) - * args = args[0] - * end - */ - NODE *one = NEW_LIST(NEW_LIT(INT2FIX(1))); - NODE *zero = NEW_LIST(NEW_LIT(INT2FIX(0))); - m->nd_next = block_append( - NEW_IF( - NEW_NODE(NODE_AND, - NEW_CALL(NEW_CALL(NEW_DVAR(id), rb_intern("length"), 0), - rb_intern("=="), one), - NEW_CALL(NEW_CALL(NEW_DVAR(id), rb_intern("[]"), zero), - rb_intern("kind_of?"), NEW_LIST(NEW_LIT(rb_cArray))), - 0), - NEW_DASGN_CURR(id, - NEW_CALL(NEW_DVAR(id), rb_intern("[]"), zero)), - 0), - node_assign($2, NEW_DVAR(id))); - } - else { - m->nd_next = node_assign(NEW_MASGN(NEW_LIST($2), 0), NEW_DVAR(id)); - } - - args = new_args(m, 0, id, 0, 0); - scope = NEW_NODE(NODE_SCOPE, tbl, $8, args); - tbl[0] = 1; tbl[1] = id; - $$ = NEW_FOR(0, $5, scope); - fixpos($$, $2); - /*% - $$ = dispatch3(for, $2, $5, $8); - %*/ - } - | keyword_class cpath superclass - { - if (in_def || in_single) - yyerror("class definition in method body"); - /*%%%*/ - local_push(0); - $<num>$ = ruby_sourceline; - /*% - %*/ - } - bodystmt - keyword_end - { - /*%%%*/ - $$ = NEW_CLASS($2, $5, $3); - nd_set_line($$, $<num>4); - local_pop(); - /*% - $$ = dispatch3(class, $2, $3, $5); - %*/ - } - | keyword_class tLSHFT expr - { - /*%%%*/ - $<num>$ = in_def; - in_def = 0; - /*% - in_def = 0; - %*/ - } - term - { - /*%%%*/ - $<num>$ = in_single; - in_single = 0; - local_push(0); - /*% - $$ = in_single; - in_single = 0; - %*/ - } - bodystmt - keyword_end - { - /*%%%*/ - $$ = NEW_SCLASS($3, $7); - fixpos($$, $3); - local_pop(); - in_def = $<num>4; - in_single = $<num>6; - /*% - $$ = dispatch2(sclass, $3, $7); - in_def = $<val>4; - in_single = $<val>6; - %*/ - } - | keyword_module cpath - { - if (in_def || in_single) - yyerror("module definition in method body"); - /*%%%*/ - local_push(0); - $<num>$ = ruby_sourceline; - /*% - %*/ - } - bodystmt - keyword_end - { - /*%%%*/ - $$ = NEW_MODULE($2, $4); - nd_set_line($$, $<num>3); - local_pop(); - /*% - $$ = dispatch2(module, $2, $4); - %*/ - } - | keyword_def fname - { - $<id>$ = cur_mid; - cur_mid = $2; - in_def++; - /*%%%*/ - local_push(0); - /*% - %*/ - } - f_arglist - bodystmt - keyword_end - { - /*%%%*/ - NODE *body = remove_begin($5); - reduce_nodes(&body); - $$ = NEW_DEFN($2, $4, body, NOEX_PRIVATE); - fixpos($$, $4); - local_pop(); - in_def--; - cur_mid = $<id>3; - /*% - $$ = dispatch3(def, $2, $4, $5); - in_def--; - cur_mid = $<id>3; - %*/ - } - | keyword_def singleton dot_or_colon {lex_state = EXPR_FNAME;} fname - { - in_single++; - lex_state = EXPR_END; /* force for args */ - /*%%%*/ - local_push(0); - /*% - %*/ - } - f_arglist - bodystmt - keyword_end - { - /*%%%*/ - NODE *body = remove_begin($8); - reduce_nodes(&body); - $$ = NEW_DEFS($2, $5, $7, body); - fixpos($$, $2); - local_pop(); - in_single--; - /*% - $$ = dispatch5(defs, $2, $3, $5, $7, $8); - in_single--; - %*/ - } - | keyword_break - { - /*%%%*/ - $$ = NEW_BREAK(0); - /*% - $$ = dispatch1(break, arg_new()); - %*/ - } - | keyword_next - { - /*%%%*/ - $$ = NEW_NEXT(0); - /*% - $$ = dispatch1(next, arg_new()); - %*/ - } - | keyword_redo - { - /*%%%*/ - $$ = NEW_REDO(); - /*% - $$ = dispatch0(redo); - %*/ - } - | keyword_retry - { - /*%%%*/ - $$ = NEW_RETRY(); - /*% - $$ = dispatch0(retry); - %*/ - } - ; - -primary_value : primary - { - /*%%%*/ - value_expr($1); - $$ = $1; - if (!$$) $$ = NEW_NIL(); - /*% - $$ = $1; - %*/ - } - ; - -then : term - /*%c%*/ - /*%c - { $$ = Qnil; } - %*/ - | keyword_then - | term keyword_then - /*%c%*/ - /*%c - { $$ = $2; } - %*/ - ; - -do : term - /*%c%*/ - /*%c - { $$ = Qnil; } - %*/ - | keyword_do_cond - ; - -if_tail : opt_else - | keyword_elsif expr_value then - compstmt - if_tail - { - /*%%%*/ - $$ = NEW_IF(cond($2), $4, $5); - fixpos($$, $2); - /*% - $$ = dispatch3(elsif, $2, $4, escape_Qundef($5)); - %*/ - } - ; - -opt_else : none - | keyword_else compstmt - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(else, $2); - %*/ - } - ; - -for_var : lhs - | mlhs - ; - -f_marg : f_norm_arg - { - /*%%%*/ - $$ = assignable($1, 0); - /*% - $$ = dispatch1(mlhs_paren, $1); - %*/ - } - | tLPAREN f_margs rparen - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(mlhs_paren, $2); - %*/ - } - ; - -f_marg_list : f_marg - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = mlhs_add(mlhs_new(), $1); - %*/ - } - | f_marg_list ',' f_marg - { - /*%%%*/ - $$ = list_append($1, $3); - /*% - $$ = mlhs_add($1, $3); - %*/ - } - ; - -f_margs : f_marg_list - { - /*%%%*/ - $$ = NEW_MASGN($1, 0); - /*% - $$ = $1; - %*/ - } - | f_marg_list ',' tSTAR f_norm_arg - { - /*%%%*/ - $$ = NEW_MASGN($1, assignable($4, 0)); - /*% - $$ = mlhs_add_star($1, $4); - %*/ - } - | f_marg_list ',' tSTAR f_norm_arg ',' f_marg_list - { - /*%%%*/ - $$ = NEW_MASGN($1, NEW_POSTARG(assignable($4, 0), $6)); - /*% - $$ = mlhs_add_star($1, $4); - %*/ - } - | f_marg_list ',' tSTAR - { - /*%%%*/ - $$ = NEW_MASGN($1, -1); - /*% - $$ = mlhs_add_star($1, Qnil); - %*/ - } - | f_marg_list ',' tSTAR ',' f_marg_list - { - /*%%%*/ - $$ = NEW_MASGN($1, NEW_POSTARG(-1, $5)); - /*% - $$ = mlhs_add_star($1, $5); - %*/ - } - | tSTAR f_norm_arg - { - /*%%%*/ - $$ = NEW_MASGN(0, assignable($2, 0)); - /*% - $$ = mlhs_add_star(mlhs_new(), $2); - %*/ - } - | tSTAR f_norm_arg ',' f_marg_list - { - /*%%%*/ - $$ = NEW_MASGN(0, NEW_POSTARG(assignable($2, 0), $4)); - /*% - #if 0 - TODO: Check me - #endif - $$ = mlhs_add_star($2, $4); - %*/ - } - | tSTAR - { - /*%%%*/ - $$ = NEW_MASGN(0, -1); - /*% - $$ = mlhs_add_star(mlhs_new(), Qnil); - %*/ - } - | tSTAR ',' f_marg_list - { - /*%%%*/ - $$ = NEW_MASGN(0, NEW_POSTARG(-1, $3)); - /*% - $$ = mlhs_add_star(mlhs_new(), Qnil); - %*/ - } - ; - -block_param : f_arg ',' f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, $3, 0, $4); - /*% - $$ = params_new($1, Qnil, $3, Qnil, escape_Qundef($4)); - %*/ - } - | f_arg ',' - { - /*%%%*/ - $$ = new_args($1, 0, 1, 0, 0); - /*% - $$ = params_new($1, Qnil, Qnil, Qnil, Qnil); - dispatch1(excessed_comma, $$); - %*/ - } - | f_arg ',' f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, $3, $5, $6); - /*% - $$ = params_new($1, Qnil, $3, $5, escape_Qundef($6)); - %*/ - } - | f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, 0, 0, $2); - /*% - $$ = params_new($1, Qnil,Qnil, Qnil, escape_Qundef($2)); - %*/ - } - | f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, $1, 0, $2); - /*% - $$ = params_new(Qnil, Qnil, $1, Qnil, escape_Qundef($2)); - %*/ - } - | f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, $1, $3, $4); - /*% - $$ = params_new(Qnil, Qnil, $1, $3, escape_Qundef($4)); - %*/ - } - | f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, 0, 0, $1); - /*% - $$ = params_new(Qnil, Qnil, Qnil, Qnil, $1); - %*/ - } - ; - -opt_block_param : none - | block_param_def - { - command_start = Qtrue; - } - ; - -block_param_def : '|' opt_bv_decl '|' - { - /*%%%*/ - $$ = 0; - /*% - $$ = blockvar_new(params_new(Qnil,Qnil,Qnil,Qnil,Qnil), - escape_Qundef($2)); - %*/ - } - | tOROP - { - /*%%%*/ - $$ = 0; - /*% - $$ = blockvar_new(params_new(Qnil,Qnil,Qnil,Qnil,Qnil), - Qnil); - %*/ - } - | '|' block_param opt_bv_decl '|' - { - /*%%%*/ - $$ = $2; - /*% - $$ = blockvar_new(escape_Qundef($2), escape_Qundef($3)); - %*/ - } - ; - - -opt_bv_decl : none - | ';' bv_decls - { - /*%%%*/ - $$ = 0; - /*% - $$ = $2; - %*/ - } - ; - -bv_decls : bvar - /*%c%*/ - /*%c - { - $$ = rb_ary_new2($1); - } - %*/ - | bv_decls ',' bvar - /*%c%*/ - /*%c - { - rb_ary_push($$, $3); - } - %*/ - ; - -bvar : tIDENTIFIER - { - /*%%%*/ - new_bv($1); - /*% - $$ = $1; - %*/ - } - | f_bad_arg - { - $$ = 0; - } - ; - -lambda : { - /*%%%*/ - dyna_push(); - $<num>$ = lpar_beg; - lpar_beg = ++paren_nest; - /*% - %*/ - } - f_larglist - lambda_body - { - /*%%%*/ - $$ = $2; - $$->nd_body = NEW_SCOPE($2->nd_head, $3); - dyna_pop(); - lpar_beg = $<num>1; - /*% - $$ = dispatch2(lambda, $2, $3); - %*/ - } - ; - -f_larglist : '(' f_args opt_bv_decl rparen - { - /*%%%*/ - $$ = NEW_LAMBDA($2); - /*% - $$ = dispatch1(paren, $2); - %*/ - } - | f_args opt_bv_decl - { - /*%%%*/ - $$ = NEW_LAMBDA($1); - /*% - $$ = $1; - %*/ - } - ; - -lambda_body : tLAMBEG compstmt '}' - { - $$ = $2; - } - | keyword_do_LAMBDA compstmt keyword_end - { - $$ = $2; - } - ; - -do_block : keyword_do_block - { - /*%%%*/ - dyna_push(); - $<num>$ = ruby_sourceline; - /*% %*/ - } - opt_block_param - compstmt - keyword_end - { - /*%%%*/ - $$ = NEW_ITER($3,$4); - nd_set_line($$, $<num>2); - dyna_pop(); - /*% - $$ = dispatch2(do_block, escape_Qundef($3), $4); - %*/ - } - ; - -block_call : command do_block - { - /*%%%*/ - block_dup_check($1->nd_args, $2); - $2->nd_iter = $1; - $$ = $2; - fixpos($$, $1); - /*% - $$ = method_add_block($1, $2); - %*/ - } - | block_call '.' operation2 opt_paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - /*% - $$ = dispatch3(call, $1, ripper_id2sym('.'), $3); - $$ = method_optarg($$, $4); - %*/ - } - | block_call tCOLON2 operation2 opt_paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - /*% - $$ = dispatch3(call, $1, ripper_intern("::"), $3); - $$ = method_optarg($$, $4); - %*/ - } - ; - -method_call : operation paren_args - { - /*%%%*/ - $$ = NEW_FCALL($1, $2); - fixpos($$, $2); - /*% - $$ = method_arg(dispatch1(fcall, $1), $2); - %*/ - } - | primary_value '.' operation2 opt_paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - fixpos($$, $1); - /*% - $$ = dispatch3(call, $1, ripper_id2sym('.'), $3); - $$ = method_optarg($$, $4); - %*/ - } - | primary_value tCOLON2 operation2 paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, $3, $4); - fixpos($$, $1); - /*% - $$ = dispatch3(call, $1, ripper_id2sym('.'), $3); - $$ = method_optarg($$, $4); - %*/ - } - | primary_value tCOLON2 operation3 - { - /*%%%*/ - $$ = NEW_CALL($1, $3, 0); - /*% - $$ = dispatch3(call, $1, ripper_intern("::"), $3); - %*/ - } - | primary_value '.' paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, rb_intern("call"), $3); - fixpos($$, $1); - /*% - $$ = dispatch3(call, dispatch1(paren, $1), - ripper_id2sym('.'), rb_intern("call")); - $$ = method_optarg($$, $3); - %*/ - } - | primary_value tCOLON2 paren_args - { - /*%%%*/ - $$ = NEW_CALL($1, rb_intern("call"), $3); - fixpos($$, $1); - /*% - $$ = dispatch3(call, dispatch1(paren, $1), - ripper_id2sym('.'), rb_intern("call")); - $$ = method_optarg($$, $3); - %*/ - } - | keyword_super paren_args - { - /*%%%*/ - $$ = NEW_SUPER($2); - /*% - $$ = dispatch1(super, $2); - %*/ - } - | keyword_super - { - /*%%%*/ - $$ = NEW_ZSUPER(); - /*% - $$ = dispatch0(zsuper); - %*/ - } - | primary_value '[' opt_call_args rbracket - { - /*%%%*/ - if ($1 && nd_type($1) == NODE_SELF) - $$ = NEW_FCALL(tAREF, $3); - else - $$ = NEW_CALL($1, tAREF, $3); - fixpos($$, $1); - /*% - $$ = dispatch2(aref, $1, escape_Qundef($3)); - %*/ - } - ; - -brace_block : '{' - { - /*%%%*/ - dyna_push(); - $<num>$ = ruby_sourceline; - /*% - %*/ - } - opt_block_param - compstmt '}' - { - /*%%%*/ - $$ = NEW_ITER($3,$4); - nd_set_line($$, $<num>2); - dyna_pop(); - /*% - $$ = dispatch2(brace_block, escape_Qundef($3), $4); - %*/ - } - | keyword_do - { - /*%%%*/ - dyna_push(); - $<num>$ = ruby_sourceline; - /*% - %*/ - } - opt_block_param - compstmt keyword_end - { - /*%%%*/ - $$ = NEW_ITER($3,$4); - nd_set_line($$, $<num>2); - dyna_pop(); - /*% - $$ = dispatch2(do_block, escape_Qundef($3), $4); - %*/ - } - ; - -case_body : keyword_when args then - compstmt - cases - { - /*%%%*/ - $$ = NEW_WHEN($2, $4, $5); - /*% - $$ = dispatch3(when, $2, $4, escape_Qundef($5)); - %*/ - } - ; - -cases : opt_else - | case_body - ; - -opt_rescue : keyword_rescue exc_list exc_var then - compstmt - opt_rescue - { - /*%%%*/ - if ($3) { - $3 = node_assign($3, NEW_ERRINFO()); - $5 = block_append($3, $5); - } - $$ = NEW_RESBODY($2, $5, $6); - fixpos($$, $2?$2:$5); - /*% - $$ = dispatch4(rescue, - escape_Qundef($2), - escape_Qundef($3), - escape_Qundef($5), - escape_Qundef($6)); - %*/ - } - | none - ; - -exc_list : arg_value - { - /*%%%*/ - $$ = NEW_LIST($1); - /*% - $$ = rb_ary_new3(1, $1); - %*/ - } - | mrhs - { - /*%%%*/ - if (!($$ = splat_array($1))) $$ = $1; - /*% - $$ = $1; - %*/ - } - | none - ; - -exc_var : tASSOC lhs - { - $$ = $2; - } - | none - ; - -opt_ensure : keyword_ensure compstmt - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(ensure, $2); - %*/ - } - | none - ; - -literal : numeric - | symbol - { - /*%%%*/ - $$ = NEW_LIT(ID2SYM($1)); - /*% - $$ = dispatch1(symbol_literal, $1); - %*/ - } - | dsym - ; - -strings : string - { - /*%%%*/ - NODE *node = $1; - if (!node) { - node = NEW_STR(STR_NEW0()); - } - else { - node = evstr2dstr(node); - } - $$ = node; - /*% - $$ = $1; - %*/ - } - ; - -string : tCHAR - | string1 - | string string1 - { - /*%%%*/ - $$ = literal_concat($1, $2); - /*% - $$ = dispatch2(string_concat, $1, $2); - %*/ - } - ; - -string1 : tSTRING_BEG string_contents tSTRING_END - { - /*%%%*/ - $$ = $2; - /*% - $$ = dispatch1(string_literal, $2); - %*/ - } - ; - -xstring : tXSTRING_BEG xstring_contents tSTRING_END - { - /*%%%*/ - NODE *node = $2; - if (!node) { - node = NEW_XSTR(STR_NEW0()); - } - else { - switch (nd_type(node)) { - case NODE_STR: - nd_set_type(node, NODE_XSTR); - break; - case NODE_DSTR: - nd_set_type(node, NODE_DXSTR); - break; - default: - node = NEW_NODE(NODE_DXSTR, STR_NEW0(), 1, NEW_LIST(node)); - break; - } - } - $$ = node; - /*% - $$ = dispatch1(xstring_literal, $2); - %*/ - } - ; - -regexp : tREGEXP_BEG xstring_contents tREGEXP_END - { - /*%%%*/ - int options = $3; - NODE *node = $2; - NODE *list; - if (!node) { - node = NEW_LIT(reg_compile(STR_NEW0(), options)); - } - else switch (nd_type(node)) { - case NODE_STR: - { - VALUE src = node->nd_lit; - nd_set_type(node, NODE_LIT); - node->nd_lit = reg_compile(src, options); - } - break; - default: - node = NEW_NODE(NODE_DSTR, STR_NEW0(), 1, NEW_LIST(node)); - case NODE_DSTR: - if (options & RE_OPTION_ONCE) { - nd_set_type(node, NODE_DREGX_ONCE); - } - else { - nd_set_type(node, NODE_DREGX); - } - node->nd_cflag = options & RE_OPTION_MASK; - reg_fragment_check(node->nd_lit, options); - for (list = node->nd_next; list; list = list->nd_next) { - if (nd_type(list->nd_head) == NODE_STR) { - reg_fragment_check(list->nd_head->nd_lit, options); - } - } - break; - } - $$ = node; - /*% - $$ = dispatch2(regexp_literal, $2, $3); - %*/ - } - ; - -words : tWORDS_BEG ' ' tSTRING_END - { - /*%%%*/ - $$ = NEW_ZARRAY(); - /*% - $$ = dispatch0(words_new); - %*/ - } - | tWORDS_BEG word_list tSTRING_END - { - $$ = $2; - } - ; - -word_list : /* none */ - { - /*%%%*/ - $$ = 0; - /*% - $$ = dispatch0(words_new); - %*/ - } - | word_list word ' ' - { - /*%%%*/ - $$ = list_append($1, evstr2dstr($2)); - /*% - $$ = dispatch2(words_add, $1, $2); - %*/ - } - ; - -word : string_content - /*%c%*/ - /*%c - { - $$ = dispatch0(word_new); - $$ = dispatch2(word_add, $$, $1); - } - %*/ - | word string_content - { - /*%%%*/ - $$ = literal_concat($1, $2); - /*% - $$ = dispatch2(word_add, $1, $2); - %*/ - } - ; - -qwords : tQWORDS_BEG ' ' tSTRING_END - { - /*%%%*/ - $$ = NEW_ZARRAY(); - /*% - $$ = dispatch0(qwords_new); - %*/ - } - | tQWORDS_BEG qword_list tSTRING_END - { - $$ = $2; - } - ; - -qword_list : /* none */ - { - /*%%%*/ - $$ = 0; - /*% - $$ = dispatch0(qwords_new); - %*/ - } - | qword_list tSTRING_CONTENT ' ' - { - /*%%%*/ - $$ = list_append($1, $2); - /*% - $$ = dispatch2(qwords_add, $1, $2); - %*/ - } - ; - -string_contents : /* none */ - { - /*%%%*/ - $$ = 0; - /*% - $$ = dispatch0(string_content); - %*/ - } - | string_contents string_content - { - /*%%%*/ - $$ = literal_concat($1, $2); - /*% - $$ = dispatch2(string_add, $1, $2); - %*/ - } - ; - -xstring_contents: /* none */ - { - /*%%%*/ - $$ = 0; - /*% - $$ = dispatch0(xstring_new); - %*/ - } - | xstring_contents string_content - { - /*%%%*/ - $$ = literal_concat($1, $2); - /*% - $$ = dispatch2(xstring_add, $1, $2); - %*/ - } - ; - -string_content : tSTRING_CONTENT - | tSTRING_DVAR - { - $<node>$ = lex_strterm; - lex_strterm = 0; - lex_state = EXPR_BEG; - } - string_dvar - { - /*%%%*/ - lex_strterm = $<node>2; - $$ = NEW_EVSTR($3); - /*% - lex_strterm = $<node>2; - $$ = dispatch1(string_dvar, $3); - %*/ - } - | tSTRING_DBEG - { - $<node>$ = lex_strterm; - lex_strterm = 0; - lex_state = EXPR_BEG; - COND_PUSH(0); - CMDARG_PUSH(0); - } - compstmt '}' - { - lex_strterm = $<node>2; - COND_LEXPOP(); - CMDARG_LEXPOP(); - /*%%%*/ - if ($3) $3->flags &= ~NODE_FL_NEWLINE; - $$ = new_evstr($3); - /*% - $$ = dispatch1(string_embexpr, $3); - %*/ - } - ; - -string_dvar : tGVAR - { - /*%%%*/ - $$ = NEW_GVAR($1); - /*% - $$ = dispatch1(var_ref, $1); - %*/ - } - | tIVAR - { - /*%%%*/ - $$ = NEW_IVAR($1); - /*% - $$ = dispatch1(var_ref, $1); - %*/ - } - | tCVAR - { - /*%%%*/ - $$ = NEW_CVAR($1); - /*% - $$ = dispatch1(var_ref, $1); - %*/ - } - | backref - ; - -symbol : tSYMBEG sym - { - /*%%%*/ - lex_state = EXPR_ENDARG; - $$ = $2; - /*% - lex_state = EXPR_ENDARG; - $$ = dispatch1(symbol, $2); - %*/ - } - ; - -sym : fname - | tIVAR - | tGVAR - | tCVAR - ; - -dsym : tSYMBEG xstring_contents tSTRING_END - { - /*%%%*/ - lex_state = EXPR_ENDARG; - if (!($$ = $2)) { - $$ = NEW_LIT(ID2SYM(rb_intern(""))); - } - else { - VALUE lit; - - switch (nd_type($$)) { - case NODE_DSTR: - nd_set_type($$, NODE_DSYM); - break; - case NODE_STR: - lit = $$->nd_lit; - $$->nd_lit = ID2SYM(rb_intern_str(lit)); - nd_set_type($$, NODE_LIT); - break; - default: - $$ = NEW_NODE(NODE_DSYM, STR_NEW0(), 1, NEW_LIST($$)); - break; - } - } - /*% - lex_state = EXPR_ENDARG; - $$ = dispatch1(dyna_symbol, $2); - %*/ - } - ; - -numeric : tINTEGER - | tFLOAT - | tUMINUS_NUM tINTEGER %prec tLOWEST - { - /*%%%*/ - $$ = negate_lit($2); - /*% - $$ = dispatch2(unary, ripper_intern("-@"), $2); - %*/ - } - | tUMINUS_NUM tFLOAT %prec tLOWEST - { - /*%%%*/ - $$ = negate_lit($2); - /*% - $$ = dispatch2(unary, ripper_intern("-@"), $2); - %*/ - } - ; - -variable : tIDENTIFIER - | tIVAR - | tGVAR - | tCONSTANT - | tCVAR - | keyword_nil {ifndef_ripper($$ = keyword_nil);} - | keyword_self {ifndef_ripper($$ = keyword_self);} - | keyword_true {ifndef_ripper($$ = keyword_true);} - | keyword_false {ifndef_ripper($$ = keyword_false);} - | keyword__FILE__ {ifndef_ripper($$ = keyword__FILE__);} - | keyword__LINE__ {ifndef_ripper($$ = keyword__LINE__);} - | keyword__ENCODING__ {ifndef_ripper($$ = keyword__ENCODING__);} - ; - -var_ref : variable - { - /*%%%*/ - if (!($$ = gettable($1))) $$ = NEW_BEGIN(0); - /*% - $$ = dispatch1(var_ref, $1); - %*/ - } - ; - -var_lhs : variable - { - /*%%%*/ - $$ = assignable($1, 0); - /*% - $$ = dispatch1(var_field, $1); - %*/ - } - ; - -backref : tNTH_REF - | tBACK_REF - ; - -superclass : term - { - /*%%%*/ - $$ = 0; - /*% - $$ = Qnil; - %*/ - } - | '<' - { - lex_state = EXPR_BEG; - } - expr_value term - { - $$ = $3; - } - | error term - { - /*%%%*/ - yyerrok; - $$ = 0; - /*% - yyerrok; - $$ = Qnil; - %*/ - } - ; - -f_arglist : '(' f_args rparen - { - /*%%%*/ - $$ = $2; - lex_state = EXPR_BEG; - command_start = Qtrue; - /*% - $$ = dispatch1(paren, $2); - lex_state = EXPR_BEG; - command_start = Qtrue; - %*/ - } - | f_args term - { - $$ = $1; - } - ; - -f_args : f_arg ',' f_optarg ',' f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, $3, $5, 0, $6); - /*% - $$ = params_new($1, $3, $5, Qnil, escape_Qundef($6)); - %*/ - } - | f_arg ',' f_optarg ',' f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, $3, $5, $7, $8); - /*% - $$ = params_new($1, $3, $5, $7, escape_Qundef($8)); - %*/ - } - | f_arg ',' f_optarg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, $3, 0, 0, $4); - /*% - $$ = params_new($1, $3, Qnil, Qnil, escape_Qundef($4)); - %*/ - } - | f_arg ',' f_optarg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, $3, 0, $5, $6); - /*% - $$ = params_new($1, $3, Qnil, $5, escape_Qundef($6)); - %*/ - } - | f_arg ',' f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, $3, 0, $4); - /*% - $$ = params_new($1, Qnil, $3, Qnil, escape_Qundef($4)); - %*/ - } - | f_arg ',' f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, $3, $5, $6); - /*% - $$ = params_new($1, Qnil, $3, $5, escape_Qundef($6)); - %*/ - } - | f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args($1, 0, 0, 0, $2); - /*% - $$ = params_new($1, Qnil, Qnil, Qnil,escape_Qundef($2)); - %*/ - } - | f_optarg ',' f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, $1, $3, 0, $4); - /*% - $$ = params_new(Qnil, $1, $3, Qnil, escape_Qundef($4)); - %*/ - } - | f_optarg ',' f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, $1, $3, $5, $6); - /*% - $$ = params_new(Qnil, $1, $3, $5, escape_Qundef($6)); - %*/ - } - | f_optarg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, $1, 0, 0, $2); - /*% - $$ = params_new(Qnil, $1, Qnil, Qnil,escape_Qundef($2)); - %*/ - } - | f_optarg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, $1, 0, $3, $4); - /*% - $$ = params_new(Qnil, $1, Qnil, $3, escape_Qundef($4)); - %*/ - } - | f_rest_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, $1, 0, $2); - /*% - $$ = params_new(Qnil, Qnil, $1, Qnil,escape_Qundef($2)); - %*/ - } - | f_rest_arg ',' f_arg opt_f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, $1, $3, $4); - /*% - $$ = params_new(Qnil, Qnil, $1, $3, escape_Qundef($4)); - %*/ - } - | f_block_arg - { - /*%%%*/ - $$ = new_args(0, 0, 0, 0, $1); - /*% - $$ = params_new(Qnil, Qnil, Qnil, Qnil, $1); - %*/ - } - | /* none */ - { - /*%%%*/ - $$ = new_args(0, 0, 0, 0, 0); - /*% - $$ = params_new(Qnil, Qnil, Qnil, Qnil, Qnil); - %*/ - } - ; - -f_bad_arg : tCONSTANT - { - /*%%%*/ - yyerror("formal argument cannot be a constant"); - $$ = 0; - /*% - $$ = dispatch1(param_error, $1); - %*/ - } - | tIVAR - { - /*%%%*/ - yyerror("formal argument cannot be an instance variable"); - $$ = 0; - /*% - $$ = dispatch1(param_error, $1); - %*/ - } - | tGVAR - { - /*%%%*/ - yyerror("formal argument cannot be a global variable"); - $$ = 0; - /*% - $$ = dispatch1(param_error, $1); - %*/ - } - | tCVAR - { - /*%%%*/ - yyerror("formal argument cannot be a class variable"); - $$ = 0; - /*% - $$ = dispatch1(param_error, $1); - %*/ - } - ; - -f_norm_arg : f_bad_arg - | tIDENTIFIER - { - /*%%%*/ - if (!is_local_id($1)) - yyerror("formal argument must be local variable"); - shadowing_lvar($1); - /*% - %*/ - $$ = $1; - } - ; - -f_arg_item : f_norm_arg - { - /*%%%*/ - arg_var($1); - $$ = NEW_ARGS_AUX($1, 1); - /*% - %*/ - } - | tLPAREN f_margs rparen - { - /*%%%*/ - ID tid = internal_id(); - arg_var(tid); - if (dyna_in_block()) { - $2->nd_value = NEW_DVAR(tid); - } - else { - $2->nd_value = NEW_LVAR(tid); - } - $$ = NEW_ARGS_AUX(tid, 1); - $$->nd_next = $2; - /*% - $$ = dispatch1(mlhs_paren, $2); - %*/ - } - ; - -f_arg : f_arg_item - /*%c%*/ - /*%c - { - $$ = rb_ary_new3(1, $1); - } - c%*/ - | f_arg ',' f_arg_item - { - /*%%%*/ - $$ = $1; - $$->nd_plen++; - $$->nd_next = block_append($$->nd_next, $3->nd_next); - rb_gc_force_recycle((VALUE)$3); - /*% - $$ = rb_ary_push($1, $3); - %*/ - } - ; - -f_opt : tIDENTIFIER '=' arg_value - { - /*%%%*/ - if (!is_local_id($1)) - yyerror("formal argument must be local variable"); - shadowing_lvar($1); - arg_var($1); - $$ = NEW_OPT_ARG(0, assignable($1, $3)); - /*% - $$ = rb_assoc_new($1, $3); - %*/ - } - ; - -f_optarg : f_opt - { - /*%%%*/ - $$ = $1; - /*% - $$ = rb_ary_new3(1, $1); - %*/ - } - | f_optarg ',' f_opt - { - /*%%%*/ - NODE *opts = $1; - - while (opts->nd_next) { - opts = opts->nd_next; - } - opts->nd_next = $3; - $$ = $1; - /*% - $$ = rb_ary_push($1, $3); - %*/ - } - ; - -restarg_mark : '*' - | tSTAR - ; - -f_rest_arg : restarg_mark tIDENTIFIER - { - /*%%%*/ - if (!is_local_id($2)) - yyerror("rest argument must be local variable"); - shadowing_lvar($2); - arg_var($2); - $$ = $2; - /*% - $$ = dispatch1(rest_param, $2); - %*/ - } - | restarg_mark - { - /*%%%*/ - $$ = internal_id(); - arg_var($$); - /*% - $$ = dispatch1(rest_param, Qnil); - %*/ - } - ; - -blkarg_mark : '&' - | tAMPER - ; - -f_block_arg : blkarg_mark tIDENTIFIER - { - /*%%%*/ - if (!is_local_id($2)) - yyerror("block argument must be local variable"); - else if (!dyna_in_block() && local_id($2)) - yyerror("duplicated block argument name"); - shadowing_lvar($2); - arg_var($2); - $$ = $2; - /*% - $$ = dispatch1(blockarg, $2); - %*/ - } - ; - -opt_f_block_arg : ',' f_block_arg - { - $$ = $2; - } - | none - { - /*%%%*/ - $$ = 0; - /*% - $$ = Qundef; - %*/ - } - ; - -singleton : var_ref - { - /*%%%*/ - value_expr($1); - $$ = $1; - if (!$$) $$ = NEW_NIL(); - /*% - $$ = $1; - %*/ - } - | '(' {lex_state = EXPR_BEG;} expr rparen - { - /*%%%*/ - if ($3 == 0) { - yyerror("can't define singleton method for ()."); - } - else { - switch (nd_type($3)) { - case NODE_STR: - case NODE_DSTR: - case NODE_XSTR: - case NODE_DXSTR: - case NODE_DREGX: - case NODE_LIT: - case NODE_ARRAY: - case NODE_ZARRAY: - yyerror("can't define singleton method for literals"); - default: - value_expr($3); - break; - } - } - $$ = $3; - /*% - $$ = dispatch1(paren, $3); - %*/ - } - ; - -assoc_list : none - | assocs trailer - { - /*%%%*/ - $$ = $1; - /*% - $$ = dispatch1(assoclist_from_args, $1); - %*/ - } - ; - -assocs : assoc - /*%c%*/ - /*%c - { - $$ = rb_ary_new3(1, $1); - } - %*/ - | assocs ',' assoc - { - /*%%%*/ - $$ = list_concat($1, $3); - /*% - $$ = rb_ary_push($1, $3); - %*/ - } - ; - -assoc : arg_value tASSOC arg_value - { - /*%%%*/ - $$ = list_append(NEW_LIST($1), $3); - /*% - $$ = dispatch2(assoc_new, $1, $3); - %*/ - } - | tLABEL arg_value - { - /*%%%*/ - $$ = list_append(NEW_LIST(NEW_LIT(ID2SYM($1))), $2); - /*% - $$ = dispatch2(assoc_new, $1, $2); - %*/ - } - ; - -operation : tIDENTIFIER - | tCONSTANT - | tFID - ; - -operation2 : tIDENTIFIER - | tCONSTANT - | tFID - | op - ; - -operation3 : tIDENTIFIER - | tFID - | op - ; - -dot_or_colon : '.' - /*%c%*/ - /*%c - { $$ = $<val>1; } - %*/ - | tCOLON2 - /*%c%*/ - /*%c - { $$ = $<val>1; } - %*/ - ; - -opt_terms : /* none */ - | terms - ; - -opt_nl : /* none */ - | '\n' - ; - -rparen : opt_nl ')' - ; - -rbracket : opt_nl ']' - ; - -trailer : /* none */ - | '\n' - | ',' - ; - -term : ';' {yyerrok;} - | '\n' - ; - -terms : term - | terms ';' {yyerrok;} - ; - -none : /* none */ - { - /*%%%*/ - $$ = 0; - /*% - $$ = Qundef; - %*/ - } - ; -%% -# undef parser -# undef yylex -# undef yylval -# define yylval (*((YYSTYPE*)(parser->parser_yylval))) - -static int parser_regx_options(struct parser_params*); -static int parser_tokadd_string(struct parser_params*,int,int,int,long*,rb_encoding**); -static void parser_tokaddmbc(struct parser_params *parser, int c, rb_encoding *enc); -static int parser_parse_string(struct parser_params*,NODE*); -static int parser_here_document(struct parser_params*,NODE*); - - -# define nextc() parser_nextc(parser) -# define pushback(c) parser_pushback(parser, c) -# define newtok() parser_newtok(parser) -# define tokspace(n) parser_tokspace(parser, n) -# define tokadd(c) parser_tokadd(parser, c) -# define tok_hex(numlen) parser_tok_hex(parser, numlen) -# define read_escape(flags,e) parser_read_escape(parser, flags, e) -# define tokadd_escape(e) parser_tokadd_escape(parser, e) -# define regx_options() parser_regx_options(parser) -# define tokadd_string(f,t,p,n,e) parser_tokadd_string(parser,f,t,p,n,e) -# define parse_string(n) parser_parse_string(parser,n) -# define tokaddmbc(c, enc) parser_tokaddmbc(parser, c, enc) -# define here_document(n) parser_here_document(parser,n) -# define heredoc_identifier() parser_heredoc_identifier(parser) -# define heredoc_restore(n) parser_heredoc_restore(parser,n) -# define whole_match_p(e,l,i) parser_whole_match_p(parser,e,l,i) - -#ifdef RIPPER -/* FIXME */ -# define local_id(x) 1 -# define dyna_in_block() 1 -#endif /* RIPPER */ - -#ifndef RIPPER -# define set_yylval_str(x) yylval.node = NEW_STR(x) -# define set_yylval_num(x) yylval.num = x -# define set_yylval_id(x) yylval.id = x -# define set_yylval_literal(x) yylval.node = NEW_LIT(x) -# define set_yylval_node(x) yylval.node = x -# define yylval_id() yylval.id -#else -# define set_yylval_str(x) (void)(x) -# define set_yylval_num(x) (void)(x) -# define set_yylval_id(x) (void)(x) -# define set_yylval_literal(x) (void)(x) -# define set_yylval_node(x) (void)(x) -# define yylval_id() SYM2ID(yylval.val) -#endif - -#ifdef RIPPER -#define ripper_flush(p) (p->tokp = p->parser_lex_p) - -static void -ripper_dispatch_scan_event(struct parser_params *parser, int t) -{ - VALUE str; - - if (lex_p < parser->tokp) rb_raise(rb_eRuntimeError, "lex_p < tokp"); - if (lex_p == parser->tokp) return; - str = STR_NEW(parser->tokp, lex_p - parser->tokp); - yylval.val = ripper_dispatch1(parser, ripper_token2eventid(t), str); - ripper_flush(parser); -} - -static void -ripper_dispatch_delayed_token(struct parser_params *parser, int t) -{ - int saved_line = ruby_sourceline; - const char *saved_tokp = parser->tokp; - - ruby_sourceline = parser->delayed_line; - parser->tokp = lex_pbeg + parser->delayed_col; - yylval.val = ripper_dispatch1(parser, ripper_token2eventid(t), parser->delayed); - parser->delayed = Qnil; - ruby_sourceline = saved_line; - parser->tokp = saved_tokp; -} -#endif /* RIPPER */ - -#include "ruby/regex.h" -#include "ruby/util.h" - -/* We remove any previous definition of `SIGN_EXTEND_CHAR', - since ours (we hope) works properly with all combinations of - machines, compilers, `char' and `unsigned char' argument types. - (Per Bothner suggested the basic approach.) */ -#undef SIGN_EXTEND_CHAR -#if __STDC__ -# define SIGN_EXTEND_CHAR(c) ((signed char)(c)) -#else /* not __STDC__ */ -/* As in Harbison and Steele. */ -# define SIGN_EXTEND_CHAR(c) ((((unsigned char)(c)) ^ 128) - 128) -#endif - -#define parser_mbclen() mbclen((lex_p-1),lex_pend,parser->enc) -#define parser_precise_mbclen() rb_enc_precise_mbclen((lex_p-1),lex_pend,parser->enc) -#define is_identchar(p,e,enc) (rb_enc_isalnum(*p,enc) || (*p) == '_' || !ISASCII(*p)) -#define parser_is_identchar() (!parser->eofp && is_identchar((lex_p-1),lex_pend,parser->enc)) - -#define parser_isascii() ISASCII(*(lex_p-1)) - -static int -parser_yyerror(struct parser_params *parser, const char *msg) -{ -#ifndef RIPPER - const int max_line_margin = 30; - const char *p, *pe; - char *buf; - int len, i; - - compile_error(PARSER_ARG "%s", msg); - p = lex_p; - while (lex_pbeg <= p) { - if (*p == '\n') break; - p--; - } - p++; - - pe = lex_p; - while (pe < lex_pend) { - if (*pe == '\n') break; - pe++; - } - - len = pe - p; - if (len > 4) { - char *p2; - const char *pre = "", *post = ""; - - if (len > max_line_margin * 2 + 10) { - if (lex_p - p > max_line_margin) { - p = rb_enc_prev_char(p, lex_p - max_line_margin, rb_enc_get(lex_lastline)); - pre = "..."; - } - if (pe - lex_p > max_line_margin) { - pe = rb_enc_prev_char(lex_p, lex_p + max_line_margin, rb_enc_get(lex_lastline)); - post = "..."; - } - len = pe - p; - } - buf = ALLOCA_N(char, len+2); - MEMCPY(buf, p, char, len); - buf[len] = '\0'; - rb_compile_error_append("%s%s%s", pre, buf, post); - - i = lex_p - p; - p2 = buf; pe = buf + len; - - while (p2 < pe) { - if (*p2 != '\t') *p2 = ' '; - p2++; - } - buf[i] = '^'; - buf[i+1] = '\0'; - rb_compile_error_append("%s%s", pre, buf); - } -#else - dispatch1(parse_error, STR_NEW2(msg)); -#endif /* !RIPPER */ - return 0; -} - -static void parser_prepare(struct parser_params *parser); - -#ifndef RIPPER -VALUE ruby_suppress_tracing(VALUE (*func)(VALUE, int), VALUE arg, int always); - -static VALUE -debug_lines(const char *f) -{ - if (rb_const_defined_at(rb_cObject, rb_intern("SCRIPT_LINES__"))) { - VALUE hash = rb_const_get_at(rb_cObject, rb_intern("SCRIPT_LINES__")); - if (TYPE(hash) == T_HASH) { - VALUE fname = rb_str_new2(f); - VALUE lines = rb_ary_new(); - rb_hash_aset(hash, fname, lines); - return lines; - } - } - return 0; -} - -static VALUE -coverage(const char *f, int n) -{ - extern VALUE rb_get_coverages(void); - VALUE coverages = rb_get_coverages(); - if (RTEST(coverages) && RBASIC(coverages)->klass == 0) { - VALUE fname = rb_str_new2(f); - VALUE lines = rb_ary_new2(n); - int i; - RBASIC(lines)->klass = 0; - for (i = 0; i < n; i++) RARRAY_PTR(lines)[i] = Qnil; - RARRAY(lines)->len = n; - rb_hash_aset(coverages, fname, lines); - return lines; - } - return 0; -} - -static int -e_option_supplied(struct parser_params *parser) -{ - if (strcmp(ruby_sourcefile, "-e") == 0) - return Qtrue; - return Qfalse; -} - -static VALUE -yycompile0(VALUE arg, int tracing) -{ - int n; - NODE *tree; - struct parser_params *parser = (struct parser_params *)arg; - - if (!compile_for_eval && rb_safe_level() == 0) { - ruby_debug_lines = debug_lines(ruby_sourcefile); - if (ruby_debug_lines && ruby_sourceline > 0) { - VALUE str = STR_NEW0(); - n = ruby_sourceline; - do { - rb_ary_push(ruby_debug_lines, str); - } while (--n); - } - - if (!e_option_supplied(parser)) { - ruby_coverage = coverage(ruby_sourcefile, ruby_sourceline); - } - } - - parser_prepare(parser); - deferred_nodes = 0; - n = yyparse((void*)parser); - ruby_debug_lines = 0; - ruby_coverage = 0; - compile_for_eval = 0; - - lex_strterm = 0; - lex_p = lex_pbeg = lex_pend = 0; - lex_lastline = lex_nextline = 0; - if (parser->nerr) { - return 0; - } - tree = ruby_eval_tree; - if (!tree) { - tree = NEW_NIL(); - } - if (ruby_eval_tree_begin) { - NODE *scope = ruby_eval_tree; - - if (scope) { - scope->nd_body = NEW_PRELUDE(ruby_eval_tree_begin, scope->nd_body); - } - tree = scope; - } - else { - tree = ruby_eval_tree; - } - return (VALUE)tree; -} - -static NODE* -yycompile(struct parser_params *parser, const char *f, int line) -{ - ruby_sourcefile = ruby_strdup(f); - ruby_sourceline = line - 1; - return (NODE *)ruby_suppress_tracing(yycompile0, (VALUE)parser, Qtrue); -} -#endif /* !RIPPER */ - -static VALUE -lex_get_str(struct parser_params *parser, VALUE s) -{ - char *beg, *end, *pend; - - beg = RSTRING_PTR(s); - if (lex_gets_ptr) { - if (RSTRING_LEN(s) == lex_gets_ptr) return Qnil; - beg += lex_gets_ptr; - } - pend = RSTRING_PTR(s) + RSTRING_LEN(s); - end = beg; - while (end < pend) { - if (*end++ == '\n') break; - } - lex_gets_ptr = end - RSTRING_PTR(s); - return rb_enc_str_new(beg, end - beg, rb_enc_get(s)); -} - -static VALUE -lex_getline(struct parser_params *parser) -{ - VALUE line = (*parser->parser_lex_gets)(parser, parser->parser_lex_input); -#ifndef RIPPER - if (ruby_debug_lines && !NIL_P(line)) { - rb_ary_push(ruby_debug_lines, line); - } - if (ruby_coverage && !NIL_P(line)) { - rb_ary_push(ruby_coverage, Qnil); - } -#endif - return line; -} - -#ifndef RIPPER -NODE* -rb_compile_string(const char *f, VALUE s, int line) -{ - VALUE volatile vparser = rb_parser_new(); - - return rb_parser_compile_string(vparser, f, s, line); -} - -NODE* -rb_parser_compile_string(volatile VALUE vparser, const char *f, VALUE s, int line) -{ - struct parser_params *parser; - NODE *node; - volatile VALUE tmp; - - Data_Get_Struct(vparser, struct parser_params, parser); - lex_gets = lex_get_str; - lex_gets_ptr = 0; - lex_input = s; - lex_pbeg = lex_p = lex_pend = 0; - compile_for_eval = rb_parse_in_eval(); - - node = yycompile(parser, f, line); - tmp = vparser; /* prohibit tail call optimization */ - - return node; -} - -NODE* -rb_compile_cstr(const char *f, const char *s, int len, int line) -{ - return rb_compile_string(f, rb_str_new(s, len), line); -} - -NODE* -rb_parser_compile_cstr(volatile VALUE vparser, const char *f, const char *s, int len, int line) -{ - return rb_parser_compile_string(vparser, f, rb_str_new(s, len), line); -} - -static VALUE -lex_io_gets(struct parser_params *parser, VALUE io) -{ - return rb_io_gets(io); -} - -NODE* -rb_compile_file(const char *f, VALUE file, int start) -{ - VALUE volatile vparser = rb_parser_new(); - - return rb_parser_compile_file(vparser, f, file, start); -} - -NODE* -rb_parser_compile_file(volatile VALUE vparser, const char *f, VALUE file, int start) -{ - struct parser_params *parser; - volatile VALUE tmp; - NODE *node; - - Data_Get_Struct(vparser, struct parser_params, parser); - lex_gets = lex_io_gets; - lex_input = file; - lex_pbeg = lex_p = lex_pend = 0; - - node = yycompile(parser, f, start); - tmp = vparser; /* prohibit tail call optimization */ - - return node; -} -#endif /* !RIPPER */ - -#define STR_FUNC_ESCAPE 0x01 -#define STR_FUNC_EXPAND 0x02 -#define STR_FUNC_REGEXP 0x04 -#define STR_FUNC_QWORDS 0x08 -#define STR_FUNC_SYMBOL 0x10 -#define STR_FUNC_INDENT 0x20 - -enum string_type { - str_squote = (0), - str_dquote = (STR_FUNC_EXPAND), - str_xquote = (STR_FUNC_EXPAND), - str_regexp = (STR_FUNC_REGEXP|STR_FUNC_ESCAPE|STR_FUNC_EXPAND), - str_sword = (STR_FUNC_QWORDS), - str_dword = (STR_FUNC_QWORDS|STR_FUNC_EXPAND), - str_ssym = (STR_FUNC_SYMBOL), - str_dsym = (STR_FUNC_SYMBOL|STR_FUNC_EXPAND) -}; - -static VALUE -parser_str_new(const char *p, long n, rb_encoding *enc, int func, rb_encoding *enc0) -{ - VALUE str; - - str = rb_enc_str_new(p, n, enc); - if (!(func & STR_FUNC_REGEXP) && rb_enc_asciicompat(enc)) { - if (rb_enc_str_coderange(str) == ENC_CODERANGE_7BIT) { - rb_enc_associate(str, rb_usascii_encoding()); - } - else if (enc0 == rb_usascii_encoding() && enc != rb_utf8_encoding()) { - rb_enc_associate(str, rb_ascii8bit_encoding()); - } - } - - return str; -} - -#define lex_goto_eol(parser) (parser->parser_lex_p = parser->parser_lex_pend) - -static inline int -parser_nextc(struct parser_params *parser) -{ - int c; - - if (lex_p == lex_pend) { - VALUE v = lex_nextline; - lex_nextline = 0; - if (!v) { - if (parser->eofp) - return -1; - - if (!lex_input || NIL_P(v = lex_getline(parser))) { - parser->eofp = Qtrue; - lex_goto_eol(parser); - return -1; - } - } - { -#ifdef RIPPER - if (parser->tokp < lex_pend) { - if (NIL_P(parser->delayed)) { - parser->delayed = rb_str_buf_new(1024); - rb_str_buf_cat(parser->delayed, - parser->tokp, lex_pend - parser->tokp); - parser->delayed_line = ruby_sourceline; - parser->delayed_col = parser->tokp - lex_pbeg; - } - else { - rb_str_buf_cat(parser->delayed, - parser->tokp, lex_pend - parser->tokp); - } - } -#endif - if (heredoc_end > 0) { - ruby_sourceline = heredoc_end; - heredoc_end = 0; - } - ruby_sourceline++; - parser->line_count++; - lex_pbeg = lex_p = RSTRING_PTR(v); - lex_pend = lex_p + RSTRING_LEN(v); -#ifdef RIPPER - ripper_flush(parser); -#endif - lex_lastline = v; - } - } - c = (unsigned char)*lex_p++; - if (c == '\r' && lex_p < lex_pend && *lex_p == '\n') { - lex_p++; - c = '\n'; - } - - return c; -} - -static void -parser_pushback(struct parser_params *parser, int c) -{ - if (c == -1) return; - lex_p--; - if (lex_p > lex_pbeg && lex_p[0] == '\n' && lex_p[-1] == '\r') { - lex_p--; - } -} - -#define was_bol() (lex_p == lex_pbeg + 1) -#define peek(c) (lex_p != lex_pend && (c) == *lex_p) - -#define tokfix() (tokenbuf[tokidx]='\0') -#define tok() tokenbuf -#define toklen() tokidx -#define toklast() (tokidx>0?tokenbuf[tokidx-1]:0) - -static char* -parser_newtok(struct parser_params *parser) -{ - tokidx = 0; - if (!tokenbuf) { - toksiz = 60; - tokenbuf = ALLOC_N(char, 60); - } - if (toksiz > 4096) { - toksiz = 60; - REALLOC_N(tokenbuf, char, 60); - } - return tokenbuf; -} - -static char * -parser_tokspace(struct parser_params *parser, int n) -{ - tokidx += n; - - if (tokidx >= toksiz) { - do {toksiz *= 2;} while (toksiz < tokidx); - REALLOC_N(tokenbuf, char, toksiz); - } - return &tokenbuf[tokidx-n]; -} - -static void -parser_tokadd(struct parser_params *parser, int c) -{ - tokenbuf[tokidx++] = (char)c; - if (tokidx >= toksiz) { - toksiz *= 2; - REALLOC_N(tokenbuf, char, toksiz); - } -} - -static int -parser_tok_hex(struct parser_params *parser, int *numlen) -{ - int c; - - c = scan_hex(lex_p, 2, numlen); - if (!*numlen) { - yyerror("invalid hex escape"); - return 0; - } - lex_p += *numlen; - return c; -} - -#define tokcopy(n) memcpy(tokspace(n), lex_p - (n), (n)) - -static int -parser_tokadd_utf8(struct parser_params *parser, rb_encoding **encp, - int string_literal, int symbol_literal, int regexp_literal) -{ - /* - * If string_literal is true, then we allow multiple codepoints - * in \u{}, and add the codepoints to the current token. - * Otherwise we're parsing a character literal and return a single - * codepoint without adding it - */ - - int codepoint; - int numlen; - - if (regexp_literal) { tokadd('\\'); tokadd('u'); } - - if (peek('{')) { /* handle \u{...} form */ - do { - if (regexp_literal) { tokadd(*lex_p); } - nextc(); - codepoint = scan_hex(lex_p, 6, &numlen); - if (numlen == 0) { - yyerror("invalid Unicode escape"); - return 0; - } - if (codepoint > 0x10ffff) { - yyerror("invalid Unicode codepoint (too large)"); - return 0; - } - lex_p += numlen; - if (regexp_literal) { - tokcopy(numlen); - } - else if (codepoint >= 0x80) { - *encp = UTF8_ENC(); - if (string_literal) tokaddmbc(codepoint, *encp); - } - else if (string_literal) { - if (codepoint == 0 && symbol_literal) { - yyerror("symbol cannot contain '\\u{0}'"); - return 0; - } - - tokadd(codepoint); - } - } while (string_literal && (peek(' ') || peek('\t'))); - - if (!peek('}')) { - yyerror("unterminated Unicode escape"); - return 0; - } - - if (regexp_literal) { tokadd('}'); } - nextc(); - } - else { /* handle \uxxxx form */ - codepoint = scan_hex(lex_p, 4, &numlen); - if (numlen < 4) { - yyerror("invalid Unicode escape"); - return 0; - } - lex_p += 4; - if (regexp_literal) { - tokcopy(4); - } - else if (codepoint >= 0x80) { - *encp = UTF8_ENC(); - if (string_literal) tokaddmbc(codepoint, *encp); - } - else if (string_literal) { - if (codepoint == 0 && symbol_literal) { - yyerror("symbol cannot contain '\\u0000'"); - return 0; - } - - tokadd(codepoint); - } - } - - return codepoint; -} - -#define ESCAPE_CONTROL 1 -#define ESCAPE_META 2 - -static int -parser_read_escape(struct parser_params *parser, int flags, - rb_encoding **encp) -{ - int c; - int numlen; - - switch (c = nextc()) { - case '\\': /* Backslash */ - return c; - - case 'n': /* newline */ - return '\n'; - - case 't': /* horizontal tab */ - return '\t'; - - case 'r': /* carriage-return */ - return '\r'; - - case 'f': /* form-feed */ - return '\f'; - - case 'v': /* vertical tab */ - return '\13'; - - case 'a': /* alarm(bell) */ - return '\007'; - - case 'e': /* escape */ - return 033; - - case '0': case '1': case '2': case '3': /* octal constant */ - case '4': case '5': case '6': case '7': - if (flags & (ESCAPE_CONTROL|ESCAPE_META)) goto eof; - { - int numlen; - - pushback(c); - c = scan_oct(lex_p, 3, &numlen); - lex_p += numlen; - } - return c; - - case 'x': /* hex constant */ - if (flags & (ESCAPE_CONTROL|ESCAPE_META)) goto eof; - c = tok_hex(&numlen); - if (numlen == 0) return 0; - return c; - - case 'b': /* backspace */ - return '\010'; - - case 's': /* space */ - return ' '; - - case 'M': - if (flags & ESCAPE_META) goto eof; - if ((c = nextc()) != '-') { - pushback(c); - goto eof; - } - if ((c = nextc()) == '\\') { - return read_escape(flags|ESCAPE_META, encp) | 0x80; - } - else if (c == -1 || !ISASCII(c)) goto eof; - else { - return ((c & 0xff) | 0x80); - } - - case 'C': - if ((c = nextc()) != '-') { - pushback(c); - goto eof; - } - case 'c': - if (flags & ESCAPE_CONTROL) goto eof; - if ((c = nextc())== '\\') { - c = read_escape(flags|ESCAPE_CONTROL, encp); - } - else if (c == '?') - return 0177; - else if (c == -1 || !ISASCII(c)) goto eof; - return c & 0x9f; - - eof: - case -1: - yyerror("Invalid escape character syntax"); - return '\0'; - - default: - return c; - } -} - -static void -parser_tokaddmbc(struct parser_params *parser, int c, rb_encoding *enc) -{ - int len = rb_enc_codelen(c, enc); - rb_enc_mbcput(c, tokspace(len), enc); -} - -static int -parser_tokadd_escape(struct parser_params *parser, rb_encoding **encp) -{ - int c; - int flags = 0; - - first: - switch (c = nextc()) { - case '\n': - return 0; /* just ignore */ - - case '0': case '1': case '2': case '3': /* octal constant */ - case '4': case '5': case '6': case '7': - if (flags & (ESCAPE_CONTROL|ESCAPE_META)) goto eof; - { - int numlen; - int oct; - - oct = scan_oct(--lex_p, 3, &numlen); - if (numlen == 0) goto eof; - lex_p += numlen; - tokcopy(numlen + 1); - } - return 0; - - case 'x': /* hex constant */ - if (flags & (ESCAPE_CONTROL|ESCAPE_META)) goto eof; - { - int numlen; - int hex; - - hex = tok_hex(&numlen); - if (numlen == 0) goto eof; - tokcopy(numlen + 2); - } - return 0; - - case 'M': - if (flags & ESCAPE_META) goto eof; - if ((c = nextc()) != '-') { - pushback(c); - goto eof; - } - tokcopy(3); - flags |= ESCAPE_META; - goto escaped; - - case 'C': - if (flags & ESCAPE_CONTROL) goto eof; - if ((c = nextc()) != '-') { - pushback(c); - goto eof; - } - tokcopy(3); - goto escaped; - - case 'c': - if (flags & ESCAPE_CONTROL) goto eof; - tokcopy(2); - flags |= ESCAPE_CONTROL; - escaped: - if ((c = nextc()) == '\\') { - goto first; - } - else if (c == -1) goto eof; - tokadd(c); - return 0; - - eof: - case -1: - yyerror("Invalid escape character syntax"); - return -1; - - default: - tokadd('\\'); - tokadd(c); - } - return 0; -} - -extern int rb_char_to_option_kcode(int c, int *option, int *kcode); - -static int -parser_regx_options(struct parser_params *parser) -{ - int kcode = 0; - int options = 0; - int c, opt, kc; - - newtok(); - while (c = nextc(), ISALPHA(c)) { - if (c == 'o') { - options |= RE_OPTION_ONCE; - } - else if (rb_char_to_option_kcode(c, &opt, &kc)) { - options |= opt; - if (kc >= 0) kcode = c; - } - else { - tokadd(c); - } - } - pushback(c); - if (toklen()) { - tokfix(); - compile_error(PARSER_ARG "unknown regexp option%s - %s", - toklen() > 1 ? "s" : "", tok()); - } - return options | RE_OPTION_ENCODING(kcode); -} - -static void -dispose_string(VALUE str) -{ - /* TODO: should use another API? */ - if (RBASIC(str)->flags & RSTRING_NOEMBED) - xfree(RSTRING_PTR(str)); - rb_gc_force_recycle(str); -} - -static int -parser_tokadd_mbchar(struct parser_params *parser, int c) -{ - int len = parser_precise_mbclen(); - if (!MBCLEN_CHARFOUND_P(len)) { - compile_error(PARSER_ARG "invalid multibyte char"); - return -1; - } - tokadd(c); - lex_p += --len; - if (len > 0) tokcopy(len); - return c; -} - -#define tokadd_mbchar(c) parser_tokadd_mbchar(parser, c) - -static int -parser_tokadd_string(struct parser_params *parser, - int func, int term, int paren, long *nest, - rb_encoding **encp) -{ - int c; - int has_nonascii = 0; - rb_encoding *enc = *encp; - char *errbuf = 0; - static const char mixed_msg[] = "%s mixed within %s source"; - -#define mixed_error(enc1, enc2) if (!errbuf) { \ - int len = sizeof(mixed_msg) - 4; \ - len += strlen(rb_enc_name(enc1)); \ - len += strlen(rb_enc_name(enc2)); \ - errbuf = ALLOCA_N(char, len); \ - snprintf(errbuf, len, mixed_msg, \ - rb_enc_name(enc1), \ - rb_enc_name(enc2)); \ - yyerror(errbuf); \ - } -#define mixed_escape(beg, enc1, enc2) do { \ - const char *pos = lex_p; \ - lex_p = beg; \ - mixed_error(enc1, enc2); \ - lex_p = pos; \ - } while (0) - - while ((c = nextc()) != -1) { - if (paren && c == paren) { - ++*nest; - } - else if (c == term) { - if (!nest || !*nest) { - pushback(c); - break; - } - --*nest; - } - else if ((func & STR_FUNC_EXPAND) && c == '#' && lex_p < lex_pend) { - int c2 = *lex_p; - if (c2 == '$' || c2 == '@' || c2 == '{') { - pushback(c); - break; - } - } - else if (c == '\\') { - const char *beg = lex_p - 1; - c = nextc(); - switch (c) { - case '\n': - if (func & STR_FUNC_QWORDS) break; - if (func & STR_FUNC_EXPAND) continue; - tokadd('\\'); - break; - - case '\\': - if (func & STR_FUNC_ESCAPE) tokadd(c); - break; - - case 'u': - if ((func & STR_FUNC_EXPAND) == 0) { - tokadd('\\'); - break; - } - parser_tokadd_utf8(parser, &enc, 1, - func & STR_FUNC_SYMBOL, - func & STR_FUNC_REGEXP); - if (has_nonascii && enc != *encp) { - mixed_escape(beg, enc, *encp); - } - continue; - - default: - if (func & STR_FUNC_REGEXP) { - pushback(c); - if ((c = tokadd_escape(&enc)) < 0) - return -1; - if (has_nonascii && enc != *encp) { - mixed_escape(beg, enc, *encp); - } - continue; - } - else if (func & STR_FUNC_EXPAND) { - pushback(c); - if (func & STR_FUNC_ESCAPE) tokadd('\\'); - c = read_escape(0, &enc); - } - else if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) { - /* ignore backslashed spaces in %w */ - } - else if (c != term && !(paren && c == paren)) { - tokadd('\\'); - } - } - } - else if (!parser_isascii()) { - has_nonascii = 1; - if (enc != *encp) { - mixed_error(enc, *encp); - continue; - } - if (tokadd_mbchar(c) == -1) return -1; - continue; - } - else if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) { - pushback(c); - break; - } - if (!c && (func & STR_FUNC_SYMBOL)) { - func &= ~STR_FUNC_SYMBOL; - compile_error(PARSER_ARG "symbol cannot contain '\\0'"); - continue; - } - if (c & 0x80) { - has_nonascii = 1; - if (enc != *encp) { - mixed_error(enc, *encp); - continue; - } - } - tokadd(c); - } - *encp = enc; - return c; -} - -#define NEW_STRTERM(func, term, paren) \ - rb_node_newnode(NODE_STRTERM, (func), (term) | ((paren) << (CHAR_BIT * 2)), 0) - -static int -parser_parse_string(struct parser_params *parser, NODE *quote) -{ - int func = quote->nd_func; - int term = nd_term(quote); - int paren = nd_paren(quote); - int c, space = 0; - rb_encoding *enc = parser->enc; - - if (func == -1) return tSTRING_END; - c = nextc(); - if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) { - do {c = nextc();} while (ISSPACE(c)); - space = 1; - } - if (c == term && !quote->nd_nest) { - if (func & STR_FUNC_QWORDS) { - quote->nd_func = -1; - return ' '; - } - if (!(func & STR_FUNC_REGEXP)) return tSTRING_END; - set_yylval_num(regx_options()); - return tREGEXP_END; - } - if (space) { - pushback(c); - return ' '; - } - newtok(); - if ((func & STR_FUNC_EXPAND) && c == '#') { - switch (c = nextc()) { - case '$': - case '@': - pushback(c); - return tSTRING_DVAR; - case '{': - return tSTRING_DBEG; - } - tokadd('#'); - } - pushback(c); - if (tokadd_string(func, term, paren, "e->nd_nest, - &enc) == -1) { - ruby_sourceline = nd_line(quote); - if (func & STR_FUNC_REGEXP) { - if (parser->eofp) - compile_error(PARSER_ARG "unterminated regexp meets end of file"); - return tREGEXP_END; - } - else { - if (parser->eofp) - compile_error(PARSER_ARG "unterminated string meets end of file"); - return tSTRING_END; - } - } - - tokfix(); - set_yylval_str(STR_NEW3(tok(), toklen(), enc, func)); - return tSTRING_CONTENT; -} - -static int -parser_heredoc_identifier(struct parser_params *parser) -{ - int c = nextc(), term, func = 0, len; - - if (c == '-') { - c = nextc(); - func = STR_FUNC_INDENT; - } - switch (c) { - case '\'': - func |= str_squote; goto quoted; - case '"': - func |= str_dquote; goto quoted; - case '`': - func |= str_xquote; - quoted: - newtok(); - tokadd(func); - term = c; - while ((c = nextc()) != -1 && c != term) { - if (tokadd_mbchar(c) == -1) return 0; - } - if (c == -1) { - compile_error(PARSER_ARG "unterminated here document identifier"); - return 0; - } - break; - - default: - if (!parser_is_identchar()) { - pushback(c); - if (func & STR_FUNC_INDENT) { - pushback('-'); - } - return 0; - } - newtok(); - term = '"'; - tokadd(func |= str_dquote); - do { - if (tokadd_mbchar(c) == -1) return 0; - } while ((c = nextc()) != -1 && parser_is_identchar()); - pushback(c); - break; - } - - tokfix(); -#ifdef RIPPER - ripper_dispatch_scan_event(parser, tHEREDOC_BEG); -#endif - len = lex_p - lex_pbeg; - lex_goto_eol(parser); - lex_strterm = rb_node_newnode(NODE_HEREDOC, - STR_NEW(tok(), toklen()), /* nd_lit */ - len, /* nd_nth */ - lex_lastline); /* nd_orig */ - nd_set_line(lex_strterm, ruby_sourceline); -#ifdef RIPPER - ripper_flush(parser); -#endif - return term == '`' ? tXSTRING_BEG : tSTRING_BEG; -} - -static void -parser_heredoc_restore(struct parser_params *parser, NODE *here) -{ - VALUE line; - -#ifdef RIPPER - if (!NIL_P(parser->delayed)) - ripper_dispatch_delayed_token(parser, tSTRING_CONTENT); - lex_goto_eol(parser); - ripper_dispatch_scan_event(parser, tHEREDOC_END); -#endif - line = here->nd_orig; - lex_lastline = line; - lex_pbeg = RSTRING_PTR(line); - lex_pend = lex_pbeg + RSTRING_LEN(line); - lex_p = lex_pbeg + here->nd_nth; - heredoc_end = ruby_sourceline; - ruby_sourceline = nd_line(here); - dispose_string(here->nd_lit); - rb_gc_force_recycle((VALUE)here); -#ifdef RIPPER - ripper_flush(parser); -#endif -} - -static int -parser_whole_match_p(struct parser_params *parser, - const char *eos, int len, int indent) -{ - const char *p = lex_pbeg; - int n; - - if (indent) { - while (*p && ISSPACE(*p)) p++; - } - n= lex_pend - (p + len); - if (n < 0 || (n > 0 && p[len] != '\n' && p[len] != '\r')) return Qfalse; - if (strncmp(eos, p, len) == 0) return Qtrue; - return Qfalse; -} - -static int -parser_here_document(struct parser_params *parser, NODE *here) -{ - int c, func, indent = 0; - const char *eos, *p, *pend; - long len; - VALUE str = 0; - - eos = RSTRING_PTR(here->nd_lit); - len = RSTRING_LEN(here->nd_lit) - 1; - indent = (func = *eos++) & STR_FUNC_INDENT; - - if ((c = nextc()) == -1) { - error: - compile_error(PARSER_ARG "can't find string \"%s\" anywhere before EOF", eos); - restore: - heredoc_restore(lex_strterm); - lex_strterm = 0; - return 0; - } - if (was_bol() && whole_match_p(eos, len, indent)) { - heredoc_restore(lex_strterm); - return tSTRING_END; - } - - if (!(func & STR_FUNC_EXPAND)) { - do { - p = RSTRING_PTR(lex_lastline); - pend = lex_pend; - if (pend > p) { - switch (pend[-1]) { - case '\n': - if (--pend == p || pend[-1] != '\r') { - pend++; - break; - } - case '\r': - --pend; - } - } - if (str) - rb_str_cat(str, p, pend - p); - else - str = STR_NEW(p, pend - p); - if (pend < lex_pend) rb_str_cat(str, "\n", 1); - lex_goto_eol(parser); - if (nextc() == -1) { - if (str) dispose_string(str); - goto error; - } - } while (!whole_match_p(eos, len, indent)); - } - else { - /* int mb = ENC_CODERANGE_7BIT, *mbp = &mb;*/ - rb_encoding *enc = parser->enc; - newtok(); - if (c == '#') { - switch (c = nextc()) { - case '$': - case '@': - pushback(c); - return tSTRING_DVAR; - case '{': - return tSTRING_DBEG; - } - tokadd('#'); - } - do { - pushback(c); - if ((c = tokadd_string(func, '\n', 0, NULL, &enc)) == -1) { - if (parser->eofp) goto error; - goto restore; - } - if (c != '\n') { - set_yylval_str(STR_NEW3(tok(), toklen(), enc, func)); - return tSTRING_CONTENT; - } - tokadd(nextc()); - /* if (mbp && mb == ENC_CODERANGE_UNKNOWN) mbp = 0;*/ - if ((c = nextc()) == -1) goto error; - } while (!whole_match_p(eos, len, indent)); - str = STR_NEW3(tok(), toklen(), enc, func); - } - heredoc_restore(lex_strterm); - lex_strterm = NEW_STRTERM(-1, 0, 0); - set_yylval_str(str); - return tSTRING_CONTENT; -} - -#include "lex.c" - -#ifndef RIPPER -static void -arg_ambiguous_gen(struct parser_params *parser) -{ - rb_warning0("ambiguous first argument; put parentheses or even spaces"); -} -#else -static void -arg_ambiguous_gen(struct parser_params *parser) -{ - dispatch0(arg_ambiguous); -} -#endif -#define arg_ambiguous() arg_ambiguous_gen(parser) - -static int -lvar_defined_gen(struct parser_params *parser, ID id) -{ -#ifndef RIPPER - return (dyna_in_block() && dvar_defined(id)) || local_id(id); -#else - return 0; -#endif -} - -/* emacsen -*- hack */ -static int -parser_encode_length(struct parser_params *parser, const char *name, int len) -{ - int nlen; - - if (len > 5 && name[nlen = len - 5] == '-') { - if (rb_memcicmp(name + nlen + 1, "unix", 4) == 0) - return nlen; - } - if (len > 4 && name[nlen = len - 5] == '-') { - if (rb_memcicmp(name + nlen + 1, "dos", 3) == 0) - return nlen; - if (rb_memcicmp(name + nlen + 1, "mac", 3) == 0) - return nlen; - } - return len; -} - -static void -parser_set_encode(struct parser_params *parser, const char *name) -{ - int idx = rb_enc_find_index(name); - rb_encoding *enc; - - if (idx < 0) { - rb_raise(rb_eArgError, "unknown encoding name: %s", name); - } - enc = rb_enc_from_index(idx); - if (!rb_enc_asciicompat(enc)) { - rb_raise(rb_eArgError, "%s is not ASCII compatible", rb_enc_name(enc)); - } - parser->enc = enc; -} - -#ifndef RIPPER -typedef int (*rb_magic_comment_length_t)(struct parser_params *parser, const char *name, int len); -typedef void (*rb_magic_comment_setter_t)(struct parser_params *parser, const char *name, const char *val); - -static void -magic_comment_encoding(struct parser_params *parser, const char *name, const char *val) -{ - if (parser->line_count != (parser->has_shebang ? 2 : 1)) - return; - parser_set_encode(parser, val); -} - -struct magic_comment { - const char *name; - rb_magic_comment_setter_t func; - rb_magic_comment_length_t length; -}; - -static const struct magic_comment magic_comments[] = { - {"coding", magic_comment_encoding, parser_encode_length}, - {"encoding", magic_comment_encoding, parser_encode_length}, -}; -#endif - -static const char * -magic_comment_marker(const char *str, int len) -{ - int i = 2; - - while (i < len) { - switch (str[i]) { - case '-': - if (str[i-1] == '*' && str[i-2] == '-') { - return str + i + 1; - } - i += 2; - break; - case '*': - if (i + 1 >= len) return 0; - if (str[i+1] != '-') { - i += 4; - } - else if (str[i-1] != '-') { - i += 2; - } - else { - return str + i + 2; - } - break; - default: - i += 3; - break; - } - } - return 0; -} - -static int -parser_magic_comment(struct parser_params *parser, const char *str, int len) -{ - VALUE name = 0, val = 0; - const char *beg, *end, *vbeg, *vend; -#define str_copy(_s, _p, _n) ((_s) \ - ? (rb_str_resize((_s), (_n)), \ - MEMCPY(RSTRING_PTR(_s), (_p), char, (_n)), (_s)) \ - : ((_s) = STR_NEW((_p), (_n)))) - - if (len <= 7) return Qfalse; - if (!(beg = magic_comment_marker(str, len))) return Qfalse; - if (!(end = magic_comment_marker(beg, str + len - beg))) return Qfalse; - str = beg; - len = end - beg - 3; - - /* %r"([^\\s\'\":;]+)\\s*:\\s*(\"(?:\\\\.|[^\"])*\"|[^\"\\s;]+)[\\s;]*" */ - while (len > 0) { -#ifndef RIPPER - const struct magic_comment *p = magic_comments; -#endif - int n = 0; - - for (; len > 0 && *str; str++, --len) { - switch (*str) { - case '\'': case '"': case ':': case ';': - continue; - } - if (!ISSPACE(*str)) break; - } - for (beg = str; len > 0; str++, --len) { - switch (*str) { - case '\'': case '"': case ':': case ';': - break; - default: - if (ISSPACE(*str)) break; - continue; - } - break; - } - for (end = str; len > 0 && ISSPACE(*str); str++, --len); - if (!len) break; - if (*str != ':') continue; - - do str++; while (--len > 0 && ISSPACE(*str)); - if (!len) break; - if (*str == '"') { - for (vbeg = ++str; --len > 0 && *str != '"'; str++) { - if (*str == '\\') { - --len; - ++str; - } - } - vend = str; - if (len) { - --len; - ++str; - } - } - else { - for (vbeg = str; len > 0 && *str != '"' && *str != ';' && !ISSPACE(*str); --len, str++); - vend = str; - } - while (len > 0 && (*str == ';' || ISSPACE(*str))) --len, str++; - - n = end - beg; - str_copy(name, beg, n); -#ifndef RIPPER - do { - if (STRNCASECMP(p->name, RSTRING_PTR(name), n) == 0) { - n = vend - vbeg; - if (p->length) { - n = (*p->length)(parser, vbeg, n); - } - str_copy(val, vbeg, n); - (*p->func)(parser, RSTRING_PTR(name), RSTRING_PTR(val)); - break; - } - } while (++p < magic_comments + sizeof(magic_comments) / sizeof(*p)); -#else - dispatch2(magic_comment, name, val); -#endif - } - - return Qtrue; -} - -static void -set_file_encoding(struct parser_params *parser, const char *str, const char *send) -{ - int sep = 0; - const char *beg = str; - VALUE s; - - for (;;) { - if (send - str <= 6) return; - switch (str[6]) { - case 'C': case 'c': str += 6; continue; - case 'O': case 'o': str += 5; continue; - case 'D': case 'd': str += 4; continue; - case 'I': case 'i': str += 3; continue; - case 'N': case 'n': str += 2; continue; - case 'G': case 'g': str += 1; continue; - case '=': case ':': - sep = 1; - str += 6; - break; - default: - str += 6; - if (ISSPACE(*str)) break; - continue; - } - if (STRNCASECMP(str-6, "coding", 6) == 0) break; - } - for (;;) { - do { - if (++str >= send) return; - } while (ISSPACE(*str)); - if (sep) break; - if (*str != '=' && *str != ':') return; - sep = 1; - str++; - } - beg = str; - while ((*str == '-' || *str == '_' || ISALNUM(*str)) && ++str < send); - s = rb_str_new(beg, parser_encode_length(parser, beg, str - beg)); - parser_set_encode(parser, RSTRING_PTR(s)); - rb_str_resize(s, 0); -} - -static void -parser_prepare(struct parser_params *parser) -{ - int c = nextc(); - switch (c) { - case '#': - if (peek('!')) parser->has_shebang = 1; - break; - case 0xef: /* UTF-8 BOM marker */ - if (lex_pend - lex_p >= 2 && - (unsigned char)lex_p[0] == 0xbb && - (unsigned char)lex_p[1] == 0xbf) { - parser_set_encode(parser, "UTF-8"); - lex_p += 2; - lex_pbeg = lex_p; - return; - } - break; - case EOF: - return; - } - pushback(c); - parser->enc = rb_enc_get(lex_lastline); -} - -#define IS_ARG() (lex_state == EXPR_ARG || lex_state == EXPR_CMDARG) -#define IS_BEG() (lex_state == EXPR_BEG || lex_state == EXPR_MID || lex_state == EXPR_VALUE || lex_state == EXPR_CLASS) - -static int -parser_yylex(struct parser_params *parser) -{ - register int c; - int space_seen = 0; - int cmd_state; - enum lex_state_e last_state; - rb_encoding *enc; - int mb; -#ifdef RIPPER - int fallthru = Qfalse; -#endif - - if (lex_strterm) { - int token; - if (nd_type(lex_strterm) == NODE_HEREDOC) { - token = here_document(lex_strterm); - if (token == tSTRING_END) { - lex_strterm = 0; - lex_state = EXPR_ENDARG; - } - } - else { - token = parse_string(lex_strterm); - if (token == tSTRING_END || token == tREGEXP_END) { - rb_gc_force_recycle((VALUE)lex_strterm); - lex_strterm = 0; - lex_state = EXPR_ENDARG; - } - } - return token; - } - cmd_state = command_start; - command_start = Qfalse; - retry: - switch (c = nextc()) { - case '\0': /* NUL */ - case '\004': /* ^D */ - case '\032': /* ^Z */ - case -1: /* end of script. */ - return 0; - - /* white spaces */ - case ' ': case '\t': case '\f': case '\r': - case '\13': /* '\v' */ - space_seen++; -#ifdef RIPPER - while ((c = nextc())) { - switch (c) { - case ' ': case '\t': case '\f': case '\r': - case '\13': /* '\v' */ - break; - default: - goto outofloop; - } - } - outofloop: - pushback(c); - ripper_dispatch_scan_event(parser, tSP); -#endif - goto retry; - - case '#': /* it's a comment */ - /* no magic_comment in shebang line */ - if (parser->line_count == (parser->has_shebang ? 2 : 1) - && (lex_p - lex_pbeg) == 1) { - if (!parser_magic_comment(parser, lex_p, lex_pend - lex_p)) { - set_file_encoding(parser, lex_p, lex_pend); - } - } - lex_p = lex_pend; -#ifdef RIPPER - ripper_dispatch_scan_event(parser, tCOMMENT); - fallthru = Qtrue; -#endif - /* fall through */ - case '\n': - switch (lex_state) { - case EXPR_BEG: - case EXPR_FNAME: - case EXPR_DOT: - case EXPR_CLASS: - case EXPR_VALUE: -#ifdef RIPPER - if (!fallthru) { - ripper_dispatch_scan_event(parser, tIGNORED_NL); - } - fallthru = Qfalse; -#endif - goto retry; - default: - break; - } - while ((c = nextc())) { - switch (c) { - case ' ': case '\t': case '\f': case '\r': - case '\13': /* '\v' */ - space_seen++; - break; - case '.': { - if ((c = nextc()) != '.') { - pushback(c); - pushback('.'); - goto retry; - } - } - default: - --ruby_sourceline; - lex_nextline = lex_lastline; - case -1: /* EOF no decrement*/ - lex_goto_eol(parser); -#ifdef RIPPER - if (c != -1) { - parser->tokp = lex_p; - } -#endif - goto normal_newline; - } - } - normal_newline: - command_start = Qtrue; - lex_state = EXPR_BEG; - return '\n'; - - case '*': - if ((c = nextc()) == '*') { - if ((c = nextc()) == '=') { - set_yylval_id(tPOW); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - c = tPOW; - } - else { - if (c == '=') { - set_yylval_id('*'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - if (IS_ARG() && space_seen && !ISSPACE(c)) { - rb_warning0("`*' interpreted as argument prefix"); - c = tSTAR; - } - else if (IS_BEG()) { - c = tSTAR; - } - else { - c = '*'; - } - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - return c; - - case '!': - c = nextc(); - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - lex_state = EXPR_ARG; - if (c == '@') { - return '!'; - } - } - else { - lex_state = EXPR_BEG; - } - if (c == '=') { - return tNEQ; - } - if (c == '~') { - return tNMATCH; - } - pushback(c); - return '!'; - - case '=': - if (was_bol()) { - /* skip embedded rd document */ - if (strncmp(lex_p, "begin", 5) == 0 && ISSPACE(lex_p[5])) { -#ifdef RIPPER - int first_p = Qtrue; - - lex_goto_eol(parser); - ripper_dispatch_scan_event(parser, tEMBDOC_BEG); -#endif - for (;;) { - lex_goto_eol(parser); -#ifdef RIPPER - if (!first_p) { - ripper_dispatch_scan_event(parser, tEMBDOC); - } - first_p = Qfalse; -#endif - c = nextc(); - if (c == -1) { - compile_error(PARSER_ARG "embedded document meets end of file"); - return 0; - } - if (c != '=') continue; - if (strncmp(lex_p, "end", 3) == 0 && - (lex_p + 3 == lex_pend || ISSPACE(lex_p[3]))) { - break; - } - } - lex_goto_eol(parser); -#ifdef RIPPER - ripper_dispatch_scan_event(parser, tEMBDOC_END); -#endif - goto retry; - } - } - - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - if ((c = nextc()) == '=') { - if ((c = nextc()) == '=') { - return tEQQ; - } - pushback(c); - return tEQ; - } - if (c == '~') { - return tMATCH; - } - else if (c == '>') { - return tASSOC; - } - pushback(c); - return '='; - - case '<': - c = nextc(); - if (c == '<' && - lex_state != EXPR_END && - lex_state != EXPR_DOT && - lex_state != EXPR_ENDARG && - lex_state != EXPR_CLASS && - (!IS_ARG() || space_seen)) { - int token = heredoc_identifier(); - if (token) return token; - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - if (c == '=') { - if ((c = nextc()) == '>') { - return tCMP; - } - pushback(c); - return tLEQ; - } - if (c == '<') { - if ((c = nextc()) == '=') { - set_yylval_id(tLSHFT); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - return tLSHFT; - } - pushback(c); - return '<'; - - case '>': - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - if ((c = nextc()) == '=') { - return tGEQ; - } - if (c == '>') { - if ((c = nextc()) == '=') { - set_yylval_id(tRSHFT); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - return tRSHFT; - } - pushback(c); - return '>'; - - case '"': - lex_strterm = NEW_STRTERM(str_dquote, '"', 0); - return tSTRING_BEG; - - case '`': - if (lex_state == EXPR_FNAME) { - lex_state = EXPR_END; - return c; - } - if (lex_state == EXPR_DOT) { - if (cmd_state) - lex_state = EXPR_CMDARG; - else - lex_state = EXPR_ARG; - return c; - } - lex_strterm = NEW_STRTERM(str_xquote, '`', 0); - return tXSTRING_BEG; - - case '\'': - lex_strterm = NEW_STRTERM(str_squote, '\'', 0); - return tSTRING_BEG; - - case '?': - if (lex_state == EXPR_END || - lex_state == EXPR_ENDARG) { - lex_state = EXPR_VALUE; - return '?'; - } - c = nextc(); - if (c == -1) { - compile_error(PARSER_ARG "incomplete character syntax"); - return 0; - } - if (rb_enc_isspace(c, parser->enc)) { - if (!IS_ARG()) { - int c2 = 0; - switch (c) { - case ' ': - c2 = 's'; - break; - case '\n': - c2 = 'n'; - break; - case '\t': - c2 = 't'; - break; - case '\v': - c2 = 'v'; - break; - case '\r': - c2 = 'r'; - break; - case '\f': - c2 = 'f'; - break; - } - if (c2) { - rb_warnI("invalid character syntax; use ?\\%c", c2); - } - } - ternary: - pushback(c); - lex_state = EXPR_VALUE; - return '?'; - } - newtok(); - enc = parser->enc; - if (!parser_isascii()) { - if (tokadd_mbchar(c) == -1) return 0; - } - else if ((rb_enc_isalnum(c, parser->enc) || c == '_') && - lex_p < lex_pend && is_identchar(lex_p, lex_pend, parser->enc)) { - goto ternary; - } - else if (c == '\\') { - if (peek('u')) { - nextc(); - c = parser_tokadd_utf8(parser, &enc, 0, 0, 0); - if (0x80 <= c) { - tokaddmbc(c, enc); - } - else { - tokadd(c); - } - } - else { - c = read_escape(0, &enc); - tokadd(c); - } - } - else { - tokadd(c); - } - tokfix(); - set_yylval_str(STR_NEW3(tok(), toklen(), enc, 0)); - lex_state = EXPR_ENDARG; - return tCHAR; - - case '&': - if ((c = nextc()) == '&') { - lex_state = EXPR_BEG; - if ((c = nextc()) == '=') { - set_yylval_id(tANDOP); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - return tANDOP; - } - else if (c == '=') { - set_yylval_id('&'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - if (IS_ARG() && space_seen && !ISSPACE(c)) { - rb_warning0("`&' interpreted as argument prefix"); - c = tAMPER; - } - else if (IS_BEG()) { - c = tAMPER; - } - else { - c = '&'; - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; - } - return c; - - case '|': - if ((c = nextc()) == '|') { - lex_state = EXPR_BEG; - if ((c = nextc()) == '=') { - set_yylval_id(tOROP); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - return tOROP; - } - if (c == '=') { - set_yylval_id('|'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - lex_state = EXPR_ARG; - } - else { - lex_state = EXPR_BEG; - } - pushback(c); - return '|'; - - case '+': - c = nextc(); - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - lex_state = EXPR_ARG; - if (c == '@') { - return tUPLUS; - } - pushback(c); - return '+'; - } - if (c == '=') { - set_yylval_id('+'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - if (IS_BEG() || - (IS_ARG() && space_seen && !ISSPACE(c))) { - if (IS_ARG()) arg_ambiguous(); - lex_state = EXPR_BEG; - pushback(c); - if (ISDIGIT(c)) { - c = '+'; - goto start_num; - } - return tUPLUS; - } - lex_state = EXPR_BEG; - pushback(c); - return '+'; - - case '-': - c = nextc(); - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - lex_state = EXPR_ARG; - if (c == '@') { - return tUMINUS; - } - pushback(c); - return '-'; - } - if (c == '=') { - set_yylval_id('-'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - if (c == '>') { - lex_state = EXPR_ARG; - return tLAMBDA; - } - if (IS_BEG() || - (IS_ARG() && space_seen && !ISSPACE(c))) { - if (IS_ARG()) arg_ambiguous(); - lex_state = EXPR_BEG; - pushback(c); - if (ISDIGIT(c)) { - return tUMINUS_NUM; - } - return tUMINUS; - } - lex_state = EXPR_BEG; - pushback(c); - return '-'; - - case '.': - lex_state = EXPR_BEG; - if ((c = nextc()) == '.') { - if ((c = nextc()) == '.') { - return tDOT3; - } - pushback(c); - return tDOT2; - } - pushback(c); - if (ISDIGIT(c)) { - yyerror("no .<digit> floating literal anymore; put 0 before dot"); - } - lex_state = EXPR_DOT; - return '.'; - - start_num: - case '0': case '1': case '2': case '3': case '4': - case '5': case '6': case '7': case '8': case '9': - { - int is_float, seen_point, seen_e, nondigit; - - is_float = seen_point = seen_e = nondigit = 0; - lex_state = EXPR_ENDARG; - newtok(); - if (c == '-' || c == '+') { - tokadd(c); - c = nextc(); - } - if (c == '0') { - int start = toklen(); - c = nextc(); - if (c == 'x' || c == 'X') { - /* hexadecimal */ - c = nextc(); - if (ISXDIGIT(c)) { - do { - if (c == '_') { - if (nondigit) break; - nondigit = c; - continue; - } - if (!ISXDIGIT(c)) break; - nondigit = 0; - tokadd(c); - } while ((c = nextc()) != -1); - } - pushback(c); - tokfix(); - if (toklen() == start) { - yyerror("numeric literal without digits"); - } - else if (nondigit) goto trailing_uc; - set_yylval_literal(rb_cstr_to_inum(tok(), 16, Qfalse)); - return tINTEGER; - } - if (c == 'b' || c == 'B') { - /* binary */ - c = nextc(); - if (c == '0' || c == '1') { - do { - if (c == '_') { - if (nondigit) break; - nondigit = c; - continue; - } - if (c != '0' && c != '1') break; - nondigit = 0; - tokadd(c); - } while ((c = nextc()) != -1); - } - pushback(c); - tokfix(); - if (toklen() == start) { - yyerror("numeric literal without digits"); - } - else if (nondigit) goto trailing_uc; - set_yylval_literal(rb_cstr_to_inum(tok(), 2, Qfalse)); - return tINTEGER; - } - if (c == 'd' || c == 'D') { - /* decimal */ - c = nextc(); - if (ISDIGIT(c)) { - do { - if (c == '_') { - if (nondigit) break; - nondigit = c; - continue; - } - if (!ISDIGIT(c)) break; - nondigit = 0; - tokadd(c); - } while ((c = nextc()) != -1); - } - pushback(c); - tokfix(); - if (toklen() == start) { - yyerror("numeric literal without digits"); - } - else if (nondigit) goto trailing_uc; - set_yylval_literal(rb_cstr_to_inum(tok(), 10, Qfalse)); - return tINTEGER; - } - if (c == '_') { - /* 0_0 */ - goto octal_number; - } - if (c == 'o' || c == 'O') { - /* prefixed octal */ - c = nextc(); - if (c == '_' || !ISDIGIT(c)) { - yyerror("numeric literal without digits"); - } - } - if (c >= '0' && c <= '7') { - /* octal */ - octal_number: - do { - if (c == '_') { - if (nondigit) break; - nondigit = c; - continue; - } - if (c < '0' || c > '9') break; - if (c > '7') goto invalid_octal; - nondigit = 0; - tokadd(c); - } while ((c = nextc()) != -1); - if (toklen() > start) { - pushback(c); - tokfix(); - if (nondigit) goto trailing_uc; - set_yylval_literal(rb_cstr_to_inum(tok(), 8, Qfalse)); - return tINTEGER; - } - if (nondigit) { - pushback(c); - goto trailing_uc; - } - } - if (c > '7' && c <= '9') { - invalid_octal: - yyerror("Invalid octal digit"); - } - else if (c == '.' || c == 'e' || c == 'E') { - tokadd('0'); - } - else { - pushback(c); - set_yylval_literal(INT2FIX(0)); - return tINTEGER; - } - } - - for (;;) { - switch (c) { - case '0': case '1': case '2': case '3': case '4': - case '5': case '6': case '7': case '8': case '9': - nondigit = 0; - tokadd(c); - break; - - case '.': - if (nondigit) goto trailing_uc; - if (seen_point || seen_e) { - goto decode_num; - } - else { - int c0 = nextc(); - if (!ISDIGIT(c0)) { - pushback(c0); - goto decode_num; - } - c = c0; - } - tokadd('.'); - tokadd(c); - is_float++; - seen_point++; - nondigit = 0; - break; - - case 'e': - case 'E': - if (nondigit) { - pushback(c); - c = nondigit; - goto decode_num; - } - if (seen_e) { - goto decode_num; - } - tokadd(c); - seen_e++; - is_float++; - nondigit = c; - c = nextc(); - if (c != '-' && c != '+') continue; - tokadd(c); - nondigit = c; - break; - - case '_': /* `_' in number just ignored */ - if (nondigit) goto decode_num; - nondigit = c; - break; - - default: - goto decode_num; - } - c = nextc(); - } - - decode_num: - pushback(c); - tokfix(); - if (nondigit) { - char tmp[30]; - trailing_uc: - sprintf(tmp, "trailing `%c' in number", nondigit); - yyerror(tmp); - } - if (is_float) { - double d = strtod(tok(), 0); - if (errno == ERANGE) { - rb_warningS("Float %s out of range", tok()); - errno = 0; - } - set_yylval_literal(DOUBLE2NUM(d)); - return tFLOAT; - } - set_yylval_literal(rb_cstr_to_inum(tok(), 10, Qfalse)); - return tINTEGER; - } - - case ')': - case ']': - paren_nest--; - case '}': - COND_LEXPOP(); - CMDARG_LEXPOP(); - if (c == ')') - lex_state = EXPR_END; - else - lex_state = EXPR_ENDARG; - return c; - - case ':': - c = nextc(); - if (c == ':') { - if (IS_BEG() || - lex_state == EXPR_CLASS || (IS_ARG() && space_seen)) { - lex_state = EXPR_BEG; - return tCOLON3; - } - lex_state = EXPR_DOT; - return tCOLON2; - } - if (lex_state == EXPR_END || - lex_state == EXPR_ENDARG || ISSPACE(c)) { - pushback(c); - lex_state = EXPR_BEG; - return ':'; - } - switch (c) { - case '\'': - lex_strterm = NEW_STRTERM(str_ssym, c, 0); - break; - case '"': - lex_strterm = NEW_STRTERM(str_dsym, c, 0); - break; - default: - pushback(c); - break; - } - lex_state = EXPR_FNAME; - return tSYMBEG; - - case '/': - if (IS_BEG()) { - lex_strterm = NEW_STRTERM(str_regexp, '/', 0); - return tREGEXP_BEG; - } - if ((c = nextc()) == '=') { - set_yylval_id('/'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - pushback(c); - if (IS_ARG() && space_seen) { - if (!ISSPACE(c)) { - arg_ambiguous(); - lex_strterm = NEW_STRTERM(str_regexp, '/', 0); - return tREGEXP_BEG; - } - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - return '/'; - - case '^': - if ((c = nextc()) == '=') { - set_yylval_id('^'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - pushback(c); - return '^'; - - case ';': - lex_state = EXPR_BEG; - command_start = Qtrue; - return ';'; - - case ',': - lex_state = EXPR_BEG; - return ','; - - case '~': - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - if ((c = nextc()) != '@') { - pushback(c); - } - lex_state = EXPR_ARG; - } - else { - lex_state = EXPR_BEG; - } - return '~'; - - case '(': - if (IS_BEG()) { - c = tLPAREN; - } - else if (space_seen) { - if (IS_ARG()) { - c = tLPAREN_ARG; - } - } - paren_nest++; - COND_PUSH(0); - CMDARG_PUSH(0); - lex_state = EXPR_BEG; - return c; - - case '[': - paren_nest++; - if (lex_state == EXPR_FNAME || lex_state == EXPR_DOT) { - lex_state = EXPR_ARG; - if ((c = nextc()) == ']') { - if ((c = nextc()) == '=') { - return tASET; - } - pushback(c); - return tAREF; - } - pushback(c); - return '['; - } - else if (IS_BEG()) { - c = tLBRACK; - } - else if (IS_ARG() && space_seen) { - c = tLBRACK; - } - lex_state = EXPR_BEG; - COND_PUSH(0); - CMDARG_PUSH(0); - return c; - - case '{': - if (lpar_beg && lpar_beg == paren_nest) { - lex_state = EXPR_BEG; - lpar_beg = 0; - --paren_nest; - return tLAMBEG; - } - if (IS_ARG() || lex_state == EXPR_END) - c = '{'; /* block (primary) */ - else if (lex_state == EXPR_ENDARG) - c = tLBRACE_ARG; /* block (expr) */ - else - c = tLBRACE; /* hash */ - COND_PUSH(0); - CMDARG_PUSH(0); - lex_state = EXPR_BEG; - if (c != tLBRACE) command_start = Qtrue; - return c; - - case '\\': - c = nextc(); - if (c == '\n') { - space_seen = 1; -#ifdef RIPPER - ripper_dispatch_scan_event(parser, tSP); -#endif - goto retry; /* skip \\n */ - } - pushback(c); - return '\\'; - - case '%': - if (IS_BEG()) { - int term; - int paren; - - c = nextc(); - quotation: - if (!ISALNUM(c)) { - term = c; - c = 'Q'; - } - else { - term = nextc(); - if (rb_enc_isalnum(term, parser->enc) || !parser_isascii()) { - yyerror("unknown type of %string"); - return 0; - } - } - if (c == -1 || term == -1) { - compile_error(PARSER_ARG "unterminated quoted string meets end of file"); - return 0; - } - paren = term; - if (term == '(') term = ')'; - else if (term == '[') term = ']'; - else if (term == '{') term = '}'; - else if (term == '<') term = '>'; - else paren = 0; - - switch (c) { - case 'Q': - lex_strterm = NEW_STRTERM(str_dquote, term, paren); - return tSTRING_BEG; - - case 'q': - lex_strterm = NEW_STRTERM(str_squote, term, paren); - return tSTRING_BEG; - - case 'W': - lex_strterm = NEW_STRTERM(str_dword, term, paren); - do {c = nextc();} while (ISSPACE(c)); - pushback(c); - return tWORDS_BEG; - - case 'w': - lex_strterm = NEW_STRTERM(str_sword, term, paren); - do {c = nextc();} while (ISSPACE(c)); - pushback(c); - return tQWORDS_BEG; - - case 'x': - lex_strterm = NEW_STRTERM(str_xquote, term, paren); - return tXSTRING_BEG; - - case 'r': - lex_strterm = NEW_STRTERM(str_regexp, term, paren); - return tREGEXP_BEG; - - case 's': - lex_strterm = NEW_STRTERM(str_ssym, term, paren); - lex_state = EXPR_FNAME; - return tSYMBEG; - - default: - yyerror("unknown type of %string"); - return 0; - } - } - if ((c = nextc()) == '=') { - set_yylval_id('%'); - lex_state = EXPR_BEG; - return tOP_ASGN; - } - if (IS_ARG() && space_seen && !ISSPACE(c)) { - goto quotation; - } - switch (lex_state) { - case EXPR_FNAME: case EXPR_DOT: - lex_state = EXPR_ARG; break; - default: - lex_state = EXPR_BEG; break; - } - pushback(c); - return '%'; - - case '$': - last_state = lex_state; - lex_state = EXPR_ENDARG; - newtok(); - c = nextc(); - switch (c) { - case '_': /* $_: last read line string */ - c = nextc(); - if (parser_is_identchar()) { - tokadd('$'); - tokadd('_'); - break; - } - pushback(c); - c = '_'; - /* fall through */ - case '~': /* $~: match-data */ - case '*': /* $*: argv */ - case '$': /* $$: pid */ - case '?': /* $?: last status */ - case '!': /* $!: error string */ - case '@': /* $@: error position */ - case '/': /* $/: input record separator */ - case '\\': /* $\: output record separator */ - case ';': /* $;: field separator */ - case ',': /* $,: output field separator */ - case '.': /* $.: last read line number */ - case '=': /* $=: ignorecase */ - case ':': /* $:: load path */ - case '<': /* $<: reading filename */ - case '>': /* $>: default output handle */ - case '\"': /* $": already loaded files */ - tokadd('$'); - tokadd(c); - tokfix(); - set_yylval_id(rb_intern(tok())); - return tGVAR; - - case '-': - tokadd('$'); - tokadd(c); - c = nextc(); - if (parser_is_identchar()) { - if (tokadd_mbchar(c) == -1) return 0; - } - else { - pushback(c); - } - gvar: - tokfix(); - set_yylval_id(rb_intern(tok())); - return tGVAR; - - case '&': /* $&: last match */ - case '`': /* $`: string before last match */ - case '\'': /* $': string after last match */ - case '+': /* $+: string matches last paren. */ - if (last_state == EXPR_FNAME) { - tokadd('$'); - tokadd(c); - goto gvar; - } - set_yylval_node(NEW_BACK_REF(c)); - return tBACK_REF; - - case '1': case '2': case '3': - case '4': case '5': case '6': - case '7': case '8': case '9': - tokadd('$'); - do { - tokadd(c); - c = nextc(); - } while (ISDIGIT(c)); - pushback(c); - if (last_state == EXPR_FNAME) goto gvar; - tokfix(); - set_yylval_node(NEW_NTH_REF(atoi(tok()+1))); - return tNTH_REF; - - default: - if (!parser_is_identchar()) { - pushback(c); - return '$'; - } - case '0': - tokadd('$'); - } - break; - - case '@': - c = nextc(); - newtok(); - tokadd('@'); - if (c == '@') { - tokadd('@'); - c = nextc(); - } - if (ISDIGIT(c)) { - if (tokidx == 1) { - compile_error(PARSER_ARG "`@%c' is not allowed as an instance variable name", c); - } - else { - compile_error(PARSER_ARG "`@@%c' is not allowed as a class variable name", c); - } - return 0; - } - if (!parser_is_identchar()) { - pushback(c); - return '@'; - } - break; - - case '_': - if (was_bol() && whole_match_p("__END__", 7, 0)) { - ruby__end__seen = 1; - parser->eofp = Qtrue; -#ifndef RIPPER - return -1; -#else - lex_goto_eol(parser); - ripper_dispatch_scan_event(parser, k__END__); - return 0; -#endif - } - newtok(); - break; - - default: - if (!parser_is_identchar()) { - rb_compile_error(PARSER_ARG "Invalid char `\\x%02X' in expression", c); - goto retry; - } - - newtok(); - break; - } - - mb = ENC_CODERANGE_7BIT; - do { - if (!ISASCII(c)) mb = ENC_CODERANGE_UNKNOWN; - if (tokadd_mbchar(c) == -1) return 0; - c = nextc(); - } while (parser_is_identchar()); - switch (tok()[0]) { - case '@': case '$': - pushback(c); - break; - default: - if ((c == '!' || c == '?') && !peek('=')) { - tokadd(c); - } - else { - pushback(c); - } - } - tokfix(); - - { - int result = 0; - - last_state = lex_state; - switch (tok()[0]) { - case '$': - lex_state = EXPR_ENDARG; - result = tGVAR; - break; - case '@': - lex_state = EXPR_ENDARG; - if (tok()[1] == '@') - result = tCVAR; - else - result = tIVAR; - break; - - default: - if (toklast() == '!' || toklast() == '?') { - result = tFID; - } - else { - if (lex_state == EXPR_FNAME) { - if ((c = nextc()) == '=' && !peek('~') && !peek('>') && - (!peek('=') || (lex_p + 1 < lex_pend && lex_p[1] == '>'))) { - result = tIDENTIFIER; - tokadd(c); - tokfix(); - } - else { - pushback(c); - } - } - if (result == 0 && ISUPPER(tok()[0])) { - result = tCONSTANT; - } - else { - result = tIDENTIFIER; - } - } - - if (mb == ENC_CODERANGE_7BIT && lex_state != EXPR_DOT) { - const struct kwtable *kw; - - /* See if it is a reserved word. */ - kw = rb_reserved_word(tok(), toklen()); - if (kw) { - enum lex_state_e state = lex_state; - lex_state = kw->state; - if (state == EXPR_FNAME) { - set_yylval_id(rb_intern(kw->name)); - return kw->id[0]; - } - if (kw->id[0] == keyword_do) { - command_start = Qtrue; - if (lpar_beg && lpar_beg == paren_nest) { - lpar_beg = 0; - --paren_nest; - return keyword_do_LAMBDA; - } - if (COND_P()) return keyword_do_cond; - if (CMDARG_P() && state != EXPR_CMDARG) - return keyword_do_block; - if (state == EXPR_ENDARG || state == EXPR_BEG) - return keyword_do_block; - return keyword_do; - } - if (state == EXPR_BEG || state == EXPR_VALUE) - return kw->id[0]; - else { - if (kw->id[0] != kw->id[1]) - lex_state = EXPR_BEG; - return kw->id[1]; - } - } - } - - if ((lex_state == EXPR_BEG && !cmd_state) || - lex_state == EXPR_ARG || - lex_state == EXPR_CMDARG) { - if (peek(':') && !(lex_p + 1 < lex_pend && lex_p[1] == ':')) { - lex_state = EXPR_BEG; - nextc(); - set_yylval_id(TOK_INTERN(!ENC_SINGLE(mb))); - return tLABEL; - } - } - if (IS_BEG() || - lex_state == EXPR_DOT || - IS_ARG()) { - if (cmd_state) { - lex_state = EXPR_CMDARG; - } - else { - lex_state = EXPR_ARG; - } - } - else { - lex_state = EXPR_END; - } - } - { - ID ident = TOK_INTERN(!ENC_SINGLE(mb)); - - set_yylval_id(ident); - if (last_state != EXPR_DOT && is_local_id(ident) && lvar_defined(ident)) { - lex_state = EXPR_END; - } - } - return result; - } -} - -#if YYPURE -static int -yylex(void *lval, void *p) -#else -yylex(void *p) -#endif -{ - struct parser_params *parser = (struct parser_params*)p; - int t; - -#if YYPURE - parser->parser_yylval = lval; - parser->parser_yylval->val = Qundef; -#endif - t = parser_yylex(parser); -#ifdef RIPPER - if (!NIL_P(parser->delayed)) { - ripper_dispatch_delayed_token(parser, t); - return t; - } - if (t != 0) - ripper_dispatch_scan_event(parser, t); -#endif - - return t; -} - -#ifndef RIPPER -static NODE* -node_newnode(struct parser_params *parser, enum node_type type, VALUE a0, VALUE a1, VALUE a2) -{ - NODE *n = (rb_node_newnode)(type, a0, a1, a2); - nd_set_line(n, ruby_sourceline); - return n; -} - -enum node_type -nodetype(NODE *node) /* for debug */ -{ - return (enum node_type)nd_type(node); -} - -int -nodeline(NODE *node) -{ - return nd_line(node); -} - -static NODE* -newline_node(NODE *node) -{ - if (node) { - node = remove_begin(node); - node->flags |= NODE_FL_NEWLINE; - } - return node; -} - -static void -fixpos(NODE *node, NODE *orig) -{ - if (!node) return; - if (!orig) return; - if (orig == (NODE*)1) return; - nd_set_line(node, nd_line(orig)); -} - -static void -parser_warning(struct parser_params *parser, NODE *node, const char *mesg) -{ - rb_compile_warning(ruby_sourcefile, nd_line(node), "%s", mesg); -} -#define parser_warning(node, mesg) parser_warning(parser, node, mesg) - -static void -parser_warn(struct parser_params *parser, NODE *node, const char *mesg) -{ - rb_compile_warn(ruby_sourcefile, nd_line(node), "%s", mesg); -} -#define parser_warn(node, mesg) parser_warn(parser, node, mesg) - -static NODE* -block_append_gen(struct parser_params *parser, NODE *head, NODE *tail) -{ - NODE *end, *h = head, *nd; - - if (tail == 0) return head; - - if (h == 0) return tail; - switch (nd_type(h)) { - case NODE_LIT: - case NODE_STR: - case NODE_SELF: - case NODE_TRUE: - case NODE_FALSE: - case NODE_NIL: - parser_warning(h, "unused literal ignored"); - return tail; - default: - h = end = NEW_BLOCK(head); - end->nd_end = end; - fixpos(end, head); - head = end; - break; - case NODE_BLOCK: - end = h->nd_end; - break; - } - - nd = end->nd_head; - switch (nd_type(nd)) { - case NODE_RETURN: - case NODE_BREAK: - case NODE_NEXT: - case NODE_REDO: - case NODE_RETRY: - if (RTEST(ruby_verbose)) { - parser_warning(nd, "statement not reached"); - } - break; - - default: - break; - } - - if (nd_type(tail) != NODE_BLOCK) { - tail = NEW_BLOCK(tail); - tail->nd_end = tail; - } - end->nd_next = tail; - h->nd_end = tail->nd_end; - return head; -} - -/* append item to the list */ -static NODE* -list_append_gen(struct parser_params *parser, NODE *list, NODE *item) -{ - NODE *last; - - if (list == 0) return NEW_LIST(item); - if (list->nd_next) { - last = list->nd_next->nd_end; - } - else { - last = list; - } - - list->nd_alen += 1; - last->nd_next = NEW_LIST(item); - list->nd_next->nd_end = last->nd_next; - return list; -} - -/* concat two lists */ -static NODE* -list_concat_gen(struct parser_params *parser, NODE *head, NODE *tail) -{ - NODE *last; - - if (head->nd_next) { - last = head->nd_next->nd_end; - } - else { - last = head; - } - - head->nd_alen += tail->nd_alen; - last->nd_next = tail; - if (tail->nd_next) { - head->nd_next->nd_end = tail->nd_next->nd_end; - } - else { - head->nd_next->nd_end = tail; - } - - return head; -} - -static int -literal_concat0(struct parser_params *parser, VALUE head, VALUE tail) -{ - if (!rb_enc_compatible(head, tail)) { - compile_error(PARSER_ARG "string literal encodings differ (%s / %s)", - rb_enc_name(rb_enc_get(head)), - rb_enc_name(rb_enc_get(tail))); - rb_str_resize(head, 0); - rb_str_resize(tail, 0); - return 0; - } - rb_str_buf_append(head, tail); - return 1; -} - -/* concat two string literals */ -static NODE * -literal_concat_gen(struct parser_params *parser, NODE *head, NODE *tail) -{ - enum node_type htype; - - if (!head) return tail; - if (!tail) return head; - - htype = nd_type(head); - if (htype == NODE_EVSTR) { - NODE *node = NEW_DSTR(STR_NEW0()); - head = list_append(node, head); - } - switch (nd_type(tail)) { - case NODE_STR: - if (htype == NODE_STR) { - if (!literal_concat0(parser, head->nd_lit, tail->nd_lit)) { - error: - rb_gc_force_recycle((VALUE)head); - rb_gc_force_recycle((VALUE)tail); - return 0; - } - rb_gc_force_recycle((VALUE)tail); - } - else { - list_append(head, tail); - } - break; - - case NODE_DSTR: - if (htype == NODE_STR) { - if (!literal_concat0(parser, head->nd_lit, tail->nd_lit)) - goto error; - tail->nd_lit = head->nd_lit; - rb_gc_force_recycle((VALUE)head); - head = tail; - } - else { - nd_set_type(tail, NODE_ARRAY); - tail->nd_head = NEW_STR(tail->nd_lit); - list_concat(head, tail); - } - break; - - case NODE_EVSTR: - if (htype == NODE_STR) { - nd_set_type(head, NODE_DSTR); - head->nd_alen = 1; - } - list_append(head, tail); - break; - } - return head; -} - -static NODE * -evstr2dstr_gen(struct parser_params *parser, NODE *node) -{ - if (nd_type(node) == NODE_EVSTR) { - node = list_append(NEW_DSTR(STR_NEW0()), node); - } - return node; -} - -static NODE * -new_evstr_gen(struct parser_params *parser, NODE *node) -{ - NODE *head = node; - - if (node) { - switch (nd_type(node)) { - case NODE_STR: case NODE_DSTR: case NODE_EVSTR: - return node; - } - } - return NEW_EVSTR(head); -} - -static NODE * -call_bin_op_gen(struct parser_params *parser, NODE *recv, ID id, NODE *arg1) -{ - value_expr(recv); - value_expr(arg1); - return NEW_CALL(recv, id, NEW_LIST(arg1)); -} - -static NODE * -call_uni_op_gen(struct parser_params *parser, NODE *recv, ID id) -{ - value_expr(recv); - return NEW_CALL(recv, id, 0); -} - -static NODE* -match_op_gen(struct parser_params *parser, NODE *node1, NODE *node2) -{ - value_expr(node1); - value_expr(node2); - if (node1) { - switch (nd_type(node1)) { - case NODE_DREGX: - case NODE_DREGX_ONCE: - return NEW_MATCH2(node1, node2); - - case NODE_LIT: - if (TYPE(node1->nd_lit) == T_REGEXP) { - return NEW_MATCH2(node1, node2); - } - } - } - - if (node2) { - switch (nd_type(node2)) { - case NODE_DREGX: - case NODE_DREGX_ONCE: - return NEW_MATCH3(node2, node1); - - case NODE_LIT: - if (TYPE(node2->nd_lit) == T_REGEXP) { - return NEW_MATCH3(node2, node1); - } - } - } - - return NEW_CALL(node1, tMATCH, NEW_LIST(node2)); -} - -static NODE* -gettable_gen(struct parser_params *parser, ID id) -{ - if (id == keyword_self) { - return NEW_SELF(); - } - else if (id == keyword_nil) { - return NEW_NIL(); - } - else if (id == keyword_true) { - return NEW_TRUE(); - } - else if (id == keyword_false) { - return NEW_FALSE(); - } - else if (id == keyword__FILE__) { - return NEW_STR(STR_NEW2(ruby_sourcefile)); - } - else if (id == keyword__LINE__) { - return NEW_LIT(INT2FIX(ruby_sourceline)); - } - else if (id == keyword__ENCODING__) { - return NEW_LIT(rb_enc_from_encoding(parser->enc)); - } - else if (is_local_id(id)) { - if (dyna_in_block() && dvar_defined(id)) return NEW_DVAR(id); - if (local_id(id)) return NEW_LVAR(id); - /* method call without arguments */ - return NEW_VCALL(id); - } - else if (is_global_id(id)) { - return NEW_GVAR(id); - } - else if (is_instance_id(id)) { - return NEW_IVAR(id); - } - else if (is_const_id(id)) { - return NEW_CONST(id); - } - else if (is_class_id(id)) { - return NEW_CVAR(id); - } - compile_error(PARSER_ARG "identifier %s is not valid to get", rb_id2name(id)); - return 0; -} - -static NODE* -assignable_gen(struct parser_params *parser, ID id, NODE *val) -{ - if (!id) return 0; - if (id == keyword_self) { - yyerror("Can't change the value of self"); - } - else if (id == keyword_nil) { - yyerror("Can't assign to nil"); - } - else if (id == keyword_true) { - yyerror("Can't assign to true"); - } - else if (id == keyword_false) { - yyerror("Can't assign to false"); - } - else if (id == keyword__FILE__) { - yyerror("Can't assign to __FILE__"); - } - else if (id == keyword__LINE__) { - yyerror("Can't assign to __LINE__"); - } - else if (id == keyword__ENCODING__) { - yyerror("Can't assign to __ENCODING__"); - } - else if (is_local_id(id)) { - if (dyna_in_block()) { - if (dvar_curr(id)) { - return NEW_DASGN_CURR(id, val); - } - else if (dvar_defined(id)) { - return NEW_DASGN(id, val); - } - else if (local_id(id)) { - return NEW_LASGN(id, val); - } - else{ - dyna_var(id); - return NEW_DASGN_CURR(id, val); - } - } - else { - if (!local_id(id)) { - local_var(id); - } - return NEW_LASGN(id, val); - } - } - else if (is_global_id(id)) { - return NEW_GASGN(id, val); - } - else if (is_instance_id(id)) { - return NEW_IASGN(id, val); - } - else if (is_const_id(id)) { - if (in_def || in_single) - yyerror("dynamic constant assignment"); - return NEW_CDECL(id, val, 0); - } - else if (is_class_id(id)) { - return NEW_CVASGN(id, val); - } - else { - compile_error(PARSER_ARG "identifier %s is not valid to set", rb_id2name(id)); - } - return 0; -} - -static void -shadowing_lvar_gen(struct parser_params *parser, ID name) -{ - ID uscore; - - CONST_ID(uscore, "_"); - if (uscore == name) return; - if (dyna_in_block()) { - if (dvar_curr(name)) { - yyerror("duplicated argument name"); - } - else if (dvar_defined(name) || local_id(name)) { - rb_warningS("shadowing outer local variable - %s", rb_id2name(name)); - vtable_add(lvtbl->vars, name); - } - } - else { - if (local_id(name)) { - yyerror("duplicated argument name"); - } - } -} - -static void -new_bv_gen(struct parser_params *parser, ID name) -{ - if (!name) return; - if (!is_local_id(name)) { - compile_error(PARSER_ARG "invalid local variable - %s", - rb_id2name(name)); - return; - } - shadowing_lvar(name); - dyna_var(name); -} - -static NODE * -aryset_gen(struct parser_params *parser, NODE *recv, NODE *idx) -{ - if (recv && nd_type(recv) == NODE_SELF) - recv = (NODE *)1; - return NEW_ATTRASGN(recv, tASET, idx); -} - -static void -block_dup_check_gen(struct parser_params *parser, NODE *node1, NODE *node2) -{ - if (node2 && node1 && nd_type(node1) == NODE_BLOCK_PASS) { - compile_error(PARSER_ARG "both block arg and actual block given"); - } -} - -ID -rb_id_attrset(ID id) -{ - id &= ~ID_SCOPE_MASK; - id |= ID_ATTRSET; - return id; -} - -static NODE * -attrset_gen(struct parser_params *parser, NODE *recv, ID id) -{ - if (recv && nd_type(recv) == NODE_SELF) - recv = (NODE *)1; - return NEW_ATTRASGN(recv, rb_id_attrset(id), 0); -} - -static void -rb_backref_error_gen(struct parser_params *parser, NODE *node) -{ - switch (nd_type(node)) { - case NODE_NTH_REF: - compile_error(PARSER_ARG "Can't set variable $%ld", node->nd_nth); - break; - case NODE_BACK_REF: - compile_error(PARSER_ARG "Can't set variable $%c", (int)node->nd_nth); - break; - } -} - -static NODE * -arg_concat_gen(struct parser_params *parser, NODE *node1, NODE *node2) -{ - if (!node2) return node1; - switch (nd_type(node1)) { - case NODE_BLOCK_PASS: - node1->nd_iter = arg_concat(node1->nd_iter, node2); - return node1; - case NODE_ARGSPUSH: - if (nd_type(node2) != NODE_ARRAY) break; - node1->nd_body = list_concat(NEW_LIST(node1->nd_body), node2); - nd_set_type(node1, NODE_ARGSCAT); - return node1; - case NODE_ARGSCAT: - if (nd_type(node2) != NODE_ARRAY) break; - node1->nd_body = list_concat(node1->nd_body, node2); - return node1; - } - return NEW_ARGSCAT(node1, node2); -} - -static NODE * -arg_append_gen(struct parser_params *parser, NODE *node1, NODE *node2) -{ - if (!node1) return NEW_LIST(node2); - switch (nd_type(node1)) { - case NODE_ARRAY: - return list_append(node1, node2); - case NODE_BLOCK_PASS: - node1->nd_head = arg_append(node1->nd_head, node2); - return node1; - case NODE_ARGSPUSH: - node1->nd_body = list_append(NEW_LIST(node1->nd_body), node2); - nd_set_type(node1, NODE_ARGSCAT); - return node1; - } - return NEW_ARGSPUSH(node1, node2); -} - -static NODE * -splat_array(NODE* node) -{ - if (nd_type(node) == NODE_SPLAT) node = node->nd_head; - if (nd_type(node) == NODE_ARRAY) return node; - return 0; -} - -static NODE * -node_assign_gen(struct parser_params *parser, NODE *lhs, NODE *rhs) -{ - if (!lhs) return 0; - - switch (nd_type(lhs)) { - case NODE_GASGN: - case NODE_IASGN: - case NODE_IASGN2: - case NODE_LASGN: - case NODE_DASGN: - case NODE_DASGN_CURR: - case NODE_MASGN: - case NODE_CDECL: - case NODE_CVASGN: - lhs->nd_value = rhs; - break; - - case NODE_ATTRASGN: - case NODE_CALL: - lhs->nd_args = arg_append(lhs->nd_args, rhs); - break; - - default: - /* should not happen */ - break; - } - - return lhs; -} - -static int -value_expr_gen(struct parser_params *parser, NODE *node) -{ - int cond = 0; - - if (!node) { - rb_warning0("empty expression"); - } - while (node) { - switch (nd_type(node)) { - case NODE_DEFN: - case NODE_DEFS: - parser_warning(node, "void value expression"); - return Qfalse; - - case NODE_RETURN: - case NODE_BREAK: - case NODE_NEXT: - case NODE_REDO: - case NODE_RETRY: - if (!cond) yyerror("void value expression"); - /* or "control never reach"? */ - return Qfalse; - - case NODE_BLOCK: - while (node->nd_next) { - node = node->nd_next; - } - node = node->nd_head; - break; - - case NODE_BEGIN: - node = node->nd_body; - break; - - case NODE_IF: - if (!node->nd_body) { - node = node->nd_else; - break; - } - else if (!node->nd_else) { - node = node->nd_body; - break; - } - if (!value_expr(node->nd_body)) return Qfalse; - node = node->nd_else; - break; - - case NODE_AND: - case NODE_OR: - cond = 1; - node = node->nd_2nd; - break; - - default: - return Qtrue; - } - } - - return Qtrue; -} - -static void -void_expr_gen(struct parser_params *parser, NODE *node) -{ - const char *useless = 0; - - if (!RTEST(ruby_verbose)) return; - - if (!node) return; - switch (nd_type(node)) { - case NODE_CALL: - switch (node->nd_mid) { - case '+': - case '-': - case '*': - case '/': - case '%': - case tPOW: - case tUPLUS: - case tUMINUS: - case '|': - case '^': - case '&': - case tCMP: - case '>': - case tGEQ: - case '<': - case tLEQ: - case tEQ: - case tNEQ: - useless = rb_id2name(node->nd_mid); - break; - } - break; - - case NODE_LVAR: - case NODE_DVAR: - case NODE_GVAR: - case NODE_IVAR: - case NODE_CVAR: - case NODE_NTH_REF: - case NODE_BACK_REF: - useless = "a variable"; - break; - case NODE_CONST: - useless = "a constant"; - break; - case NODE_LIT: - case NODE_STR: - case NODE_DSTR: - case NODE_DREGX: - case NODE_DREGX_ONCE: - useless = "a literal"; - break; - case NODE_COLON2: - case NODE_COLON3: - useless = "::"; - break; - case NODE_DOT2: - useless = ".."; - break; - case NODE_DOT3: - useless = "..."; - break; - case NODE_SELF: - useless = "self"; - break; - case NODE_NIL: - useless = "nil"; - break; - case NODE_TRUE: - useless = "true"; - break; - case NODE_FALSE: - useless = "false"; - break; - case NODE_DEFINED: - useless = "defined?"; - break; - } - - if (useless) { - int line = ruby_sourceline; - - ruby_sourceline = nd_line(node); - rb_warnS("useless use of %s in void context", useless); - ruby_sourceline = line; - } -} - -static void -void_stmts_gen(struct parser_params *parser, NODE *node) -{ - if (!RTEST(ruby_verbose)) return; - if (!node) return; - if (nd_type(node) != NODE_BLOCK) return; - - for (;;) { - if (!node->nd_next) return; - void_expr0(node->nd_head); - node = node->nd_next; - } -} - -static NODE * -remove_begin(NODE *node) -{ - NODE **n = &node, *n1 = node; - while (n1 && nd_type(n1) == NODE_BEGIN && n1->nd_body) { - *n = n1 = n1->nd_body; - } - return node; -} - -static void -reduce_nodes_gen(struct parser_params *parser, NODE **body) -{ - NODE *node = *body; - - if (!node) { - *body = NEW_NIL(); - return; - } -#define subnodes(n1, n2) \ - ((!node->n1) ? (node->n2 ? (body = &node->n2, 1) : 0) : \ - (!node->n2) ? (body = &node->n1, 1) : \ - (reduce_nodes(&node->n1), body = &node->n2, 1)) - - while (node) { - switch (nd_type(node)) { - end: - case NODE_NIL: - *body = 0; - return; - case NODE_RETURN: - *body = node = node->nd_stts; - continue; - case NODE_BEGIN: - *body = node = node->nd_body; - continue; - case NODE_BLOCK: - body = &node->nd_end->nd_head; - break; - case NODE_IF: - if (subnodes(nd_body, nd_else)) break; - return; - case NODE_CASE: - body = &node->nd_body; - break; - case NODE_WHEN: - if (!subnodes(nd_body, nd_next)) goto end; - break; - case NODE_ENSURE: - if (!subnodes(nd_head, nd_resq)) goto end; - break; - case NODE_RESCUE: - if (!subnodes(nd_head, nd_resq)) goto end; - break; - default: - return; - } - node = *body; - } - -#undef subnodes -} - -static int -assign_in_cond(struct parser_params *parser, NODE *node) -{ - switch (nd_type(node)) { - case NODE_MASGN: - yyerror("multiple assignment in conditional"); - return 1; - - case NODE_LASGN: - case NODE_DASGN: - case NODE_GASGN: - case NODE_IASGN: - break; - - default: - return 0; - } - - switch (nd_type(node->nd_value)) { - case NODE_LIT: - case NODE_STR: - case NODE_NIL: - case NODE_TRUE: - case NODE_FALSE: - /* reports always */ - parser_warn(node->nd_value, "found = in conditional, should be =="); - return 1; - - case NODE_DSTR: - case NODE_XSTR: - case NODE_DXSTR: - case NODE_EVSTR: - case NODE_DREGX: - default: - break; - } - return 1; -} - -static void -warn_unless_e_option(struct parser_params *parser, NODE *node, const char *str) -{ - if (!e_option_supplied(parser)) parser_warn(node, str); -} - -static void -warning_unless_e_option(struct parser_params *parser, NODE *node, const char *str) -{ - if (!e_option_supplied(parser)) parser_warning(node, str); -} - -static void -fixup_nodes(NODE **rootnode) -{ - NODE *node, *next, *head; - - for (node = *rootnode; node; node = next) { - enum node_type type; - VALUE val; - - next = node->nd_next; - head = node->nd_head; - rb_gc_force_recycle((VALUE)node); - *rootnode = next; - switch (type = nd_type(head)) { - case NODE_DOT2: - case NODE_DOT3: - val = rb_range_new(head->nd_beg->nd_lit, head->nd_end->nd_lit, - type == NODE_DOT3 ? Qtrue : Qfalse); - rb_gc_force_recycle((VALUE)head->nd_beg); - rb_gc_force_recycle((VALUE)head->nd_end); - nd_set_type(head, NODE_LIT); - head->nd_lit = val; - break; - default: - break; - } - } -} - -static NODE *cond0(struct parser_params*,NODE*); - -static NODE* -range_op(struct parser_params *parser, NODE *node) -{ - enum node_type type; - - if (node == 0) return 0; - - type = nd_type(node); - value_expr(node); - if (type == NODE_LIT && FIXNUM_P(node->nd_lit)) { - warn_unless_e_option(parser, node, "integer literal in conditional range"); - return NEW_CALL(node, tEQ, NEW_LIST(NEW_GVAR(rb_intern("$.")))); - } - return cond0(parser, node); -} - -static int -literal_node(NODE *node) -{ - if (!node) return 1; /* same as NODE_NIL */ - switch (nd_type(node)) { - case NODE_LIT: - case NODE_STR: - case NODE_DSTR: - case NODE_EVSTR: - case NODE_DREGX: - case NODE_DREGX_ONCE: - case NODE_DSYM: - return 2; - case NODE_TRUE: - case NODE_FALSE: - case NODE_NIL: - return 1; - } - return 0; -} - -static NODE* -cond0(struct parser_params *parser, NODE *node) -{ - if (node == 0) return 0; - assign_in_cond(parser, node); - - switch (nd_type(node)) { - case NODE_DSTR: - case NODE_EVSTR: - case NODE_STR: - rb_warn0("string literal in condition"); - break; - - case NODE_DREGX: - case NODE_DREGX_ONCE: - warning_unless_e_option(parser, node, "regex literal in condition"); - return NEW_MATCH2(node, NEW_GVAR(rb_intern("$_"))); - - case NODE_AND: - case NODE_OR: - node->nd_1st = cond0(parser, node->nd_1st); - node->nd_2nd = cond0(parser, node->nd_2nd); - break; - - case NODE_DOT2: - case NODE_DOT3: - node->nd_beg = range_op(parser, node->nd_beg); - node->nd_end = range_op(parser, node->nd_end); - if (nd_type(node) == NODE_DOT2) nd_set_type(node,NODE_FLIP2); - else if (nd_type(node) == NODE_DOT3) nd_set_type(node, NODE_FLIP3); - if (!e_option_supplied(parser)) { - int b = literal_node(node->nd_beg); - int e = literal_node(node->nd_end); - if ((b == 1 && e == 1) || (b + e >= 2 && RTEST(ruby_verbose))) { - parser_warn(node, "range literal in condition"); - } - } - break; - - case NODE_DSYM: - parser_warning(node, "literal in condition"); - break; - - case NODE_LIT: - if (TYPE(node->nd_lit) == T_REGEXP) { - warn_unless_e_option(parser, node, "regex literal in condition"); - nd_set_type(node, NODE_MATCH); - } - else { - parser_warning(node, "literal in condition"); - } - default: - break; - } - return node; -} - -static NODE* -cond_gen(struct parser_params *parser, NODE *node) -{ - if (node == 0) return 0; - return cond0(parser, node); -} - -static NODE* -logop_gen(struct parser_params *parser, enum node_type type, NODE *left, NODE *right) -{ - value_expr(left); - if (left && nd_type(left) == type) { - NODE *node = left, *second; - while ((second = node->nd_2nd) != 0 && nd_type(second) == type) { - node = second; - } - node->nd_2nd = NEW_NODE(type, second, right, 0); - return left; - } - return NEW_NODE(type, left, right, 0); -} - -static void -no_blockarg(struct parser_params *parser, NODE *node) -{ - if (node && nd_type(node) == NODE_BLOCK_PASS) { - compile_error(PARSER_ARG "block argument should not be given"); - } -} - -static NODE * -ret_args_gen(struct parser_params *parser, NODE *node) -{ - if (node) { - no_blockarg(parser, node); - if (nd_type(node) == NODE_ARRAY) { - if (node->nd_next == 0) { - node = node->nd_head; - } - else { - nd_set_type(node, NODE_VALUES); - } - } - } - return node; -} - -static NODE * -new_yield_gen(struct parser_params *parser, NODE *node) -{ - long state = Qtrue; - - if (node) { - no_blockarg(parser, node); - if (node && nd_type(node) == NODE_SPLAT) { - state = Qtrue; - } - } - else { - state = Qfalse; - } - return NEW_YIELD(node, state); -} - -static NODE* -negate_lit(NODE *node) -{ - switch (TYPE(node->nd_lit)) { - case T_FIXNUM: - node->nd_lit = LONG2FIX(-FIX2LONG(node->nd_lit)); - break; - case T_BIGNUM: - node->nd_lit = rb_funcall(node->nd_lit,tUMINUS,0,0); - break; - case T_FLOAT: - RFLOAT(node->nd_lit)->float_value = -RFLOAT_VALUE(node->nd_lit); - break; - default: - break; - } - return node; -} - -static NODE * -arg_blk_pass(NODE *node1, NODE *node2) -{ - if (node2) { - node2->nd_head = node1; - return node2; - } - return node1; -} - -static NODE* -new_args_gen(struct parser_params *parser, NODE *m, NODE *o, ID r, NODE *p, ID b) -{ - int saved_line = ruby_sourceline; - NODE *node; - NODE *i1, *i2 = 0; - - node = NEW_ARGS(m ? m->nd_plen : 0, o); - i1 = m ? m->nd_next : 0; - node->nd_next = NEW_ARGS_AUX(r, b); - - if (p) { - i2 = p->nd_next; - node->nd_next->nd_next = NEW_ARGS_AUX(p->nd_pid, p->nd_plen); - } - else if (i1) { - node->nd_next->nd_next = NEW_ARGS_AUX(0, 0); - } - if (i1 || i2) { - node->nd_next->nd_next->nd_next = NEW_NODE(NODE_AND, i1, i2, 0); - } - ruby_sourceline = saved_line; - return node; -} - -static void -local_push_gen(struct parser_params *parser, int inherit_dvars) -{ - struct local_vars *local; - - local = ALLOC(struct local_vars); - local->prev = lvtbl; - local->args = vtable_alloc(0); - local->vars = vtable_alloc(inherit_dvars ? DVARS_INHERIT : DVARS_TOPSCOPE); - lvtbl = local; -} - -static void -local_pop_gen(struct parser_params *parser) -{ - struct local_vars *local = lvtbl->prev; - vtable_free(lvtbl->args); - vtable_free(lvtbl->vars); - xfree(lvtbl); - lvtbl = local; -} - -static ID* -vtable_tblcpy(ID *buf, const struct vtable *src) -{ - int i, cnt = vtable_size(src); - - if (cnt > 0) { - buf[0] = cnt; - for (i = 0; i < cnt; i++) { - buf[i] = src->tbl[i]; - } - return buf; - } - return 0; -} - -static ID* -local_tbl_gen(struct parser_params *parser) -{ - int cnt = vtable_size(lvtbl->args) + vtable_size(lvtbl->vars); - ID *buf; - - if (cnt <= 0) return 0; - buf = ALLOC_N(ID, cnt + 1); - vtable_tblcpy(buf+1, lvtbl->args); - vtable_tblcpy(buf+vtable_size(lvtbl->args)+1, lvtbl->vars); - buf[0] = cnt; - return buf; -} - -#include "debug.h" -static int -arg_var_gen(struct parser_params *parser, ID id) -{ - vtable_add(lvtbl->args, id); - return vtable_size(lvtbl->args) - 1; -} - -static int -local_var_gen(struct parser_params *parser, ID id) -{ - vtable_add(lvtbl->vars, id); - return vtable_size(lvtbl->vars) - 1; -} - -static int -local_id_gen(struct parser_params *parser, ID id) -{ - struct vtable *vars, *args; - - vars = lvtbl->vars; - args = lvtbl->args; - - while (vars && POINTER_P(vars->prev)) { - vars = vars->prev; - args = args->prev; - } - - if (vars && vars->prev == DVARS_INHERIT) { - return rb_local_defined(id); - } - else { - return (vtable_included(args, id) || - vtable_included(vars, id)); - } -} - -static void -dyna_push_gen(struct parser_params *parser) -{ - lvtbl->args = vtable_alloc(lvtbl->args); - lvtbl->vars = vtable_alloc(lvtbl->vars); -} - -static void -dyna_pop_gen(struct parser_params *parser) -{ - struct vtable *tmp; - - tmp = lvtbl->args; - lvtbl->args = lvtbl->args->prev; - vtable_free(tmp); - tmp = lvtbl->vars; - lvtbl->vars = lvtbl->vars->prev; - vtable_free(tmp); -} - -static int -dyna_in_block_gen(struct parser_params *parser) -{ - return POINTER_P(lvtbl->vars) && lvtbl->vars->prev != DVARS_TOPSCOPE; -} - -static int -dvar_defined_gen(struct parser_params *parser, ID id) -{ - struct vtable *vars, *args; - - args = lvtbl->args; - vars = lvtbl->vars; - - while (POINTER_P(vars)) { - if (vtable_included(args, id)) { - return 1; - } - if (vtable_included(vars, id)) { - return 1; - } - args = args->prev; - vars = vars->prev; - } - - if (vars == DVARS_INHERIT) { - return rb_dvar_defined(id); - } - - return 0; -} - -static int -dvar_curr_gen(struct parser_params *parser, ID id) -{ - return (vtable_included(lvtbl->args, id) || - vtable_included(lvtbl->vars, id)); -} - -VALUE rb_reg_compile(VALUE str, int options); -VALUE rb_reg_check_preprocess(VALUE); - -static void -reg_fragment_setenc_gen(struct parser_params* parser, VALUE str, int options) -{ - int c = RE_OPTION_ENCODING_IDX(options); - - if (c) { - int opt, idx; - rb_char_to_option_kcode(c, &opt, &idx); - if (idx != ENCODING_GET(str) && - rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) { - goto error; - } - ENCODING_SET(str, idx); - } - else if (RE_OPTION_ENCODING_NONE(options)) { - if (!ENCODING_IS_ASCII8BIT(str) && - rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) { - c = 'n'; - goto error; - } - rb_enc_associate(str, rb_ascii8bit_encoding()); - } - else if (parser->enc == rb_usascii_encoding()) { - if (rb_enc_str_coderange(str) != ENC_CODERANGE_7BIT) { - /* raise in re.c */ - rb_enc_associate(str, rb_usascii_encoding()); - } - else { - rb_enc_associate(str, rb_ascii8bit_encoding()); - } - } - return; - - error: - compile_error(PARSER_ARG - "regexp encoding option '%c' differs from source encoding '%s'", - c, rb_enc_name(rb_enc_get(str))); -} - -static void -reg_fragment_check_gen(struct parser_params* parser, VALUE str, int options) -{ - VALUE err; - reg_fragment_setenc_gen(parser, str, options); - err = rb_reg_check_preprocess(str); - if (err != Qnil) { - err = rb_obj_as_string(err); - compile_error(PARSER_ARG "%s", RSTRING_PTR(err)); - RB_GC_GUARD(err); - } -} - -typedef struct { - struct parser_params* parser; - rb_encoding *enc; - NODE *succ_block; - NODE *fail_block; - int num; -} reg_named_capture_assign_t; - -static int -reg_named_capture_assign_iter(const OnigUChar *name, const OnigUChar *name_end, - int back_num, int *back_refs, OnigRegex regex, void *arg0) -{ - reg_named_capture_assign_t *arg = (reg_named_capture_assign_t*)arg0; - struct parser_params* parser = arg->parser; - rb_encoding *enc = arg->enc; - int len = name_end - name; - const char *s = (const char *)name; - ID var; - - arg->num++; - - if (arg->succ_block == 0) { - arg->succ_block = NEW_BEGIN(0); - arg->fail_block = NEW_BEGIN(0); - } - - if (!len || (*name != '_' && ISASCII(*name) && !rb_enc_islower(*name, enc)) || - rb_reserved_word(s, len) || !rb_enc_symname2_p(s, len, enc)) { - return ST_CONTINUE; - } - var = rb_intern3(s, len, enc); - if (dvar_defined(var) || local_id(var)) { - rb_warningS("named capture conflicts a local variable - %s", - rb_id2name(var)); - } - arg->succ_block = block_append(arg->succ_block, - newline_node(node_assign(assignable(var,0), - NEW_CALL( - gettable(rb_intern("$~")), - idAREF, - NEW_LIST(NEW_LIT(ID2SYM(var)))) - ))); - arg->fail_block = block_append(arg->fail_block, - newline_node(node_assign(assignable(var,0), NEW_LIT(Qnil)))); - return ST_CONTINUE; -} - -static NODE * -reg_named_capture_assign_gen(struct parser_params* parser, VALUE regexp, NODE *match) -{ - reg_named_capture_assign_t arg; - - arg.parser = parser; - arg.enc = rb_enc_get(regexp); - arg.succ_block = 0; - arg.fail_block = 0; - arg.num = 0; - onig_foreach_name(RREGEXP(regexp)->ptr, reg_named_capture_assign_iter, (void*)&arg); - - if (arg.num == 0) - return match; - - return - block_append( - newline_node(match), - NEW_IF(gettable(rb_intern("$~")), - block_append( - newline_node(arg.succ_block), - newline_node( - NEW_CALL( - gettable(rb_intern("$~")), - rb_intern("begin"), - NEW_LIST(NEW_LIT(INT2FIX(0)))))), - block_append( - newline_node(arg.fail_block), - newline_node( - NEW_LIT(Qnil))))); -} - -static VALUE -reg_compile_gen(struct parser_params* parser, VALUE str, int options) -{ - VALUE re; - VALUE err; - - reg_fragment_setenc(str, options); - err = rb_errinfo(); - re = rb_reg_compile(str, options & RE_OPTION_MASK); - if (NIL_P(re)) { - ID mesg = rb_intern("mesg"); - VALUE m = rb_attr_get(rb_errinfo(), mesg); - rb_set_errinfo(err); - if (!NIL_P(err)) { - rb_str_append(rb_str_cat(rb_attr_get(err, mesg), "\n", 1), m); - } - else { - compile_error(PARSER_ARG "%s", RSTRING_PTR(m)); - } - return Qnil; - } - return re; -} - -void -rb_gc_mark_parser(void) -{ -} - -NODE* -rb_parser_append_print(VALUE vparser, NODE *node) -{ - NODE *prelude = 0; - NODE *scope = node; - struct parser_params *parser; - - if (!node) return node; - - Data_Get_Struct(vparser, struct parser_params, parser); - - node = node->nd_body; - - if (nd_type(node) == NODE_PRELUDE) { - prelude = node; - node = node->nd_body; - } - - node = block_append(node, - NEW_FCALL(rb_intern("print"), - NEW_ARRAY(NEW_GVAR(rb_intern("$_"))))); - if (prelude) { - prelude->nd_body = node; - scope->nd_body = prelude; - } - else { - scope->nd_body = node; - } - - return scope; -} - -NODE * -rb_parser_while_loop(VALUE vparser, NODE *node, int chop, int split) -{ - NODE *prelude = 0; - NODE *scope = node; - struct parser_params *parser; - - if (!node) return node; - - Data_Get_Struct(vparser, struct parser_params, parser); - - node = node->nd_body; - - if (nd_type(node) == NODE_PRELUDE) { - prelude = node; - node = node->nd_body; - } - if (split) { - node = block_append(NEW_GASGN(rb_intern("$F"), - NEW_CALL(NEW_GVAR(rb_intern("$_")), - rb_intern("split"), 0)), - node); - } - if (chop) { - node = block_append(NEW_CALL(NEW_GVAR(rb_intern("$_")), - rb_intern("chop!"), 0), node); - } - - node = NEW_OPT_N(node); - - if (prelude) { - prelude->nd_body = node; - scope->nd_body = prelude; - } - else { - scope->nd_body = node; - } - - return scope; -} - -static const struct { - ID token; - const char *name; -} op_tbl[] = { - {tDOT2, ".."}, - {tDOT3, "..."}, - {'+', "+(binary)"}, - {'-', "-(binary)"}, - {tPOW, "**"}, - {tUPLUS, "+@"}, - {tUMINUS, "-@"}, - {tCMP, "<=>"}, - {tGEQ, ">="}, - {tLEQ, "<="}, - {tEQ, "=="}, - {tEQQ, "==="}, - {tNEQ, "!="}, - {tMATCH, "=~"}, - {tNMATCH, "!~"}, - {tAREF, "[]"}, - {tASET, "[]="}, - {tLSHFT, "<<"}, - {tRSHFT, ">>"}, - {tCOLON2, "::"}, -}; - -#define op_tbl_count (sizeof(op_tbl) / sizeof(op_tbl[0])) - -static struct symbols { - ID last_id; - st_table *sym_id; - st_table *id_str; - st_table *ivar2_id; - st_table *id_ivar2; - VALUE op_sym[tLAST_TOKEN]; -} global_symbols = {tLAST_ID}; - -static const struct st_hash_type symhash = { - rb_str_hash_cmp, - rb_str_hash, -}; - -struct ivar2_key { - ID id; - VALUE klass; -}; - -static int -ivar2_cmp(struct ivar2_key *key1, struct ivar2_key *key2) -{ - if (key1->id == key2->id && key1->klass == key2->klass) { - return 0; - } - return 1; -} - -static int -ivar2_hash(struct ivar2_key *key) -{ - return (key->id << 8) ^ (key->klass >> 2); -} - -static const struct st_hash_type ivar2_hash_type = { - ivar2_cmp, - ivar2_hash, -}; - -void -Init_sym(void) -{ - global_symbols.sym_id = st_init_table_with_size(&symhash, 1000); - global_symbols.id_str = st_init_numtable_with_size(1000); - global_symbols.ivar2_id = st_init_table_with_size(&ivar2_hash_type, 1000); - global_symbols.id_ivar2 = st_init_numtable_with_size(1000); - - Init_id(); -} - -void -rb_gc_mark_symbols(void) -{ - rb_mark_tbl(global_symbols.id_str); - rb_gc_mark_locations(global_symbols.op_sym, - global_symbols.op_sym + tLAST_TOKEN); -} - -static ID -internal_id_gen(struct parser_params *parser) -{ - ID id = (ID)vtable_size(lvtbl->args) + (ID)vtable_size(lvtbl->vars); - id += ((tLAST_TOKEN - ID_INTERNAL) >> ID_SCOPE_SHIFT) + 1; - return ID_INTERNAL | (id << ID_SCOPE_SHIFT); -} - -static int -is_special_global_name(const char *m, const char *e, rb_encoding *enc) -{ - int mb = 0; - - if (m >= e) return 0; - switch (*m) { - case '~': case '*': case '$': case '?': case '!': case '@': - case '/': case '\\': case ';': case ',': case '.': case '=': - case ':': case '<': case '>': case '\"': - case '&': case '`': case '\'': case '+': - case '0': - ++m; - break; - case '-': - ++m; - if (m < e && is_identchar(m, e, enc)) { - if (!ISASCII(*m)) mb = 1; - m += rb_enc_mbclen(m, e, enc); - } - break; - default: - if (!rb_enc_isdigit(*m, enc)) return 0; - do { - if (!ISASCII(*m)) mb = 1; - ++m; - } while (rb_enc_isdigit(*m, enc)); - } - return m == e ? mb + 1 : 0; -} - -int -rb_symname_p(const char *name) -{ - return rb_enc_symname_p(name, rb_ascii8bit_encoding()); -} - -int -rb_enc_symname_p(const char *name, rb_encoding *enc) -{ - return rb_enc_symname2_p(name, strlen(name), enc); -} - -int -rb_enc_symname2_p(const char *name, int len, rb_encoding *enc) -{ - const char *m = name; - const char *e = m + len; - int localid = Qfalse; - - if (!m) return Qfalse; - switch (*m) { - case '\0': - return Qfalse; - - case '$': - if (is_special_global_name(++m, e, enc)) return Qtrue; - goto id; - - case '@': - if (*++m == '@') ++m; - goto id; - - case '<': - switch (*++m) { - case '<': ++m; break; - case '=': if (*++m == '>') ++m; break; - default: break; - } - break; - - case '>': - switch (*++m) { - case '>': case '=': ++m; break; - } - break; - - case '=': - switch (*++m) { - case '~': ++m; break; - case '=': if (*++m == '=') ++m; break; - default: return Qfalse; - } - break; - - case '*': - if (*++m == '*') ++m; - break; - - case '+': case '-': - if (*++m == '@') ++m; - break; - - case '|': case '^': case '&': case '/': case '%': case '~': case '`': - ++m; - break; - - case '[': - if (*++m != ']') return Qfalse; - if (*++m == '=') ++m; - break; - - case '!': - switch (*++m) { - case '\0': return Qtrue; - case '=': case '~': ++m; break; - default: return Qfalse; - } - break; - - default: - localid = !rb_enc_isupper(*m, enc); - id: - if (m >= e || (*m != '_' && !rb_enc_isalpha(*m, enc) && ISASCII(*m))) - return Qfalse; - while (m < e && is_identchar(m, e, enc)) m += rb_enc_mbclen(m, e, enc); - if (localid) { - switch (*m) { - case '!': case '?': case '=': ++m; - } - } - break; - } - return *m ? Qfalse : Qtrue; -} - -static ID -register_symid(ID id, const char *name, long len, rb_encoding *enc) -{ - VALUE str = rb_enc_str_new(name, len, enc); - OBJ_FREEZE(str); - st_add_direct(global_symbols.sym_id, (st_data_t)str, id); - st_add_direct(global_symbols.id_str, id, (st_data_t)str); - return id; -} - -ID -rb_intern3(const char *name, long len, rb_encoding *enc) -{ - const char *m = name; - const char *e = m + len; - unsigned char c; - VALUE str; - ID id; - int last; - int mb; - struct RString fake_str; - fake_str.basic.flags = T_STRING|RSTRING_NOEMBED|FL_FREEZE; - fake_str.basic.klass = rb_cString; - fake_str.as.heap.len = len; - fake_str.as.heap.ptr = (char *)name; - fake_str.as.heap.aux.capa = len; - str = (VALUE)&fake_str; - rb_enc_associate(str, enc); - - if (st_lookup(global_symbols.sym_id, str, (st_data_t *)&id)) - return id; - - if (rb_cString && !rb_enc_asciicompat(enc)) { - id = ID_JUNK; - goto new_id; - } - last = len-1; - id = 0; - switch (*m) { - case '$': - id |= ID_GLOBAL; - if ((mb = is_special_global_name(++m, e, enc)) != 0) { - if (!--mb) enc = rb_ascii8bit_encoding(); - goto new_id; - } - break; - case '@': - if (m[1] == '@') { - m++; - id |= ID_CLASS; - } - else { - id |= ID_INSTANCE; - } - m++; - break; - default: - c = m[0]; - if (c != '_' && rb_enc_isascii(c, enc) && rb_enc_ispunct(c, enc)) { - /* operators */ - int i; - - if (len == 1) { - id = c; - goto id_register; - } - for (i = 0; i < op_tbl_count; i++) { - if (*op_tbl[i].name == *m && - strcmp(op_tbl[i].name, m) == 0) { - id = op_tbl[i].token; - goto id_register; - } - } - } - - if (m[last] == '=') { - /* attribute assignment */ - id = rb_intern3(name, last, enc); - if (id > tLAST_TOKEN && !is_attrset_id(id)) { - enc = rb_enc_get(rb_id2str(id)); - id = rb_id_attrset(id); - goto id_register; - } - id = ID_ATTRSET; - } - else if (rb_enc_isupper(m[0], enc)) { - id = ID_CONST; - } - else { - id = ID_LOCAL; - } - break; - } - mb = 0; - if (!rb_enc_isdigit(*m, enc)) { - while (m <= name + last && is_identchar(m, e, enc)) { - if (ISASCII(*m)) { - m++; - } - else { - mb = 1; - m += rb_enc_mbclen(m, e, enc); - } - } - } - if (m - name < len) id = ID_JUNK; - if (enc != rb_usascii_encoding()) { - /* - * this clause makes sense only when called from other than - * rb_intern_str() taking care of code-range. - */ - if (!mb) { - for (; m <= name + len; ++m) { - if (!ISASCII(*m)) goto mbstr; - } - enc = rb_usascii_encoding(); - } - mbstr:; - } - new_id: - id |= ++global_symbols.last_id << ID_SCOPE_SHIFT; - id_register: - return register_symid(id, name, len, enc); -} - -ID -rb_intern2(const char *name, long len) -{ - return rb_intern3(name, len, rb_usascii_encoding()); -} - -#undef rb_intern -ID -rb_intern(const char *name) -{ - return rb_intern2(name, strlen(name)); -} - -ID -rb_intern_str(VALUE str) -{ - rb_encoding *enc; - ID id; - - if (rb_enc_str_coderange(str) == ENC_CODERANGE_7BIT) { - enc = rb_usascii_encoding(); - } - else { - enc = rb_enc_get(str); - } - id = rb_intern3(RSTRING_PTR(str), RSTRING_LEN(str), enc); - RB_GC_GUARD(str); - return id; -} - -VALUE -rb_id2str(ID id) -{ - st_data_t data; - - if (id < tLAST_TOKEN) { - int i = 0; - - if (rb_ispunct(id)) { - VALUE str = global_symbols.op_sym[i = (int)id]; - if (!str) { - char name[2]; - name[0] = (char)id; - name[1] = 0; - str = rb_usascii_str_new(name, 1); - OBJ_FREEZE(str); - global_symbols.op_sym[i] = str; - } - return str; - } - for (i = 0; i < op_tbl_count; i++) { - if (op_tbl[i].token == id) { - VALUE str = global_symbols.op_sym[i]; - if (!str) { - str = rb_usascii_str_new2(op_tbl[i].name); - OBJ_FREEZE(str); - global_symbols.op_sym[i] = str; - } - return str; - } - } - } - - if (st_lookup(global_symbols.id_str, id, &data)) { - VALUE str = (VALUE)data; - if (RBASIC(str)->klass == 0) - RBASIC(str)->klass = rb_cString; - return str; - } - - if (is_attrset_id(id)) { - ID id2 = (id & ~ID_SCOPE_MASK) | ID_LOCAL; - VALUE str; - - while (!(str = rb_id2str(id2))) { - if (!is_local_id(id2)) return 0; - id2 = (id & ~ID_SCOPE_MASK) | ID_CONST; - } - str = rb_str_dup(str); - rb_str_cat(str, "=", 1); - rb_intern_str(str); - if (st_lookup(global_symbols.id_str, id, &data)) { - VALUE str = (VALUE)data; - if (RBASIC(str)->klass == 0) - RBASIC(str)->klass = rb_cString; - return str; - } - } - return 0; -} - -const char * -rb_id2name(ID id) -{ - VALUE str = rb_id2str(id); - - if (!str) return 0; - return RSTRING_PTR(str); -} - -static int -symbols_i(VALUE sym, ID value, VALUE ary) -{ - rb_ary_push(ary, ID2SYM(value)); - return ST_CONTINUE; -} - -/* - * call-seq: - * Symbol.all_symbols => array - * - * Returns an array of all the symbols currently in Ruby's symbol - * table. - * - * Symbol.all_symbols.size #=> 903 - * Symbol.all_symbols[1,20] #=> [:floor, :ARGV, :Binding, :symlink, - * :chown, :EOFError, :$;, :String, - * :LOCK_SH, :"setuid?", :$<, - * :default_proc, :compact, :extend, - * :Tms, :getwd, :$=, :ThreadGroup, - * :wait2, :$>] - */ - -VALUE -rb_sym_all_symbols(void) -{ - VALUE ary = rb_ary_new2(global_symbols.sym_id->num_entries); - - st_foreach(global_symbols.sym_id, symbols_i, ary); - return ary; -} - -int -rb_is_const_id(ID id) -{ - if (is_const_id(id)) return Qtrue; - return Qfalse; -} - -int -rb_is_class_id(ID id) -{ - if (is_class_id(id)) return Qtrue; - return Qfalse; -} - -int -rb_is_instance_id(ID id) -{ - if (is_instance_id(id)) return Qtrue; - return Qfalse; -} - -int -rb_is_local_id(ID id) -{ - if (is_local_id(id)) return Qtrue; - return Qfalse; -} - -int -rb_is_junk_id(ID id) -{ - if (is_junk_id(id)) return Qtrue; - return Qfalse; -} - -#endif /* !RIPPER */ - -static void -parser_initialize(struct parser_params *parser) -{ - parser->eofp = Qfalse; - - parser->parser_lex_strterm = 0; - parser->parser_cond_stack = 0; - parser->parser_cmdarg_stack = 0; - parser->parser_class_nest = 0; - parser->parser_paren_nest = 0; - parser->parser_lpar_beg = 0; - parser->parser_in_single = 0; - parser->parser_in_def = 0; - parser->parser_in_defined = 0; - parser->parser_compile_for_eval = 0; - parser->parser_cur_mid = 0; - parser->parser_tokenbuf = NULL; - parser->parser_tokidx = 0; - parser->parser_toksiz = 0; - parser->parser_heredoc_end = 0; - parser->parser_command_start = Qtrue; - parser->parser_deferred_nodes = 0; - parser->parser_lex_pbeg = 0; - parser->parser_lex_p = 0; - parser->parser_lex_pend = 0; - parser->parser_lvtbl = 0; - parser->parser_ruby__end__seen = 0; - parser->parser_ruby_sourcefile = 0; -#ifndef RIPPER - parser->is_ripper = 0; - parser->parser_eval_tree_begin = 0; - parser->parser_eval_tree = 0; -#else - parser->is_ripper = 1; - parser->parser_ruby_sourcefile_string = Qnil; - parser->delayed = Qnil; - - parser->result = Qnil; - parser->parsing_thread = Qnil; - parser->toplevel_p = Qtrue; -#endif -#ifdef YYMALLOC - parser->heap = NULL; -#endif - parser->enc = rb_usascii_encoding(); -} - -#ifdef RIPPER -#define parser_mark ripper_parser_mark -#define parser_free ripper_parser_free -#endif - -static void -parser_mark(void *ptr) -{ - struct parser_params *p = (struct parser_params*)ptr; - - rb_gc_mark((VALUE)p->parser_lex_strterm); - rb_gc_mark((VALUE)p->parser_deferred_nodes); - rb_gc_mark(p->parser_lex_input); - rb_gc_mark(p->parser_lex_lastline); - rb_gc_mark(p->parser_lex_nextline); -#ifndef RIPPER - rb_gc_mark((VALUE)p->parser_eval_tree_begin) ; - rb_gc_mark((VALUE)p->parser_eval_tree) ; - rb_gc_mark(p->debug_lines); -#else - rb_gc_mark(p->parser_ruby_sourcefile_string); - rb_gc_mark(p->delayed); - rb_gc_mark(p->value); - rb_gc_mark(p->result); - rb_gc_mark(p->parsing_thread); -#endif -#ifdef YYMALLOC - rb_gc_mark((VALUE)p->heap); -#endif -} - -static void -parser_free(void *ptr) -{ - struct parser_params *p = (struct parser_params*)ptr; - struct local_vars *local, *prev; - - if (p->parser_tokenbuf) { - xfree(p->parser_tokenbuf); - } - for (local = p->parser_lvtbl; local; local = prev) { - if (local->vars) xfree(local->vars); - prev = local->prev; - xfree(local); - } -#ifndef RIPPER - xfree(p->parser_ruby_sourcefile); -#endif - xfree(p); -} - -VALUE rb_parser_get_yydebug(VALUE); -VALUE rb_parser_set_yydebug(VALUE, VALUE); - -#ifndef RIPPER -static struct parser_params * -parser_new(void) -{ - struct parser_params *p; - - p = ALLOC_N(struct parser_params, 1); - MEMZERO(p, struct parser_params, 1); - parser_initialize(p); - return p; -} - -VALUE -rb_parser_new(void) -{ - struct parser_params *p = parser_new(); - - return Data_Wrap_Struct(0, parser_mark, parser_free, p); -} - -/* - * call-seq: - * ripper#end_seen? -> Boolean - * - * Return if parsed source ended by +\_\_END\_\_+. - * This number starts from 1. - */ -VALUE -rb_parser_end_seen_p(VALUE vparser) -{ - struct parser_params *parser; - - Data_Get_Struct(vparser, struct parser_params, parser); - return ruby__end__seen ? Qtrue : Qfalse; -} - -/* - * call-seq: - * ripper#encoding -> encoding - * - * Return encoding of the source. - */ -VALUE -rb_parser_encoding(VALUE vparser) -{ - struct parser_params *parser; - - Data_Get_Struct(vparser, struct parser_params, parser); - return rb_enc_from_encoding(parser->enc); -} - -/* - * call-seq: - * ripper.yydebug -> true or false - * - * Get yydebug. - */ -VALUE -rb_parser_get_yydebug(VALUE self) -{ - struct parser_params *parser; - - Data_Get_Struct(self, struct parser_params, parser); - return yydebug ? Qtrue : Qfalse; -} - -/* - * call-seq: - * ripper.yydebug = flag - * - * Set yydebug. - */ -VALUE -rb_parser_set_yydebug(VALUE self, VALUE flag) -{ - struct parser_params *parser; - - Data_Get_Struct(self, struct parser_params, parser); - yydebug = RTEST(flag); - return flag; -} - -#ifdef YYMALLOC -#define HEAPCNT(n, size) ((n) * (size) / sizeof(YYSTYPE)) -#define NEWHEAP() rb_node_newnode(NODE_ALLOCA, 0, (VALUE)parser->heap, 0) -#define ADD2HEAP(n, c, p) ((parser->heap = (n))->u1.node = (p), \ - (n)->u3.cnt = (c), (p)) - -void * -rb_parser_malloc(struct parser_params *parser, size_t size) -{ - size_t cnt = HEAPCNT(1, size); - NODE *n = NEWHEAP(); - void *ptr = xmalloc(size); - - return ADD2HEAP(n, cnt, ptr); -} - -void * -rb_parser_calloc(struct parser_params *parser, size_t nelem, size_t size) -{ - size_t cnt = HEAPCNT(nelem, size); - NODE *n = NEWHEAP(); - void *ptr = xcalloc(nelem, size); - - return ADD2HEAP(n, cnt, ptr); -} - -void * -rb_parser_realloc(struct parser_params *parser, void *ptr, size_t size) -{ - NODE *n; - size_t cnt = HEAPCNT(1, size); - - if (ptr && (n = parser->heap) != NULL) { - do { - if (n->u1.node == ptr) { - n->u1.node = ptr = xrealloc(ptr, size); - if (n->u3.cnt) n->u3.cnt = cnt; - return ptr; - } - } while ((n = n->u2.node) != NULL); - } - n = NEWHEAP(); - ptr = xrealloc(ptr, size); - return ADD2HEAP(n, cnt, ptr); -} - -void -rb_parser_free(struct parser_params *parser, void *ptr) -{ - NODE **prev = &parser->heap, *n; - - while ((n = *prev) != NULL) { - if (n->u1.node == ptr) { - *prev = n->u2.node; - rb_gc_force_recycle((VALUE)n); - break; - } - prev = &n->u2.node; - } - xfree(ptr); -} -#endif -#endif - -#ifdef RIPPER -#ifdef RIPPER_DEBUG -extern int rb_is_pointer_to_heap(VALUE); - -/* :nodoc: */ -static VALUE -ripper_validate_object(VALUE self, VALUE x) -{ - if (x == Qfalse) return x; - if (x == Qtrue) return x; - if (x == Qnil) return x; - if (x == Qundef) - rb_raise(rb_eArgError, "Qundef given"); - if (FIXNUM_P(x)) return x; - if (SYMBOL_P(x)) return x; - if (!rb_is_pointer_to_heap(x)) - rb_raise(rb_eArgError, "invalid pointer: %p", x); - switch (TYPE(x)) { - case T_STRING: - case T_OBJECT: - case T_ARRAY: - case T_BIGNUM: - case T_FLOAT: - return x; - case T_NODE: - rb_raise(rb_eArgError, "NODE given: %p", x); - default: - rb_raise(rb_eArgError, "wrong type of ruby object: %p (%s)", - x, rb_obj_classname(x)); - } - return x; -} -#endif - -#define validate(x) - -static VALUE -ripper_dispatch0(struct parser_params *parser, ID mid) -{ - return rb_funcall(parser->value, mid, 0); -} - -static VALUE -ripper_dispatch1(struct parser_params *parser, ID mid, VALUE a) -{ - validate(a); - return rb_funcall(parser->value, mid, 1, a); -} - -static VALUE -ripper_dispatch2(struct parser_params *parser, ID mid, VALUE a, VALUE b) -{ - validate(a); - validate(b); - return rb_funcall(parser->value, mid, 2, a, b); -} - -static VALUE -ripper_dispatch3(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c) -{ - validate(a); - validate(b); - validate(c); - return rb_funcall(parser->value, mid, 3, a, b, c); -} - -static VALUE -ripper_dispatch4(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c, VALUE d) -{ - validate(a); - validate(b); - validate(c); - validate(d); - return rb_funcall(parser->value, mid, 4, a, b, c, d); -} - -static VALUE -ripper_dispatch5(struct parser_params *parser, ID mid, VALUE a, VALUE b, VALUE c, VALUE d, VALUE e) -{ - validate(a); - validate(b); - validate(c); - validate(d); - validate(e); - return rb_funcall(parser->value, mid, 5, a, b, c, d, e); -} - -static const struct kw_assoc { - ID id; - const char *name; -} keyword_to_name[] = { - {keyword_class, "class"}, - {keyword_module, "module"}, - {keyword_def, "def"}, - {keyword_undef, "undef"}, - {keyword_begin, "begin"}, - {keyword_rescue, "rescue"}, - {keyword_ensure, "ensure"}, - {keyword_end, "end"}, - {keyword_if, "if"}, - {keyword_unless, "unless"}, - {keyword_then, "then"}, - {keyword_elsif, "elsif"}, - {keyword_else, "else"}, - {keyword_case, "case"}, - {keyword_when, "when"}, - {keyword_while, "while"}, - {keyword_until, "until"}, - {keyword_for, "for"}, - {keyword_break, "break"}, - {keyword_next, "next"}, - {keyword_redo, "redo"}, - {keyword_retry, "retry"}, - {keyword_in, "in"}, - {keyword_do, "do"}, - {keyword_do_cond, "do"}, - {keyword_do_block, "do"}, - {keyword_return, "return"}, - {keyword_yield, "yield"}, - {keyword_super, "super"}, - {keyword_self, "self"}, - {keyword_nil, "nil"}, - {keyword_true, "true"}, - {keyword_false, "false"}, - {keyword_and, "and"}, - {keyword_or, "or"}, - {keyword_not, "not"}, - {modifier_if, "if"}, - {modifier_unless, "unless"}, - {modifier_while, "while"}, - {modifier_until, "until"}, - {modifier_rescue, "rescue"}, - {keyword_alias, "alias"}, - {keyword_defined, "defined?"}, - {keyword_BEGIN, "BEGIN"}, - {keyword_END, "END"}, - {keyword__LINE__, "__LINE__"}, - {keyword__FILE__, "__FILE__"}, - {keyword__ENCODING__, "__ENCODING__"}, - {0, NULL} -}; - -static const char* -keyword_id_to_str(ID id) -{ - const struct kw_assoc *a; - - for (a = keyword_to_name; a->id; a++) { - if (a->id == id) - return a->name; - } - return NULL; -} - -#undef ripper_id2sym -static VALUE -ripper_id2sym(ID id) -{ - const char *name; - char buf[8]; - - if (id <= 256) { - buf[0] = id; - buf[1] = '\0'; - return ID2SYM(rb_intern(buf)); - } - if ((name = keyword_id_to_str(id))) { - return ID2SYM(rb_intern(name)); - } - switch (id) { - case tOROP: - name = "||"; - break; - case tANDOP: - name = "&&"; - break; - default: - name = rb_id2name(id); - if (!name) { - rb_bug("cannot convert ID to string: %ld", (unsigned long)id); - } - break; - } - return ID2SYM(rb_intern(name)); -} - -static VALUE -ripper_intern(const char *s) -{ - return ID2SYM(rb_intern(s)); -} - -static void -ripper_compile_error(struct parser_params *parser, const char *fmt, ...) -{ - VALUE str; - va_list args; - - va_start(args, fmt); - str = rb_vsprintf(fmt, args); - va_end(args); - rb_funcall(parser->value, rb_intern("compile_error"), 1, str); -} - -static void -ripper_warn0(struct parser_params *parser, const char *fmt) -{ - rb_funcall(parser->value, rb_intern("warn"), 1, STR_NEW2(fmt)); -} - -static void -ripper_warnI(struct parser_params *parser, const char *fmt, int a) -{ - rb_funcall(parser->value, rb_intern("warn"), 2, - STR_NEW2(fmt), INT2NUM(a)); -} - -#if 0 -static void -ripper_warnS(struct parser_params *parser, const char *fmt, const char *str) -{ - rb_funcall(parser->value, rb_intern("warn"), 2, - STR_NEW2(fmt), STR_NEW2(str)); -} -#endif - -static void -ripper_warning0(struct parser_params *parser, const char *fmt) -{ - rb_funcall(parser->value, rb_intern("warning"), 1, STR_NEW2(fmt)); -} - -static void -ripper_warningS(struct parser_params *parser, const char *fmt, const char *str) -{ - rb_funcall(parser->value, rb_intern("warning"), 2, - STR_NEW2(fmt), STR_NEW2(str)); -} - -static VALUE -ripper_lex_get_generic(struct parser_params *parser, VALUE src) -{ - return rb_funcall(src, ripper_id_gets, 0); -} - -static VALUE -ripper_s_allocate(VALUE klass) -{ - struct parser_params *p; - VALUE self; - - p = ALLOC_N(struct parser_params, 1); - MEMZERO(p, struct parser_params, 1); - self = Data_Wrap_Struct(klass, parser_mark, parser_free, p); - p->value = self; - return self; -} - -#define ripper_initialized_p(r) ((r)->parser_lex_input != 0) - -/* - * call-seq: - * Ripper.new(src, filename="(ripper)", lineno=1) -> ripper - * - * Create a new Ripper object. - * _src_ must be a String, a IO, or an Object which has #gets method. - * - * This method does not starts parsing. - * See also Ripper#parse and Ripper.parse. - */ -static VALUE -ripper_initialize(int argc, VALUE *argv, VALUE self) -{ - struct parser_params *parser; - VALUE src, fname, lineno; - - Data_Get_Struct(self, struct parser_params, parser); - rb_scan_args(argc, argv, "12", &src, &fname, &lineno); - if (rb_obj_respond_to(src, ripper_id_gets, 0)) { - parser->parser_lex_gets = ripper_lex_get_generic; - } - else { - StringValue(src); - parser->parser_lex_gets = lex_get_str; - } - parser->parser_lex_input = src; - parser->eofp = Qfalse; - if (NIL_P(fname)) { - fname = STR_NEW2("(ripper)"); - } - else { - StringValue(fname); - } - parser_initialize(parser); - - parser->parser_ruby_sourcefile_string = fname; - parser->parser_ruby_sourcefile = RSTRING_PTR(fname); - parser->parser_ruby_sourceline = NIL_P(lineno) ? 0 : NUM2INT(lineno) - 1; - - return Qnil; -} - -extern VALUE rb_thread_pass(void); - -struct ripper_args { - struct parser_params *parser; - int argc; - VALUE *argv; -}; - -static VALUE -ripper_parse0(VALUE parser_v) -{ - struct parser_params *parser; - - Data_Get_Struct(parser_v, struct parser_params, parser); - parser_prepare(parser); - ripper_yyparse((void*)parser); - return parser->result; -} - -static VALUE -ripper_ensure(VALUE parser_v) -{ - struct parser_params *parser; - - Data_Get_Struct(parser_v, struct parser_params, parser); - parser->parsing_thread = Qnil; - return Qnil; -} - -/* - * call-seq: - * ripper#parse - * - * Start parsing and returns the value of the root action. - */ -static VALUE -ripper_parse(VALUE self) -{ - struct parser_params *parser; - - Data_Get_Struct(self, struct parser_params, parser); - if (!ripper_initialized_p(parser)) { - rb_raise(rb_eArgError, "method called for uninitialized object"); - } - if (!NIL_P(parser->parsing_thread)) { - if (parser->parsing_thread == rb_thread_current()) - rb_raise(rb_eArgError, "Ripper#parse is not reentrant"); - else - rb_raise(rb_eArgError, "Ripper#parse is not multithread-safe"); - } - parser->parsing_thread = rb_thread_current(); - rb_ensure(ripper_parse0, self, ripper_ensure, self); - - return parser->result; -} - -/* - * call-seq: - * ripper#column -> Integer - * - * Return column number of current parsing line. - * This number starts from 0. - */ -static VALUE -ripper_column(VALUE self) -{ - struct parser_params *parser; - long col; - - Data_Get_Struct(self, struct parser_params, parser); - if (!ripper_initialized_p(parser)) { - rb_raise(rb_eArgError, "method called for uninitialized object"); - } - if (NIL_P(parser->parsing_thread)) return Qnil; - col = parser->tokp - parser->parser_lex_pbeg; - return LONG2NUM(col); -} - -/* - * call-seq: - * ripper#lineno -> Integer - * - * Return line number of current parsing line. - * This number starts from 1. - */ -static VALUE -ripper_lineno(VALUE self) -{ - struct parser_params *parser; - - Data_Get_Struct(self, struct parser_params, parser); - if (!ripper_initialized_p(parser)) { - rb_raise(rb_eArgError, "method called for uninitialized object"); - } - if (NIL_P(parser->parsing_thread)) return Qnil; - return INT2NUM(parser->parser_ruby_sourceline); -} - -#ifdef RIPPER_DEBUG -/* :nodoc: */ -static VALUE -ripper_assert_Qundef(VALUE self, VALUE obj, VALUE msg) -{ - StringValue(msg); - if (obj == Qundef) { - rb_raise(rb_eArgError, "%s", RSTRING_PTR(msg)); - } - return Qnil; -} - -/* :nodoc: */ -static VALUE -ripper_value(VALUE self, VALUE obj) -{ - return ULONG2NUM(obj); -} -#endif - -void -Init_ripper(void) -{ - VALUE Ripper; - - Ripper = rb_define_class("Ripper", rb_cObject); - rb_define_const(Ripper, "Version", rb_usascii_str_new2(RIPPER_VERSION)); - rb_define_alloc_func(Ripper, ripper_s_allocate); - rb_define_method(Ripper, "initialize", ripper_initialize, -1); - rb_define_method(Ripper, "parse", ripper_parse, 0); - rb_define_method(Ripper, "column", ripper_column, 0); - rb_define_method(Ripper, "lineno", ripper_lineno, 0); - rb_define_method(Ripper, "end_seen?", rb_parser_end_seen_p, 0); - rb_define_method(Ripper, "encoding", rb_parser_encoding, 0); - rb_define_method(Ripper, "yydebug", rb_parser_get_yydebug, 0); - rb_define_method(Ripper, "yydebug=", rb_parser_set_yydebug, 1); -#ifdef RIPPER_DEBUG - rb_define_method(rb_mKernel, "assert_Qundef", ripper_assert_Qundef, 2); - rb_define_method(rb_mKernel, "rawVALUE", ripper_value, 1); - rb_define_method(rb_mKernel, "validate_object", ripper_validate_object, 1); -#endif - - ripper_id_gets = rb_intern("gets"); - ripper_init_eventids1(Ripper); - ripper_init_eventids2(Ripper); - /* ensure existing in symbol table */ - rb_intern("||"); - rb_intern("&&"); -} -#endif /* RIPPER */ |