/* This is a wrapper for parse.y */ #include "internal/re.h" #include "internal/ruby_parser.h" #include "node.h" #include "rubyparser.h" #include "internal/error.h" #ifdef UNIVERSAL_PARSER #include "internal.h" #include "internal/array.h" #include "internal/bignum.h" #include "internal/compile.h" #include "internal/complex.h" #include "internal/encoding.h" #include "internal/gc.h" #include "internal/hash.h" #include "internal/io.h" #include "internal/parse.h" #include "internal/rational.h" #include "internal/re.h" #include "internal/string.h" #include "internal/symbol.h" #include "internal/thread.h" #include "ruby/ractor.h" #include "ruby/ruby.h" #include "ruby/util.h" #include "internal.h" #include "vm_core.h" #include "symbol.h" struct ruby_parser { rb_parser_t *parser_params; }; static void parser_mark(void *ptr) { struct ruby_parser *parser = (struct ruby_parser*)ptr; rb_ruby_parser_mark(parser->parser_params); } static void parser_free(void *ptr) { struct ruby_parser *parser = (struct ruby_parser*)ptr; rb_ruby_parser_free(parser->parser_params); } static size_t parser_memsize(const void *ptr) { struct ruby_parser *parser = (struct ruby_parser*)ptr; return rb_ruby_parser_memsize(parser->parser_params); } static const rb_data_type_t ruby_parser_data_type = { "parser", { parser_mark, parser_free, parser_memsize, }, 0, 0, RUBY_TYPED_FREE_IMMEDIATELY }; static int is_ascii_string2(VALUE str) { return is_ascii_string(str); } RBIMPL_ATTR_FORMAT(RBIMPL_PRINTF_FORMAT, 6, 0) static VALUE syntax_error_append(VALUE exc, VALUE file, int line, int column, void *enc, const char *fmt, va_list args) { return rb_syntax_error_append(exc, file, line, column, (rb_encoding *)enc, fmt, args); } static int local_defined(ID id, const void *p) { return rb_local_defined(id, (const rb_iseq_t *)p); } static int dvar_defined(ID id, const void *p) { return rb_dvar_defined(id, (const rb_iseq_t *)p); } static bool hash_literal_key_p(VALUE k) { switch (OBJ_BUILTIN_TYPE(k)) { case T_NODE: return false; default: return true; } } static int literal_cmp(VALUE val, VALUE lit) { if (val == lit) return 0; if (!hash_literal_key_p(val) || !hash_literal_key_p(lit)) return -1; return rb_iseq_cdhash_cmp(val, lit); } static st_index_t literal_hash(VALUE a) { if (!hash_literal_key_p(a)) return (st_index_t)a; return rb_iseq_cdhash_hash(a); } static int is_usascii_enc(void *enc) { return rb_is_usascii_enc((rb_encoding *)enc); } static int is_local_id2(ID id) { return is_local_id(id); } static int is_attrset_id2(ID id) { return is_attrset_id(id); } static int is_notop_id2(ID id) { return is_notop_id(id); } static VALUE enc_str_new(const char *ptr, long len, void *enc) { return rb_enc_str_new(ptr, len, (rb_encoding *)enc); } static int enc_isalnum(OnigCodePoint c, void *enc) { return rb_enc_isalnum(c, (rb_encoding *)enc); } static int enc_precise_mbclen(const char *p, const char *e, void *enc) { return rb_enc_precise_mbclen(p, e, (rb_encoding *)enc); } static int mbclen_charfound_p(int len) { return MBCLEN_CHARFOUND_P(len); } static int mbclen_charfound_len(int len) { return MBCLEN_CHARFOUND_LEN(len); } static const char * enc_name(void *enc) { return rb_enc_name((rb_encoding *)enc); } static char * enc_prev_char(const char *s, const char *p, const char *e, void *enc) { return rb_enc_prev_char(s, p, e, (rb_encoding *)enc); } static void * enc_get(VALUE obj) { return (void *)rb_enc_get(obj); } static int enc_asciicompat(void *enc) { return rb_enc_asciicompat((rb_encoding *)enc); } static void * utf8_encoding(void) { return (void *)rb_utf8_encoding(); } static VALUE enc_associate(VALUE obj, void *enc) { return rb_enc_associate(obj, (rb_encoding *)enc); } static void * ascii8bit_encoding(void) { return (void *)rb_ascii8bit_encoding(); } static int enc_codelen(int c, void *enc) { return rb_enc_codelen(c, (rb_encoding *)enc); } static VALUE enc_str_buf_cat(VALUE str, const char *ptr, long len, void *enc) { return rb_enc_str_buf_cat(str, ptr, len, (rb_encoding *)enc); } static int enc_mbcput(unsigned int c, void *buf, void *enc) { return rb_enc_mbcput(c, buf, (rb_encoding *)enc); } static void * enc_from_index(int idx) { return (void *)rb_enc_from_index(idx); } static int enc_isspace(OnigCodePoint c, void *enc) { return rb_enc_isspace(c, (rb_encoding *)enc); } static ID intern3(const char *name, long len, void *enc) { return rb_intern3(name, len, (rb_encoding *)enc); } static void * enc_compatible(VALUE str1, VALUE str2) { return (void *)rb_enc_compatible(str1, str2); } static VALUE enc_from_encoding(void *enc) { return rb_enc_from_encoding((rb_encoding *)enc); } static int encoding_get(VALUE obj) { return ENCODING_GET(obj); } static void encoding_set(VALUE obj, int encindex) { ENCODING_SET(obj, encindex); } static int encoding_is_ascii8bit(VALUE obj) { return ENCODING_IS_ASCII8BIT(obj); } static void * usascii_encoding(void) { return (void *)rb_usascii_encoding(); } static int enc_symname_type(const char *name, long len, void *enc, unsigned int allowed_attrset) { return rb_enc_symname_type(name, len, (rb_encoding *)enc, allowed_attrset); } typedef struct { struct parser_params *parser; rb_encoding *enc; NODE *succ_block; const rb_code_location_t *loc; } reg_named_capture_assign_t; static int reg_named_capture_assign_iter(const OnigUChar *name, const OnigUChar *name_end, int back_num, int *back_refs, OnigRegex regex, void *arg0) { reg_named_capture_assign_t *arg = (reg_named_capture_assign_t*)arg0; struct parser_params* p = arg->parser; rb_encoding *enc = arg->enc; const rb_code_location_t *loc = arg->loc; long len = name_end - name; const char *s = (const char *)name; return rb_reg_named_capture_assign_iter_impl(p, s, len, (void *)enc, &arg->succ_block, loc); } static NODE * reg_named_capture_assign(struct parser_params* p, VALUE regexp, const rb_code_location_t *loc) { reg_named_capture_assign_t arg; arg.parser = p; arg.enc = rb_enc_get(regexp); arg.succ_block = 0; arg.loc = loc; onig_foreach_name(RREGEXP_PTR(regexp), reg_named_capture_assign_iter, &arg); if (!arg.succ_block) return 0; return RNODE_BLOCK(arg.succ_block)->nd_next; } static VALUE rbool(VALUE v) { return RBOOL(v); } static int undef_p(VALUE v) { return RB_UNDEF_P(v); } static int rtest(VALUE obj) { return (int)RB_TEST(obj); } static int nil_p(VALUE obj) { return (int)NIL_P(obj); } static VALUE syntax_error_new(void) { return rb_class_new_instance(0, 0, rb_eSyntaxError); } static VALUE obj_write(VALUE old, VALUE *slot, VALUE young) { return RB_OBJ_WRITE(old, slot, young); } static VALUE obj_written(VALUE old, VALUE slot, VALUE young) { return RB_OBJ_WRITTEN(old, slot, young); } static VALUE default_rs(void) { return rb_default_rs; } static void * memmove2(void *dest, const void *src, size_t t, size_t n) { return memmove(dest, src, rbimpl_size_mul_or_raise(t, n)); } static void * nonempty_memcpy(void *dest, const void *src, size_t t, size_t n) { return ruby_nonempty_memcpy(dest, src, rbimpl_size_mul_or_raise(t, n)); } static VALUE ruby_verbose2(void) { return ruby_verbose; } static int * rb_errno_ptr2(void) { return rb_errno_ptr(); } static int fixnum_p(VALUE obj) { return (int)RB_FIXNUM_P(obj); } static int symbol_p(VALUE obj) { return (int)RB_SYMBOL_P(obj); } static void * zalloc(size_t elemsiz) { return ruby_xcalloc(1, elemsiz); } static void gc_guard(VALUE obj) { RB_GC_GUARD(obj); } static rb_imemo_tmpbuf_t * tmpbuf_parser_heap(void *buf, rb_imemo_tmpbuf_t *old_heap, size_t cnt) { return rb_imemo_tmpbuf_parser_heap(buf, old_heap, cnt); } static VALUE arg_error(void) { return rb_eArgError; } static VALUE ruby_vm_frozen_core(void) { return rb_mRubyVMFrozenCore; } static rb_ast_t * ast_new(VALUE nb) { return IMEMO_NEW(rb_ast_t, imemo_ast, nb); } static VALUE static_id2sym(ID id) { return (((VALUE)(id)<parser_params = parser_params; return vparser; } void rb_parser_set_options(VALUE vparser, int print, int loop, int chomp, int split) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_set_options(parser->parser_params, print, loop, chomp, split); } VALUE rb_parser_set_context(VALUE vparser, const struct rb_iseq_struct *base, int main) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_set_context(parser->parser_params, base, main); return vparser; } void rb_parser_set_script_lines(VALUE vparser, VALUE lines) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_set_script_lines(parser->parser_params, lines); } void rb_parser_error_tolerant(VALUE vparser) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_error_tolerant(parser->parser_params); } rb_ast_t* rb_parser_compile_file_path(VALUE vparser, VALUE fname, VALUE file, int start) { struct ruby_parser *parser; rb_ast_t *ast; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); ast = rb_ruby_parser_compile_file_path(parser->parser_params, fname, file, start); RB_GC_GUARD(vparser); return ast; } void rb_parser_keep_tokens(VALUE vparser) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_keep_tokens(parser->parser_params); } rb_ast_t* rb_parser_compile_generic(VALUE vparser, VALUE (*lex_gets)(VALUE, int), VALUE fname, VALUE input, int start) { struct ruby_parser *parser; rb_ast_t *ast; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); ast = rb_ruby_parser_compile_generic(parser->parser_params, lex_gets, fname, input, start); RB_GC_GUARD(vparser); return ast; } rb_ast_t* rb_parser_compile_string(VALUE vparser, const char *f, VALUE s, int line) { struct ruby_parser *parser; rb_ast_t *ast; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); ast = rb_ruby_parser_compile_string(parser->parser_params, f, s, line); RB_GC_GUARD(vparser); return ast; } rb_ast_t* rb_parser_compile_string_path(VALUE vparser, VALUE f, VALUE s, int line) { struct ruby_parser *parser; rb_ast_t *ast; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); ast = rb_ruby_parser_compile_string_path(parser->parser_params, f, s, line); RB_GC_GUARD(vparser); return ast; } VALUE rb_parser_encoding(VALUE vparser) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); return rb_ruby_parser_encoding(parser->parser_params); } VALUE rb_parser_end_seen_p(VALUE vparser) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); return RBOOL(rb_ruby_parser_end_seen_p(parser->parser_params)); } VALUE rb_parser_set_yydebug(VALUE vparser, VALUE flag) { struct ruby_parser *parser; TypedData_Get_Struct(vparser, struct ruby_parser, &ruby_parser_data_type, parser); rb_ruby_parser_set_yydebug(parser->parser_params, RTEST(flag)); return flag; } #endif VALUE rb_str_new_parser_string(rb_parser_string_t *str) { return rb_enc_str_new(str->ptr, str->len, str->enc); } static VALUE negative_numeric(VALUE val) { if (FIXNUM_P(val)) { return LONG2FIX(-FIX2LONG(val)); } if (SPECIAL_CONST_P(val)) { #if USE_FLONUM if (FLONUM_P(val)) { return DBL2NUM(-RFLOAT_VALUE(val)); } #endif goto unknown; } switch (BUILTIN_TYPE(val)) { case T_BIGNUM: BIGNUM_NEGATE(val); val = rb_big_norm(val); break; case T_RATIONAL: RATIONAL_SET_NUM(val, negative_numeric(RRATIONAL(val)->num)); break; case T_COMPLEX: RCOMPLEX_SET_REAL(val, negative_numeric(RCOMPLEX(val)->real)); RCOMPLEX_SET_IMAG(val, negative_numeric(RCOMPLEX(val)->imag)); break; case T_FLOAT: val = DBL2NUM(-RFLOAT_VALUE(val)); break; unknown: default: rb_bug("unknown literal type (%s) passed to negative_numeric", rb_builtin_class_name(val)); break; } return val; } static VALUE integer_value(const char *val, int base) { return rb_cstr_to_inum(val, base, FALSE); } static VALUE rational_value(const char *node_val, int base, int seen_point) { VALUE lit; char* val = strdup(node_val); if (seen_point > 0) { int len = (int)(strlen(val)); char *point = &val[seen_point]; size_t fraclen = len-seen_point-1; memmove(point, point+1, fraclen+1); lit = rb_rational_new(integer_value(val, base), rb_int_positive_pow(10, fraclen)); } else { lit = rb_rational_raw1(integer_value(val, base)); } free(val); return lit; } VALUE rb_node_integer_literal_val(const NODE *n) { const rb_node_integer_t *node = RNODE_INTEGER(n); VALUE val = integer_value(node->val, node->base); if (node->minus) { val = negative_numeric(val); } return val; } VALUE rb_node_float_literal_val(const NODE *n) { const rb_node_float_t *node = RNODE_FLOAT(n); double d = strtod(node->val, 0); if (node->minus) { d = -d; } VALUE val = DBL2NUM(d); return val; } VALUE rb_node_rational_literal_val(const NODE *n) { VALUE lit; const rb_node_rational_t *node = RNODE_RATIONAL(n); lit = rational_value(node->val, node->base, node->seen_point); if (node->minus) { lit = negative_numeric(lit); } return lit; } VALUE rb_node_imaginary_literal_val(const NODE *n) { VALUE lit; const rb_node_imaginary_t *node = RNODE_IMAGINARY(n); enum rb_numeric_type type = node->type; switch (type) { case integer_literal: lit = integer_value(node->val, node->base); break; case float_literal:{ double d = strtod(node->val, 0); lit = DBL2NUM(d); break; } case rational_literal: lit = rational_value(node->val, node->base, node->seen_point); break; default: rb_bug("unreachable"); } lit = rb_complex_raw(INT2FIX(0), lit); if (node->minus) { lit = negative_numeric(lit); } return lit; } VALUE rb_node_str_string_val(const NODE *node) { rb_parser_string_t *str = RNODE_STR(node)->string; return rb_str_new_parser_string(str); } VALUE rb_node_sym_string_val(const NODE *node) { rb_parser_string_t *str = RNODE_SYM(node)->string; return ID2SYM(rb_intern3(str->ptr, str->len, str->enc)); } VALUE rb_node_dstr_string_val(const NODE *node) { rb_parser_string_t *str = RNODE_DSTR(node)->string; return str ? rb_str_new_parser_string(str) : Qnil; } VALUE rb_node_dregx_string_val(const NODE *node) { rb_parser_string_t *str = RNODE_DREGX(node)->string; return rb_str_new_parser_string(str); } VALUE rb_node_regx_string_val(const NODE *node) { rb_node_regx_t *node_reg = RNODE_REGX(node); rb_parser_string_t *string = node_reg->string; VALUE str = rb_enc_str_new(string->ptr, string->len, string->enc); return rb_reg_compile(str, node_reg->options, NULL, 0); } VALUE rb_node_line_lineno_val(const NODE *node) { return INT2FIX(node->nd_loc.beg_pos.lineno); } VALUE rb_node_file_path_val(const NODE *node) { return rb_str_new_parser_string(RNODE_FILE(node)->path); } VALUE rb_node_encoding_val(const NODE *node) { return rb_enc_from_encoding(RNODE_ENCODING(node)->enc); } VALUE rb_node_const_decl_val(const NODE *node) { VALUE path; switch (nd_type(node)) { case NODE_CDECL: if (RNODE_CDECL(node)->nd_vid) { path = rb_id2str(RNODE_CDECL(node)->nd_vid); goto end; } else { node = RNODE_CDECL(node)->nd_else; } break; case NODE_COLON2: break; case NODE_COLON3: // ::Const path = rb_str_new_cstr("::"); rb_str_append(path, rb_id2str(RNODE_COLON3(node)->nd_mid)); goto end; default: rb_bug("unexpected node: %s", ruby_node_name(nd_type(node))); UNREACHABLE_RETURN(0); } path = rb_ary_new(); if (node) { for (; node && nd_type_p(node, NODE_COLON2); node = RNODE_COLON2(node)->nd_head) { rb_ary_push(path, rb_id2str(RNODE_COLON2(node)->nd_mid)); } if (node && nd_type_p(node, NODE_CONST)) { // Const::Name rb_ary_push(path, rb_id2str(RNODE_CONST(node)->nd_vid)); } else if (node && nd_type_p(node, NODE_COLON3)) { // ::Const::Name rb_ary_push(path, rb_id2str(RNODE_COLON3(node)->nd_mid)); rb_ary_push(path, rb_str_new(0, 0)); } else { // expression::Name rb_ary_push(path, rb_str_new_cstr("...")); } path = rb_ary_join(rb_ary_reverse(path), rb_str_new_cstr("::")); } end: path = rb_fstring(path); return path; }