diff options
Diffstat (limited to 'ruby.c')
| -rw-r--r-- | ruby.c | 2140 |
1 files changed, 1441 insertions, 699 deletions
@@ -15,13 +15,8 @@ #include <windows.h> #include <sys/cygwin.h> #endif -#ifdef _WIN32_WCE -#include <winsock.h> -#include "ruby/wince.h" -#endif -#include "ruby/ruby.h" -#include "ruby/node.h" -#include "ruby/encoding.h" +#include "internal.h" +#include "ruby/thread.h" #include "eval_intern.h" #include "dln.h" #include <stdio.h> @@ -31,6 +26,9 @@ #ifdef __hpux #include <sys/pstat.h> #endif +#if defined(LOAD_RELATIVE) && defined(HAVE_DLADDR) +#include <dlfcn.h> +#endif #ifdef HAVE_UNISTD_H #include <unistd.h> @@ -46,9 +44,8 @@ #ifndef MAXPATHLEN # define MAXPATHLEN 1024 #endif - -#if defined(__MACOS__) && defined(__MWERKS__) -#include <console.h> +#ifndef O_ACCMODE +# define O_ACCMODE (O_RDONLY | O_WRONLY | O_RDWR) #endif #include "ruby/util.h" @@ -57,36 +54,74 @@ char *getenv(); #endif -VALUE rb_parser_get_yydebug(VALUE); -VALUE rb_parser_set_yydebug(VALUE, VALUE); - -const char *ruby_get_inplace_mode(void); -void ruby_set_inplace_mode(const char *); +#ifndef DISABLE_RUBYGEMS +# define DISABLE_RUBYGEMS 0 +#endif +#if DISABLE_RUBYGEMS +#define DEFAULT_RUBYGEMS_ENABLED "disabled" +#else +#define DEFAULT_RUBYGEMS_ENABLED "enabled" +#endif -#define DISABLE_BIT(bit) (1U << disable_##bit) -enum disable_flag_bits { - disable_gems, - disable_rubyopt, +#define COMMA , +#define FEATURE_BIT(bit) (1U << feature_##bit) +#define EACH_FEATURES(X, SEP) \ + X(gems) \ + SEP \ + X(did_you_mean) \ + SEP \ + X(rubyopt) \ + SEP \ + X(frozen_string_literal) \ + /* END OF FEATURES */ +#define EACH_DEBUG_FEATURES(X, SEP) \ + X(frozen_string_literal) \ + /* END OF DEBUG FEATURES */ +#define AMBIGUOUS_FEATURE_NAMES 0 /* no ambiguous feature names now */ +#define DEFINE_FEATURE(bit) feature_##bit +#define DEFINE_DEBUG_FEATURE(bit) feature_debug_##bit +enum feature_flag_bits { + EACH_FEATURES(DEFINE_FEATURE, COMMA), + feature_debug_flag_first, + feature_debug_flag_begin = feature_debug_flag_first - 1, + EACH_DEBUG_FEATURES(DEFINE_DEBUG_FEATURE, COMMA), + feature_flag_count }; +#define DEBUG_BIT(bit) (1U << feature_debug_##bit) + #define DUMP_BIT(bit) (1U << dump_##bit) +#define DEFINE_DUMP(bit) dump_##bit +#define EACH_DUMPS(X, SEP) \ + X(version) \ + SEP \ + X(copyright) \ + SEP \ + X(usage) \ + SEP \ + X(help) \ + SEP \ + X(yydebug) \ + SEP \ + X(syntax) \ + SEP \ + X(parsetree) \ + SEP \ + X(parsetree_with_comment) \ + SEP \ + X(insns) \ + /* END OF DUMPS */ enum dump_flag_bits { - dump_insns, + dump_version_v, + EACH_DUMPS(DEFINE_DUMP, COMMA), + dump_exit_bits = (DUMP_BIT(yydebug) | DUMP_BIT(syntax) | + DUMP_BIT(parsetree) | DUMP_BIT(parsetree_with_comment) | + DUMP_BIT(insns)) }; -struct cmdline_options { - int sflag, xflag; - int do_loop, do_print; - int do_check, do_line; - int do_split, do_search; - int usage; - int version; - int copyright; - unsigned int disable; - int verbose; - int yydebug; - unsigned int setids; - unsigned int dump; +typedef struct ruby_cmdline_options ruby_cmdline_options_t; + +struct ruby_cmdline_options { const char *script; VALUE script_name; VALUE e_script; @@ -95,148 +130,159 @@ struct cmdline_options { VALUE name; int index; } enc; - } src, ext; + } src, ext, intern; VALUE req_list; + unsigned int features; + unsigned int dump; + int safe_level; + int sflag, xflag; + unsigned int warning: 1; + unsigned int verbose: 1; + unsigned int do_loop: 1; + unsigned int do_print: 1; + unsigned int do_line: 1; + unsigned int do_split: 1; + unsigned int do_search: 1; + unsigned int setids: 2; }; -static void init_ids(struct cmdline_options *); +static void init_ids(ruby_cmdline_options_t *); #define src_encoding_index GET_VM()->src_encoding_index -static struct cmdline_options * -cmdline_options_init(struct cmdline_options *opt) +enum { + COMPILATION_FEATURES = ( + 0 + | FEATURE_BIT(frozen_string_literal) + | FEATURE_BIT(debug_frozen_string_literal) + ), + DEFAULT_FEATURES = ( + (FEATURE_BIT(debug_flag_first)-1) +#if DISABLE_RUBYGEMS + & ~FEATURE_BIT(gems) +#endif + & ~FEATURE_BIT(frozen_string_literal) + ) +}; + +static ruby_cmdline_options_t * +cmdline_options_init(ruby_cmdline_options_t *opt) { MEMZERO(opt, *opt, 1); init_ids(opt); opt->src.enc.index = src_encoding_index; + opt->ext.enc.index = -1; + opt->intern.enc.index = -1; + opt->features = DEFAULT_FEATURES; return opt; } -struct cmdline_arguments { - int argc; - char **argv; - struct cmdline_options *opt; -}; - -static NODE *load_file(VALUE, const char *, int, struct cmdline_options *); -static void forbid_setid(const char *, struct cmdline_options *); -#define forbid_setid(s) forbid_setid(s, opt) +static rb_ast_t *load_file(VALUE parser, VALUE fname, VALUE f, int script, + ruby_cmdline_options_t *opt); +static VALUE open_load_file(VALUE fname_v, int *xflag); +static void forbid_setid(const char *, const ruby_cmdline_options_t *); +#define forbid_setid(s) forbid_setid((s), opt) static struct { int argc; char **argv; -#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE) - int len; -#endif } origarg; static void -usage(const char *name) +show_usage_line(const char *str, unsigned int namelen, unsigned int secondlen, int help) +{ + const unsigned int w = 16; + const int wrap = help && namelen + secondlen - 2 > w; + printf(" %.*s%-*.*s%-*s%s\n", namelen-1, str, + (wrap ? 0 : w - namelen + 1), + (help ? secondlen-1 : 0), str + namelen, + (wrap ? w + 3 : 0), (wrap ? "\n" : ""), + str + namelen + secondlen); +} + +static void +usage(const char *name, int help) { /* This message really ought to be max 23 lines. * Removed -h because the user already knows that option. Others? */ - static const char *const usage_msg[] = { - "-0[octal] specify record separator (\\0, if no argument)", - "-a autosplit mode with -n or -p (splits $_ into $F)", - "-c check syntax only", - "-Cdirectory cd to directory, before executing your script", - "-d set debugging flags (set $DEBUG to true)", - "-e 'command' one line of script. Several -e's allowed. Omit [programfile]", - "-Eencoding specifies the character encoding for the program codes", - "-Fpattern split() pattern for autosplit (-a)", - "-i[extension] edit ARGV files in place (make backup if extension supplied)", - "-Idirectory specify $LOAD_PATH directory (may be used more than once)", - "-l enable line ending processing", - "-n assume 'while gets(); ... end' loop around your script", - "-p assume loop like -n but print line also like sed", - "-rlibrary require the library, before executing your script", - "-s enable some switch parsing for switches after script name", - "-S look for the script using PATH environment variable", - "-T[level] turn on tainting checks", - "-v print version number, then turn on verbose mode", - "-w turn warnings on for your script", - "-W[level] set warning level; 0=silence, 1=medium, 2=verbose (default)", - "-x[directory] strip off text before #!ruby line and perhaps cd to directory", - "--copyright print the copyright", - "--version print the version", - NULL + struct message { + const char *str; + unsigned short namelen, secondlen; }; - const char *const *p = usage_msg; - - printf("Usage: %s [switches] [--] [programfile] [arguments]\n", name); - while (*p) - printf(" %s\n", *p++); -} - -VALUE rb_get_load_path(void); - -#ifndef CharNext /* defined as CharNext[AW] on Windows. */ -#define CharNext(p) ((p) + mblen(p, RUBY_MBCHAR_MAXSIZE)) -#endif - -#if defined DOSISH || defined __CYGWIN__ -static inline void -translate_char(char *p, int from, int to) -{ - while (*p) { - if ((unsigned char)*p == from) - *p = to; - p = CharNext(p); - } +#define M(shortopt, longopt, desc) { \ + shortopt " " longopt " " desc, \ + (unsigned short)sizeof(shortopt), \ + (unsigned short)sizeof(longopt), \ } -#endif + static const struct message usage_msg[] = { + M("-0[octal]", "", "specify record separator (\\0, if no argument)"), + M("-a", "", "autosplit mode with -n or -p (splits $_ into $F)"), + M("-c", "", "check syntax only"), + M("-Cdirectory", "", "cd to directory before executing your script"), + M("-d", ", --debug", "set debugging flags (set $DEBUG to true)"), + M("-e 'command'", "", "one line of script. Several -e's allowed. Omit [programfile]"), + M("-Eex[:in]", ", --encoding=ex[:in]", "specify the default external and internal character encodings"), + M("-Fpattern", "", "split() pattern for autosplit (-a)"), + M("-i[extension]", "", "edit ARGV files in place (make backup if extension supplied)"), + M("-Idirectory", "", "specify $LOAD_PATH directory (may be used more than once)"), + M("-l", "", "enable line ending processing"), + M("-n", "", "assume 'while gets(); ... end' loop around your script"), + M("-p", "", "assume loop like -n but print line also like sed"), + M("-rlibrary", "", "require the library before executing your script"), + M("-s", "", "enable some switch parsing for switches after script name"), + M("-S", "", "look for the script using PATH environment variable"), + M("-T[level=1]", "", "turn on tainting checks"), + M("-v", ", --verbose", "print version number, then turn on verbose mode"), + M("-w", "", "turn warnings on for your script"), + M("-W[level=2]", "", "set warning level; 0=silence, 1=medium, 2=verbose"), + M("-x[directory]", "", "strip off text before #!ruby line and perhaps cd to directory"), + M("-h", "", "show this message, --help for more info"), + }; + static const struct message help_msg[] = { + M("--copyright", "", "print the copyright"), + M("--dump={insns|parsetree|...}[,...]", "", + "dump debug information. see below for available dump list"), + M("--enable={gems|rubyopt|...}[,...]", ", --disable={gems|rubyopt|...}[,...]", + "enable or disable features. see below for available features"), + M("--external-encoding=encoding", ", --internal-encoding=encoding", + "specify the default external or internal character encoding"), + M("--version", "", "print the version"), + M("--help", "", "show this message, -h for short message"), + }; + static const struct message dumps[] = { + M("insns", "", "instruction sequences"), + M("yydebug", "", "yydebug of yacc parser generator"), + M("parsetree", "", "AST"), + M("parsetree_with_comment", "", "AST with comments"), + }; + static const struct message features[] = { + M("gems", "", "rubygems (default: "DEFAULT_RUBYGEMS_ENABLED")"), + M("did_you_mean", "", "did_you_mean (default: "DEFAULT_RUBYGEMS_ENABLED")"), + M("rubyopt", "", "RUBYOPT environment variable (default: enabled)"), + M("frozen-string-literal", "", "freeze all string literals (default: disabled)"), + }; + int i; + const int num = numberof(usage_msg) - (help ? 1 : 0); +#define SHOW(m) show_usage_line((m).str, (m).namelen, (m).secondlen, help) -#if defined _WIN32 || defined __CYGWIN__ || defined __DJGPP__ -static VALUE -rubylib_mangled_path(const char *s, unsigned int l) -{ - static char *newp, *oldp; - static int newl, oldl, notfound; - char *ptr; - VALUE ret; - - if (!newp && !notfound) { - newp = getenv("RUBYLIB_PREFIX"); - if (newp) { - oldp = newp = strdup(newp); - while (*newp && !ISSPACE(*newp) && *newp != ';') { - newp = CharNext(newp); /* Skip digits. */ - } - oldl = newp - oldp; - while (*newp && (ISSPACE(*newp) || *newp == ';')) { - newp = CharNext(newp); /* Skip whitespace. */ - } - newl = strlen(newp); - if (newl == 0 || oldl == 0) { - rb_fatal("malformed RUBYLIB_PREFIX"); - } - translate_char(newp, '\\', '/'); - } - else { - notfound = 1; - } - } - if (!newp || l < oldl || STRNCASECMP(oldp, s, oldl) != 0) { - return rb_str_new(s, l); - } - ret = rb_str_new(0, l + newl - oldl); - ptr = RSTRING_PTR(ret); - memcpy(ptr, newp, newl); - memcpy(ptr + newl, s + oldl, l - oldl); - ptr[l + newl - oldl] = 0; - return ret; + printf("Usage: %s [switches] [--] [programfile] [arguments]\n", name); + for (i = 0; i < num; ++i) + SHOW(usage_msg[i]); + + if (!help) return; + + for (i = 0; i < numberof(help_msg); ++i) + SHOW(help_msg[i]); + puts("Dump List:"); + for (i = 0; i < numberof(dumps); ++i) + SHOW(dumps[i]); + puts("Features:"); + for (i = 0; i < numberof(features); ++i) + SHOW(features[i]); } -static VALUE -rubylib_mangled_path2(const char *s) -{ - return rubylib_mangled_path(s, strlen(s)); -} -#else -#define rubylib_mangled_path rb_str_new -#define rubylib_mangled_path2 rb_str_new2 -#endif +#define rubylib_path_new rb_str_new static void push_include(const char *path, VALUE (*filter)(VALUE)) @@ -251,7 +297,7 @@ push_include(const char *path, VALUE (*filter)(VALUE)) p++; if (!*p) break; for (s = p; *s && *s != sep; s = CharNext(s)); - rb_ary_push(load_path, (*filter)(rubylib_mangled_path(p, s - p))); + rb_ary_push(load_path, (*filter)(rubylib_path_new(p, s - p))); p = s; } } @@ -282,7 +328,13 @@ push_include_cygwin(const char *path, VALUE (*filter)(VALUE)) p = strncpy(RSTRING_PTR(buf), p, len); } } - if (cygwin_conv_to_posix_path(p, rubylib) == 0) +#ifdef HAVE_CYGWIN_CONV_PATH +#define CONV_TO_POSIX_PATH(p, lib) \ + cygwin_conv_path(CCP_WIN_A_TO_POSIX|CCP_RELATIVE, (p), (lib), sizeof(lib)) +#else +# error no cygwin_conv_path +#endif + if (CONV_TO_POSIX_PATH(p, rubylib) == 0) p = rubylib; push_include(p, filter); if (!*s) break; @@ -306,11 +358,17 @@ identical_path(VALUE path) { return path; } +static VALUE +locale_path(VALUE path) +{ + rb_enc_associate(path, rb_locale_encoding()); + return path; +} void ruby_incpush(const char *path) { - ruby_push_include(path, identical_path); + ruby_push_include(path, locale_path); } static VALUE @@ -324,16 +382,13 @@ expand_include_path(VALUE path) return rb_file_expand_path(path, Qnil); } -void +void ruby_incpush_expand(const char *path) { ruby_push_include(path, expand_include_path); } -#if defined DOSISH || defined __CYGWIN__ -#define LOAD_RELATIVE 1 -#endif - +#undef UTF8_PATH #if defined _WIN32 || defined __CYGWIN__ static HMODULE libruby; @@ -344,140 +399,288 @@ DllMain(HINSTANCE dll, DWORD reason, LPVOID reserved) libruby = dll; return TRUE; } + +HANDLE +rb_libruby_handle(void) +{ + return libruby; +} + +static inline void +translit_char_bin(char *p, int from, int to) +{ + while (*p) { + if ((unsigned char)*p == from) + *p = to; + p++; + } +} +#endif + +#ifdef _WIN32 +# define UTF8_PATH 1 +#endif + +#ifndef UTF8_PATH +# define UTF8_PATH 0 +#endif +#if UTF8_PATH +# define IF_UTF8_PATH(t, f) t +#else +# define IF_UTF8_PATH(t, f) f +#endif + +#if UTF8_PATH +static VALUE +str_conv_enc(VALUE str, rb_encoding *from, rb_encoding *to) +{ + return rb_str_conv_enc_opts(str, from, to, + ECONV_UNDEF_REPLACE|ECONV_INVALID_REPLACE, + Qnil); +} +#else +# define str_conv_enc(str, from, to) (str) #endif +void ruby_init_loadpath_safe(int safe_level); + void ruby_init_loadpath(void) { + ruby_init_loadpath_safe(0); +} + +#if defined(LOAD_RELATIVE) && defined(HAVE_DLADDR) && !defined(__CYGWIN__) +static VALUE +dladdr_path(const void* addr) +{ + Dl_info dli; + VALUE fname, path; + + if (!dladdr(addr, &dli)) { + return rb_str_new(0, 0); + } +#ifdef __linux__ + else if (origarg.argc > 0 && origarg.argv && dli.dli_fname == origarg.argv[0]) { + fname = rb_str_new_cstr("/proc/self/exe"); + path = rb_readlink(fname, NULL); + } +#endif + else { + fname = rb_str_new_cstr(dli.dli_fname); + path = rb_realpath_internal(Qnil, fname, 1); + } + rb_str_resize(fname, 0); + return path; +} +#endif + +#define INITIAL_LOAD_PATH_MARK rb_intern_const("@gem_prelude_index") + +void +ruby_init_loadpath_safe(int safe_level) +{ VALUE load_path; + ID id_initial_load_path_mark; + const char *paths = ruby_initial_load_paths; #if defined LOAD_RELATIVE +# if defined HAVE_DLADDR || defined __CYGWIN__ || defined _WIN32 +# define VARIABLE_LIBPATH 1 +# else +# define VARIABLE_LIBPATH 0 +# endif +# if VARIABLE_LIBPATH + char *libpath; + VALUE sopath; +# else char libpath[MAXPATHLEN + 1]; +# endif + size_t baselen; char *p; - int rest; #if defined _WIN32 || defined __CYGWIN__ - GetModuleFileName(libruby, libpath, sizeof libpath); -#elif defined(DJGPP) - extern char *__dos_argv0; - strncpy(libpath, __dos_argv0, sizeof(libpath) - 1); -#elif defined(__human68k__) - extern char **_argv; - strncpy(libpath, _argv[0], sizeof(libpath) - 1); -#elif defined(__EMX__) - _execname(libpath, sizeof(libpath) - 1); + { + DWORD len = RSTRING_EMBED_LEN_MAX, ret, i; + VALUE wsopath = rb_str_new(0, len*sizeof(WCHAR)); + WCHAR *wlibpath; + while (wlibpath = (WCHAR *)RSTRING_PTR(wsopath), + ret = GetModuleFileNameW(libruby, wlibpath, len), + (ret == len)) + { + rb_str_modify_expand(wsopath, len*sizeof(WCHAR)); + rb_str_set_len(wsopath, (len += len)*sizeof(WCHAR)); + } + if (!ret || ret > len) rb_fatal("failed to get module file name"); + for (len = ret, i = 0; i < len; ++i) { + if (wlibpath[i] == L'\\') { + wlibpath[i] = L'/'; + ret = i+1; /* chop after the last separator */ + } + } + len = WideCharToMultiByte(CP_UTF8, 0, wlibpath, ret, NULL, 0, NULL, NULL); + sopath = rb_utf8_str_new(0, len); + libpath = RSTRING_PTR(sopath); + WideCharToMultiByte(CP_UTF8, 0, wlibpath, ret, libpath, len, NULL, NULL); + rb_str_resize(wsopath, 0); + } +#elif defined(HAVE_DLADDR) + sopath = dladdr_path((void *)(VALUE)expand_include_path); + libpath = RSTRING_PTR(sopath); #endif +#if !VARIABLE_LIBPATH libpath[sizeof(libpath) - 1] = '\0'; -#if defined DOSISH - translate_char(libpath, '\\', '/'); +#endif +#if defined DOSISH && !defined _WIN32 + translit_char(libpath, '\\', '/'); #elif defined __CYGWIN__ { - char rubylib[FILENAME_MAX]; - cygwin_conv_to_posix_path(libpath, rubylib); - strncpy(libpath, rubylib, sizeof(libpath)); + const int win_to_posix = CCP_WIN_A_TO_POSIX | CCP_RELATIVE; + size_t newsize = cygwin_conv_path(win_to_posix, libpath, 0, 0); + if (newsize > 0) { + VALUE rubylib = rb_str_new(0, newsize); + p = RSTRING_PTR(rubylib); + if (cygwin_conv_path(win_to_posix, libpath, p, newsize) == 0) { + rb_str_resize(sopath, 0); + sopath = rubylib; + libpath = p; + } + } } #endif p = strrchr(libpath, '/'); if (p) { - *p = 0; - if (p - libpath > 3 && !STRCASECMP(p - 4, "/bin")) { - p -= 4; - *p = 0; + static const char bindir[] = "/bin"; +#ifdef LIBDIR_BASENAME + static const char libdir[] = "/"LIBDIR_BASENAME; +#else + static const char libdir[] = "/lib"; +#endif + const ptrdiff_t bindir_len = (ptrdiff_t)sizeof(bindir) - 1; + const ptrdiff_t libdir_len = (ptrdiff_t)sizeof(libdir) - 1; + +#ifdef ENABLE_MULTIARCH + char *p2 = NULL; + + multiarch: +#endif + if (p - libpath >= bindir_len && !STRNCASECMP(p - bindir_len, bindir, bindir_len)) { + p -= bindir_len; + } + else if (p - libpath >= libdir_len && !strncmp(p - libdir_len, libdir, libdir_len)) { + p -= libdir_len; + } +#ifdef ENABLE_MULTIARCH + else if (p2) { + p = p2; } + else { + p2 = p; + p = rb_enc_path_last_separator(libpath, p, rb_ascii8bit_encoding()); + if (p) goto multiarch; + p = p2; + } +#endif +#if !VARIABLE_LIBPATH + *p = 0; +#endif } +#if !VARIABLE_LIBPATH else { - strcpy(libpath, "."); + strlcpy(libpath, ".", sizeof(libpath)); p = libpath + 1; } + baselen = p - libpath; +#define PREFIX_PATH() rb_str_new(libpath, baselen) +#else + baselen = p - libpath; + rb_str_resize(sopath, baselen); + libpath = RSTRING_PTR(sopath); +#define PREFIX_PATH() sopath +#endif - rest = sizeof(libpath) - 1 - (p - libpath); +#define BASEPATH() rb_str_buf_cat(rb_str_buf_new(baselen+len), libpath, baselen) -#define RUBY_RELATIVE(path) (strncpy(p, (path), rest), libpath) +#define RUBY_RELATIVE(path, len) rb_str_buf_cat(BASEPATH(), (path), (len)) #else -#define RUBY_RELATIVE(path) (path) + const size_t exec_prefix_len = strlen(ruby_exec_prefix); +#define RUBY_RELATIVE(path, len) rubylib_path_new((path), (len)) +#define PREFIX_PATH() RUBY_RELATIVE(ruby_exec_prefix, exec_prefix_len) #endif -#define incpush(path) rb_ary_push(load_path, rubylib_mangled_path2(path)) load_path = GET_VM()->load_path; - if (rb_safe_level() == 0) { - ruby_incpush(getenv("RUBYLIB")); + if (safe_level == 0) { + ruby_push_include(getenv("RUBYLIB"), identical_path); } -#ifdef RUBY_SEARCH_PATH - incpush(RUBY_RELATIVE(RUBY_SEARCH_PATH)); -#endif - - incpush(RUBY_RELATIVE(RUBY_SITE_LIB2)); -#ifdef RUBY_SITE_THIN_ARCHLIB - incpush(RUBY_RELATIVE(RUBY_SITE_THIN_ARCHLIB)); -#endif - incpush(RUBY_RELATIVE(RUBY_SITE_ARCHLIB)); - incpush(RUBY_RELATIVE(RUBY_SITE_LIB)); - - incpush(RUBY_RELATIVE(RUBY_VENDOR_LIB2)); -#ifdef RUBY_VENDOR_THIN_ARCHLIB - incpush(RUBY_RELATIVE(RUBY_VENDOR_THIN_ARCHLIB)); -#endif - incpush(RUBY_RELATIVE(RUBY_VENDOR_ARCHLIB)); - incpush(RUBY_RELATIVE(RUBY_VENDOR_LIB)); - - incpush(RUBY_RELATIVE(RUBY_LIB)); -#ifdef RUBY_THIN_ARCHLIB - incpush(RUBY_RELATIVE(RUBY_THIN_ARCHLIB)); -#endif - incpush(RUBY_RELATIVE(RUBY_ARCHLIB)); - - if (rb_safe_level() == 0) { - incpush("."); + id_initial_load_path_mark = INITIAL_LOAD_PATH_MARK; + while (*paths) { + size_t len = strlen(paths); + VALUE path = RUBY_RELATIVE(paths, len); + rb_ivar_set(path, id_initial_load_path_mark, path); + rb_ary_push(load_path, path); + paths += len + 1; } + + rb_const_set(rb_cObject, rb_intern_const("TMP_RUBY_PREFIX"), rb_obj_freeze(PREFIX_PATH())); } static void -add_modules(struct cmdline_options *opt, const char *mod) +add_modules(VALUE *req_list, const char *mod) { - VALUE list = opt->req_list; + VALUE list = *req_list; + VALUE feature; if (!list) { - opt->req_list = list = rb_ary_new(); - RBASIC(list)->klass = 0; + *req_list = list = rb_ary_new(); + RBASIC_CLEAR_CLASS(list); } - rb_ary_push(list, rb_obj_freeze(rb_str_new2(mod))); + feature = rb_str_new2(mod); + RBASIC_CLEAR_CLASS(feature); + rb_ary_push(list, feature); } -extern void Init_ext(void); -extern VALUE rb_vm_top_self(void); - static void -require_libraries(struct cmdline_options *opt) +require_libraries(VALUE *req_list) { - VALUE list = opt->req_list; + VALUE list = *req_list; + VALUE self = rb_vm_top_self(); ID require; + rb_encoding *extenc = rb_default_external_encoding(); - Init_ext(); /* should be called here for some reason :-( */ CONST_ID(require, "require"); while (list && RARRAY_LEN(list) > 0) { VALUE feature = rb_ary_shift(list); - rb_funcall2(rb_vm_top_self(), require, 1, &feature); + rb_enc_associate(feature, extenc); + RBASIC_SET_CLASS_RAW(feature, rb_cString); + OBJ_FREEZE(feature); + rb_funcallv(self, require, 1, &feature); } - opt->req_list = 0; + *req_list = 0; +} + +static const struct rb_block* +toplevel_context(rb_binding_t *bind) +{ + return &bind->block; } static void -process_sflag(struct cmdline_options *opt) +process_sflag(int *sflag) { - if (opt->sflag) { + if (*sflag > 0) { long n; - VALUE *args; + const VALUE *args; VALUE argv = rb_argv; n = RARRAY_LEN(argv); - args = RARRAY_PTR(argv); + args = RARRAY_CONST_PTR(argv); while (n > 0) { VALUE v = *args++; char *s = StringValuePtr(v); char *p; - int hyphen = Qfalse; + int hyphen = FALSE; if (s[0] != '-') break; @@ -494,7 +697,7 @@ process_sflag(struct cmdline_options *opt) break; } if (*p == '-') { - hyphen = Qtrue; + hyphen = TRUE; } else if (*p != '_' && !ISALNUM(*p)) { VALUE name_error[2]; @@ -523,110 +726,227 @@ process_sflag(struct cmdline_options *opt) while (n--) { rb_ary_shift(argv); } + *sflag = -1; } - opt->sflag = 0; } -NODE *rb_parser_append_print(VALUE, NODE *); -NODE *rb_parser_while_loop(VALUE, NODE *, int, int); -static int proc_options(int argc, char **argv, struct cmdline_options *opt); +static long proc_options(long argc, char **argv, ruby_cmdline_options_t *opt, int envopt); -static char * -moreswitches(const char *s, struct cmdline_options *opt) +static void +moreswitches(const char *s, ruby_cmdline_options_t *opt, int envopt) { - int argc; - char *argv[3]; - const char *p = s; - - argc = 2; - argv[0] = argv[2] = 0; - while (*s && !ISSPACE(*s)) - s++; - argv[1] = ALLOCA_N(char, s - p + 2); - argv[1][0] = '-'; - strncpy(argv[1] + 1, p, s - p); - argv[1][s - p + 1] = '\0'; - proc_options(argc, argv, opt); - while (*s && ISSPACE(*s)) - s++; - return (char *)s; + long argc, i, len; + char **argv, *p; + const char *ap = 0; + VALUE argstr, argary; + + while (ISSPACE(*s)) s++; + if (!*s) return; + argstr = rb_str_tmp_new((len = strlen(s)) + (envopt!=0)); + argary = rb_str_tmp_new(0); + + p = RSTRING_PTR(argstr); + if (envopt) *p++ = ' '; + memcpy(p, s, len + 1); + ap = 0; + rb_str_cat(argary, (char *)&ap, sizeof(ap)); + while (*p) { + ap = p; + rb_str_cat(argary, (char *)&ap, sizeof(ap)); + while (*p && !ISSPACE(*p)) ++p; + if (!*p) break; + *p++ = '\0'; + while (ISSPACE(*p)) ++p; + } + argc = RSTRING_LEN(argary) / sizeof(ap); + ap = 0; + rb_str_cat(argary, (char *)&ap, sizeof(ap)); + argv = (char **)RSTRING_PTR(argary); + + while ((i = proc_options(argc, argv, opt, envopt)) > 1 && envopt && (argc -= i) > 0) { + argv += i; + if (**argv != '-') { + *--*argv = '-'; + } + if ((*argv)[1]) { + ++argc; + --argv; + } + } + + /* get rid of GC */ + rb_str_resize(argary, 0); + rb_str_resize(argstr, 0); +} + +static int +name_match_p(const char *name, const char *str, size_t len) +{ + if (len == 0) return 0; + do { + while (TOLOWER(*str) == *name) { + if (!--len || !*++str) return 1; + ++name; + } + if (*str != '-' && *str != '_') return 0; + while (ISALNUM(*name)) name++; + if (*name != '-' && *name != '_') return 0; + ++name; + ++str; + } while (len > 0); + return !*name; } #define NAME_MATCH_P(name, str, len) \ - ((len) < sizeof(name) && strncmp((str), name, (len)) == 0) + ((len) < (int)sizeof(name) && name_match_p((name), (str), (len))) #define UNSET_WHEN(name, bit, str, len) \ - if (NAME_MATCH_P(name, str, len)) { \ + if (NAME_MATCH_P((name), (str), (len))) { \ *(unsigned int *)arg &= ~(bit); \ return; \ } #define SET_WHEN(name, bit, str, len) \ - if (NAME_MATCH_P(name, str, len)) { \ + if (NAME_MATCH_P((name), (str), (len))) { \ *(unsigned int *)arg |= (bit); \ return; \ } +#define LITERAL_NAME_ELEMENT(name) #name + static void -enable_option(const char *str, int len, void *arg) +feature_option(const char *str, int len, void *arg, const unsigned int enable) { -#define UNSET_WHEN_DISABLE(bit) UNSET_WHEN(#bit, DISABLE_BIT(bit), str, len) - UNSET_WHEN_DISABLE(gems); - UNSET_WHEN_DISABLE(rubyopt); + static const char list[] = EACH_FEATURES(LITERAL_NAME_ELEMENT, ", "); + unsigned int *argp = arg; + unsigned int mask = ~0U; +#if AMBIGUOUS_FEATURE_NAMES + unsigned int set = 0U; + int matched = 0; +#define SET_FEATURE(bit) \ + if (NAME_MATCH_P(#bit, str, len)) {set |= mask = FEATURE_BIT(bit); ++matched;} +#else +#define SET_FEATURE(bit) \ + if (NAME_MATCH_P(#bit, str, len)) {mask = FEATURE_BIT(bit); goto found;} +#endif + EACH_FEATURES(SET_FEATURE, ;); if (NAME_MATCH_P("all", str, len)) { - *(unsigned int *)arg = 0U; + found: + *argp = (*argp & ~mask) | (mask & enable); return; } - rb_warn("unknown argument for --enable: `%.*s'", len, str); +#if AMBIGUOUS_FEATURE_NAMES + if (matched == 1) goto found; + if (matched > 1) { + VALUE mesg = rb_sprintf("ambiguous feature: `%.*s' (", len, str); +#define ADD_FEATURE_NAME(bit) \ + if (FEATURE_BIT(bit) & set) { \ + rb_str_cat_cstr(mesg, #bit); \ + if (--matched) rb_str_cat_cstr(mesg, ", "); \ + } + EACH_FEATURES(ADD_FEATURE_NAME, ;); + rb_str_cat_cstr(mesg, ")"); + rb_exc_raise(rb_exc_new_str(rb_eRuntimeError, mesg)); +#undef ADD_FEATURE_NAME + } +#endif + rb_warn("unknown argument for --%s: `%.*s'", + enable ? "enable" : "disable", len, str); + rb_warn("features are [%.*s].", (int)strlen(list), list); +} + +static void +enable_option(const char *str, int len, void *arg) +{ + feature_option(str, len, arg, ~0U); } static void disable_option(const char *str, int len, void *arg) { -#define SET_WHEN_DISABLE(bit) SET_WHEN(#bit, DISABLE_BIT(bit), str, len) - SET_WHEN_DISABLE(gems); - SET_WHEN_DISABLE(rubyopt); - if (NAME_MATCH_P("all", str, len)) { - *(unsigned int *)arg = ~0U; - return; - } - rb_warn("unknown argument for --disable: `%.*s'", len, str); + feature_option(str, len, arg, 0U); +} + +RUBY_EXTERN const int ruby_patchlevel; +int ruby_env_debug_option(const char *str, int len, void *arg); + +static void +debug_option(const char *str, int len, void *arg) +{ + static const char list[] = EACH_DEBUG_FEATURES(LITERAL_NAME_ELEMENT, ", "); +#define SET_WHEN_DEBUG(bit) SET_WHEN(#bit, DEBUG_BIT(bit), str, len) + EACH_DEBUG_FEATURES(SET_WHEN_DEBUG, ;); +#ifdef RUBY_DEVEL + if (ruby_patchlevel < 0 && ruby_env_debug_option(str, len, 0)) return; +#endif + rb_warn("unknown argument for --debug: `%.*s'", len, str); + rb_warn("debug features are [%.*s].", (int)strlen(list), list); } static void dump_option(const char *str, int len, void *arg) { + static const char list[] = EACH_DUMPS(LITERAL_NAME_ELEMENT, ", "); #define SET_WHEN_DUMP(bit) SET_WHEN(#bit, DUMP_BIT(bit), str, len) - SET_WHEN_DUMP(insns); - rb_warn("don't know how to dump `%.*s', (insns)", len, str); + EACH_DUMPS(SET_WHEN_DUMP, ;); + rb_warn("don't know how to dump `%.*s',", len, str); + rb_warn("but only [%.*s].", (int)strlen(list), list); } -static int -proc_options(int argc, char **argv, struct cmdline_options *opt) +static void +set_option_encoding_once(const char *type, VALUE *name, const char *e, long elen) +{ + VALUE ename; + + if (!elen) elen = strlen(e); + ename = rb_str_new(e, elen); + + if (*name && + rb_funcall(ename, rb_intern("casecmp"), 1, *name) != INT2FIX(0)) { + rb_raise(rb_eRuntimeError, + "%s already set to %"PRIsVALUE, type, *name); + } + *name = ename; +} + +#define set_internal_encoding_once(opt, e, elen) \ + set_option_encoding_once("default_internal", &(opt)->intern.enc.name, (e), (elen)) +#define set_external_encoding_once(opt, e, elen) \ + set_option_encoding_once("default_external", &(opt)->ext.enc.name, (e), (elen)) +#define set_source_encoding_once(opt, e, elen) \ + set_option_encoding_once("source", &(opt)->src.enc.name, (e), (elen)) + +static long +proc_options(long argc, char **argv, ruby_cmdline_options_t *opt, int envopt) { - int n, argc0 = argc; + long n, argc0 = argc; const char *s; + int warning = opt->warning; - if (argc == 0) + if (argc <= 0 || !argv) return 0; for (argc--, argv++; argc > 0; argc--, argv++) { - if (argv[0][0] != '-' || !argv[0][1]) + const char *const arg = argv[0]; + if (!arg || arg[0] != '-' || !arg[1]) break; - s = argv[0] + 1; + s = arg + 1; reswitch: switch (*s) { case 'a': - opt->do_split = Qtrue; + if (envopt) goto noenvopt; + opt->do_split = TRUE; s++; goto reswitch; case 'p': - opt->do_print = Qtrue; + if (envopt) goto noenvopt; + opt->do_print = TRUE; /* through */ case 'n': - opt->do_loop = Qtrue; + if (envopt) goto noenvopt; + opt->do_loop = TRUE; s++; goto reswitch; @@ -637,7 +957,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) goto reswitch; case 'y': - opt->yydebug = 1; + if (envopt) goto noenvopt; + opt->dump |= DUMP_BIT(yydebug); s++; goto reswitch; @@ -646,16 +967,19 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) s++; goto reswitch; } - ruby_show_version(); + opt->dump |= DUMP_BIT(version_v); opt->verbose = 1; case 'w': - ruby_verbose = Qtrue; + if (!opt->warning) { + warning = 1; + ruby_verbose = Qtrue; + } s++; goto reswitch; case 'W': { - int numlen; + size_t numlen; int v = 2; /* -W as -W2 */ if (*++s) { @@ -664,56 +988,62 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) v = 1; s += numlen; } - switch (v) { - case 0: - ruby_verbose = Qnil; - break; - case 1: - ruby_verbose = Qfalse; - break; - default: - ruby_verbose = Qtrue; - break; + if (!opt->warning) { + switch (v) { + case 0: + ruby_verbose = Qnil; + break; + case 1: + ruby_verbose = Qfalse; + break; + default: + ruby_verbose = Qtrue; + break; + } } + warning = 1; } goto reswitch; case 'c': - opt->do_check = Qtrue; + if (envopt) goto noenvopt; + opt->dump |= DUMP_BIT(syntax); s++; goto reswitch; case 's': + if (envopt) goto noenvopt; forbid_setid("-s"); - opt->sflag = 1; + if (!opt->sflag) opt->sflag = 1; s++; goto reswitch; case 'h': - usage(origarg.argv[0]); - rb_exit(EXIT_SUCCESS); - break; + if (envopt) goto noenvopt; + opt->dump |= DUMP_BIT(usage); + goto switch_end; case 'l': - opt->do_line = Qtrue; + if (envopt) goto noenvopt; + opt->do_line = TRUE; rb_output_rs = rb_rs; s++; goto reswitch; case 'S': + if (envopt) goto noenvopt; forbid_setid("-S"); - opt->do_search = Qtrue; + opt->do_search = TRUE; s++; goto reswitch; case 'e': + if (envopt) goto noenvopt; forbid_setid("-e"); if (!*++s) { - s = argv[1]; - argc--, argv++; - } - if (!s) { - rb_raise(rb_eRuntimeError, "no code specified for -e"); + if (!--argc) + rb_raise(rb_eRuntimeError, "no code specified for -e"); + s = *++argv; } if (!opt->e_script) { opt->e_script = rb_str_new(0, 0); @@ -727,21 +1057,24 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) case 'r': forbid_setid("-r"); if (*++s) { - add_modules(opt, s); + add_modules(&opt->req_list, s); } - else if (argv[1]) { - add_modules(opt, argv[1]); + else if (argc > 1) { + add_modules(&opt->req_list, argv[1]); argc--, argv++; } break; case 'i': + if (envopt) goto noenvopt; forbid_setid("-i"); ruby_set_inplace_mode(s + 1); break; case 'x': - opt->xflag = Qtrue; + if (envopt) goto noenvopt; + forbid_setid("-x"); + opt->xflag = TRUE; s++; if (*s && chdir(s) < 0) { rb_fatal("Can't chdir to %s", s); @@ -750,12 +1083,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) case 'C': case 'X': - s++; - if (!*s) { - s = argv[1]; - argc--, argv++; - } - if (!s || !*s) { + if (envopt) goto noenvopt; + if (!*++s && (!--argc || !(s = *++argv) || !*s)) { rb_fatal("Can't chdir"); } if (chdir(s) < 0) { @@ -764,15 +1093,23 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) break; case 'F': + if (envopt) goto noenvopt; if (*++s) { rb_fs = rb_reg_new(s, strlen(s), 0); } break; case 'E': - if (!*++s) goto next_encoding; + if (!*++s && (!--argc || !(s = *++argv))) { + rb_raise(rb_eRuntimeError, "missing argument for -E"); + } goto encoding; + case 'U': + set_internal_encoding_once(opt, "UTF-8", 0); + ++s; + goto reswitch; + case 'K': if (*++s) { const char *enc_name = 0; @@ -792,7 +1129,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) } if (enc_name) { opt->src.enc.name = rb_str_new2(enc_name); - opt->ext.enc.name = opt->src.enc.name; + if (!opt->ext.enc.name) + opt->ext.enc.name = opt->src.enc.name; } s++; } @@ -800,7 +1138,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) case 'T': { - int numlen; + size_t numlen; int v = 1; if (*++s) { @@ -809,7 +1147,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) v = 1; s += numlen; } - rb_set_safe_level(v); + if (v > opt->safe_level) opt->safe_level = v; } goto reswitch; @@ -817,15 +1155,16 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) forbid_setid("-I"); if (*++s) ruby_incpush_expand(s); - else if (argv[1]) { + else if (argc > 1) { ruby_incpush_expand(argv[1]); argc--, argv++; } break; case '0': + if (envopt) goto noenvopt; { - int numlen; + size_t numlen; int v; char c; @@ -834,7 +1173,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) if (v > 0377) rb_rs = Qnil; else if (v == 0 && numlen >= 2) { - rb_rs = rb_str_new2("\n\n"); + rb_rs = rb_str_new2(""); } else { c = v & 0xff; @@ -849,52 +1188,97 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) goto switch_end; } s++; - if (strcmp("copyright", s) == 0) - opt->copyright = 1; - else if (strcmp("debug", s) == 0) { - ruby_debug = Qtrue; - ruby_verbose = Qtrue; - } - else if (strncmp("enable", s, n = 6) == 0 && - (!s[n] || s[n] == '-' || s[n] == '=')) { - if ((s += n + 1)[-1] ? !*s : (!--argc || !(s = *++argv))) { - rb_raise(rb_eRuntimeError, "missing argument for --enable"); - } - ruby_each_words(s, enable_option, &opt->disable); + +# define is_option_end(c, allow_hyphen) \ + (!(c) || ((allow_hyphen) && (c) == '-') || (c) == '=') +# define check_envopt(name, allow_envopt) \ + (((allow_envopt) || !envopt) ? (void)0 : \ + rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: --" name)) +# define need_argument(name, s, needs_arg, next_arg) \ + ((*(s) ? !*++(s) : (next_arg) && (!argc || !((s) = argv[1]) || (--argc, ++argv, 0))) && (needs_arg) ? \ + rb_raise(rb_eRuntimeError, "missing argument for --" name) \ + : (void)0) +# define is_option_with_arg(name, allow_hyphen, allow_envopt) \ + is_option_with_optarg(name, allow_hyphen, allow_envopt, Qtrue, Qtrue) +# define is_option_with_optarg(name, allow_hyphen, allow_envopt, needs_arg, next_arg) \ + (strncmp((name), s, n = sizeof(name) - 1) == 0 && is_option_end(s[n], (allow_hyphen)) ? \ + (check_envopt(name, (allow_envopt)), s += n, \ + need_argument(name, s, needs_arg, next_arg), 1) : 0) + + if (strcmp("copyright", s) == 0) { + if (envopt) goto noenvopt_long; + opt->dump |= DUMP_BIT(copyright); } - else if (strncmp("disable", s, n = 7) == 0 && - (!s[n] || s[n] == '-' || s[n] == '=')) { - if ((s += n + 1)[-1] ? !*s : (!--argc || !(s = *++argv))) { - rb_raise(rb_eRuntimeError, "missing argument for --disable"); + else if (is_option_with_optarg("debug", Qtrue, Qtrue, Qfalse, Qfalse)) { + if (s && *s) { + ruby_each_words(s, debug_option, &opt->features); } - ruby_each_words(s, disable_option, &opt->disable); - } - else if (strncmp("encoding", s, n = 8) == 0 && (!s[n] || s[n] == '=')) { - s += n; - if (!*s++) { - next_encoding: - if (!--argc || !(s = *++argv)) { - rb_raise(rb_eRuntimeError, "missing argument for --encoding"); - } + else { + ruby_debug = Qtrue; + ruby_verbose = Qtrue; } + } + else if (is_option_with_arg("enable", Qtrue, Qtrue)) { + ruby_each_words(s, enable_option, &opt->features); + } + else if (is_option_with_arg("disable", Qtrue, Qtrue)) { + ruby_each_words(s, disable_option, &opt->features); + } + else if (is_option_with_arg("encoding", Qfalse, Qtrue)) { + char *p; encoding: - opt->ext.enc.name = rb_str_new2(s); + do { +# define set_encoding_part(type) \ + if (!(p = strchr(s, ':'))) { \ + set_##type##_encoding_once(opt, s, 0); \ + break; \ + } \ + else if (p > s) { \ + set_##type##_encoding_once(opt, s, p-s); \ + } + set_encoding_part(external); + if (!*(s = ++p)) break; + set_encoding_part(internal); + if (!*(s = ++p)) break; +#if defined ALLOW_DEFAULT_SOURCE_ENCODING && ALLOW_DEFAULT_SOURCE_ENCODING + set_encoding_part(source); + if (!*(s = ++p)) break; +#endif + rb_raise(rb_eRuntimeError, "extra argument for %s: %s", + (arg[1] == '-' ? "--encoding" : "-E"), s); +# undef set_encoding_part + } while (0); + } + else if (is_option_with_arg("internal-encoding", Qfalse, Qtrue)) { + set_internal_encoding_once(opt, s, 0); + } + else if (is_option_with_arg("external-encoding", Qfalse, Qtrue)) { + set_external_encoding_once(opt, s, 0); + } +#if defined ALLOW_DEFAULT_SOURCE_ENCODING && ALLOW_DEFAULT_SOURCE_ENCODING + else if (is_option_with_arg("source-encoding", Qfalse, Qtrue)) { + set_source_encoding_once(opt, s, 0); + } +#endif + else if (strcmp("version", s) == 0) { + if (envopt) goto noenvopt_long; + opt->dump |= DUMP_BIT(version); } - else if (strcmp("version", s) == 0) - opt->version = 1; else if (strcmp("verbose", s) == 0) { opt->verbose = 1; ruby_verbose = Qtrue; } - else if (strcmp("yydebug", s) == 0) - opt->yydebug = 1; - else if (strncmp("dump", s, n = 4) == 0 && (!s[n] || s[n] == '=')) { - if (!(s += n + 1)[-1] && (!--argc || !(s = *++argv)) && *s != '-') break; + else if (strcmp("yydebug", s) == 0) { + if (envopt) goto noenvopt_long; + opt->dump |= DUMP_BIT(yydebug); + } + else if (is_option_with_arg("dump", Qfalse, Qfalse)) { ruby_each_words(s, dump_option, &opt->dump); } else if (strcmp("help", s) == 0) { - usage(origarg.argv[0]); - rb_exit(EXIT_SUCCESS); + if (envopt) goto noenvopt_long; + opt->dump |= DUMP_BIT(help); + goto switch_end; } else { rb_raise(rb_eRuntimeError, @@ -921,22 +1305,35 @@ proc_options(int argc, char **argv, struct cmdline_options *opt) } goto switch_end; + noenvopt: + /* "EIdvwWrKU" only */ + rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: -%c", *s); + break; + + noenvopt_long: + rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: --%s", s); + break; + case 0: break; +# undef is_option_end +# undef check_envopt +# undef need_argument +# undef is_option_with_arg +# undef is_option_with_optarg } } switch_end: + if (warning) opt->warning = warning; return argc0 - argc; } -void Init_prelude(void); - static void -ruby_init_gems(int enable) +ruby_init_prelude(void) { - if (enable) rb_define_module("Gem"); Init_prelude(); + rb_const_remove(rb_cObject, rb_intern_const("TMP_RUBY_PREFIX")); } static int @@ -954,95 +1351,180 @@ opt_enc_index(VALUE enc_name) return i; } -#define rb_progname (GET_VM()->progname) +#define rb_progname (GET_VM()->progname) +#define rb_orig_progname (GET_VM()->orig_progname) VALUE rb_argv0; static VALUE -process_options(VALUE arg) +false_value(void) +{ + return Qfalse; +} + +static VALUE +true_value(void) +{ + return Qtrue; +} + +#define rb_define_readonly_boolean(name, val) \ + rb_define_virtual_variable((name), (val) ? true_value : false_value, 0) + +static VALUE +uscore_get(void) +{ + VALUE line; + + line = rb_lastline_get(); + if (!RB_TYPE_P(line, T_STRING)) { + rb_raise(rb_eTypeError, "$_ value need to be String (%s given)", + NIL_P(line) ? "nil" : rb_obj_classname(line)); + } + return line; +} + +/* + * call-seq: + * sub(pattern, replacement) -> $_ + * sub(pattern) {|...| block } -> $_ + * + * Equivalent to <code>$_.sub(<i>args</i>)</code>, except that + * <code>$_</code> will be updated if substitution occurs. + * Available only when -p/-n command line option specified. + */ + +static VALUE +rb_f_sub(int argc, VALUE *argv) +{ + VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("sub"), argc, argv); + rb_lastline_set(str); + return str; +} + +/* + * call-seq: + * gsub(pattern, replacement) -> $_ + * gsub(pattern) {|...| block } -> $_ + * + * Equivalent to <code>$_.gsub...</code>, except that <code>$_</code> + * will be updated if substitution occurs. + * Available only when -p/-n command line option specified. + * + */ + +static VALUE +rb_f_gsub(int argc, VALUE *argv) +{ + VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("gsub"), argc, argv); + rb_lastline_set(str); + return str; +} + +/* + * call-seq: + * chop -> $_ + * + * Equivalent to <code>($_.dup).chop!</code>, except <code>nil</code> + * is never returned. See <code>String#chop!</code>. + * Available only when -p/-n command line option specified. + * + */ + +static VALUE +rb_f_chop(void) +{ + VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("chop"), 0, 0); + rb_lastline_set(str); + return str; +} + + +/* + * call-seq: + * chomp -> $_ + * chomp(string) -> $_ + * + * Equivalent to <code>$_ = $_.chomp(<em>string</em>)</code>. See + * <code>String#chomp</code>. + * Available only when -p/-n command line option specified. + * + */ + +static VALUE +rb_f_chomp(int argc, VALUE *argv) +{ + VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("chomp"), argc, argv); + rb_lastline_set(str); + return str; +} + +static VALUE +process_options(int argc, char **argv, ruby_cmdline_options_t *opt) { - struct cmdline_arguments *argp = (struct cmdline_arguments *)arg; - struct cmdline_options *opt = argp->opt; - int argc = argp->argc; - char **argv = argp->argv; - NODE *tree = 0; + rb_ast_t *ast = 0; VALUE parser; - VALUE iseq; + VALUE script_name; + const rb_iseq_t *iseq; rb_encoding *enc, *lenc; +#if UTF8_PATH + rb_encoding *uenc, *ienc = 0; +#endif const char *s; char fbuf[MAXPATHLEN]; - int i = proc_options(argc, argv, opt); - int safe; + int i = (int)proc_options(argc, argv, opt, 0); + rb_binding_t *toplevel_binding; + const struct rb_block *base_block; + unsigned int dump = opt->dump & dump_exit_bits; + + if (opt->dump & (DUMP_BIT(usage)|DUMP_BIT(help))) { + const char *const progname = + (argc > 0 && argv && argv[0] ? argv[0] : + origarg.argc > 0 && origarg.argv && origarg.argv[0] ? origarg.argv[0] : + ruby_engine); + usage(progname, (opt->dump & DUMP_BIT(help))); + return Qtrue; + } argc -= i; argv += i; - if (!(opt->disable & DISABLE_BIT(rubyopt)) && - rb_safe_level() == 0 && (s = getenv("RUBYOPT"))) { + if ((opt->features & FEATURE_BIT(rubyopt)) && + opt->safe_level == 0 && (s = getenv("RUBYOPT"))) { VALUE src_enc_name = opt->src.enc.name; VALUE ext_enc_name = opt->ext.enc.name; + VALUE int_enc_name = opt->intern.enc.name; - while (ISSPACE(*s)) - s++; - if (*s == 'T' || (*s == '-' && *(s + 1) == 'T')) { - int numlen; - int v = 1; - - if (*s != 'T') - ++s; - if (*++s) { - v = scan_oct(s, 2, &numlen); - if (numlen == 0) - v = 1; - } - rb_set_safe_level(v); - } - else { - while (s && *s) { - if (*s == '-') { - s++; - if (ISSPACE(*s)) { - do { - s++; - } while (ISSPACE(*s)); - continue; - } - } - if (!*s) - break; - if (!strchr("EIdvwWrK", *s)) - rb_raise(rb_eRuntimeError, - "invalid switch in RUBYOPT: -%c", *s); - s = moreswitches(s, opt); - } - } + opt->src.enc.name = opt->ext.enc.name = opt->intern.enc.name = 0; + moreswitches(s, opt, 1); if (src_enc_name) opt->src.enc.name = src_enc_name; if (ext_enc_name) opt->ext.enc.name = ext_enc_name; + if (int_enc_name) + opt->intern.enc.name = int_enc_name; } - if (opt->version) { + if (opt->src.enc.name) + rb_warning("-K is specified; it is for 1.8 compatibility and may cause odd behavior"); + + if (opt->dump & (DUMP_BIT(version) | DUMP_BIT(version_v))) { ruby_show_version(); - return Qtrue; + if (opt->dump & DUMP_BIT(version)) return Qtrue; } - if (opt->copyright) { + if (opt->dump & DUMP_BIT(copyright)) { ruby_show_copyright(); - } - - if (rb_safe_level() >= 4) { - OBJ_TAINT(rb_argv); - OBJ_TAINT(GET_VM()->load_path); + return Qtrue; } if (!opt->e_script) { - if (argc == 0) { /* no more args */ + if (argc <= 0) { /* no more args */ if (opt->verbose) return Qtrue; opt->script = "-"; } else { opt->script = argv[0]; - if (opt->script[0] == '\0') { + if (!opt->script || opt->script[0] == '\0') { opt->script = "-"; } else if (opt->do_search) { @@ -1061,30 +1543,36 @@ process_options(VALUE arg) argc--; argv++; } + if (opt->script[0] == '-' && !opt->script[1]) { + forbid_setid("program input from stdin"); + } } - ruby_script(opt->script); -#if defined DOSISH || defined __CYGWIN__ - translate_char(RSTRING_PTR(rb_progname), '\\', '/'); -#endif - opt->script_name = rb_str_new4(rb_progname); + opt->script_name = rb_str_new_cstr(opt->script); opt->script = RSTRING_PTR(opt->script_name); - ruby_set_argv(argc, argv); - process_sflag(opt); - ruby_init_loadpath(); - safe = rb_safe_level(); - rb_set_safe_level_force(0); - ruby_init_gems(!(opt->disable & DISABLE_BIT(gems))); +#if _WIN32 + translit_char_bin(RSTRING_PTR(opt->script_name), '\\', '/'); +#elif defined DOSISH + translit_char(RSTRING_PTR(opt->script_name), '\\', '/'); +#endif + + ruby_gc_set_params(opt->safe_level); + ruby_init_loadpath_safe(opt->safe_level); + Init_enc(); lenc = rb_locale_encoding(); - for (i = 0; i < RARRAY_LEN(rb_argv); i++) { - rb_enc_associate(RARRAY_PTR(rb_argv)[i], lenc); - } + rb_enc_associate(rb_progname, lenc); + rb_obj_freeze(rb_progname); parser = rb_parser_new(); - if (opt->yydebug) rb_parser_set_yydebug(parser, Qtrue); + if (opt->dump & DUMP_BIT(yydebug)) { + rb_parser_set_yydebug(parser, Qtrue); + } if (opt->ext.enc.name != 0) { opt->ext.enc.index = opt_enc_index(opt->ext.enc.name); } + if (opt->intern.enc.name != 0) { + opt->intern.enc.index = opt_enc_index(opt->intern.enc.name); + } if (opt->src.enc.name != 0) { opt->src.enc.index = opt_enc_index(opt->src.enc.name); src_encoding_index = opt->src.enc.index; @@ -1096,176 +1584,294 @@ process_options(VALUE arg) enc = lenc; } rb_enc_set_default_external(rb_enc_from_encoding(enc)); + if (opt->intern.enc.index >= 0) { + enc = rb_enc_from_index(opt->intern.enc.index); + rb_enc_set_default_internal(rb_enc_from_encoding(enc)); + opt->intern.enc.index = -1; +#if UTF8_PATH + ienc = enc; +#endif + } + script_name = opt->script_name; + rb_enc_associate(opt->script_name, + IF_UTF8_PATH(uenc = rb_utf8_encoding(), lenc)); +#if UTF8_PATH + if (uenc != lenc) { + opt->script_name = str_conv_enc(opt->script_name, uenc, lenc); + opt->script = RSTRING_PTR(opt->script_name); + } +#endif + rb_obj_freeze(opt->script_name); + if (IF_UTF8_PATH(uenc != lenc, 1)) { + long i; + rb_vm_t *vm = GET_VM(); + VALUE load_path = vm->load_path; + const ID id_initial_load_path_mark = INITIAL_LOAD_PATH_MARK; + int modifiable = FALSE; + + rb_get_expanded_load_path(); + for (i = 0; i < RARRAY_LEN(load_path); ++i) { + VALUE path = RARRAY_AREF(load_path, i); + int mark = rb_attr_get(path, id_initial_load_path_mark) == path; +#if UTF8_PATH + VALUE newpath = rb_str_conv_enc(path, uenc, lenc); + if (newpath == path) continue; + path = newpath; +#else + path = rb_enc_associate(rb_str_dup(path), lenc); +#endif + if (mark) rb_ivar_set(path, id_initial_load_path_mark, path); + if (!modifiable) { + rb_ary_modify(load_path); + modifiable = TRUE; + } + RARRAY_ASET(load_path, i, path); + } + if (modifiable) { + rb_ary_replace(vm->load_path_snapshot, load_path); + } + } + Init_ext(); /* load statically linked extensions before rubygems */ + if (opt->features & FEATURE_BIT(gems)) { + rb_define_module("Gem"); + } + if (opt->features & FEATURE_BIT(did_you_mean)) { + rb_define_module("DidYouMean"); + } + ruby_init_prelude(); + if ((opt->features ^ DEFAULT_FEATURES) & COMPILATION_FEATURES) { + VALUE option = rb_hash_new(); +#define SET_COMPILE_OPTION(h, o, name) \ + rb_hash_aset((h), ID2SYM(rb_intern_const(#name)), \ + ((o)->features & FEATURE_BIT(name) ? Qtrue : Qfalse)); + SET_COMPILE_OPTION(option, opt, frozen_string_literal); + SET_COMPILE_OPTION(option, opt, debug_frozen_string_literal); + rb_funcallv(rb_cISeq, rb_intern_const("compile_option="), 1, &option); +#undef SET_COMPILE_OPTION + } + ruby_set_argv(argc, argv); + process_sflag(&opt->sflag); + + GetBindingPtr(rb_const_get(rb_cObject, rb_intern("TOPLEVEL_BINDING")), + toplevel_binding); + /* need to acquire env from toplevel_binding each time, since it + * may update after eval() */ + + base_block = toplevel_context(toplevel_binding); + rb_parser_set_context(parser, base_block, TRUE); - rb_set_safe_level_force(safe); if (opt->e_script) { + VALUE progname = rb_progname; rb_encoding *eenc; if (opt->src.enc.index >= 0) { eenc = rb_enc_from_index(opt->src.enc.index); } else { eenc = lenc; +#if UTF8_PATH + if (ienc) eenc = ienc; +#endif + } +#if UTF8_PATH + if (eenc != uenc) { + opt->e_script = str_conv_enc(opt->e_script, uenc, eenc); } +#endif rb_enc_associate(opt->e_script, eenc); - require_libraries(opt); - tree = rb_parser_compile_string(parser, opt->script, opt->e_script, 1); + if (!(opt->dump & ~DUMP_BIT(version_v))) { + ruby_set_script_name(opt->script_name); + require_libraries(&opt->req_list); + } + ruby_set_script_name(progname); + rb_parser_set_options(parser, opt->do_print, opt->do_loop, + opt->do_line, opt->do_split); + ast = rb_parser_compile_string(parser, opt->script, opt->e_script, 1); } else { - if (opt->script[0] == '-' && !opt->script[1]) { - forbid_setid("program input from stdin"); - } - tree = load_file(parser, opt->script, 1, opt); + VALUE f; + f = open_load_file(script_name, &opt->xflag); + ast = load_file(parser, opt->script_name, f, 1, opt); + } + ruby_set_script_name(opt->script_name); + if (dump & DUMP_BIT(yydebug)) { + dump &= ~DUMP_BIT(yydebug); + if (!dump) return Qtrue; } - if (!tree) return Qfalse; + if (opt->ext.enc.index >= 0) { + enc = rb_enc_from_index(opt->ext.enc.index); + } + else { + enc = lenc; + } + rb_enc_set_default_external(rb_enc_from_encoding(enc)); + if (opt->intern.enc.index >= 0) { + /* Set in the shebang line */ + enc = rb_enc_from_index(opt->intern.enc.index); + rb_enc_set_default_internal(rb_enc_from_encoding(enc)); + } + else if (!rb_default_internal_encoding()) + /* Freeze default_internal */ + rb_enc_set_default_internal(Qnil); + rb_stdio_set_default_encoding(); + + if (!ast->root) { + rb_ast_dispose(ast); + return Qfalse; + } - process_sflag(opt); + process_sflag(&opt->sflag); opt->xflag = 0; - if (rb_safe_level() >= 4) { - FL_UNSET(rb_argv, FL_TAINT); - FL_UNSET(GET_VM()->load_path, FL_TAINT); - } - - if (opt->do_check) { + if (dump & DUMP_BIT(syntax)) { printf("Syntax OK\n"); - return Qtrue; + dump &= ~DUMP_BIT(syntax); + if (!dump) return Qtrue; } - if (opt->do_print) { - tree = rb_parser_append_print(parser, tree); - } if (opt->do_loop) { - tree = rb_parser_while_loop(parser, tree, opt->do_line, opt->do_split); + rb_define_global_function("sub", rb_f_sub, -1); + rb_define_global_function("gsub", rb_f_gsub, -1); + rb_define_global_function("chop", rb_f_chop, 0); + rb_define_global_function("chomp", rb_f_chomp, -1); + } + + if (dump & (DUMP_BIT(parsetree)|DUMP_BIT(parsetree_with_comment))) { + rb_io_write(rb_stdout, rb_parser_dump_tree(ast->root, dump & DUMP_BIT(parsetree_with_comment))); + rb_io_flush(rb_stdout); + dump &= ~DUMP_BIT(parsetree)&~DUMP_BIT(parsetree_with_comment); + if (!dump) { + rb_ast_dispose(ast); + return Qtrue; + } } - iseq = rb_iseq_new(tree, rb_str_new2("<main>"), - opt->script_name, Qfalse, ISEQ_TYPE_TOP); + { + VALUE path = Qnil; + if (!opt->e_script && strcmp(opt->script, "-")) { + path = rb_realpath_internal(Qnil, script_name, 1); +#if UTF8_PATH + if (uenc != lenc) { + path = str_conv_enc(path, uenc, lenc); + } +#endif + if (!ENCODING_GET(path)) { /* ASCII-8BIT */ + rb_enc_copy(path, opt->script_name); + } + } + base_block = toplevel_context(toplevel_binding); + iseq = rb_iseq_new_main(ast->root, opt->script_name, path, vm_block_iseq(base_block)); + rb_ast_dispose(ast); + } - if (opt->dump & DUMP_BIT(insns)) { - rb_io_write(rb_stdout, ruby_iseq_disasm(iseq)); + if (dump & DUMP_BIT(insns)) { + rb_io_write(rb_stdout, rb_iseq_disasm((const rb_iseq_t *)iseq)); rb_io_flush(rb_stdout); - return Qtrue; + dump &= ~DUMP_BIT(insns); + if (!dump) return Qtrue; } + if (opt->dump & dump_exit_bits) return Qtrue; - return iseq; + rb_define_readonly_boolean("$-p", opt->do_print); + rb_define_readonly_boolean("$-l", opt->do_line); + rb_define_readonly_boolean("$-a", opt->do_split); + + rb_set_safe_level(opt->safe_level); + + return (VALUE)iseq; } -static NODE * -load_file(VALUE parser, const char *fname, int script, struct cmdline_options *opt) +#ifndef DOSISH +static void +warn_cr_in_shebang(const char *str, long len) { - extern VALUE rb_stdin; - VALUE f; - int line_start = 1; - NODE *tree = 0; - rb_encoding *enc; - - if (!fname) - rb_load_fail(fname); - if (strcmp(fname, "-") == 0) { - f = rb_stdin; + if (str[len-1] == '\n' && str[len-2] == '\r') { + rb_warn("shebang line ending with \\r may cause problems"); } - else { - int fd, mode = O_RDONLY; -#if defined DOSISH || defined __CYGWIN__ - { - const char *ext = strrchr(fname, '.'); - if (ext && STRCASECMP(ext, ".exe") == 0) - mode |= O_BINARY; - } +} +#else +#define warn_cr_in_shebang(str, len) (void)0 #endif - if ((fd = open(fname, mode)) < 0) { - rb_load_fail(fname); - } - f = rb_io_fdopen(fd, mode, fname); - } +struct load_file_arg { + VALUE parser; + VALUE fname; + int script; + ruby_cmdline_options_t *opt; + VALUE f; +}; + +static VALUE +load_file_internal(VALUE argp_v) +{ + struct load_file_arg *argp = (struct load_file_arg *)argp_v; + VALUE parser = argp->parser; + VALUE orig_fname = argp->fname; + int script = argp->script; + ruby_cmdline_options_t *opt = argp->opt; + VALUE f = argp->f; + int line_start = 1; + rb_ast_t *ast = 0; + rb_encoding *enc; + ID set_encoding; + CONST_ID(set_encoding, "set_encoding"); if (script) { VALUE c = 1; /* something not nil */ VALUE line; - char *p; + char *p, *str; + long len; int no_src_enc = !opt->src.enc.name; int no_ext_enc = !opt->ext.enc.name; + int no_int_enc = !opt->intern.enc.name; - enc = rb_usascii_encoding(); - rb_funcall(f, rb_intern("set_encoding"), 1, rb_enc_from_encoding(enc)); + enc = rb_ascii8bit_encoding(); + rb_funcall(f, set_encoding, 1, rb_enc_from_encoding(enc)); if (opt->xflag) { - forbid_setid("-x"); - opt->xflag = Qfalse; + line_start--; + search_shebang: while (!NIL_P(line = rb_io_gets(f))) { line_start++; - if (RSTRING_LEN(line) > 2 - && RSTRING_PTR(line)[0] == '#' - && RSTRING_PTR(line)[1] == '!') { - if ((p = strstr(RSTRING_PTR(line), "ruby")) != 0) { + RSTRING_GETMEM(line, str, len); + if (len > 2 && str[0] == '#' && str[1] == '!') { + if (line_start == 1) warn_cr_in_shebang(str, len); + if ((p = strstr(str+2, ruby_engine)) != 0) { goto start_read; } } } - rb_raise(rb_eLoadError, "no Ruby script found in input"); + rb_loaderror("no Ruby script found in input"); } c = rb_io_getbyte(f); if (c == INT2FIX('#')) { c = rb_io_getbyte(f); - if (c == INT2FIX('!')) { - line = rb_io_gets(f); - if (NIL_P(line)) - return 0; - - if ((p = strstr(RSTRING_PTR(line), "ruby")) == 0) { - /* not ruby script, kick the program */ - char **argv; - char *path; - char *pend = RSTRING_PTR(line) + RSTRING_LEN(line); - - p = RSTRING_PTR(line); /* skip `#!' */ - if (pend[-1] == '\n') - pend--; /* chomp line */ - if (pend[-1] == '\r') - pend--; - *pend = '\0'; - while (p < pend && ISSPACE(*p)) - p++; - path = p; /* interpreter path */ - while (p < pend && !ISSPACE(*p)) - p++; - *p++ = '\0'; - if (p < pend) { - argv = ALLOCA_N(char *, origarg.argc + 3); - argv[1] = p; - MEMCPY(argv + 2, origarg.argv + 1, char *, origarg.argc); - } - else { - argv = origarg.argv; - } - argv[0] = path; - execv(path, argv); - - rb_fatal("Can't exec %s", path); + if (c == INT2FIX('!') && !NIL_P(line = rb_io_gets(f))) { + RSTRING_GETMEM(line, str, len); + warn_cr_in_shebang(str, len); + if ((p = strstr(str, ruby_engine)) == 0) { + /* not ruby script, assume -x flag */ + goto search_shebang; } start_read: - p += 4; - RSTRING_PTR(line)[RSTRING_LEN(line) - 1] = '\0'; - if (RSTRING_PTR(line)[RSTRING_LEN(line) - 2] == '\r') - RSTRING_PTR(line)[RSTRING_LEN(line) - 2] = '\0'; + str += len - 1; + if (*str == '\n') *str-- = '\0'; + if (*str == '\r') *str-- = '\0'; + /* ruby_engine should not contain a space */ if ((p = strstr(p, " -")) != 0) { - p++; /* skip space before `-' */ - while (*p == '-') { - p = moreswitches(p + 1, opt); - } + opt->warning = 0; + moreswitches(p + 1, opt, 0); } /* push back shebang for pragma may exist in next line */ - rb_io_ungetc(f, rb_str_new2("!\n")); + rb_io_ungetbyte(f, rb_str_new2("!\n")); } else if (!NIL_P(c)) { - rb_io_ungetc(f, c); + rb_io_ungetbyte(f, c); } - rb_io_ungetc(f, INT2FIX('#')); + rb_io_ungetbyte(f, INT2FIX('#')); if (no_src_enc && opt->src.enc.name) { opt->src.enc.index = opt_enc_index(opt->src.enc.name); src_encoding_index = opt->src.enc.index; @@ -1273,11 +1879,20 @@ load_file(VALUE parser, const char *fname, int script, struct cmdline_options *o if (no_ext_enc && opt->ext.enc.name) { opt->ext.enc.index = opt_enc_index(opt->ext.enc.name); } + if (no_int_enc && opt->intern.enc.name) { + opt->intern.enc.index = opt_enc_index(opt->intern.enc.name); + } } else if (!NIL_P(c)) { - rb_io_ungetc(f, c); + rb_io_ungetbyte(f, c); + } + else { + argp->f = f = Qnil; + } + if (!(opt->dump & ~DUMP_BIT(version_v))) { + ruby_set_script_name(opt->script_name); + require_libraries(&opt->req_list); /* Why here? unnatural */ } - require_libraries(opt); /* Why here? unnatural */ } if (opt->src.enc.index >= 0) { enc = rb_enc_from_index(opt->src.enc.index); @@ -1286,156 +1901,281 @@ load_file(VALUE parser, const char *fname, int script, struct cmdline_options *o enc = rb_locale_encoding(); } else { - enc = rb_usascii_encoding(); + enc = rb_utf8_encoding(); + } + rb_parser_set_options(parser, opt->do_print, opt->do_loop, + opt->do_line, opt->do_split); + if (NIL_P(f)) { + f = rb_str_new(0, 0); + rb_enc_associate(f, enc); + return (VALUE)rb_parser_compile_string_path(parser, orig_fname, f, line_start); } - rb_funcall(f, rb_intern("set_encoding"), 1, rb_enc_from_encoding(enc)); - tree = (NODE *)rb_parser_compile_file(parser, fname, f, line_start); - rb_funcall(f, rb_intern("set_encoding"), 1, rb_parser_encoding(parser)); + rb_funcall(f, set_encoding, 2, rb_enc_from_encoding(enc), rb_str_new_cstr("-")); + ast = rb_parser_compile_file_path(parser, orig_fname, f, line_start); + rb_funcall(f, set_encoding, 1, rb_parser_encoding(parser)); if (script && rb_parser_end_seen_p(parser)) { + /* + * DATA is a File that contains the data section of the executed file. + * To create a data section use <tt>__END__</tt>: + * + * $ cat t.rb + * puts DATA.gets + * __END__ + * hello world! + * + * $ ruby t.rb + * hello world! + */ rb_define_global_const("DATA", f); + argp->f = Qnil; + } + return (VALUE)ast; +} + +static VALUE +open_load_file(VALUE fname_v, int *xflag) +{ + const char *fname = (fname_v = rb_str_encode_ospath(fname_v), + StringValueCStr(fname_v)); + long flen = RSTRING_LEN(fname_v); + VALUE f; + int e; + + if (flen == 1 && fname[0] == '-') { + f = rb_stdin; + } + else { + int fd; + /* open(2) may block if fname is point to FIFO and it's empty. Let's + use O_NONBLOCK. */ +#if defined O_NONBLOCK && HAVE_FCNTL && !(O_NONBLOCK & O_ACCMODE) + /* TODO: fix conflicting O_NONBLOCK in ruby/win32.h */ +# define MODE_TO_LOAD (O_RDONLY | O_NONBLOCK) +#elif defined O_NDELAY && HAVE_FCNTL && !(O_NDELAY & O_ACCMODE) +# define MODE_TO_LOAD (O_RDONLY | O_NDELAY) +#else +# define MODE_TO_LOAD (O_RDONLY) +#endif + int mode = MODE_TO_LOAD; +#if defined DOSISH || defined __CYGWIN__ +# define isdirsep(x) ((x) == '/' || (x) == '\\') + { + static const char exeext[] = ".exe"; + enum {extlen = sizeof(exeext)-1}; + if (flen > extlen && !isdirsep(fname[flen-extlen-1]) && + STRNCASECMP(fname+flen-extlen, exeext, extlen) == 0) { + mode |= O_BINARY; + *xflag = 1; + } + } +#endif + + if ((fd = rb_cloexec_open(fname, mode, 0)) < 0) { + int e = errno; + if (!rb_gc_for_fd(e)) { + rb_load_fail(fname_v, strerror(e)); + } + if ((fd = rb_cloexec_open(fname, mode, 0)) < 0) { + rb_load_fail(fname_v, strerror(errno)); + } + } + rb_update_max_fd(fd); + +#if defined HAVE_FCNTL && MODE_TO_LOAD != O_RDONLY + /* disabling O_NONBLOCK */ + if (fcntl(fd, F_SETFL, 0) < 0) { + e = errno; + (void)close(fd); + rb_load_fail(fname_v, strerror(e)); + } +#endif + + e = ruby_is_fd_loadable(fd); + if (!e) { + e = errno; + (void)close(fd); + rb_load_fail(fname_v, strerror(e)); + } + + f = rb_io_fdopen(fd, mode, fname); + if (e < 0) { + /* + We need to wait if FIFO is empty. It's FIFO's semantics. + rb_thread_wait_fd() release GVL. So, it's safe. + */ + rb_thread_wait_fd(fd); + } } - else if (f != rb_stdin) { + return f; +} + +static VALUE +restore_load_file(VALUE arg) +{ + struct load_file_arg *argp = (struct load_file_arg *)arg; + VALUE f = argp->f; + + if (!NIL_P(f) && f != rb_stdin) { rb_io_close(f); } - return tree; + return Qnil; +} + +static rb_ast_t * +load_file(VALUE parser, VALUE fname, VALUE f, int script, ruby_cmdline_options_t *opt) +{ + struct load_file_arg arg; + arg.parser = parser; + arg.fname = fname; + arg.script = script; + arg.opt = opt; + arg.f = f; + return (rb_ast_t *)rb_ensure(load_file_internal, (VALUE)&arg, + restore_load_file, (VALUE)&arg); } void * rb_load_file(const char *fname) { - struct cmdline_options opt; + VALUE fname_v = rb_str_new_cstr(fname); + return rb_load_file_str(fname_v); +} - return load_file(rb_parser_new(), fname, 0, cmdline_options_init(&opt)); +void * +rb_load_file_str(VALUE fname_v) +{ + return rb_parser_load_file(rb_parser_new(), fname_v); } -#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE) -#if !defined(_WIN32) && !(defined(HAVE_SETENV) && defined(HAVE_UNSETENV)) -#define USE_ENVSPACE_FOR_ARG0 -#endif +void * +rb_parser_load_file(VALUE parser, VALUE fname_v) +{ + ruby_cmdline_options_t opt; + VALUE f = open_load_file(fname_v, &cmdline_options_init(&opt)->xflag); + return load_file(parser, fname_v, f, 0, &opt); +} -#ifdef USE_ENVSPACE_FOR_ARG0 -extern char **environ; -#endif +/* + * call-seq: + * Process.argv0 -> frozen_string + * + * Returns the name of the script being executed. The value is not + * affected by assigning a new value to $0. + * + * This method first appeared in Ruby 2.1 to serve as a global + * variable free means to get the script name. + */ -static int -get_arglen(int argc, char **argv) +static VALUE +proc_argv0(VALUE process) { - char *s = argv[0]; - int i; + return rb_orig_progname; +} - if (!argc) return 0; - s += strlen(s); - /* See if all the arguments are contiguous in memory */ - for (i = 1; i < argc; i++) { - if (argv[i] == s + 1) { - s++; - s += strlen(s); /* this one is ok too */ - } - else { - break; - } - } -#if defined(USE_ENVSPACE_FOR_ARG0) - if (environ && (s == environ[0])) { - s += strlen(s); - for (i = 1; environ[i]; i++) { - if (environ[i] == s + 1) { - s++; - s += strlen(s); /* this one is ok too */ - } - } - ruby_setenv("", NULL); /* duplicate environ vars */ - } -#endif - return s - argv[0]; +static VALUE ruby_setproctitle(VALUE title); + +/* + * call-seq: + * Process.setproctitle(string) -> string + * + * Sets the process title that appears on the ps(1) command. Not + * necessarily effective on all platforms. No exception will be + * raised regardless of the result, nor will NotImplementedError be + * raised even if the platform does not support the feature. + * + * Calling this method does not affect the value of $0. + * + * Process.setproctitle('myapp: worker #%d' % worker_id) + * + * This method first appeared in Ruby 2.1 to serve as a global + * variable free means to change the process title. + */ + +static VALUE +proc_setproctitle(VALUE process, VALUE title) +{ + return ruby_setproctitle(title); +} + +static VALUE +ruby_setproctitle(VALUE title) +{ + const char *ptr = StringValueCStr(title); + setproctitle("%.*s", RSTRING_LENINT(title), ptr); + return title; } -#endif static void set_arg0(VALUE val, ID id) { - char *s; - long i; - if (origarg.argv == 0) rb_raise(rb_eRuntimeError, "$0 not initialized"); - StringValue(val); - s = RSTRING_PTR(val); - i = RSTRING_LEN(val); -#if defined(PSTAT_SETCMD) - if (i > PST_CLEN) { - union pstun un; - char buf[PST_CLEN + 1]; /* PST_CLEN is 64 (HP-UX 11.23) */ - strncpy(buf, s, PST_CLEN); - buf[PST_CLEN] = '\0'; - un.pst_command = buf; - pstat(PSTAT_SETCMD, un, PST_CLEN, 0, 0); - } - else { - union pstun un; - un.pst_command = s; - pstat(PSTAT_SETCMD, un, i, 0, 0); - } -#elif defined(HAVE_SETPROCTITLE) - setproctitle("%.*s", (int)i, s); -#else - - if (i >= origarg.len) { - i = origarg.len; - } - - memcpy(origarg.argv[0], s, i); - { - int j; - char *t = origarg.argv[0] + i; - *t = '\0'; + rb_progname = rb_str_new_frozen(ruby_setproctitle(val)); +} - if (i + 1 < origarg.len) memset(t + 1, ' ', origarg.len - i - 1); - for (j = 1; j < origarg.argc; j++) { - origarg.argv[j] = t; - } - } +static inline VALUE +external_str_new_cstr(const char *p) +{ +#if UTF8_PATH + VALUE str = rb_utf8_str_new_cstr(p); + str = str_conv_enc(str, NULL, rb_default_external_encoding()); + OBJ_TAINT_RAW(str); + return str; +#else + return rb_external_str_new_cstr(p); #endif - rb_progname = rb_tainted_str_new(s, i); } +/*! Sets the current script name to this value. + * + * This is similar to <code>$0 = name</code> in Ruby level but also affects + * <code>Method#location</code> and others. + */ void ruby_script(const char *name) { if (name) { - rb_progname = rb_tainted_str_new2(name); + rb_orig_progname = rb_progname = external_str_new_cstr(name); + rb_vm_set_progname(rb_progname); } } +/*! Sets the current script name to this value. + * + * Same as ruby_script() but accepts a VALUE. + */ +void +ruby_set_script_name(VALUE name) +{ + rb_orig_progname = rb_progname = rb_str_dup(name); + rb_vm_set_progname(rb_progname); +} + static void -init_ids(struct cmdline_options *opt) +init_ids(ruby_cmdline_options_t *opt) { rb_uid_t uid = getuid(); rb_uid_t euid = geteuid(); rb_gid_t gid = getgid(); rb_gid_t egid = getegid(); -#ifdef VMS - uid |= gid << 16; - euid |= egid << 16; -#endif if (uid != euid) opt->setids |= 1; if (egid != gid) opt->setids |= 2; if (uid && opt->setids) { - rb_set_safe_level(1); + if (opt->safe_level < 1) opt->safe_level = 1; } } #undef forbid_setid static void -forbid_setid(const char *s, struct cmdline_options *opt) +forbid_setid(const char *s, const ruby_cmdline_options_t *opt) { if (opt->setids & 1) rb_raise(rb_eSecurityError, "no %s allowed while running setuid", s); if (opt->setids & 2) rb_raise(rb_eSecurityError, "no %s allowed while running setgid", s); - if (rb_safe_level() > 0) + if (opt->safe_level > 0) rb_raise(rb_eSecurityError, "no %s allowed in tainted mode", s); } @@ -1457,34 +2197,35 @@ opt_W_getter(ID id, void *data) return INT2FIX(1); case Qtrue: return INT2FIX(2); + default: + return Qnil; } - return Qnil; /* not reached */ } +/*! Defines built-in variables */ void ruby_prog_init(void) { rb_define_hooked_variable("$VERBOSE", &ruby_verbose, 0, verbose_setter); rb_define_hooked_variable("$-v", &ruby_verbose, 0, verbose_setter); rb_define_hooked_variable("$-w", &ruby_verbose, 0, verbose_setter); - rb_define_hooked_variable("$-W", &ruby_verbose, opt_W_getter, 0); + rb_define_hooked_variable("$-W", &ruby_verbose, opt_W_getter, rb_gvar_readonly_setter); rb_define_variable("$DEBUG", &ruby_debug); rb_define_variable("$-d", &ruby_debug); rb_define_hooked_variable("$0", &rb_progname, 0, set_arg0); rb_define_hooked_variable("$PROGRAM_NAME", &rb_progname, 0, set_arg0); - rb_define_global_const("ARGV", rb_argv); - rb_global_variable(&rb_argv0); + rb_define_module_function(rb_mProcess, "argv0", proc_argv0, 0); + rb_define_module_function(rb_mProcess, "setproctitle", proc_setproctitle, 1); -#ifdef MSDOS /* - * There is no way we can refer to them from ruby, so close them to save - * space. + * ARGV contains the command line arguments used to run ruby. + * + * A library like OptionParser can be used to process command-line + * arguments. */ - (void)fclose(stdaux); - (void)fclose(stdprn); -#endif + rb_define_global_const("ARGV", rb_argv); } void @@ -1494,91 +2235,92 @@ ruby_set_argv(int argc, char **argv) VALUE av = rb_argv; #if defined(USE_DLN_A_OUT) - if (origarg.argv) + if (origarg.argc > 0 && origarg.argv) dln_argv0 = origarg.argv[0]; - else + else if (argc > 0 && argv) dln_argv0 = argv[0]; #endif rb_ary_clear(av); for (i = 0; i < argc; i++) { - VALUE arg = rb_tainted_str_new2(argv[i]); + VALUE arg = external_str_new_cstr(argv[i]); OBJ_FREEZE(arg); rb_ary_push(av, arg); } } -static VALUE -false_value(void) -{ - return Qfalse; -} - -static VALUE -true_value(void) -{ - return Qtrue; -} - -#define rb_define_readonly_boolean(name, val) \ - rb_define_virtual_variable((name), (val) ? true_value : false_value, 0) - void * ruby_process_options(int argc, char **argv) { - struct cmdline_arguments args; - struct cmdline_options opt; - NODE *tree; + ruby_cmdline_options_t opt; + VALUE iseq; + const char *script_name = (argc > 0 && argv[0]) ? argv[0] : ruby_engine; - ruby_script(argv[0]); /* for the time being */ + if (!origarg.argv || origarg.argc <= 0) { + origarg.argc = argc; + origarg.argv = argv; + } + ruby_script(script_name); /* for the time being */ rb_argv0 = rb_str_new4(rb_progname); - args.argc = argc; - args.argv = argv; - args.opt = cmdline_options_init(&opt); - opt.ext.enc.index = -1; - tree = (NODE *)rb_vm_call_cfunc(rb_vm_top_self(), - process_options, (VALUE)&args, - 0, rb_progname); + rb_gc_register_mark_object(rb_argv0); + iseq = process_options(argc, argv, cmdline_options_init(&opt)); + +#ifndef HAVE_SETPROCTITLE + ruby_init_setproctitle(argc, argv); +#endif - rb_define_readonly_boolean("$-p", opt.do_print); - rb_define_readonly_boolean("$-l", opt.do_line); - rb_define_readonly_boolean("$-a", opt.do_split); + return (void*)(struct RData*)iseq; +} - return tree; +static void +fill_standard_fds(void) +{ + int f0, f1, f2, fds[2]; + struct stat buf; + f0 = fstat(0, &buf) == -1 && errno == EBADF; + f1 = fstat(1, &buf) == -1 && errno == EBADF; + f2 = fstat(2, &buf) == -1 && errno == EBADF; + if (f0) { + if (pipe(fds) == 0) { + close(fds[1]); + if (fds[0] != 0) { + dup2(fds[0], 0); + close(fds[0]); + } + } + } + if (f1 || f2) { + if (pipe(fds) == 0) { + close(fds[0]); + if (f1 && fds[1] != 1) + dup2(fds[1], 1); + if (f2 && fds[1] != 2) + dup2(fds[1], 2); + if (fds[1] != 1 && fds[1] != 2) + close(fds[1]); + } + } } +/*! Initializes the process for libruby. + * + * This function assumes this process is ruby(1) and it has just started. + * Usually programs that embed CRuby interpreter may not call this function, + * and may do their own initialization. + * argc and argv cannot be NULL. + */ void ruby_sysinit(int *argc, char ***argv) { -#if defined(__APPLE__) && (defined(__MACH__) || defined(__DARWIN__)) - int i, n = *argc, len = 0; - char **v1 = *argv, **v2, *p; - - for (i = 0; i < n; ++i) { - len += strlen(v1[i]) + 1; - } - v2 = malloc((n + 1)* sizeof(char*) + len); - p = (char *)&v2[n + 1]; - for (i = 0; i < n; ++i) { - int l = strlen(v1[i]); - memcpy(p, v1[i], l + 1); - v2[i] = p; - p += l + 1; - } - v2[n] = 0; - *argv = v2; -#elif defined(__MACOS__) && defined(__MWERKS__) - *argc = ccommand(argv); -#elif defined(_WIN32) - void rb_w32_sysinit(int *argc, char ***argv); +#if defined(_WIN32) rb_w32_sysinit(argc, argv); #endif - origarg.argc = *argc; - origarg.argv = *argv; -#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE) - origarg.len = get_arglen(origarg.argc, origarg.argv); -#endif + if (*argc >= 0 && *argv) { + origarg.argc = *argc; + origarg.argv = *argv; #if defined(USE_DLN_A_OUT) - dln_argv0 = origarg.argv[0]; + dln_argv0 = origarg.argv[0]; #endif + } + fill_standard_fds(); } |
