summaryrefslogtreecommitdiff
path: root/ruby.c
diff options
context:
space:
mode:
Diffstat (limited to 'ruby.c')
-rw-r--r--ruby.c2140
1 files changed, 1441 insertions, 699 deletions
diff --git a/ruby.c b/ruby.c
index 027b15f051..4ff30cceca 100644
--- a/ruby.c
+++ b/ruby.c
@@ -15,13 +15,8 @@
#include <windows.h>
#include <sys/cygwin.h>
#endif
-#ifdef _WIN32_WCE
-#include <winsock.h>
-#include "ruby/wince.h"
-#endif
-#include "ruby/ruby.h"
-#include "ruby/node.h"
-#include "ruby/encoding.h"
+#include "internal.h"
+#include "ruby/thread.h"
#include "eval_intern.h"
#include "dln.h"
#include <stdio.h>
@@ -31,6 +26,9 @@
#ifdef __hpux
#include <sys/pstat.h>
#endif
+#if defined(LOAD_RELATIVE) && defined(HAVE_DLADDR)
+#include <dlfcn.h>
+#endif
#ifdef HAVE_UNISTD_H
#include <unistd.h>
@@ -46,9 +44,8 @@
#ifndef MAXPATHLEN
# define MAXPATHLEN 1024
#endif
-
-#if defined(__MACOS__) && defined(__MWERKS__)
-#include <console.h>
+#ifndef O_ACCMODE
+# define O_ACCMODE (O_RDONLY | O_WRONLY | O_RDWR)
#endif
#include "ruby/util.h"
@@ -57,36 +54,74 @@
char *getenv();
#endif
-VALUE rb_parser_get_yydebug(VALUE);
-VALUE rb_parser_set_yydebug(VALUE, VALUE);
-
-const char *ruby_get_inplace_mode(void);
-void ruby_set_inplace_mode(const char *);
+#ifndef DISABLE_RUBYGEMS
+# define DISABLE_RUBYGEMS 0
+#endif
+#if DISABLE_RUBYGEMS
+#define DEFAULT_RUBYGEMS_ENABLED "disabled"
+#else
+#define DEFAULT_RUBYGEMS_ENABLED "enabled"
+#endif
-#define DISABLE_BIT(bit) (1U << disable_##bit)
-enum disable_flag_bits {
- disable_gems,
- disable_rubyopt,
+#define COMMA ,
+#define FEATURE_BIT(bit) (1U << feature_##bit)
+#define EACH_FEATURES(X, SEP) \
+ X(gems) \
+ SEP \
+ X(did_you_mean) \
+ SEP \
+ X(rubyopt) \
+ SEP \
+ X(frozen_string_literal) \
+ /* END OF FEATURES */
+#define EACH_DEBUG_FEATURES(X, SEP) \
+ X(frozen_string_literal) \
+ /* END OF DEBUG FEATURES */
+#define AMBIGUOUS_FEATURE_NAMES 0 /* no ambiguous feature names now */
+#define DEFINE_FEATURE(bit) feature_##bit
+#define DEFINE_DEBUG_FEATURE(bit) feature_debug_##bit
+enum feature_flag_bits {
+ EACH_FEATURES(DEFINE_FEATURE, COMMA),
+ feature_debug_flag_first,
+ feature_debug_flag_begin = feature_debug_flag_first - 1,
+ EACH_DEBUG_FEATURES(DEFINE_DEBUG_FEATURE, COMMA),
+ feature_flag_count
};
+#define DEBUG_BIT(bit) (1U << feature_debug_##bit)
+
#define DUMP_BIT(bit) (1U << dump_##bit)
+#define DEFINE_DUMP(bit) dump_##bit
+#define EACH_DUMPS(X, SEP) \
+ X(version) \
+ SEP \
+ X(copyright) \
+ SEP \
+ X(usage) \
+ SEP \
+ X(help) \
+ SEP \
+ X(yydebug) \
+ SEP \
+ X(syntax) \
+ SEP \
+ X(parsetree) \
+ SEP \
+ X(parsetree_with_comment) \
+ SEP \
+ X(insns) \
+ /* END OF DUMPS */
enum dump_flag_bits {
- dump_insns,
+ dump_version_v,
+ EACH_DUMPS(DEFINE_DUMP, COMMA),
+ dump_exit_bits = (DUMP_BIT(yydebug) | DUMP_BIT(syntax) |
+ DUMP_BIT(parsetree) | DUMP_BIT(parsetree_with_comment) |
+ DUMP_BIT(insns))
};
-struct cmdline_options {
- int sflag, xflag;
- int do_loop, do_print;
- int do_check, do_line;
- int do_split, do_search;
- int usage;
- int version;
- int copyright;
- unsigned int disable;
- int verbose;
- int yydebug;
- unsigned int setids;
- unsigned int dump;
+typedef struct ruby_cmdline_options ruby_cmdline_options_t;
+
+struct ruby_cmdline_options {
const char *script;
VALUE script_name;
VALUE e_script;
@@ -95,148 +130,159 @@ struct cmdline_options {
VALUE name;
int index;
} enc;
- } src, ext;
+ } src, ext, intern;
VALUE req_list;
+ unsigned int features;
+ unsigned int dump;
+ int safe_level;
+ int sflag, xflag;
+ unsigned int warning: 1;
+ unsigned int verbose: 1;
+ unsigned int do_loop: 1;
+ unsigned int do_print: 1;
+ unsigned int do_line: 1;
+ unsigned int do_split: 1;
+ unsigned int do_search: 1;
+ unsigned int setids: 2;
};
-static void init_ids(struct cmdline_options *);
+static void init_ids(ruby_cmdline_options_t *);
#define src_encoding_index GET_VM()->src_encoding_index
-static struct cmdline_options *
-cmdline_options_init(struct cmdline_options *opt)
+enum {
+ COMPILATION_FEATURES = (
+ 0
+ | FEATURE_BIT(frozen_string_literal)
+ | FEATURE_BIT(debug_frozen_string_literal)
+ ),
+ DEFAULT_FEATURES = (
+ (FEATURE_BIT(debug_flag_first)-1)
+#if DISABLE_RUBYGEMS
+ & ~FEATURE_BIT(gems)
+#endif
+ & ~FEATURE_BIT(frozen_string_literal)
+ )
+};
+
+static ruby_cmdline_options_t *
+cmdline_options_init(ruby_cmdline_options_t *opt)
{
MEMZERO(opt, *opt, 1);
init_ids(opt);
opt->src.enc.index = src_encoding_index;
+ opt->ext.enc.index = -1;
+ opt->intern.enc.index = -1;
+ opt->features = DEFAULT_FEATURES;
return opt;
}
-struct cmdline_arguments {
- int argc;
- char **argv;
- struct cmdline_options *opt;
-};
-
-static NODE *load_file(VALUE, const char *, int, struct cmdline_options *);
-static void forbid_setid(const char *, struct cmdline_options *);
-#define forbid_setid(s) forbid_setid(s, opt)
+static rb_ast_t *load_file(VALUE parser, VALUE fname, VALUE f, int script,
+ ruby_cmdline_options_t *opt);
+static VALUE open_load_file(VALUE fname_v, int *xflag);
+static void forbid_setid(const char *, const ruby_cmdline_options_t *);
+#define forbid_setid(s) forbid_setid((s), opt)
static struct {
int argc;
char **argv;
-#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE)
- int len;
-#endif
} origarg;
static void
-usage(const char *name)
+show_usage_line(const char *str, unsigned int namelen, unsigned int secondlen, int help)
+{
+ const unsigned int w = 16;
+ const int wrap = help && namelen + secondlen - 2 > w;
+ printf(" %.*s%-*.*s%-*s%s\n", namelen-1, str,
+ (wrap ? 0 : w - namelen + 1),
+ (help ? secondlen-1 : 0), str + namelen,
+ (wrap ? w + 3 : 0), (wrap ? "\n" : ""),
+ str + namelen + secondlen);
+}
+
+static void
+usage(const char *name, int help)
{
/* This message really ought to be max 23 lines.
* Removed -h because the user already knows that option. Others? */
- static const char *const usage_msg[] = {
- "-0[octal] specify record separator (\\0, if no argument)",
- "-a autosplit mode with -n or -p (splits $_ into $F)",
- "-c check syntax only",
- "-Cdirectory cd to directory, before executing your script",
- "-d set debugging flags (set $DEBUG to true)",
- "-e 'command' one line of script. Several -e's allowed. Omit [programfile]",
- "-Eencoding specifies the character encoding for the program codes",
- "-Fpattern split() pattern for autosplit (-a)",
- "-i[extension] edit ARGV files in place (make backup if extension supplied)",
- "-Idirectory specify $LOAD_PATH directory (may be used more than once)",
- "-l enable line ending processing",
- "-n assume 'while gets(); ... end' loop around your script",
- "-p assume loop like -n but print line also like sed",
- "-rlibrary require the library, before executing your script",
- "-s enable some switch parsing for switches after script name",
- "-S look for the script using PATH environment variable",
- "-T[level] turn on tainting checks",
- "-v print version number, then turn on verbose mode",
- "-w turn warnings on for your script",
- "-W[level] set warning level; 0=silence, 1=medium, 2=verbose (default)",
- "-x[directory] strip off text before #!ruby line and perhaps cd to directory",
- "--copyright print the copyright",
- "--version print the version",
- NULL
+ struct message {
+ const char *str;
+ unsigned short namelen, secondlen;
};
- const char *const *p = usage_msg;
-
- printf("Usage: %s [switches] [--] [programfile] [arguments]\n", name);
- while (*p)
- printf(" %s\n", *p++);
-}
-
-VALUE rb_get_load_path(void);
-
-#ifndef CharNext /* defined as CharNext[AW] on Windows. */
-#define CharNext(p) ((p) + mblen(p, RUBY_MBCHAR_MAXSIZE))
-#endif
-
-#if defined DOSISH || defined __CYGWIN__
-static inline void
-translate_char(char *p, int from, int to)
-{
- while (*p) {
- if ((unsigned char)*p == from)
- *p = to;
- p = CharNext(p);
- }
+#define M(shortopt, longopt, desc) { \
+ shortopt " " longopt " " desc, \
+ (unsigned short)sizeof(shortopt), \
+ (unsigned short)sizeof(longopt), \
}
-#endif
+ static const struct message usage_msg[] = {
+ M("-0[octal]", "", "specify record separator (\\0, if no argument)"),
+ M("-a", "", "autosplit mode with -n or -p (splits $_ into $F)"),
+ M("-c", "", "check syntax only"),
+ M("-Cdirectory", "", "cd to directory before executing your script"),
+ M("-d", ", --debug", "set debugging flags (set $DEBUG to true)"),
+ M("-e 'command'", "", "one line of script. Several -e's allowed. Omit [programfile]"),
+ M("-Eex[:in]", ", --encoding=ex[:in]", "specify the default external and internal character encodings"),
+ M("-Fpattern", "", "split() pattern for autosplit (-a)"),
+ M("-i[extension]", "", "edit ARGV files in place (make backup if extension supplied)"),
+ M("-Idirectory", "", "specify $LOAD_PATH directory (may be used more than once)"),
+ M("-l", "", "enable line ending processing"),
+ M("-n", "", "assume 'while gets(); ... end' loop around your script"),
+ M("-p", "", "assume loop like -n but print line also like sed"),
+ M("-rlibrary", "", "require the library before executing your script"),
+ M("-s", "", "enable some switch parsing for switches after script name"),
+ M("-S", "", "look for the script using PATH environment variable"),
+ M("-T[level=1]", "", "turn on tainting checks"),
+ M("-v", ", --verbose", "print version number, then turn on verbose mode"),
+ M("-w", "", "turn warnings on for your script"),
+ M("-W[level=2]", "", "set warning level; 0=silence, 1=medium, 2=verbose"),
+ M("-x[directory]", "", "strip off text before #!ruby line and perhaps cd to directory"),
+ M("-h", "", "show this message, --help for more info"),
+ };
+ static const struct message help_msg[] = {
+ M("--copyright", "", "print the copyright"),
+ M("--dump={insns|parsetree|...}[,...]", "",
+ "dump debug information. see below for available dump list"),
+ M("--enable={gems|rubyopt|...}[,...]", ", --disable={gems|rubyopt|...}[,...]",
+ "enable or disable features. see below for available features"),
+ M("--external-encoding=encoding", ", --internal-encoding=encoding",
+ "specify the default external or internal character encoding"),
+ M("--version", "", "print the version"),
+ M("--help", "", "show this message, -h for short message"),
+ };
+ static const struct message dumps[] = {
+ M("insns", "", "instruction sequences"),
+ M("yydebug", "", "yydebug of yacc parser generator"),
+ M("parsetree", "", "AST"),
+ M("parsetree_with_comment", "", "AST with comments"),
+ };
+ static const struct message features[] = {
+ M("gems", "", "rubygems (default: "DEFAULT_RUBYGEMS_ENABLED")"),
+ M("did_you_mean", "", "did_you_mean (default: "DEFAULT_RUBYGEMS_ENABLED")"),
+ M("rubyopt", "", "RUBYOPT environment variable (default: enabled)"),
+ M("frozen-string-literal", "", "freeze all string literals (default: disabled)"),
+ };
+ int i;
+ const int num = numberof(usage_msg) - (help ? 1 : 0);
+#define SHOW(m) show_usage_line((m).str, (m).namelen, (m).secondlen, help)
-#if defined _WIN32 || defined __CYGWIN__ || defined __DJGPP__
-static VALUE
-rubylib_mangled_path(const char *s, unsigned int l)
-{
- static char *newp, *oldp;
- static int newl, oldl, notfound;
- char *ptr;
- VALUE ret;
-
- if (!newp && !notfound) {
- newp = getenv("RUBYLIB_PREFIX");
- if (newp) {
- oldp = newp = strdup(newp);
- while (*newp && !ISSPACE(*newp) && *newp != ';') {
- newp = CharNext(newp); /* Skip digits. */
- }
- oldl = newp - oldp;
- while (*newp && (ISSPACE(*newp) || *newp == ';')) {
- newp = CharNext(newp); /* Skip whitespace. */
- }
- newl = strlen(newp);
- if (newl == 0 || oldl == 0) {
- rb_fatal("malformed RUBYLIB_PREFIX");
- }
- translate_char(newp, '\\', '/');
- }
- else {
- notfound = 1;
- }
- }
- if (!newp || l < oldl || STRNCASECMP(oldp, s, oldl) != 0) {
- return rb_str_new(s, l);
- }
- ret = rb_str_new(0, l + newl - oldl);
- ptr = RSTRING_PTR(ret);
- memcpy(ptr, newp, newl);
- memcpy(ptr + newl, s + oldl, l - oldl);
- ptr[l + newl - oldl] = 0;
- return ret;
+ printf("Usage: %s [switches] [--] [programfile] [arguments]\n", name);
+ for (i = 0; i < num; ++i)
+ SHOW(usage_msg[i]);
+
+ if (!help) return;
+
+ for (i = 0; i < numberof(help_msg); ++i)
+ SHOW(help_msg[i]);
+ puts("Dump List:");
+ for (i = 0; i < numberof(dumps); ++i)
+ SHOW(dumps[i]);
+ puts("Features:");
+ for (i = 0; i < numberof(features); ++i)
+ SHOW(features[i]);
}
-static VALUE
-rubylib_mangled_path2(const char *s)
-{
- return rubylib_mangled_path(s, strlen(s));
-}
-#else
-#define rubylib_mangled_path rb_str_new
-#define rubylib_mangled_path2 rb_str_new2
-#endif
+#define rubylib_path_new rb_str_new
static void
push_include(const char *path, VALUE (*filter)(VALUE))
@@ -251,7 +297,7 @@ push_include(const char *path, VALUE (*filter)(VALUE))
p++;
if (!*p) break;
for (s = p; *s && *s != sep; s = CharNext(s));
- rb_ary_push(load_path, (*filter)(rubylib_mangled_path(p, s - p)));
+ rb_ary_push(load_path, (*filter)(rubylib_path_new(p, s - p)));
p = s;
}
}
@@ -282,7 +328,13 @@ push_include_cygwin(const char *path, VALUE (*filter)(VALUE))
p = strncpy(RSTRING_PTR(buf), p, len);
}
}
- if (cygwin_conv_to_posix_path(p, rubylib) == 0)
+#ifdef HAVE_CYGWIN_CONV_PATH
+#define CONV_TO_POSIX_PATH(p, lib) \
+ cygwin_conv_path(CCP_WIN_A_TO_POSIX|CCP_RELATIVE, (p), (lib), sizeof(lib))
+#else
+# error no cygwin_conv_path
+#endif
+ if (CONV_TO_POSIX_PATH(p, rubylib) == 0)
p = rubylib;
push_include(p, filter);
if (!*s) break;
@@ -306,11 +358,17 @@ identical_path(VALUE path)
{
return path;
}
+static VALUE
+locale_path(VALUE path)
+{
+ rb_enc_associate(path, rb_locale_encoding());
+ return path;
+}
void
ruby_incpush(const char *path)
{
- ruby_push_include(path, identical_path);
+ ruby_push_include(path, locale_path);
}
static VALUE
@@ -324,16 +382,13 @@ expand_include_path(VALUE path)
return rb_file_expand_path(path, Qnil);
}
-void
+void
ruby_incpush_expand(const char *path)
{
ruby_push_include(path, expand_include_path);
}
-#if defined DOSISH || defined __CYGWIN__
-#define LOAD_RELATIVE 1
-#endif
-
+#undef UTF8_PATH
#if defined _WIN32 || defined __CYGWIN__
static HMODULE libruby;
@@ -344,140 +399,288 @@ DllMain(HINSTANCE dll, DWORD reason, LPVOID reserved)
libruby = dll;
return TRUE;
}
+
+HANDLE
+rb_libruby_handle(void)
+{
+ return libruby;
+}
+
+static inline void
+translit_char_bin(char *p, int from, int to)
+{
+ while (*p) {
+ if ((unsigned char)*p == from)
+ *p = to;
+ p++;
+ }
+}
+#endif
+
+#ifdef _WIN32
+# define UTF8_PATH 1
+#endif
+
+#ifndef UTF8_PATH
+# define UTF8_PATH 0
+#endif
+#if UTF8_PATH
+# define IF_UTF8_PATH(t, f) t
+#else
+# define IF_UTF8_PATH(t, f) f
+#endif
+
+#if UTF8_PATH
+static VALUE
+str_conv_enc(VALUE str, rb_encoding *from, rb_encoding *to)
+{
+ return rb_str_conv_enc_opts(str, from, to,
+ ECONV_UNDEF_REPLACE|ECONV_INVALID_REPLACE,
+ Qnil);
+}
+#else
+# define str_conv_enc(str, from, to) (str)
#endif
+void ruby_init_loadpath_safe(int safe_level);
+
void
ruby_init_loadpath(void)
{
+ ruby_init_loadpath_safe(0);
+}
+
+#if defined(LOAD_RELATIVE) && defined(HAVE_DLADDR) && !defined(__CYGWIN__)
+static VALUE
+dladdr_path(const void* addr)
+{
+ Dl_info dli;
+ VALUE fname, path;
+
+ if (!dladdr(addr, &dli)) {
+ return rb_str_new(0, 0);
+ }
+#ifdef __linux__
+ else if (origarg.argc > 0 && origarg.argv && dli.dli_fname == origarg.argv[0]) {
+ fname = rb_str_new_cstr("/proc/self/exe");
+ path = rb_readlink(fname, NULL);
+ }
+#endif
+ else {
+ fname = rb_str_new_cstr(dli.dli_fname);
+ path = rb_realpath_internal(Qnil, fname, 1);
+ }
+ rb_str_resize(fname, 0);
+ return path;
+}
+#endif
+
+#define INITIAL_LOAD_PATH_MARK rb_intern_const("@gem_prelude_index")
+
+void
+ruby_init_loadpath_safe(int safe_level)
+{
VALUE load_path;
+ ID id_initial_load_path_mark;
+ const char *paths = ruby_initial_load_paths;
#if defined LOAD_RELATIVE
+# if defined HAVE_DLADDR || defined __CYGWIN__ || defined _WIN32
+# define VARIABLE_LIBPATH 1
+# else
+# define VARIABLE_LIBPATH 0
+# endif
+# if VARIABLE_LIBPATH
+ char *libpath;
+ VALUE sopath;
+# else
char libpath[MAXPATHLEN + 1];
+# endif
+ size_t baselen;
char *p;
- int rest;
#if defined _WIN32 || defined __CYGWIN__
- GetModuleFileName(libruby, libpath, sizeof libpath);
-#elif defined(DJGPP)
- extern char *__dos_argv0;
- strncpy(libpath, __dos_argv0, sizeof(libpath) - 1);
-#elif defined(__human68k__)
- extern char **_argv;
- strncpy(libpath, _argv[0], sizeof(libpath) - 1);
-#elif defined(__EMX__)
- _execname(libpath, sizeof(libpath) - 1);
+ {
+ DWORD len = RSTRING_EMBED_LEN_MAX, ret, i;
+ VALUE wsopath = rb_str_new(0, len*sizeof(WCHAR));
+ WCHAR *wlibpath;
+ while (wlibpath = (WCHAR *)RSTRING_PTR(wsopath),
+ ret = GetModuleFileNameW(libruby, wlibpath, len),
+ (ret == len))
+ {
+ rb_str_modify_expand(wsopath, len*sizeof(WCHAR));
+ rb_str_set_len(wsopath, (len += len)*sizeof(WCHAR));
+ }
+ if (!ret || ret > len) rb_fatal("failed to get module file name");
+ for (len = ret, i = 0; i < len; ++i) {
+ if (wlibpath[i] == L'\\') {
+ wlibpath[i] = L'/';
+ ret = i+1; /* chop after the last separator */
+ }
+ }
+ len = WideCharToMultiByte(CP_UTF8, 0, wlibpath, ret, NULL, 0, NULL, NULL);
+ sopath = rb_utf8_str_new(0, len);
+ libpath = RSTRING_PTR(sopath);
+ WideCharToMultiByte(CP_UTF8, 0, wlibpath, ret, libpath, len, NULL, NULL);
+ rb_str_resize(wsopath, 0);
+ }
+#elif defined(HAVE_DLADDR)
+ sopath = dladdr_path((void *)(VALUE)expand_include_path);
+ libpath = RSTRING_PTR(sopath);
#endif
+#if !VARIABLE_LIBPATH
libpath[sizeof(libpath) - 1] = '\0';
-#if defined DOSISH
- translate_char(libpath, '\\', '/');
+#endif
+#if defined DOSISH && !defined _WIN32
+ translit_char(libpath, '\\', '/');
#elif defined __CYGWIN__
{
- char rubylib[FILENAME_MAX];
- cygwin_conv_to_posix_path(libpath, rubylib);
- strncpy(libpath, rubylib, sizeof(libpath));
+ const int win_to_posix = CCP_WIN_A_TO_POSIX | CCP_RELATIVE;
+ size_t newsize = cygwin_conv_path(win_to_posix, libpath, 0, 0);
+ if (newsize > 0) {
+ VALUE rubylib = rb_str_new(0, newsize);
+ p = RSTRING_PTR(rubylib);
+ if (cygwin_conv_path(win_to_posix, libpath, p, newsize) == 0) {
+ rb_str_resize(sopath, 0);
+ sopath = rubylib;
+ libpath = p;
+ }
+ }
}
#endif
p = strrchr(libpath, '/');
if (p) {
- *p = 0;
- if (p - libpath > 3 && !STRCASECMP(p - 4, "/bin")) {
- p -= 4;
- *p = 0;
+ static const char bindir[] = "/bin";
+#ifdef LIBDIR_BASENAME
+ static const char libdir[] = "/"LIBDIR_BASENAME;
+#else
+ static const char libdir[] = "/lib";
+#endif
+ const ptrdiff_t bindir_len = (ptrdiff_t)sizeof(bindir) - 1;
+ const ptrdiff_t libdir_len = (ptrdiff_t)sizeof(libdir) - 1;
+
+#ifdef ENABLE_MULTIARCH
+ char *p2 = NULL;
+
+ multiarch:
+#endif
+ if (p - libpath >= bindir_len && !STRNCASECMP(p - bindir_len, bindir, bindir_len)) {
+ p -= bindir_len;
+ }
+ else if (p - libpath >= libdir_len && !strncmp(p - libdir_len, libdir, libdir_len)) {
+ p -= libdir_len;
+ }
+#ifdef ENABLE_MULTIARCH
+ else if (p2) {
+ p = p2;
}
+ else {
+ p2 = p;
+ p = rb_enc_path_last_separator(libpath, p, rb_ascii8bit_encoding());
+ if (p) goto multiarch;
+ p = p2;
+ }
+#endif
+#if !VARIABLE_LIBPATH
+ *p = 0;
+#endif
}
+#if !VARIABLE_LIBPATH
else {
- strcpy(libpath, ".");
+ strlcpy(libpath, ".", sizeof(libpath));
p = libpath + 1;
}
+ baselen = p - libpath;
+#define PREFIX_PATH() rb_str_new(libpath, baselen)
+#else
+ baselen = p - libpath;
+ rb_str_resize(sopath, baselen);
+ libpath = RSTRING_PTR(sopath);
+#define PREFIX_PATH() sopath
+#endif
- rest = sizeof(libpath) - 1 - (p - libpath);
+#define BASEPATH() rb_str_buf_cat(rb_str_buf_new(baselen+len), libpath, baselen)
-#define RUBY_RELATIVE(path) (strncpy(p, (path), rest), libpath)
+#define RUBY_RELATIVE(path, len) rb_str_buf_cat(BASEPATH(), (path), (len))
#else
-#define RUBY_RELATIVE(path) (path)
+ const size_t exec_prefix_len = strlen(ruby_exec_prefix);
+#define RUBY_RELATIVE(path, len) rubylib_path_new((path), (len))
+#define PREFIX_PATH() RUBY_RELATIVE(ruby_exec_prefix, exec_prefix_len)
#endif
-#define incpush(path) rb_ary_push(load_path, rubylib_mangled_path2(path))
load_path = GET_VM()->load_path;
- if (rb_safe_level() == 0) {
- ruby_incpush(getenv("RUBYLIB"));
+ if (safe_level == 0) {
+ ruby_push_include(getenv("RUBYLIB"), identical_path);
}
-#ifdef RUBY_SEARCH_PATH
- incpush(RUBY_RELATIVE(RUBY_SEARCH_PATH));
-#endif
-
- incpush(RUBY_RELATIVE(RUBY_SITE_LIB2));
-#ifdef RUBY_SITE_THIN_ARCHLIB
- incpush(RUBY_RELATIVE(RUBY_SITE_THIN_ARCHLIB));
-#endif
- incpush(RUBY_RELATIVE(RUBY_SITE_ARCHLIB));
- incpush(RUBY_RELATIVE(RUBY_SITE_LIB));
-
- incpush(RUBY_RELATIVE(RUBY_VENDOR_LIB2));
-#ifdef RUBY_VENDOR_THIN_ARCHLIB
- incpush(RUBY_RELATIVE(RUBY_VENDOR_THIN_ARCHLIB));
-#endif
- incpush(RUBY_RELATIVE(RUBY_VENDOR_ARCHLIB));
- incpush(RUBY_RELATIVE(RUBY_VENDOR_LIB));
-
- incpush(RUBY_RELATIVE(RUBY_LIB));
-#ifdef RUBY_THIN_ARCHLIB
- incpush(RUBY_RELATIVE(RUBY_THIN_ARCHLIB));
-#endif
- incpush(RUBY_RELATIVE(RUBY_ARCHLIB));
-
- if (rb_safe_level() == 0) {
- incpush(".");
+ id_initial_load_path_mark = INITIAL_LOAD_PATH_MARK;
+ while (*paths) {
+ size_t len = strlen(paths);
+ VALUE path = RUBY_RELATIVE(paths, len);
+ rb_ivar_set(path, id_initial_load_path_mark, path);
+ rb_ary_push(load_path, path);
+ paths += len + 1;
}
+
+ rb_const_set(rb_cObject, rb_intern_const("TMP_RUBY_PREFIX"), rb_obj_freeze(PREFIX_PATH()));
}
static void
-add_modules(struct cmdline_options *opt, const char *mod)
+add_modules(VALUE *req_list, const char *mod)
{
- VALUE list = opt->req_list;
+ VALUE list = *req_list;
+ VALUE feature;
if (!list) {
- opt->req_list = list = rb_ary_new();
- RBASIC(list)->klass = 0;
+ *req_list = list = rb_ary_new();
+ RBASIC_CLEAR_CLASS(list);
}
- rb_ary_push(list, rb_obj_freeze(rb_str_new2(mod)));
+ feature = rb_str_new2(mod);
+ RBASIC_CLEAR_CLASS(feature);
+ rb_ary_push(list, feature);
}
-extern void Init_ext(void);
-extern VALUE rb_vm_top_self(void);
-
static void
-require_libraries(struct cmdline_options *opt)
+require_libraries(VALUE *req_list)
{
- VALUE list = opt->req_list;
+ VALUE list = *req_list;
+ VALUE self = rb_vm_top_self();
ID require;
+ rb_encoding *extenc = rb_default_external_encoding();
- Init_ext(); /* should be called here for some reason :-( */
CONST_ID(require, "require");
while (list && RARRAY_LEN(list) > 0) {
VALUE feature = rb_ary_shift(list);
- rb_funcall2(rb_vm_top_self(), require, 1, &feature);
+ rb_enc_associate(feature, extenc);
+ RBASIC_SET_CLASS_RAW(feature, rb_cString);
+ OBJ_FREEZE(feature);
+ rb_funcallv(self, require, 1, &feature);
}
- opt->req_list = 0;
+ *req_list = 0;
+}
+
+static const struct rb_block*
+toplevel_context(rb_binding_t *bind)
+{
+ return &bind->block;
}
static void
-process_sflag(struct cmdline_options *opt)
+process_sflag(int *sflag)
{
- if (opt->sflag) {
+ if (*sflag > 0) {
long n;
- VALUE *args;
+ const VALUE *args;
VALUE argv = rb_argv;
n = RARRAY_LEN(argv);
- args = RARRAY_PTR(argv);
+ args = RARRAY_CONST_PTR(argv);
while (n > 0) {
VALUE v = *args++;
char *s = StringValuePtr(v);
char *p;
- int hyphen = Qfalse;
+ int hyphen = FALSE;
if (s[0] != '-')
break;
@@ -494,7 +697,7 @@ process_sflag(struct cmdline_options *opt)
break;
}
if (*p == '-') {
- hyphen = Qtrue;
+ hyphen = TRUE;
}
else if (*p != '_' && !ISALNUM(*p)) {
VALUE name_error[2];
@@ -523,110 +726,227 @@ process_sflag(struct cmdline_options *opt)
while (n--) {
rb_ary_shift(argv);
}
+ *sflag = -1;
}
- opt->sflag = 0;
}
-NODE *rb_parser_append_print(VALUE, NODE *);
-NODE *rb_parser_while_loop(VALUE, NODE *, int, int);
-static int proc_options(int argc, char **argv, struct cmdline_options *opt);
+static long proc_options(long argc, char **argv, ruby_cmdline_options_t *opt, int envopt);
-static char *
-moreswitches(const char *s, struct cmdline_options *opt)
+static void
+moreswitches(const char *s, ruby_cmdline_options_t *opt, int envopt)
{
- int argc;
- char *argv[3];
- const char *p = s;
-
- argc = 2;
- argv[0] = argv[2] = 0;
- while (*s && !ISSPACE(*s))
- s++;
- argv[1] = ALLOCA_N(char, s - p + 2);
- argv[1][0] = '-';
- strncpy(argv[1] + 1, p, s - p);
- argv[1][s - p + 1] = '\0';
- proc_options(argc, argv, opt);
- while (*s && ISSPACE(*s))
- s++;
- return (char *)s;
+ long argc, i, len;
+ char **argv, *p;
+ const char *ap = 0;
+ VALUE argstr, argary;
+
+ while (ISSPACE(*s)) s++;
+ if (!*s) return;
+ argstr = rb_str_tmp_new((len = strlen(s)) + (envopt!=0));
+ argary = rb_str_tmp_new(0);
+
+ p = RSTRING_PTR(argstr);
+ if (envopt) *p++ = ' ';
+ memcpy(p, s, len + 1);
+ ap = 0;
+ rb_str_cat(argary, (char *)&ap, sizeof(ap));
+ while (*p) {
+ ap = p;
+ rb_str_cat(argary, (char *)&ap, sizeof(ap));
+ while (*p && !ISSPACE(*p)) ++p;
+ if (!*p) break;
+ *p++ = '\0';
+ while (ISSPACE(*p)) ++p;
+ }
+ argc = RSTRING_LEN(argary) / sizeof(ap);
+ ap = 0;
+ rb_str_cat(argary, (char *)&ap, sizeof(ap));
+ argv = (char **)RSTRING_PTR(argary);
+
+ while ((i = proc_options(argc, argv, opt, envopt)) > 1 && envopt && (argc -= i) > 0) {
+ argv += i;
+ if (**argv != '-') {
+ *--*argv = '-';
+ }
+ if ((*argv)[1]) {
+ ++argc;
+ --argv;
+ }
+ }
+
+ /* get rid of GC */
+ rb_str_resize(argary, 0);
+ rb_str_resize(argstr, 0);
+}
+
+static int
+name_match_p(const char *name, const char *str, size_t len)
+{
+ if (len == 0) return 0;
+ do {
+ while (TOLOWER(*str) == *name) {
+ if (!--len || !*++str) return 1;
+ ++name;
+ }
+ if (*str != '-' && *str != '_') return 0;
+ while (ISALNUM(*name)) name++;
+ if (*name != '-' && *name != '_') return 0;
+ ++name;
+ ++str;
+ } while (len > 0);
+ return !*name;
}
#define NAME_MATCH_P(name, str, len) \
- ((len) < sizeof(name) && strncmp((str), name, (len)) == 0)
+ ((len) < (int)sizeof(name) && name_match_p((name), (str), (len)))
#define UNSET_WHEN(name, bit, str, len) \
- if (NAME_MATCH_P(name, str, len)) { \
+ if (NAME_MATCH_P((name), (str), (len))) { \
*(unsigned int *)arg &= ~(bit); \
return; \
}
#define SET_WHEN(name, bit, str, len) \
- if (NAME_MATCH_P(name, str, len)) { \
+ if (NAME_MATCH_P((name), (str), (len))) { \
*(unsigned int *)arg |= (bit); \
return; \
}
+#define LITERAL_NAME_ELEMENT(name) #name
+
static void
-enable_option(const char *str, int len, void *arg)
+feature_option(const char *str, int len, void *arg, const unsigned int enable)
{
-#define UNSET_WHEN_DISABLE(bit) UNSET_WHEN(#bit, DISABLE_BIT(bit), str, len)
- UNSET_WHEN_DISABLE(gems);
- UNSET_WHEN_DISABLE(rubyopt);
+ static const char list[] = EACH_FEATURES(LITERAL_NAME_ELEMENT, ", ");
+ unsigned int *argp = arg;
+ unsigned int mask = ~0U;
+#if AMBIGUOUS_FEATURE_NAMES
+ unsigned int set = 0U;
+ int matched = 0;
+#define SET_FEATURE(bit) \
+ if (NAME_MATCH_P(#bit, str, len)) {set |= mask = FEATURE_BIT(bit); ++matched;}
+#else
+#define SET_FEATURE(bit) \
+ if (NAME_MATCH_P(#bit, str, len)) {mask = FEATURE_BIT(bit); goto found;}
+#endif
+ EACH_FEATURES(SET_FEATURE, ;);
if (NAME_MATCH_P("all", str, len)) {
- *(unsigned int *)arg = 0U;
+ found:
+ *argp = (*argp & ~mask) | (mask & enable);
return;
}
- rb_warn("unknown argument for --enable: `%.*s'", len, str);
+#if AMBIGUOUS_FEATURE_NAMES
+ if (matched == 1) goto found;
+ if (matched > 1) {
+ VALUE mesg = rb_sprintf("ambiguous feature: `%.*s' (", len, str);
+#define ADD_FEATURE_NAME(bit) \
+ if (FEATURE_BIT(bit) & set) { \
+ rb_str_cat_cstr(mesg, #bit); \
+ if (--matched) rb_str_cat_cstr(mesg, ", "); \
+ }
+ EACH_FEATURES(ADD_FEATURE_NAME, ;);
+ rb_str_cat_cstr(mesg, ")");
+ rb_exc_raise(rb_exc_new_str(rb_eRuntimeError, mesg));
+#undef ADD_FEATURE_NAME
+ }
+#endif
+ rb_warn("unknown argument for --%s: `%.*s'",
+ enable ? "enable" : "disable", len, str);
+ rb_warn("features are [%.*s].", (int)strlen(list), list);
+}
+
+static void
+enable_option(const char *str, int len, void *arg)
+{
+ feature_option(str, len, arg, ~0U);
}
static void
disable_option(const char *str, int len, void *arg)
{
-#define SET_WHEN_DISABLE(bit) SET_WHEN(#bit, DISABLE_BIT(bit), str, len)
- SET_WHEN_DISABLE(gems);
- SET_WHEN_DISABLE(rubyopt);
- if (NAME_MATCH_P("all", str, len)) {
- *(unsigned int *)arg = ~0U;
- return;
- }
- rb_warn("unknown argument for --disable: `%.*s'", len, str);
+ feature_option(str, len, arg, 0U);
+}
+
+RUBY_EXTERN const int ruby_patchlevel;
+int ruby_env_debug_option(const char *str, int len, void *arg);
+
+static void
+debug_option(const char *str, int len, void *arg)
+{
+ static const char list[] = EACH_DEBUG_FEATURES(LITERAL_NAME_ELEMENT, ", ");
+#define SET_WHEN_DEBUG(bit) SET_WHEN(#bit, DEBUG_BIT(bit), str, len)
+ EACH_DEBUG_FEATURES(SET_WHEN_DEBUG, ;);
+#ifdef RUBY_DEVEL
+ if (ruby_patchlevel < 0 && ruby_env_debug_option(str, len, 0)) return;
+#endif
+ rb_warn("unknown argument for --debug: `%.*s'", len, str);
+ rb_warn("debug features are [%.*s].", (int)strlen(list), list);
}
static void
dump_option(const char *str, int len, void *arg)
{
+ static const char list[] = EACH_DUMPS(LITERAL_NAME_ELEMENT, ", ");
#define SET_WHEN_DUMP(bit) SET_WHEN(#bit, DUMP_BIT(bit), str, len)
- SET_WHEN_DUMP(insns);
- rb_warn("don't know how to dump `%.*s', (insns)", len, str);
+ EACH_DUMPS(SET_WHEN_DUMP, ;);
+ rb_warn("don't know how to dump `%.*s',", len, str);
+ rb_warn("but only [%.*s].", (int)strlen(list), list);
}
-static int
-proc_options(int argc, char **argv, struct cmdline_options *opt)
+static void
+set_option_encoding_once(const char *type, VALUE *name, const char *e, long elen)
+{
+ VALUE ename;
+
+ if (!elen) elen = strlen(e);
+ ename = rb_str_new(e, elen);
+
+ if (*name &&
+ rb_funcall(ename, rb_intern("casecmp"), 1, *name) != INT2FIX(0)) {
+ rb_raise(rb_eRuntimeError,
+ "%s already set to %"PRIsVALUE, type, *name);
+ }
+ *name = ename;
+}
+
+#define set_internal_encoding_once(opt, e, elen) \
+ set_option_encoding_once("default_internal", &(opt)->intern.enc.name, (e), (elen))
+#define set_external_encoding_once(opt, e, elen) \
+ set_option_encoding_once("default_external", &(opt)->ext.enc.name, (e), (elen))
+#define set_source_encoding_once(opt, e, elen) \
+ set_option_encoding_once("source", &(opt)->src.enc.name, (e), (elen))
+
+static long
+proc_options(long argc, char **argv, ruby_cmdline_options_t *opt, int envopt)
{
- int n, argc0 = argc;
+ long n, argc0 = argc;
const char *s;
+ int warning = opt->warning;
- if (argc == 0)
+ if (argc <= 0 || !argv)
return 0;
for (argc--, argv++; argc > 0; argc--, argv++) {
- if (argv[0][0] != '-' || !argv[0][1])
+ const char *const arg = argv[0];
+ if (!arg || arg[0] != '-' || !arg[1])
break;
- s = argv[0] + 1;
+ s = arg + 1;
reswitch:
switch (*s) {
case 'a':
- opt->do_split = Qtrue;
+ if (envopt) goto noenvopt;
+ opt->do_split = TRUE;
s++;
goto reswitch;
case 'p':
- opt->do_print = Qtrue;
+ if (envopt) goto noenvopt;
+ opt->do_print = TRUE;
/* through */
case 'n':
- opt->do_loop = Qtrue;
+ if (envopt) goto noenvopt;
+ opt->do_loop = TRUE;
s++;
goto reswitch;
@@ -637,7 +957,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
goto reswitch;
case 'y':
- opt->yydebug = 1;
+ if (envopt) goto noenvopt;
+ opt->dump |= DUMP_BIT(yydebug);
s++;
goto reswitch;
@@ -646,16 +967,19 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
s++;
goto reswitch;
}
- ruby_show_version();
+ opt->dump |= DUMP_BIT(version_v);
opt->verbose = 1;
case 'w':
- ruby_verbose = Qtrue;
+ if (!opt->warning) {
+ warning = 1;
+ ruby_verbose = Qtrue;
+ }
s++;
goto reswitch;
case 'W':
{
- int numlen;
+ size_t numlen;
int v = 2; /* -W as -W2 */
if (*++s) {
@@ -664,56 +988,62 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
v = 1;
s += numlen;
}
- switch (v) {
- case 0:
- ruby_verbose = Qnil;
- break;
- case 1:
- ruby_verbose = Qfalse;
- break;
- default:
- ruby_verbose = Qtrue;
- break;
+ if (!opt->warning) {
+ switch (v) {
+ case 0:
+ ruby_verbose = Qnil;
+ break;
+ case 1:
+ ruby_verbose = Qfalse;
+ break;
+ default:
+ ruby_verbose = Qtrue;
+ break;
+ }
}
+ warning = 1;
}
goto reswitch;
case 'c':
- opt->do_check = Qtrue;
+ if (envopt) goto noenvopt;
+ opt->dump |= DUMP_BIT(syntax);
s++;
goto reswitch;
case 's':
+ if (envopt) goto noenvopt;
forbid_setid("-s");
- opt->sflag = 1;
+ if (!opt->sflag) opt->sflag = 1;
s++;
goto reswitch;
case 'h':
- usage(origarg.argv[0]);
- rb_exit(EXIT_SUCCESS);
- break;
+ if (envopt) goto noenvopt;
+ opt->dump |= DUMP_BIT(usage);
+ goto switch_end;
case 'l':
- opt->do_line = Qtrue;
+ if (envopt) goto noenvopt;
+ opt->do_line = TRUE;
rb_output_rs = rb_rs;
s++;
goto reswitch;
case 'S':
+ if (envopt) goto noenvopt;
forbid_setid("-S");
- opt->do_search = Qtrue;
+ opt->do_search = TRUE;
s++;
goto reswitch;
case 'e':
+ if (envopt) goto noenvopt;
forbid_setid("-e");
if (!*++s) {
- s = argv[1];
- argc--, argv++;
- }
- if (!s) {
- rb_raise(rb_eRuntimeError, "no code specified for -e");
+ if (!--argc)
+ rb_raise(rb_eRuntimeError, "no code specified for -e");
+ s = *++argv;
}
if (!opt->e_script) {
opt->e_script = rb_str_new(0, 0);
@@ -727,21 +1057,24 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
case 'r':
forbid_setid("-r");
if (*++s) {
- add_modules(opt, s);
+ add_modules(&opt->req_list, s);
}
- else if (argv[1]) {
- add_modules(opt, argv[1]);
+ else if (argc > 1) {
+ add_modules(&opt->req_list, argv[1]);
argc--, argv++;
}
break;
case 'i':
+ if (envopt) goto noenvopt;
forbid_setid("-i");
ruby_set_inplace_mode(s + 1);
break;
case 'x':
- opt->xflag = Qtrue;
+ if (envopt) goto noenvopt;
+ forbid_setid("-x");
+ opt->xflag = TRUE;
s++;
if (*s && chdir(s) < 0) {
rb_fatal("Can't chdir to %s", s);
@@ -750,12 +1083,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
case 'C':
case 'X':
- s++;
- if (!*s) {
- s = argv[1];
- argc--, argv++;
- }
- if (!s || !*s) {
+ if (envopt) goto noenvopt;
+ if (!*++s && (!--argc || !(s = *++argv) || !*s)) {
rb_fatal("Can't chdir");
}
if (chdir(s) < 0) {
@@ -764,15 +1093,23 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
break;
case 'F':
+ if (envopt) goto noenvopt;
if (*++s) {
rb_fs = rb_reg_new(s, strlen(s), 0);
}
break;
case 'E':
- if (!*++s) goto next_encoding;
+ if (!*++s && (!--argc || !(s = *++argv))) {
+ rb_raise(rb_eRuntimeError, "missing argument for -E");
+ }
goto encoding;
+ case 'U':
+ set_internal_encoding_once(opt, "UTF-8", 0);
+ ++s;
+ goto reswitch;
+
case 'K':
if (*++s) {
const char *enc_name = 0;
@@ -792,7 +1129,8 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
}
if (enc_name) {
opt->src.enc.name = rb_str_new2(enc_name);
- opt->ext.enc.name = opt->src.enc.name;
+ if (!opt->ext.enc.name)
+ opt->ext.enc.name = opt->src.enc.name;
}
s++;
}
@@ -800,7 +1138,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
case 'T':
{
- int numlen;
+ size_t numlen;
int v = 1;
if (*++s) {
@@ -809,7 +1147,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
v = 1;
s += numlen;
}
- rb_set_safe_level(v);
+ if (v > opt->safe_level) opt->safe_level = v;
}
goto reswitch;
@@ -817,15 +1155,16 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
forbid_setid("-I");
if (*++s)
ruby_incpush_expand(s);
- else if (argv[1]) {
+ else if (argc > 1) {
ruby_incpush_expand(argv[1]);
argc--, argv++;
}
break;
case '0':
+ if (envopt) goto noenvopt;
{
- int numlen;
+ size_t numlen;
int v;
char c;
@@ -834,7 +1173,7 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
if (v > 0377)
rb_rs = Qnil;
else if (v == 0 && numlen >= 2) {
- rb_rs = rb_str_new2("\n\n");
+ rb_rs = rb_str_new2("");
}
else {
c = v & 0xff;
@@ -849,52 +1188,97 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
goto switch_end;
}
s++;
- if (strcmp("copyright", s) == 0)
- opt->copyright = 1;
- else if (strcmp("debug", s) == 0) {
- ruby_debug = Qtrue;
- ruby_verbose = Qtrue;
- }
- else if (strncmp("enable", s, n = 6) == 0 &&
- (!s[n] || s[n] == '-' || s[n] == '=')) {
- if ((s += n + 1)[-1] ? !*s : (!--argc || !(s = *++argv))) {
- rb_raise(rb_eRuntimeError, "missing argument for --enable");
- }
- ruby_each_words(s, enable_option, &opt->disable);
+
+# define is_option_end(c, allow_hyphen) \
+ (!(c) || ((allow_hyphen) && (c) == '-') || (c) == '=')
+# define check_envopt(name, allow_envopt) \
+ (((allow_envopt) || !envopt) ? (void)0 : \
+ rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: --" name))
+# define need_argument(name, s, needs_arg, next_arg) \
+ ((*(s) ? !*++(s) : (next_arg) && (!argc || !((s) = argv[1]) || (--argc, ++argv, 0))) && (needs_arg) ? \
+ rb_raise(rb_eRuntimeError, "missing argument for --" name) \
+ : (void)0)
+# define is_option_with_arg(name, allow_hyphen, allow_envopt) \
+ is_option_with_optarg(name, allow_hyphen, allow_envopt, Qtrue, Qtrue)
+# define is_option_with_optarg(name, allow_hyphen, allow_envopt, needs_arg, next_arg) \
+ (strncmp((name), s, n = sizeof(name) - 1) == 0 && is_option_end(s[n], (allow_hyphen)) ? \
+ (check_envopt(name, (allow_envopt)), s += n, \
+ need_argument(name, s, needs_arg, next_arg), 1) : 0)
+
+ if (strcmp("copyright", s) == 0) {
+ if (envopt) goto noenvopt_long;
+ opt->dump |= DUMP_BIT(copyright);
}
- else if (strncmp("disable", s, n = 7) == 0 &&
- (!s[n] || s[n] == '-' || s[n] == '=')) {
- if ((s += n + 1)[-1] ? !*s : (!--argc || !(s = *++argv))) {
- rb_raise(rb_eRuntimeError, "missing argument for --disable");
+ else if (is_option_with_optarg("debug", Qtrue, Qtrue, Qfalse, Qfalse)) {
+ if (s && *s) {
+ ruby_each_words(s, debug_option, &opt->features);
}
- ruby_each_words(s, disable_option, &opt->disable);
- }
- else if (strncmp("encoding", s, n = 8) == 0 && (!s[n] || s[n] == '=')) {
- s += n;
- if (!*s++) {
- next_encoding:
- if (!--argc || !(s = *++argv)) {
- rb_raise(rb_eRuntimeError, "missing argument for --encoding");
- }
+ else {
+ ruby_debug = Qtrue;
+ ruby_verbose = Qtrue;
}
+ }
+ else if (is_option_with_arg("enable", Qtrue, Qtrue)) {
+ ruby_each_words(s, enable_option, &opt->features);
+ }
+ else if (is_option_with_arg("disable", Qtrue, Qtrue)) {
+ ruby_each_words(s, disable_option, &opt->features);
+ }
+ else if (is_option_with_arg("encoding", Qfalse, Qtrue)) {
+ char *p;
encoding:
- opt->ext.enc.name = rb_str_new2(s);
+ do {
+# define set_encoding_part(type) \
+ if (!(p = strchr(s, ':'))) { \
+ set_##type##_encoding_once(opt, s, 0); \
+ break; \
+ } \
+ else if (p > s) { \
+ set_##type##_encoding_once(opt, s, p-s); \
+ }
+ set_encoding_part(external);
+ if (!*(s = ++p)) break;
+ set_encoding_part(internal);
+ if (!*(s = ++p)) break;
+#if defined ALLOW_DEFAULT_SOURCE_ENCODING && ALLOW_DEFAULT_SOURCE_ENCODING
+ set_encoding_part(source);
+ if (!*(s = ++p)) break;
+#endif
+ rb_raise(rb_eRuntimeError, "extra argument for %s: %s",
+ (arg[1] == '-' ? "--encoding" : "-E"), s);
+# undef set_encoding_part
+ } while (0);
+ }
+ else if (is_option_with_arg("internal-encoding", Qfalse, Qtrue)) {
+ set_internal_encoding_once(opt, s, 0);
+ }
+ else if (is_option_with_arg("external-encoding", Qfalse, Qtrue)) {
+ set_external_encoding_once(opt, s, 0);
+ }
+#if defined ALLOW_DEFAULT_SOURCE_ENCODING && ALLOW_DEFAULT_SOURCE_ENCODING
+ else if (is_option_with_arg("source-encoding", Qfalse, Qtrue)) {
+ set_source_encoding_once(opt, s, 0);
+ }
+#endif
+ else if (strcmp("version", s) == 0) {
+ if (envopt) goto noenvopt_long;
+ opt->dump |= DUMP_BIT(version);
}
- else if (strcmp("version", s) == 0)
- opt->version = 1;
else if (strcmp("verbose", s) == 0) {
opt->verbose = 1;
ruby_verbose = Qtrue;
}
- else if (strcmp("yydebug", s) == 0)
- opt->yydebug = 1;
- else if (strncmp("dump", s, n = 4) == 0 && (!s[n] || s[n] == '=')) {
- if (!(s += n + 1)[-1] && (!--argc || !(s = *++argv)) && *s != '-') break;
+ else if (strcmp("yydebug", s) == 0) {
+ if (envopt) goto noenvopt_long;
+ opt->dump |= DUMP_BIT(yydebug);
+ }
+ else if (is_option_with_arg("dump", Qfalse, Qfalse)) {
ruby_each_words(s, dump_option, &opt->dump);
}
else if (strcmp("help", s) == 0) {
- usage(origarg.argv[0]);
- rb_exit(EXIT_SUCCESS);
+ if (envopt) goto noenvopt_long;
+ opt->dump |= DUMP_BIT(help);
+ goto switch_end;
}
else {
rb_raise(rb_eRuntimeError,
@@ -921,22 +1305,35 @@ proc_options(int argc, char **argv, struct cmdline_options *opt)
}
goto switch_end;
+ noenvopt:
+ /* "EIdvwWrKU" only */
+ rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: -%c", *s);
+ break;
+
+ noenvopt_long:
+ rb_raise(rb_eRuntimeError, "invalid switch in RUBYOPT: --%s", s);
+ break;
+
case 0:
break;
+# undef is_option_end
+# undef check_envopt
+# undef need_argument
+# undef is_option_with_arg
+# undef is_option_with_optarg
}
}
switch_end:
+ if (warning) opt->warning = warning;
return argc0 - argc;
}
-void Init_prelude(void);
-
static void
-ruby_init_gems(int enable)
+ruby_init_prelude(void)
{
- if (enable) rb_define_module("Gem");
Init_prelude();
+ rb_const_remove(rb_cObject, rb_intern_const("TMP_RUBY_PREFIX"));
}
static int
@@ -954,95 +1351,180 @@ opt_enc_index(VALUE enc_name)
return i;
}
-#define rb_progname (GET_VM()->progname)
+#define rb_progname (GET_VM()->progname)
+#define rb_orig_progname (GET_VM()->orig_progname)
VALUE rb_argv0;
static VALUE
-process_options(VALUE arg)
+false_value(void)
+{
+ return Qfalse;
+}
+
+static VALUE
+true_value(void)
+{
+ return Qtrue;
+}
+
+#define rb_define_readonly_boolean(name, val) \
+ rb_define_virtual_variable((name), (val) ? true_value : false_value, 0)
+
+static VALUE
+uscore_get(void)
+{
+ VALUE line;
+
+ line = rb_lastline_get();
+ if (!RB_TYPE_P(line, T_STRING)) {
+ rb_raise(rb_eTypeError, "$_ value need to be String (%s given)",
+ NIL_P(line) ? "nil" : rb_obj_classname(line));
+ }
+ return line;
+}
+
+/*
+ * call-seq:
+ * sub(pattern, replacement) -> $_
+ * sub(pattern) {|...| block } -> $_
+ *
+ * Equivalent to <code>$_.sub(<i>args</i>)</code>, except that
+ * <code>$_</code> will be updated if substitution occurs.
+ * Available only when -p/-n command line option specified.
+ */
+
+static VALUE
+rb_f_sub(int argc, VALUE *argv)
+{
+ VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("sub"), argc, argv);
+ rb_lastline_set(str);
+ return str;
+}
+
+/*
+ * call-seq:
+ * gsub(pattern, replacement) -> $_
+ * gsub(pattern) {|...| block } -> $_
+ *
+ * Equivalent to <code>$_.gsub...</code>, except that <code>$_</code>
+ * will be updated if substitution occurs.
+ * Available only when -p/-n command line option specified.
+ *
+ */
+
+static VALUE
+rb_f_gsub(int argc, VALUE *argv)
+{
+ VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("gsub"), argc, argv);
+ rb_lastline_set(str);
+ return str;
+}
+
+/*
+ * call-seq:
+ * chop -> $_
+ *
+ * Equivalent to <code>($_.dup).chop!</code>, except <code>nil</code>
+ * is never returned. See <code>String#chop!</code>.
+ * Available only when -p/-n command line option specified.
+ *
+ */
+
+static VALUE
+rb_f_chop(void)
+{
+ VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("chop"), 0, 0);
+ rb_lastline_set(str);
+ return str;
+}
+
+
+/*
+ * call-seq:
+ * chomp -> $_
+ * chomp(string) -> $_
+ *
+ * Equivalent to <code>$_ = $_.chomp(<em>string</em>)</code>. See
+ * <code>String#chomp</code>.
+ * Available only when -p/-n command line option specified.
+ *
+ */
+
+static VALUE
+rb_f_chomp(int argc, VALUE *argv)
+{
+ VALUE str = rb_funcall_passing_block(uscore_get(), rb_intern("chomp"), argc, argv);
+ rb_lastline_set(str);
+ return str;
+}
+
+static VALUE
+process_options(int argc, char **argv, ruby_cmdline_options_t *opt)
{
- struct cmdline_arguments *argp = (struct cmdline_arguments *)arg;
- struct cmdline_options *opt = argp->opt;
- int argc = argp->argc;
- char **argv = argp->argv;
- NODE *tree = 0;
+ rb_ast_t *ast = 0;
VALUE parser;
- VALUE iseq;
+ VALUE script_name;
+ const rb_iseq_t *iseq;
rb_encoding *enc, *lenc;
+#if UTF8_PATH
+ rb_encoding *uenc, *ienc = 0;
+#endif
const char *s;
char fbuf[MAXPATHLEN];
- int i = proc_options(argc, argv, opt);
- int safe;
+ int i = (int)proc_options(argc, argv, opt, 0);
+ rb_binding_t *toplevel_binding;
+ const struct rb_block *base_block;
+ unsigned int dump = opt->dump & dump_exit_bits;
+
+ if (opt->dump & (DUMP_BIT(usage)|DUMP_BIT(help))) {
+ const char *const progname =
+ (argc > 0 && argv && argv[0] ? argv[0] :
+ origarg.argc > 0 && origarg.argv && origarg.argv[0] ? origarg.argv[0] :
+ ruby_engine);
+ usage(progname, (opt->dump & DUMP_BIT(help)));
+ return Qtrue;
+ }
argc -= i;
argv += i;
- if (!(opt->disable & DISABLE_BIT(rubyopt)) &&
- rb_safe_level() == 0 && (s = getenv("RUBYOPT"))) {
+ if ((opt->features & FEATURE_BIT(rubyopt)) &&
+ opt->safe_level == 0 && (s = getenv("RUBYOPT"))) {
VALUE src_enc_name = opt->src.enc.name;
VALUE ext_enc_name = opt->ext.enc.name;
+ VALUE int_enc_name = opt->intern.enc.name;
- while (ISSPACE(*s))
- s++;
- if (*s == 'T' || (*s == '-' && *(s + 1) == 'T')) {
- int numlen;
- int v = 1;
-
- if (*s != 'T')
- ++s;
- if (*++s) {
- v = scan_oct(s, 2, &numlen);
- if (numlen == 0)
- v = 1;
- }
- rb_set_safe_level(v);
- }
- else {
- while (s && *s) {
- if (*s == '-') {
- s++;
- if (ISSPACE(*s)) {
- do {
- s++;
- } while (ISSPACE(*s));
- continue;
- }
- }
- if (!*s)
- break;
- if (!strchr("EIdvwWrK", *s))
- rb_raise(rb_eRuntimeError,
- "invalid switch in RUBYOPT: -%c", *s);
- s = moreswitches(s, opt);
- }
- }
+ opt->src.enc.name = opt->ext.enc.name = opt->intern.enc.name = 0;
+ moreswitches(s, opt, 1);
if (src_enc_name)
opt->src.enc.name = src_enc_name;
if (ext_enc_name)
opt->ext.enc.name = ext_enc_name;
+ if (int_enc_name)
+ opt->intern.enc.name = int_enc_name;
}
- if (opt->version) {
+ if (opt->src.enc.name)
+ rb_warning("-K is specified; it is for 1.8 compatibility and may cause odd behavior");
+
+ if (opt->dump & (DUMP_BIT(version) | DUMP_BIT(version_v))) {
ruby_show_version();
- return Qtrue;
+ if (opt->dump & DUMP_BIT(version)) return Qtrue;
}
- if (opt->copyright) {
+ if (opt->dump & DUMP_BIT(copyright)) {
ruby_show_copyright();
- }
-
- if (rb_safe_level() >= 4) {
- OBJ_TAINT(rb_argv);
- OBJ_TAINT(GET_VM()->load_path);
+ return Qtrue;
}
if (!opt->e_script) {
- if (argc == 0) { /* no more args */
+ if (argc <= 0) { /* no more args */
if (opt->verbose)
return Qtrue;
opt->script = "-";
}
else {
opt->script = argv[0];
- if (opt->script[0] == '\0') {
+ if (!opt->script || opt->script[0] == '\0') {
opt->script = "-";
}
else if (opt->do_search) {
@@ -1061,30 +1543,36 @@ process_options(VALUE arg)
argc--;
argv++;
}
+ if (opt->script[0] == '-' && !opt->script[1]) {
+ forbid_setid("program input from stdin");
+ }
}
- ruby_script(opt->script);
-#if defined DOSISH || defined __CYGWIN__
- translate_char(RSTRING_PTR(rb_progname), '\\', '/');
-#endif
- opt->script_name = rb_str_new4(rb_progname);
+ opt->script_name = rb_str_new_cstr(opt->script);
opt->script = RSTRING_PTR(opt->script_name);
- ruby_set_argv(argc, argv);
- process_sflag(opt);
- ruby_init_loadpath();
- safe = rb_safe_level();
- rb_set_safe_level_force(0);
- ruby_init_gems(!(opt->disable & DISABLE_BIT(gems)));
+#if _WIN32
+ translit_char_bin(RSTRING_PTR(opt->script_name), '\\', '/');
+#elif defined DOSISH
+ translit_char(RSTRING_PTR(opt->script_name), '\\', '/');
+#endif
+
+ ruby_gc_set_params(opt->safe_level);
+ ruby_init_loadpath_safe(opt->safe_level);
+ Init_enc();
lenc = rb_locale_encoding();
- for (i = 0; i < RARRAY_LEN(rb_argv); i++) {
- rb_enc_associate(RARRAY_PTR(rb_argv)[i], lenc);
- }
+ rb_enc_associate(rb_progname, lenc);
+ rb_obj_freeze(rb_progname);
parser = rb_parser_new();
- if (opt->yydebug) rb_parser_set_yydebug(parser, Qtrue);
+ if (opt->dump & DUMP_BIT(yydebug)) {
+ rb_parser_set_yydebug(parser, Qtrue);
+ }
if (opt->ext.enc.name != 0) {
opt->ext.enc.index = opt_enc_index(opt->ext.enc.name);
}
+ if (opt->intern.enc.name != 0) {
+ opt->intern.enc.index = opt_enc_index(opt->intern.enc.name);
+ }
if (opt->src.enc.name != 0) {
opt->src.enc.index = opt_enc_index(opt->src.enc.name);
src_encoding_index = opt->src.enc.index;
@@ -1096,176 +1584,294 @@ process_options(VALUE arg)
enc = lenc;
}
rb_enc_set_default_external(rb_enc_from_encoding(enc));
+ if (opt->intern.enc.index >= 0) {
+ enc = rb_enc_from_index(opt->intern.enc.index);
+ rb_enc_set_default_internal(rb_enc_from_encoding(enc));
+ opt->intern.enc.index = -1;
+#if UTF8_PATH
+ ienc = enc;
+#endif
+ }
+ script_name = opt->script_name;
+ rb_enc_associate(opt->script_name,
+ IF_UTF8_PATH(uenc = rb_utf8_encoding(), lenc));
+#if UTF8_PATH
+ if (uenc != lenc) {
+ opt->script_name = str_conv_enc(opt->script_name, uenc, lenc);
+ opt->script = RSTRING_PTR(opt->script_name);
+ }
+#endif
+ rb_obj_freeze(opt->script_name);
+ if (IF_UTF8_PATH(uenc != lenc, 1)) {
+ long i;
+ rb_vm_t *vm = GET_VM();
+ VALUE load_path = vm->load_path;
+ const ID id_initial_load_path_mark = INITIAL_LOAD_PATH_MARK;
+ int modifiable = FALSE;
+
+ rb_get_expanded_load_path();
+ for (i = 0; i < RARRAY_LEN(load_path); ++i) {
+ VALUE path = RARRAY_AREF(load_path, i);
+ int mark = rb_attr_get(path, id_initial_load_path_mark) == path;
+#if UTF8_PATH
+ VALUE newpath = rb_str_conv_enc(path, uenc, lenc);
+ if (newpath == path) continue;
+ path = newpath;
+#else
+ path = rb_enc_associate(rb_str_dup(path), lenc);
+#endif
+ if (mark) rb_ivar_set(path, id_initial_load_path_mark, path);
+ if (!modifiable) {
+ rb_ary_modify(load_path);
+ modifiable = TRUE;
+ }
+ RARRAY_ASET(load_path, i, path);
+ }
+ if (modifiable) {
+ rb_ary_replace(vm->load_path_snapshot, load_path);
+ }
+ }
+ Init_ext(); /* load statically linked extensions before rubygems */
+ if (opt->features & FEATURE_BIT(gems)) {
+ rb_define_module("Gem");
+ }
+ if (opt->features & FEATURE_BIT(did_you_mean)) {
+ rb_define_module("DidYouMean");
+ }
+ ruby_init_prelude();
+ if ((opt->features ^ DEFAULT_FEATURES) & COMPILATION_FEATURES) {
+ VALUE option = rb_hash_new();
+#define SET_COMPILE_OPTION(h, o, name) \
+ rb_hash_aset((h), ID2SYM(rb_intern_const(#name)), \
+ ((o)->features & FEATURE_BIT(name) ? Qtrue : Qfalse));
+ SET_COMPILE_OPTION(option, opt, frozen_string_literal);
+ SET_COMPILE_OPTION(option, opt, debug_frozen_string_literal);
+ rb_funcallv(rb_cISeq, rb_intern_const("compile_option="), 1, &option);
+#undef SET_COMPILE_OPTION
+ }
+ ruby_set_argv(argc, argv);
+ process_sflag(&opt->sflag);
+
+ GetBindingPtr(rb_const_get(rb_cObject, rb_intern("TOPLEVEL_BINDING")),
+ toplevel_binding);
+ /* need to acquire env from toplevel_binding each time, since it
+ * may update after eval() */
+
+ base_block = toplevel_context(toplevel_binding);
+ rb_parser_set_context(parser, base_block, TRUE);
- rb_set_safe_level_force(safe);
if (opt->e_script) {
+ VALUE progname = rb_progname;
rb_encoding *eenc;
if (opt->src.enc.index >= 0) {
eenc = rb_enc_from_index(opt->src.enc.index);
}
else {
eenc = lenc;
+#if UTF8_PATH
+ if (ienc) eenc = ienc;
+#endif
+ }
+#if UTF8_PATH
+ if (eenc != uenc) {
+ opt->e_script = str_conv_enc(opt->e_script, uenc, eenc);
}
+#endif
rb_enc_associate(opt->e_script, eenc);
- require_libraries(opt);
- tree = rb_parser_compile_string(parser, opt->script, opt->e_script, 1);
+ if (!(opt->dump & ~DUMP_BIT(version_v))) {
+ ruby_set_script_name(opt->script_name);
+ require_libraries(&opt->req_list);
+ }
+ ruby_set_script_name(progname);
+ rb_parser_set_options(parser, opt->do_print, opt->do_loop,
+ opt->do_line, opt->do_split);
+ ast = rb_parser_compile_string(parser, opt->script, opt->e_script, 1);
}
else {
- if (opt->script[0] == '-' && !opt->script[1]) {
- forbid_setid("program input from stdin");
- }
- tree = load_file(parser, opt->script, 1, opt);
+ VALUE f;
+ f = open_load_file(script_name, &opt->xflag);
+ ast = load_file(parser, opt->script_name, f, 1, opt);
+ }
+ ruby_set_script_name(opt->script_name);
+ if (dump & DUMP_BIT(yydebug)) {
+ dump &= ~DUMP_BIT(yydebug);
+ if (!dump) return Qtrue;
}
- if (!tree) return Qfalse;
+ if (opt->ext.enc.index >= 0) {
+ enc = rb_enc_from_index(opt->ext.enc.index);
+ }
+ else {
+ enc = lenc;
+ }
+ rb_enc_set_default_external(rb_enc_from_encoding(enc));
+ if (opt->intern.enc.index >= 0) {
+ /* Set in the shebang line */
+ enc = rb_enc_from_index(opt->intern.enc.index);
+ rb_enc_set_default_internal(rb_enc_from_encoding(enc));
+ }
+ else if (!rb_default_internal_encoding())
+ /* Freeze default_internal */
+ rb_enc_set_default_internal(Qnil);
+ rb_stdio_set_default_encoding();
+
+ if (!ast->root) {
+ rb_ast_dispose(ast);
+ return Qfalse;
+ }
- process_sflag(opt);
+ process_sflag(&opt->sflag);
opt->xflag = 0;
- if (rb_safe_level() >= 4) {
- FL_UNSET(rb_argv, FL_TAINT);
- FL_UNSET(GET_VM()->load_path, FL_TAINT);
- }
-
- if (opt->do_check) {
+ if (dump & DUMP_BIT(syntax)) {
printf("Syntax OK\n");
- return Qtrue;
+ dump &= ~DUMP_BIT(syntax);
+ if (!dump) return Qtrue;
}
- if (opt->do_print) {
- tree = rb_parser_append_print(parser, tree);
- }
if (opt->do_loop) {
- tree = rb_parser_while_loop(parser, tree, opt->do_line, opt->do_split);
+ rb_define_global_function("sub", rb_f_sub, -1);
+ rb_define_global_function("gsub", rb_f_gsub, -1);
+ rb_define_global_function("chop", rb_f_chop, 0);
+ rb_define_global_function("chomp", rb_f_chomp, -1);
+ }
+
+ if (dump & (DUMP_BIT(parsetree)|DUMP_BIT(parsetree_with_comment))) {
+ rb_io_write(rb_stdout, rb_parser_dump_tree(ast->root, dump & DUMP_BIT(parsetree_with_comment)));
+ rb_io_flush(rb_stdout);
+ dump &= ~DUMP_BIT(parsetree)&~DUMP_BIT(parsetree_with_comment);
+ if (!dump) {
+ rb_ast_dispose(ast);
+ return Qtrue;
+ }
}
- iseq = rb_iseq_new(tree, rb_str_new2("<main>"),
- opt->script_name, Qfalse, ISEQ_TYPE_TOP);
+ {
+ VALUE path = Qnil;
+ if (!opt->e_script && strcmp(opt->script, "-")) {
+ path = rb_realpath_internal(Qnil, script_name, 1);
+#if UTF8_PATH
+ if (uenc != lenc) {
+ path = str_conv_enc(path, uenc, lenc);
+ }
+#endif
+ if (!ENCODING_GET(path)) { /* ASCII-8BIT */
+ rb_enc_copy(path, opt->script_name);
+ }
+ }
+ base_block = toplevel_context(toplevel_binding);
+ iseq = rb_iseq_new_main(ast->root, opt->script_name, path, vm_block_iseq(base_block));
+ rb_ast_dispose(ast);
+ }
- if (opt->dump & DUMP_BIT(insns)) {
- rb_io_write(rb_stdout, ruby_iseq_disasm(iseq));
+ if (dump & DUMP_BIT(insns)) {
+ rb_io_write(rb_stdout, rb_iseq_disasm((const rb_iseq_t *)iseq));
rb_io_flush(rb_stdout);
- return Qtrue;
+ dump &= ~DUMP_BIT(insns);
+ if (!dump) return Qtrue;
}
+ if (opt->dump & dump_exit_bits) return Qtrue;
- return iseq;
+ rb_define_readonly_boolean("$-p", opt->do_print);
+ rb_define_readonly_boolean("$-l", opt->do_line);
+ rb_define_readonly_boolean("$-a", opt->do_split);
+
+ rb_set_safe_level(opt->safe_level);
+
+ return (VALUE)iseq;
}
-static NODE *
-load_file(VALUE parser, const char *fname, int script, struct cmdline_options *opt)
+#ifndef DOSISH
+static void
+warn_cr_in_shebang(const char *str, long len)
{
- extern VALUE rb_stdin;
- VALUE f;
- int line_start = 1;
- NODE *tree = 0;
- rb_encoding *enc;
-
- if (!fname)
- rb_load_fail(fname);
- if (strcmp(fname, "-") == 0) {
- f = rb_stdin;
+ if (str[len-1] == '\n' && str[len-2] == '\r') {
+ rb_warn("shebang line ending with \\r may cause problems");
}
- else {
- int fd, mode = O_RDONLY;
-#if defined DOSISH || defined __CYGWIN__
- {
- const char *ext = strrchr(fname, '.');
- if (ext && STRCASECMP(ext, ".exe") == 0)
- mode |= O_BINARY;
- }
+}
+#else
+#define warn_cr_in_shebang(str, len) (void)0
#endif
- if ((fd = open(fname, mode)) < 0) {
- rb_load_fail(fname);
- }
- f = rb_io_fdopen(fd, mode, fname);
- }
+struct load_file_arg {
+ VALUE parser;
+ VALUE fname;
+ int script;
+ ruby_cmdline_options_t *opt;
+ VALUE f;
+};
+
+static VALUE
+load_file_internal(VALUE argp_v)
+{
+ struct load_file_arg *argp = (struct load_file_arg *)argp_v;
+ VALUE parser = argp->parser;
+ VALUE orig_fname = argp->fname;
+ int script = argp->script;
+ ruby_cmdline_options_t *opt = argp->opt;
+ VALUE f = argp->f;
+ int line_start = 1;
+ rb_ast_t *ast = 0;
+ rb_encoding *enc;
+ ID set_encoding;
+ CONST_ID(set_encoding, "set_encoding");
if (script) {
VALUE c = 1; /* something not nil */
VALUE line;
- char *p;
+ char *p, *str;
+ long len;
int no_src_enc = !opt->src.enc.name;
int no_ext_enc = !opt->ext.enc.name;
+ int no_int_enc = !opt->intern.enc.name;
- enc = rb_usascii_encoding();
- rb_funcall(f, rb_intern("set_encoding"), 1, rb_enc_from_encoding(enc));
+ enc = rb_ascii8bit_encoding();
+ rb_funcall(f, set_encoding, 1, rb_enc_from_encoding(enc));
if (opt->xflag) {
- forbid_setid("-x");
- opt->xflag = Qfalse;
+ line_start--;
+ search_shebang:
while (!NIL_P(line = rb_io_gets(f))) {
line_start++;
- if (RSTRING_LEN(line) > 2
- && RSTRING_PTR(line)[0] == '#'
- && RSTRING_PTR(line)[1] == '!') {
- if ((p = strstr(RSTRING_PTR(line), "ruby")) != 0) {
+ RSTRING_GETMEM(line, str, len);
+ if (len > 2 && str[0] == '#' && str[1] == '!') {
+ if (line_start == 1) warn_cr_in_shebang(str, len);
+ if ((p = strstr(str+2, ruby_engine)) != 0) {
goto start_read;
}
}
}
- rb_raise(rb_eLoadError, "no Ruby script found in input");
+ rb_loaderror("no Ruby script found in input");
}
c = rb_io_getbyte(f);
if (c == INT2FIX('#')) {
c = rb_io_getbyte(f);
- if (c == INT2FIX('!')) {
- line = rb_io_gets(f);
- if (NIL_P(line))
- return 0;
-
- if ((p = strstr(RSTRING_PTR(line), "ruby")) == 0) {
- /* not ruby script, kick the program */
- char **argv;
- char *path;
- char *pend = RSTRING_PTR(line) + RSTRING_LEN(line);
-
- p = RSTRING_PTR(line); /* skip `#!' */
- if (pend[-1] == '\n')
- pend--; /* chomp line */
- if (pend[-1] == '\r')
- pend--;
- *pend = '\0';
- while (p < pend && ISSPACE(*p))
- p++;
- path = p; /* interpreter path */
- while (p < pend && !ISSPACE(*p))
- p++;
- *p++ = '\0';
- if (p < pend) {
- argv = ALLOCA_N(char *, origarg.argc + 3);
- argv[1] = p;
- MEMCPY(argv + 2, origarg.argv + 1, char *, origarg.argc);
- }
- else {
- argv = origarg.argv;
- }
- argv[0] = path;
- execv(path, argv);
-
- rb_fatal("Can't exec %s", path);
+ if (c == INT2FIX('!') && !NIL_P(line = rb_io_gets(f))) {
+ RSTRING_GETMEM(line, str, len);
+ warn_cr_in_shebang(str, len);
+ if ((p = strstr(str, ruby_engine)) == 0) {
+ /* not ruby script, assume -x flag */
+ goto search_shebang;
}
start_read:
- p += 4;
- RSTRING_PTR(line)[RSTRING_LEN(line) - 1] = '\0';
- if (RSTRING_PTR(line)[RSTRING_LEN(line) - 2] == '\r')
- RSTRING_PTR(line)[RSTRING_LEN(line) - 2] = '\0';
+ str += len - 1;
+ if (*str == '\n') *str-- = '\0';
+ if (*str == '\r') *str-- = '\0';
+ /* ruby_engine should not contain a space */
if ((p = strstr(p, " -")) != 0) {
- p++; /* skip space before `-' */
- while (*p == '-') {
- p = moreswitches(p + 1, opt);
- }
+ opt->warning = 0;
+ moreswitches(p + 1, opt, 0);
}
/* push back shebang for pragma may exist in next line */
- rb_io_ungetc(f, rb_str_new2("!\n"));
+ rb_io_ungetbyte(f, rb_str_new2("!\n"));
}
else if (!NIL_P(c)) {
- rb_io_ungetc(f, c);
+ rb_io_ungetbyte(f, c);
}
- rb_io_ungetc(f, INT2FIX('#'));
+ rb_io_ungetbyte(f, INT2FIX('#'));
if (no_src_enc && opt->src.enc.name) {
opt->src.enc.index = opt_enc_index(opt->src.enc.name);
src_encoding_index = opt->src.enc.index;
@@ -1273,11 +1879,20 @@ load_file(VALUE parser, const char *fname, int script, struct cmdline_options *o
if (no_ext_enc && opt->ext.enc.name) {
opt->ext.enc.index = opt_enc_index(opt->ext.enc.name);
}
+ if (no_int_enc && opt->intern.enc.name) {
+ opt->intern.enc.index = opt_enc_index(opt->intern.enc.name);
+ }
}
else if (!NIL_P(c)) {
- rb_io_ungetc(f, c);
+ rb_io_ungetbyte(f, c);
+ }
+ else {
+ argp->f = f = Qnil;
+ }
+ if (!(opt->dump & ~DUMP_BIT(version_v))) {
+ ruby_set_script_name(opt->script_name);
+ require_libraries(&opt->req_list); /* Why here? unnatural */
}
- require_libraries(opt); /* Why here? unnatural */
}
if (opt->src.enc.index >= 0) {
enc = rb_enc_from_index(opt->src.enc.index);
@@ -1286,156 +1901,281 @@ load_file(VALUE parser, const char *fname, int script, struct cmdline_options *o
enc = rb_locale_encoding();
}
else {
- enc = rb_usascii_encoding();
+ enc = rb_utf8_encoding();
+ }
+ rb_parser_set_options(parser, opt->do_print, opt->do_loop,
+ opt->do_line, opt->do_split);
+ if (NIL_P(f)) {
+ f = rb_str_new(0, 0);
+ rb_enc_associate(f, enc);
+ return (VALUE)rb_parser_compile_string_path(parser, orig_fname, f, line_start);
}
- rb_funcall(f, rb_intern("set_encoding"), 1, rb_enc_from_encoding(enc));
- tree = (NODE *)rb_parser_compile_file(parser, fname, f, line_start);
- rb_funcall(f, rb_intern("set_encoding"), 1, rb_parser_encoding(parser));
+ rb_funcall(f, set_encoding, 2, rb_enc_from_encoding(enc), rb_str_new_cstr("-"));
+ ast = rb_parser_compile_file_path(parser, orig_fname, f, line_start);
+ rb_funcall(f, set_encoding, 1, rb_parser_encoding(parser));
if (script && rb_parser_end_seen_p(parser)) {
+ /*
+ * DATA is a File that contains the data section of the executed file.
+ * To create a data section use <tt>__END__</tt>:
+ *
+ * $ cat t.rb
+ * puts DATA.gets
+ * __END__
+ * hello world!
+ *
+ * $ ruby t.rb
+ * hello world!
+ */
rb_define_global_const("DATA", f);
+ argp->f = Qnil;
+ }
+ return (VALUE)ast;
+}
+
+static VALUE
+open_load_file(VALUE fname_v, int *xflag)
+{
+ const char *fname = (fname_v = rb_str_encode_ospath(fname_v),
+ StringValueCStr(fname_v));
+ long flen = RSTRING_LEN(fname_v);
+ VALUE f;
+ int e;
+
+ if (flen == 1 && fname[0] == '-') {
+ f = rb_stdin;
+ }
+ else {
+ int fd;
+ /* open(2) may block if fname is point to FIFO and it's empty. Let's
+ use O_NONBLOCK. */
+#if defined O_NONBLOCK && HAVE_FCNTL && !(O_NONBLOCK & O_ACCMODE)
+ /* TODO: fix conflicting O_NONBLOCK in ruby/win32.h */
+# define MODE_TO_LOAD (O_RDONLY | O_NONBLOCK)
+#elif defined O_NDELAY && HAVE_FCNTL && !(O_NDELAY & O_ACCMODE)
+# define MODE_TO_LOAD (O_RDONLY | O_NDELAY)
+#else
+# define MODE_TO_LOAD (O_RDONLY)
+#endif
+ int mode = MODE_TO_LOAD;
+#if defined DOSISH || defined __CYGWIN__
+# define isdirsep(x) ((x) == '/' || (x) == '\\')
+ {
+ static const char exeext[] = ".exe";
+ enum {extlen = sizeof(exeext)-1};
+ if (flen > extlen && !isdirsep(fname[flen-extlen-1]) &&
+ STRNCASECMP(fname+flen-extlen, exeext, extlen) == 0) {
+ mode |= O_BINARY;
+ *xflag = 1;
+ }
+ }
+#endif
+
+ if ((fd = rb_cloexec_open(fname, mode, 0)) < 0) {
+ int e = errno;
+ if (!rb_gc_for_fd(e)) {
+ rb_load_fail(fname_v, strerror(e));
+ }
+ if ((fd = rb_cloexec_open(fname, mode, 0)) < 0) {
+ rb_load_fail(fname_v, strerror(errno));
+ }
+ }
+ rb_update_max_fd(fd);
+
+#if defined HAVE_FCNTL && MODE_TO_LOAD != O_RDONLY
+ /* disabling O_NONBLOCK */
+ if (fcntl(fd, F_SETFL, 0) < 0) {
+ e = errno;
+ (void)close(fd);
+ rb_load_fail(fname_v, strerror(e));
+ }
+#endif
+
+ e = ruby_is_fd_loadable(fd);
+ if (!e) {
+ e = errno;
+ (void)close(fd);
+ rb_load_fail(fname_v, strerror(e));
+ }
+
+ f = rb_io_fdopen(fd, mode, fname);
+ if (e < 0) {
+ /*
+ We need to wait if FIFO is empty. It's FIFO's semantics.
+ rb_thread_wait_fd() release GVL. So, it's safe.
+ */
+ rb_thread_wait_fd(fd);
+ }
}
- else if (f != rb_stdin) {
+ return f;
+}
+
+static VALUE
+restore_load_file(VALUE arg)
+{
+ struct load_file_arg *argp = (struct load_file_arg *)arg;
+ VALUE f = argp->f;
+
+ if (!NIL_P(f) && f != rb_stdin) {
rb_io_close(f);
}
- return tree;
+ return Qnil;
+}
+
+static rb_ast_t *
+load_file(VALUE parser, VALUE fname, VALUE f, int script, ruby_cmdline_options_t *opt)
+{
+ struct load_file_arg arg;
+ arg.parser = parser;
+ arg.fname = fname;
+ arg.script = script;
+ arg.opt = opt;
+ arg.f = f;
+ return (rb_ast_t *)rb_ensure(load_file_internal, (VALUE)&arg,
+ restore_load_file, (VALUE)&arg);
}
void *
rb_load_file(const char *fname)
{
- struct cmdline_options opt;
+ VALUE fname_v = rb_str_new_cstr(fname);
+ return rb_load_file_str(fname_v);
+}
- return load_file(rb_parser_new(), fname, 0, cmdline_options_init(&opt));
+void *
+rb_load_file_str(VALUE fname_v)
+{
+ return rb_parser_load_file(rb_parser_new(), fname_v);
}
-#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE)
-#if !defined(_WIN32) && !(defined(HAVE_SETENV) && defined(HAVE_UNSETENV))
-#define USE_ENVSPACE_FOR_ARG0
-#endif
+void *
+rb_parser_load_file(VALUE parser, VALUE fname_v)
+{
+ ruby_cmdline_options_t opt;
+ VALUE f = open_load_file(fname_v, &cmdline_options_init(&opt)->xflag);
+ return load_file(parser, fname_v, f, 0, &opt);
+}
-#ifdef USE_ENVSPACE_FOR_ARG0
-extern char **environ;
-#endif
+/*
+ * call-seq:
+ * Process.argv0 -> frozen_string
+ *
+ * Returns the name of the script being executed. The value is not
+ * affected by assigning a new value to $0.
+ *
+ * This method first appeared in Ruby 2.1 to serve as a global
+ * variable free means to get the script name.
+ */
-static int
-get_arglen(int argc, char **argv)
+static VALUE
+proc_argv0(VALUE process)
{
- char *s = argv[0];
- int i;
+ return rb_orig_progname;
+}
- if (!argc) return 0;
- s += strlen(s);
- /* See if all the arguments are contiguous in memory */
- for (i = 1; i < argc; i++) {
- if (argv[i] == s + 1) {
- s++;
- s += strlen(s); /* this one is ok too */
- }
- else {
- break;
- }
- }
-#if defined(USE_ENVSPACE_FOR_ARG0)
- if (environ && (s == environ[0])) {
- s += strlen(s);
- for (i = 1; environ[i]; i++) {
- if (environ[i] == s + 1) {
- s++;
- s += strlen(s); /* this one is ok too */
- }
- }
- ruby_setenv("", NULL); /* duplicate environ vars */
- }
-#endif
- return s - argv[0];
+static VALUE ruby_setproctitle(VALUE title);
+
+/*
+ * call-seq:
+ * Process.setproctitle(string) -> string
+ *
+ * Sets the process title that appears on the ps(1) command. Not
+ * necessarily effective on all platforms. No exception will be
+ * raised regardless of the result, nor will NotImplementedError be
+ * raised even if the platform does not support the feature.
+ *
+ * Calling this method does not affect the value of $0.
+ *
+ * Process.setproctitle('myapp: worker #%d' % worker_id)
+ *
+ * This method first appeared in Ruby 2.1 to serve as a global
+ * variable free means to change the process title.
+ */
+
+static VALUE
+proc_setproctitle(VALUE process, VALUE title)
+{
+ return ruby_setproctitle(title);
+}
+
+static VALUE
+ruby_setproctitle(VALUE title)
+{
+ const char *ptr = StringValueCStr(title);
+ setproctitle("%.*s", RSTRING_LENINT(title), ptr);
+ return title;
}
-#endif
static void
set_arg0(VALUE val, ID id)
{
- char *s;
- long i;
-
if (origarg.argv == 0)
rb_raise(rb_eRuntimeError, "$0 not initialized");
- StringValue(val);
- s = RSTRING_PTR(val);
- i = RSTRING_LEN(val);
-#if defined(PSTAT_SETCMD)
- if (i > PST_CLEN) {
- union pstun un;
- char buf[PST_CLEN + 1]; /* PST_CLEN is 64 (HP-UX 11.23) */
- strncpy(buf, s, PST_CLEN);
- buf[PST_CLEN] = '\0';
- un.pst_command = buf;
- pstat(PSTAT_SETCMD, un, PST_CLEN, 0, 0);
- }
- else {
- union pstun un;
- un.pst_command = s;
- pstat(PSTAT_SETCMD, un, i, 0, 0);
- }
-#elif defined(HAVE_SETPROCTITLE)
- setproctitle("%.*s", (int)i, s);
-#else
-
- if (i >= origarg.len) {
- i = origarg.len;
- }
-
- memcpy(origarg.argv[0], s, i);
- {
- int j;
- char *t = origarg.argv[0] + i;
- *t = '\0';
+ rb_progname = rb_str_new_frozen(ruby_setproctitle(val));
+}
- if (i + 1 < origarg.len) memset(t + 1, ' ', origarg.len - i - 1);
- for (j = 1; j < origarg.argc; j++) {
- origarg.argv[j] = t;
- }
- }
+static inline VALUE
+external_str_new_cstr(const char *p)
+{
+#if UTF8_PATH
+ VALUE str = rb_utf8_str_new_cstr(p);
+ str = str_conv_enc(str, NULL, rb_default_external_encoding());
+ OBJ_TAINT_RAW(str);
+ return str;
+#else
+ return rb_external_str_new_cstr(p);
#endif
- rb_progname = rb_tainted_str_new(s, i);
}
+/*! Sets the current script name to this value.
+ *
+ * This is similar to <code>$0 = name</code> in Ruby level but also affects
+ * <code>Method#location</code> and others.
+ */
void
ruby_script(const char *name)
{
if (name) {
- rb_progname = rb_tainted_str_new2(name);
+ rb_orig_progname = rb_progname = external_str_new_cstr(name);
+ rb_vm_set_progname(rb_progname);
}
}
+/*! Sets the current script name to this value.
+ *
+ * Same as ruby_script() but accepts a VALUE.
+ */
+void
+ruby_set_script_name(VALUE name)
+{
+ rb_orig_progname = rb_progname = rb_str_dup(name);
+ rb_vm_set_progname(rb_progname);
+}
+
static void
-init_ids(struct cmdline_options *opt)
+init_ids(ruby_cmdline_options_t *opt)
{
rb_uid_t uid = getuid();
rb_uid_t euid = geteuid();
rb_gid_t gid = getgid();
rb_gid_t egid = getegid();
-#ifdef VMS
- uid |= gid << 16;
- euid |= egid << 16;
-#endif
if (uid != euid) opt->setids |= 1;
if (egid != gid) opt->setids |= 2;
if (uid && opt->setids) {
- rb_set_safe_level(1);
+ if (opt->safe_level < 1) opt->safe_level = 1;
}
}
#undef forbid_setid
static void
-forbid_setid(const char *s, struct cmdline_options *opt)
+forbid_setid(const char *s, const ruby_cmdline_options_t *opt)
{
if (opt->setids & 1)
rb_raise(rb_eSecurityError, "no %s allowed while running setuid", s);
if (opt->setids & 2)
rb_raise(rb_eSecurityError, "no %s allowed while running setgid", s);
- if (rb_safe_level() > 0)
+ if (opt->safe_level > 0)
rb_raise(rb_eSecurityError, "no %s allowed in tainted mode", s);
}
@@ -1457,34 +2197,35 @@ opt_W_getter(ID id, void *data)
return INT2FIX(1);
case Qtrue:
return INT2FIX(2);
+ default:
+ return Qnil;
}
- return Qnil; /* not reached */
}
+/*! Defines built-in variables */
void
ruby_prog_init(void)
{
rb_define_hooked_variable("$VERBOSE", &ruby_verbose, 0, verbose_setter);
rb_define_hooked_variable("$-v", &ruby_verbose, 0, verbose_setter);
rb_define_hooked_variable("$-w", &ruby_verbose, 0, verbose_setter);
- rb_define_hooked_variable("$-W", &ruby_verbose, opt_W_getter, 0);
+ rb_define_hooked_variable("$-W", &ruby_verbose, opt_W_getter, rb_gvar_readonly_setter);
rb_define_variable("$DEBUG", &ruby_debug);
rb_define_variable("$-d", &ruby_debug);
rb_define_hooked_variable("$0", &rb_progname, 0, set_arg0);
rb_define_hooked_variable("$PROGRAM_NAME", &rb_progname, 0, set_arg0);
- rb_define_global_const("ARGV", rb_argv);
- rb_global_variable(&rb_argv0);
+ rb_define_module_function(rb_mProcess, "argv0", proc_argv0, 0);
+ rb_define_module_function(rb_mProcess, "setproctitle", proc_setproctitle, 1);
-#ifdef MSDOS
/*
- * There is no way we can refer to them from ruby, so close them to save
- * space.
+ * ARGV contains the command line arguments used to run ruby.
+ *
+ * A library like OptionParser can be used to process command-line
+ * arguments.
*/
- (void)fclose(stdaux);
- (void)fclose(stdprn);
-#endif
+ rb_define_global_const("ARGV", rb_argv);
}
void
@@ -1494,91 +2235,92 @@ ruby_set_argv(int argc, char **argv)
VALUE av = rb_argv;
#if defined(USE_DLN_A_OUT)
- if (origarg.argv)
+ if (origarg.argc > 0 && origarg.argv)
dln_argv0 = origarg.argv[0];
- else
+ else if (argc > 0 && argv)
dln_argv0 = argv[0];
#endif
rb_ary_clear(av);
for (i = 0; i < argc; i++) {
- VALUE arg = rb_tainted_str_new2(argv[i]);
+ VALUE arg = external_str_new_cstr(argv[i]);
OBJ_FREEZE(arg);
rb_ary_push(av, arg);
}
}
-static VALUE
-false_value(void)
-{
- return Qfalse;
-}
-
-static VALUE
-true_value(void)
-{
- return Qtrue;
-}
-
-#define rb_define_readonly_boolean(name, val) \
- rb_define_virtual_variable((name), (val) ? true_value : false_value, 0)
-
void *
ruby_process_options(int argc, char **argv)
{
- struct cmdline_arguments args;
- struct cmdline_options opt;
- NODE *tree;
+ ruby_cmdline_options_t opt;
+ VALUE iseq;
+ const char *script_name = (argc > 0 && argv[0]) ? argv[0] : ruby_engine;
- ruby_script(argv[0]); /* for the time being */
+ if (!origarg.argv || origarg.argc <= 0) {
+ origarg.argc = argc;
+ origarg.argv = argv;
+ }
+ ruby_script(script_name); /* for the time being */
rb_argv0 = rb_str_new4(rb_progname);
- args.argc = argc;
- args.argv = argv;
- args.opt = cmdline_options_init(&opt);
- opt.ext.enc.index = -1;
- tree = (NODE *)rb_vm_call_cfunc(rb_vm_top_self(),
- process_options, (VALUE)&args,
- 0, rb_progname);
+ rb_gc_register_mark_object(rb_argv0);
+ iseq = process_options(argc, argv, cmdline_options_init(&opt));
+
+#ifndef HAVE_SETPROCTITLE
+ ruby_init_setproctitle(argc, argv);
+#endif
- rb_define_readonly_boolean("$-p", opt.do_print);
- rb_define_readonly_boolean("$-l", opt.do_line);
- rb_define_readonly_boolean("$-a", opt.do_split);
+ return (void*)(struct RData*)iseq;
+}
- return tree;
+static void
+fill_standard_fds(void)
+{
+ int f0, f1, f2, fds[2];
+ struct stat buf;
+ f0 = fstat(0, &buf) == -1 && errno == EBADF;
+ f1 = fstat(1, &buf) == -1 && errno == EBADF;
+ f2 = fstat(2, &buf) == -1 && errno == EBADF;
+ if (f0) {
+ if (pipe(fds) == 0) {
+ close(fds[1]);
+ if (fds[0] != 0) {
+ dup2(fds[0], 0);
+ close(fds[0]);
+ }
+ }
+ }
+ if (f1 || f2) {
+ if (pipe(fds) == 0) {
+ close(fds[0]);
+ if (f1 && fds[1] != 1)
+ dup2(fds[1], 1);
+ if (f2 && fds[1] != 2)
+ dup2(fds[1], 2);
+ if (fds[1] != 1 && fds[1] != 2)
+ close(fds[1]);
+ }
+ }
}
+/*! Initializes the process for libruby.
+ *
+ * This function assumes this process is ruby(1) and it has just started.
+ * Usually programs that embed CRuby interpreter may not call this function,
+ * and may do their own initialization.
+ * argc and argv cannot be NULL.
+ */
void
ruby_sysinit(int *argc, char ***argv)
{
-#if defined(__APPLE__) && (defined(__MACH__) || defined(__DARWIN__))
- int i, n = *argc, len = 0;
- char **v1 = *argv, **v2, *p;
-
- for (i = 0; i < n; ++i) {
- len += strlen(v1[i]) + 1;
- }
- v2 = malloc((n + 1)* sizeof(char*) + len);
- p = (char *)&v2[n + 1];
- for (i = 0; i < n; ++i) {
- int l = strlen(v1[i]);
- memcpy(p, v1[i], l + 1);
- v2[i] = p;
- p += l + 1;
- }
- v2[n] = 0;
- *argv = v2;
-#elif defined(__MACOS__) && defined(__MWERKS__)
- *argc = ccommand(argv);
-#elif defined(_WIN32)
- void rb_w32_sysinit(int *argc, char ***argv);
+#if defined(_WIN32)
rb_w32_sysinit(argc, argv);
#endif
- origarg.argc = *argc;
- origarg.argv = *argv;
-#if !defined(PSTAT_SETCMD) && !defined(HAVE_SETPROCTITLE)
- origarg.len = get_arglen(origarg.argc, origarg.argv);
-#endif
+ if (*argc >= 0 && *argv) {
+ origarg.argc = *argc;
+ origarg.argv = *argv;
#if defined(USE_DLN_A_OUT)
- dln_argv0 = origarg.argv[0];
+ dln_argv0 = origarg.argv[0];
#endif
+ }
+ fill_standard_fds();
}