From 842b0008c132dd587f09766a228041afb7fed24f Mon Sep 17 00:00:00 2001 From: Nobuyoshi Nakada Date: Wed, 29 Sep 2021 19:59:31 +0900 Subject: Skip broken strings as the locale encoding --- ruby.c | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) (limited to 'ruby.c') diff --git a/ruby.c b/ruby.c index 3358068bbb..818161710c 100644 --- a/ruby.c +++ b/ruby.c @@ -1680,7 +1680,11 @@ tty_enabled(void) static VALUE copy_str(VALUE str, rb_encoding *enc, bool intern) { - if (!intern) return rb_enc_associate(rb_str_dup(str), enc); + if (!intern) { + if (rb_enc_str_coderange_scan(str, enc) == ENC_CODERANGE_BROKEN) + return 0; + return rb_enc_associate(rb_str_dup(str), enc); + } return rb_enc_interned_str(RSTRING_PTR(str), RSTRING_LEN(str), enc); } @@ -1916,7 +1920,7 @@ process_options(int argc, char **argv, ruby_cmdline_options_t *opt) if (newpath == path) continue; path = newpath; #else - path = copy_str(path, lenc, !mark); + if (!(path = copy_str(path, lenc, !mark))) continue; #endif if (mark) rb_ivar_set(path, id_initial_load_path_mark, path); if (!modifiable) { @@ -1934,8 +1938,7 @@ process_options(int argc, char **argv, ruby_cmdline_options_t *opt) bool modified = false; for (long i = loaded_before_enc; i < RARRAY_LEN(loaded_features); ++i) { VALUE path = RARRAY_AREF(loaded_features, i); - if (rb_enc_get(path) == IF_UTF8_PATH(uenc, lenc)) continue; - path = copy_str(path, IF_UTF8_PATH(uenc, lenc), true); + if (!(path = copy_str(path, IF_UTF8_PATH(uenc, lenc), true))) continue; modified = true; RARRAY_ASET(loaded_features, i, path); } -- cgit v1.2.3