summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authornagachika <nagachika@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2016-08-15 19:02:10 +0000
committernagachika <nagachika@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2016-08-15 19:02:10 +0000
commit9b71251e1e8f86972df2c0eda7c4209c5da7488a (patch)
treeb6c48f35a415eccd80f4dfb59b0572caf7d617aa
parent243d224f285c8a4a5e4db344e2f4d4023cf8d2e9 (diff)
merge revision(s) 55181: [Backport #12431]
* transcode.c (str_transcode0): scrub in the given encoding when the source encoding is given, not in the encoding of the receiver. [ruby-core:75732] [Bug #12431] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/branches/ruby_2_3@55905 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
-rw-r--r--ChangeLog6
-rw-r--r--internal.h1
-rw-r--r--string.c8
-rw-r--r--test/ruby/test_transcode.rb3
-rw-r--r--transcode.c2
-rw-r--r--version.h2
6 files changed, 18 insertions, 4 deletions
diff --git a/ChangeLog b/ChangeLog
index 396f4cb723..ae6a7bd053 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,3 +1,9 @@
+Tue Aug 16 03:51:59 2016 Nobuyoshi Nakada <nobu@ruby-lang.org>
+
+ * transcode.c (str_transcode0): scrub in the given encoding when
+ the source encoding is given, not in the encoding of the
+ receiver. [ruby-core:75732] [Bug #12431]
+
Tue Aug 16 03:41:21 2016 Kazuki Yamaguchi <k@rhe.jp>
* ext/openssl/ossl_pkey_dh.c (ossl_dh_compute_key): Check that the DH
diff --git a/internal.h b/internal.h
index 7602559e2c..ac8834dbce 100644
--- a/internal.h
+++ b/internal.h
@@ -1129,6 +1129,7 @@ VALUE rb_str_locktmp_ensure(VALUE str, VALUE (*func)(VALUE), VALUE arg);
VALUE rb_external_str_with_enc(VALUE str, rb_encoding *eenc);
VALUE rb_str_cat_conv_enc_opts(VALUE newstr, long ofs, const char *ptr, long len,
rb_encoding *from, int ecflags, VALUE ecopts);
+VALUE rb_enc_str_scrub(rb_encoding *enc, VALUE str, VALUE repl);
#endif
#define STR_NOEMBED FL_USER1
#define STR_SHARED FL_USER2 /* = ELTS_SHARED */
diff --git a/string.c b/string.c
index 318acf38ff..d959b0b067 100644
--- a/string.c
+++ b/string.c
@@ -8675,8 +8675,13 @@ str_compat_and_valid(VALUE str, rb_encoding *enc)
VALUE
rb_str_scrub(VALUE str, VALUE repl)
{
+ return rb_enc_str_scrub(STR_ENC_GET(str), str, repl);
+}
+
+VALUE
+rb_enc_str_scrub(rb_encoding *enc, VALUE str, VALUE repl)
+{
int cr = ENC_CODERANGE(str);
- rb_encoding *enc;
int encidx;
VALUE buf = Qnil;
const char *rep;
@@ -8686,7 +8691,6 @@ rb_str_scrub(VALUE str, VALUE repl)
if (ENC_CODERANGE_CLEAN_P(cr))
return Qnil;
- enc = STR_ENC_GET(str);
if (!NIL_P(repl)) {
repl = str_compat_and_valid(repl, enc);
tainted = OBJ_TAINTED_RAW(repl);
diff --git a/test/ruby/test_transcode.rb b/test/ruby/test_transcode.rb
index 33e7467102..2f97d098fd 100644
--- a/test/ruby/test_transcode.rb
+++ b/test/ruby/test_transcode.rb
@@ -1213,6 +1213,9 @@ class TestTranscode < Test::Unit::TestCase
def test_invalid_replace_string
assert_equal("a<x>A", "a\x80A".encode("us-ascii", "euc-jp", :invalid=>:replace, :replace=>"<x>"))
assert_equal("a<x>A", "a\x80A".encode("us-ascii", "euc-jis-2004", :invalid=>:replace, :replace=>"<x>"))
+ s = "abcd\u{c1}"
+ r = s.b.encode("UTF-8", "UTF-8", invalid: :replace, replace: "\u{fffd}")
+ assert_equal(s, r)
end
def test_undef_replace
diff --git a/transcode.c b/transcode.c
index 0514adaf7e..8aa9cf3352 100644
--- a/transcode.c
+++ b/transcode.c
@@ -2700,7 +2700,7 @@ str_transcode0(int argc, VALUE *argv, VALUE *self, int ecflags, VALUE ecopts)
if (!NIL_P(ecopts)) {
rep = rb_hash_aref(ecopts, sym_replace);
}
- dest = rb_str_scrub(str, rep);
+ dest = rb_enc_str_scrub(senc, str, rep);
if (NIL_P(dest)) dest = str;
*self = dest;
return dencidx;
diff --git a/version.h b/version.h
index 626886551b..e6ce077475 100644
--- a/version.h
+++ b/version.h
@@ -1,6 +1,6 @@
#define RUBY_VERSION "2.3.2"
#define RUBY_RELEASE_DATE "2016-08-16"
-#define RUBY_PATCHLEVEL 155
+#define RUBY_PATCHLEVEL 156
#define RUBY_RELEASE_YEAR 2016
#define RUBY_RELEASE_MONTH 8