diff options
| author | tompng <tomoyapenguin@gmail.com> | 2024-01-16 02:44:53 +0900 |
|---|---|---|
| committer | Nobuyoshi Nakada <nobu@ruby-lang.org> | 2024-01-16 23:18:55 +0900 |
| commit | ade56737e2273847426214035c0ff2340b43799a (patch) | |
| tree | bad63eab75e91ff9406ecf56101f9f48144560e0 | |
| parent | 0520e9675b91ea559da1ae5eda9db378fbdbca52 (diff) | |
Fix coderange of invalid_encoding_string.<<(ord)
Appending valid encoding character can change coderange from invalid to valid.
Example: "\x95".force_encoding('sjis')<<0x5C will be a valid string "\x{955C}"
| -rw-r--r-- | string.c | 6 | ||||
| -rw-r--r-- | test/ruby/test_string.rb | 3 |
2 files changed, 8 insertions, 1 deletions
@@ -3522,8 +3522,12 @@ rb_str_concat(VALUE str1, VALUE str2) } rb_str_resize(str1, pos+len); memcpy(RSTRING_PTR(str1) + pos, buf, len); - if (cr == ENC_CODERANGE_7BIT && code > 127) + if (cr == ENC_CODERANGE_7BIT && code > 127) { cr = ENC_CODERANGE_VALID; + } + else if (cr == ENC_CODERANGE_BROKEN) { + cr = ENC_CODERANGE_UNKNOWN; + } ENC_CODERANGE_SET(str1, cr); } return str1; diff --git a/test/ruby/test_string.rb b/test/ruby/test_string.rb index 4aa119f8fd..42f2544b5a 100644 --- a/test/ruby/test_string.rb +++ b/test/ruby/test_string.rb @@ -301,6 +301,9 @@ CODE assert_raise(RangeError, bug) {S("a".force_encoding(Encoding::UTF_8)) << -1} assert_raise(RangeError, bug) {S("a".force_encoding(Encoding::UTF_8)) << 0x81308130} assert_nothing_raised {S("a".force_encoding(Encoding::GB18030)) << 0x81308130} + + s = "\x95".force_encoding(Encoding::SJIS).tap(&:valid_encoding?) + assert_predicate(s << 0x5c, :valid_encoding?) end def test_MATCH # '=~' |
