summaryrefslogtreecommitdiff
path: root/string.c
diff options
context:
space:
mode:
authormatz <matz@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-06-19 17:11:55 +0000
committermatz <matz@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-06-19 17:11:55 +0000
commit5336cbdfd33b90c92069f55d8c0ba6df4cf66a0e (patch)
treef257335933c6260698e891a78e3657818e0ac5ca /string.c
parente929f49e564dab959e6df43bb7e3621d74e8c3c5 (diff)
* string.c (str_gsub): should preserve last successful match
data. [ruby-dev:35182] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@17447 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'string.c')
-rw-r--r--string.c35
1 files changed, 17 insertions, 18 deletions
diff --git a/string.c b/string.c
index f3207d7077..b962880d43 100644
--- a/string.c
+++ b/string.c
@@ -3084,8 +3084,7 @@ get_pat(VALUE pat, int quote)
static VALUE
rb_str_sub_bang(int argc, VALUE *argv, VALUE str)
{
- VALUE pat, repl, match, hash = Qnil;
- struct re_registers *regs;
+ VALUE pat, repl, hash = Qnil;
int iter = 0;
int tainted = 0;
long plen;
@@ -3109,15 +3108,13 @@ rb_str_sub_bang(int argc, VALUE *argv, VALUE str)
if (rb_reg_search(pat, str, 0, 0) >= 0) {
rb_encoding *enc;
int cr = ENC_CODERANGE(str);
-
- match = rb_backref_get();
- regs = RMATCH_REGS(match);
+ VALUE match = rb_backref_get();
+ struct re_registers *regs = RMATCH_REGS(match);
if (iter || !NIL_P(hash)) {
char *p = RSTRING_PTR(str); long len = RSTRING_LEN(str);
if (iter) {
- rb_match_busy(match);
repl = rb_obj_as_string(rb_yield(rb_reg_nth_match(0, match)));
}
else {
@@ -3126,7 +3123,6 @@ rb_str_sub_bang(int argc, VALUE *argv, VALUE str)
}
str_mod_check(str, p, len);
str_frozen_check(str);
- if (iter) rb_backref_set(match);
}
else {
repl = rb_reg_regsub(repl, str, regs, pat);
@@ -3217,7 +3213,8 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
VALUE pat, val, repl, match, dest, hash = Qnil;
struct re_registers *regs;
long beg, n;
- long offset, blen, slen, len;
+ long beg0, end0;
+ long offset, blen, slen, len, last;
int iter = 0;
char *sp, *cp;
int tainted = 0;
@@ -3241,13 +3238,14 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
}
pat = get_pat(argv[0], 1);
- offset=0; n=0;
beg = rb_reg_search(pat, str, 0, 0);
if (beg < 0) {
if (bang) return Qnil; /* no match, no substitution */
return rb_str_dup(str);
}
+ offset = 0;
+ n = 0;
blen = RSTRING_LEN(str) + 30; /* len + margin */
dest = rb_str_buf_new(blen);
sp = RSTRING_PTR(str);
@@ -3259,9 +3257,10 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
n++;
match = rb_backref_get();
regs = RMATCH_REGS(match);
+ beg0 = BEG(0);
+ end0 = END(0);
if (iter || !NIL_P(hash)) {
if (iter) {
- rb_match_busy(match);
val = rb_obj_as_string(rb_yield(rb_reg_nth_match(0, match)));
}
else {
@@ -3273,7 +3272,6 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
if (val == dest) { /* paranoid check [ruby-dev:24827] */
rb_raise(rb_eRuntimeError, "block should not cheat");
}
- if (iter) rb_backref_set(match);
}
else {
val = rb_reg_regsub(repl, str, regs, pat);
@@ -3288,16 +3286,17 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
rb_str_buf_append(dest, val);
- offset = END(0);
- if (BEG(0) == END(0)) {
+ last = offset;
+ offset = end0;
+ if (beg0 == end0) {
/*
* Always consume at least one character of the input string
* in order to prevent infinite loops.
*/
- if (RSTRING_LEN(str) <= END(0)) break;
- len = rb_enc_mbclen(RSTRING_PTR(str)+END(0), RSTRING_END(str), str_enc);
- rb_enc_str_buf_cat(dest, RSTRING_PTR(str)+END(0), len, str_enc);
- offset = END(0) + len;
+ if (RSTRING_LEN(str) <= end0) break;
+ len = rb_enc_mbclen(RSTRING_PTR(str)+end0, RSTRING_END(str), str_enc);
+ rb_enc_str_buf_cat(dest, RSTRING_PTR(str)+end0, len, str_enc);
+ offset = end0 + len;
}
cp = RSTRING_PTR(str) + offset;
if (offset > RSTRING_LEN(str)) break;
@@ -3306,7 +3305,7 @@ str_gsub(int argc, VALUE *argv, VALUE str, int bang)
if (RSTRING_LEN(str) > offset) {
rb_enc_str_buf_cat(dest, cp, RSTRING_LEN(str) - offset, str_enc);
}
- rb_backref_set(match);
+ rb_reg_search(pat, str, last, 0);
if (bang) {
rb_str_shared_replace(str, dest);
}