summaryrefslogtreecommitdiff
path: root/parse.y
diff options
context:
space:
mode:
authornobu <nobu@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2007-10-24 08:09:40 +0000
committernobu <nobu@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2007-10-24 08:09:40 +0000
commit2070362f3303df4c854ad141b41c4d7895049bac (patch)
treeb958c03bf714b0995a1c31892d616a7c65859b20 /parse.y
parent7989a0868d6a5231bfbed846eb84d99c7514939a (diff)
* parse.y (parser_tokspace): make space in token buffer.
* parse.y (parser_yylex): fix encoding of single character literal. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@13766 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'parse.y')
-rw-r--r--parse.y30
1 files changed, 23 insertions, 7 deletions
diff --git a/parse.y b/parse.y
index 8a46f2d71d..3182ceee0e 100644
--- a/parse.y
+++ b/parse.y
@@ -4494,6 +4494,7 @@ static int parser_here_document(struct parser_params*,NODE*);
# define nextc() parser_nextc(parser)
# define pushback(c) parser_pushback(parser, c)
# define newtok() parser_newtok(parser)
+# define tokspace(n) parser_tokspace(parser, n)
# define tokadd(c) parser_tokadd(parser, c)
# define read_escape(m) parser_read_escape(parser, m)
# define tokadd_escape(t,m) parser_tokadd_escape(parser, t, m)
@@ -4913,6 +4914,18 @@ parser_newtok(struct parser_params *parser)
return tokenbuf;
}
+static char *
+parser_tokspace(struct parser_params *parser, int n)
+{
+ int idx = tokidx + n;
+
+ if (idx >= toksiz) {
+ do {toksiz *= 2;} while (toksiz < idx);
+ REALLOC_N(tokenbuf, char, toksiz);
+ }
+ return &tokenbuf[tokidx];
+}
+
static void
parser_tokadd(struct parser_params *parser, int c)
{
@@ -6086,21 +6099,24 @@ parser_yylex(struct parser_params *parser)
}
newtok();
if (parser_ismbchar()) {
+ mb = ENC_CODERANGE_MULTI;
tokadd_mbchar(c);
}
else if ((rb_enc_isalnum(c, parser->enc) || c == '_') &&
lex_p < lex_pend && is_identchar(lex_p, lex_pend, parser->enc)) {
goto ternary;
}
- else if (c == '\\') {
- c = read_escape(0);
- tokadd(c);
+ else if (c == '\\' && (c = read_escape(0)) >= 0x80) {
+ rb_encoding *enc = parser->enc;
+ mb = ENC_CODERANGE_UNKNOWN;
+ rb_enc_mbcput(c, tokspace(rb_enc_codelen(c, enc)), enc);
}
else {
+ mb = ENC_CODERANGE_SINGLE;
tokadd(c);
}
tokfix();
- set_yylval_str(STR_NEW(tok(), toklen()));
+ set_yylval_str(STR_NEW3(tok(), toklen(), mb));
lex_state = EXPR_ENDARG;
return tCHAR;
@@ -6865,9 +6881,9 @@ parser_yylex(struct parser_params *parser)
break;
}
- mb = 0;
+ mb = ENC_CODERANGE_SINGLE;
do {
- if (!ISASCII(c)) mb = 1;
+ if (!ISASCII(c)) mb = ENC_CODERANGE_UNKNOWN;
tokadd_mbchar(c);
c = nextc();
} while (parser_is_identchar());
@@ -6920,7 +6936,7 @@ parser_yylex(struct parser_params *parser)
}
}
- if (!mb && lex_state != EXPR_DOT) {
+ if (mb == ENC_CODERANGE_SINGLE && lex_state != EXPR_DOT) {
const struct kwtable *kw;
/* See if it is a reserved word. */