summaryrefslogtreecommitdiff
path: root/parse.y
diff options
context:
space:
mode:
authorcharliesome <charliesome@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2013-09-02 07:11:41 +0000
committercharliesome <charliesome@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2013-09-02 07:11:41 +0000
commita056098cb719312452eca309bec914406f9e5ca3 (patch)
tree36680bbcdabc53cd0a4132996d2b8984eaaa945d /parse.y
parent78c75d91ae577df2c43ba5b41891572d75105b2d (diff)
* NEWS: Add note about frozen string literals
* compile.c (case_when_optimizable_literal): optimize NODE_LIT strings in when clauses of case statements * ext/ripper/eventids2.c: add tSTRING_SUFFIX * parse.y: add 'f' suffix on string literals for frozen strings * test/ripper/test_scanner_events.rb: add scanner tests * test/ruby/test_string.rb: add frozen string tests [Feature #8579] [ruby-core:55699] git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@42773 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'parse.y')
-rw-r--r--parse.y107
1 files changed, 99 insertions, 8 deletions
diff --git a/parse.y b/parse.y
index 496e37b9d4..31ed7598e6 100644
--- a/parse.y
+++ b/parse.y
@@ -400,6 +400,8 @@ static NODE *new_evstr_gen(struct parser_params*,NODE*);
#define new_evstr(n) new_evstr_gen(parser,(n))
static NODE *evstr2dstr_gen(struct parser_params*,NODE*);
#define evstr2dstr(n) evstr2dstr_gen(parser,(n))
+static NODE *str_suffix_gen(struct parser_params*, NODE*, long);
+#define str_suffix(n,o) str_suffix_gen(parser,(n),(o))
static NODE *splat_array(NODE*);
static NODE *call_bin_op_gen(struct parser_params*,NODE*,ID,NODE*);
@@ -531,6 +533,9 @@ static int lvar_defined_gen(struct parser_params*, ID);
#define RE_OPTION_MASK 0xff
#define RE_OPTION_ARG_ENCODING_NONE 32
+#define STR_OPTION_FROZEN 1
+#define STR_OPTION_BINARY 0 /* disabled */
+
#define NODE_STRTERM NODE_ZARRAY /* nothing to gc */
#define NODE_HEREDOC NODE_ARRAY /* 1, 3 to gc */
#define SIGN_EXTEND(x,n) (((1<<(n)-1)^((x)&~(~0<<(n))))-(1<<(n)-1))
@@ -758,7 +763,7 @@ static void token_info_pop(struct parser_params*, const char *token);
%token <id> tIDENTIFIER tFID tGVAR tIVAR tCONSTANT tCVAR tLABEL
%token <node> tINTEGER tFLOAT tRATIONAL tIMAGINARY tSTRING_CONTENT tCHAR
%token <node> tNTH_REF tBACK_REF
-%token <num> tREGEXP_END
+%token <num> tREGEXP_END tSTRING_SUFFIX
%type <node> singleton strings string string1 xstring regexp
%type <node> string_contents xstring_contents regexp_contents string_content
@@ -784,6 +789,7 @@ static void token_info_pop(struct parser_params*, const char *token);
%type <id> fsym keyword_variable user_variable sym symbol operation operation2 operation3
%type <id> cname fname op f_rest_arg f_block_arg opt_f_block_arg f_norm_arg f_bad_arg
%type <id> f_kwrest f_label
+%type <num> opt_string_sfx
/*%%%*/
/*%
%type <val> program reswords then do dot_or_colon
@@ -3806,7 +3812,7 @@ literal : numeric
| dsym
;
-strings : string
+strings : string opt_string_sfx
{
/*%%%*/
NODE *node = $1;
@@ -3816,6 +3822,7 @@ strings : string
else {
node = evstr2dstr(node);
}
+ node = str_suffix(node, $2);
$$ = node;
/*%
$$ = $1;
@@ -3845,6 +3852,10 @@ string1 : tSTRING_BEG string_contents tSTRING_END
}
;
+opt_string_sfx : tSTRING_SUFFIX
+ | /* none */ {$$ = 0;}
+ ;
+
xstring : tXSTRING_BEG xstring_contents tSTRING_END
{
/*%%%*/
@@ -5008,6 +5019,7 @@ none : /* none */
# define yylval (*((YYSTYPE*)(parser->parser_yylval)))
static int parser_regx_options(struct parser_params*);
+static int parser_str_options(struct parser_params*);
static int parser_tokadd_string(struct parser_params*,int,int,int,long*,rb_encoding**);
static void parser_tokaddmbc(struct parser_params *parser, int c, rb_encoding *enc);
static int parser_parse_string(struct parser_params*,NODE*);
@@ -5023,6 +5035,7 @@ static int parser_here_document(struct parser_params*,NODE*);
# define read_escape(flags,e) parser_read_escape(parser, (flags), (e))
# define tokadd_escape(e) parser_tokadd_escape(parser, (e))
# define regx_options() parser_regx_options(parser)
+# define str_options() parser_str_options(parser)
# define tokadd_string(f,t,p,n,e) parser_tokadd_string(parser,(f),(t),(p),(n),(e))
# define parse_string(n) parser_parse_string(parser,(n))
# define tokaddmbc(c, enc) parser_tokaddmbc(parser, (c), (enc))
@@ -5532,10 +5545,11 @@ rb_parser_compile_file_path(volatile VALUE vparser, VALUE fname, VALUE file, int
#define STR_FUNC_QWORDS 0x08
#define STR_FUNC_SYMBOL 0x10
#define STR_FUNC_INDENT 0x20
+#define STR_FUNC_OPTION 0x40
enum string_type {
- str_squote = (0),
- str_dquote = (STR_FUNC_EXPAND),
+ str_squote = (STR_FUNC_OPTION),
+ str_dquote = (STR_FUNC_EXPAND|STR_FUNC_OPTION),
str_xquote = (STR_FUNC_EXPAND),
str_regexp = (STR_FUNC_REGEXP|STR_FUNC_ESCAPE|STR_FUNC_EXPAND),
str_sword = (STR_FUNC_QWORDS),
@@ -5982,6 +5996,40 @@ parser_regx_options(struct parser_params *parser)
return options | RE_OPTION_ENCODING(kcode);
}
+static int
+parser_str_options(struct parser_params *parser)
+{
+ int c, options = 0;
+
+ newtok();
+ while (c = nextc(), ISALPHA(c)) {
+ switch (c) {
+#if STR_OPTION_FROZEN
+ case 'f':
+ options |= STR_OPTION_FROZEN;
+ break;
+#endif
+#if STR_OPTION_BINARY
+ case 'b':
+ options |= STR_OPTION_BINARY;
+ break;
+#endif
+ default:
+ tokadd(c);
+ break;
+ }
+ }
+ pushback(c);
+
+ if (toklen()) {
+ tokfix();
+ compile_error(PARSER_ARG "unknown string option%s - %s",
+ toklen() > 1 ? "s" : "", tok());
+ }
+
+ return options;
+}
+
static void
dispose_string(VALUE str)
{
@@ -6248,6 +6296,10 @@ parser_parse_string(struct parser_params *parser, NODE *quote)
rb_encoding *enc = current_enc;
if (func == -1) return tSTRING_END;
+ if (func == 0) {
+ set_yylval_num(term);
+ return tSTRING_SUFFIX;
+ }
c = nextc();
if ((func & STR_FUNC_QWORDS) && ISSPACE(c)) {
do {c = nextc();} while (ISSPACE(c));
@@ -6256,11 +6308,18 @@ parser_parse_string(struct parser_params *parser, NODE *quote)
if (c == term && !quote->nd_nest) {
if (func & STR_FUNC_QWORDS) {
quote->nd_func = -1;
+ quote->u2.id = 0;
return ' ';
}
- if (!(func & STR_FUNC_REGEXP)) return tSTRING_END;
- set_yylval_num(regx_options());
- return tREGEXP_END;
+ if (func & STR_FUNC_REGEXP) {
+ set_yylval_num(regx_options());
+ return tREGEXP_END;
+ }
+ if ((func & STR_FUNC_OPTION) && (func = str_options()) != 0) {
+ quote->nd_func = 0;
+ quote->u2.id = func;
+ }
+ return tSTRING_END;
}
if (space) {
pushback(c);
@@ -6948,7 +7007,8 @@ parser_yylex(struct parser_params *parser)
}
else {
token = parse_string(lex_strterm);
- if (token == tSTRING_END || token == tREGEXP_END) {
+ if ((token == tSTRING_END && lex_strterm->nd_func) ||
+ token == tSTRING_SUFFIX || token == tREGEXP_END) {
rb_gc_force_recycle((VALUE)lex_strterm);
lex_strterm = 0;
lex_state = EXPR_END;
@@ -8498,6 +8558,37 @@ evstr2dstr_gen(struct parser_params *parser, NODE *node)
}
static NODE *
+str_suffix_gen(struct parser_params *parser, NODE *node, long opt)
+{
+ if (nd_type(node) == NODE_STR) {
+#if STR_OPTION_BINARY
+ if (opt & STR_OPTION_BINARY) {
+ rb_enc_associate_index(node->nd_lit, ENCINDEX_ASCII);
+ }
+#endif
+#if STR_OPTION_FROZEN
+ if (opt & STR_OPTION_FROZEN) {
+ OBJ_FREEZE(node->nd_lit);
+ nd_set_type(node, NODE_LIT);
+ }
+#endif
+ }
+ else {
+#if STR_OPTION_BINARY
+ if (opt & STR_OPTION_BINARY) {
+ node = NEW_CALL(node, rb_intern("b"), 0);
+ }
+#endif
+#if STR_OPTION_FROZEN
+ if (opt & STR_OPTION_FROZEN) {
+ node = NEW_CALL(node, rb_intern("freeze"), 0);
+ }
+#endif
+ }
+ return node;
+}
+
+static NODE *
new_evstr_gen(struct parser_params *parser, NODE *node)
{
NODE *head = node;