diff options
author | nobu <nobu@b2dd03c8-39d4-4d8f-98ff-823fe69b080e> | 2007-10-24 08:09:40 +0000 |
---|---|---|
committer | nobu <nobu@b2dd03c8-39d4-4d8f-98ff-823fe69b080e> | 2007-10-24 08:09:40 +0000 |
commit | 2070362f3303df4c854ad141b41c4d7895049bac (patch) | |
tree | b958c03bf714b0995a1c31892d616a7c65859b20 /parse.y | |
parent | 7989a0868d6a5231bfbed846eb84d99c7514939a (diff) | |
download | ruby-2070362f3303df4c854ad141b41c4d7895049bac.tar.gz |
* parse.y (parser_tokspace): make space in token buffer.
* parse.y (parser_yylex): fix encoding of single character literal.
git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@13766 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'parse.y')
-rw-r--r-- | parse.y | 30 |
1 files changed, 23 insertions, 7 deletions
@@ -4494,6 +4494,7 @@ static int parser_here_document(struct parser_params*,NODE*); # define nextc() parser_nextc(parser) # define pushback(c) parser_pushback(parser, c) # define newtok() parser_newtok(parser) +# define tokspace(n) parser_tokspace(parser, n) # define tokadd(c) parser_tokadd(parser, c) # define read_escape(m) parser_read_escape(parser, m) # define tokadd_escape(t,m) parser_tokadd_escape(parser, t, m) @@ -4913,6 +4914,18 @@ parser_newtok(struct parser_params *parser) return tokenbuf; } +static char * +parser_tokspace(struct parser_params *parser, int n) +{ + int idx = tokidx + n; + + if (idx >= toksiz) { + do {toksiz *= 2;} while (toksiz < idx); + REALLOC_N(tokenbuf, char, toksiz); + } + return &tokenbuf[tokidx]; +} + static void parser_tokadd(struct parser_params *parser, int c) { @@ -6086,21 +6099,24 @@ parser_yylex(struct parser_params *parser) } newtok(); if (parser_ismbchar()) { + mb = ENC_CODERANGE_MULTI; tokadd_mbchar(c); } else if ((rb_enc_isalnum(c, parser->enc) || c == '_') && lex_p < lex_pend && is_identchar(lex_p, lex_pend, parser->enc)) { goto ternary; } - else if (c == '\\') { - c = read_escape(0); - tokadd(c); + else if (c == '\\' && (c = read_escape(0)) >= 0x80) { + rb_encoding *enc = parser->enc; + mb = ENC_CODERANGE_UNKNOWN; + rb_enc_mbcput(c, tokspace(rb_enc_codelen(c, enc)), enc); } else { + mb = ENC_CODERANGE_SINGLE; tokadd(c); } tokfix(); - set_yylval_str(STR_NEW(tok(), toklen())); + set_yylval_str(STR_NEW3(tok(), toklen(), mb)); lex_state = EXPR_ENDARG; return tCHAR; @@ -6865,9 +6881,9 @@ parser_yylex(struct parser_params *parser) break; } - mb = 0; + mb = ENC_CODERANGE_SINGLE; do { - if (!ISASCII(c)) mb = 1; + if (!ISASCII(c)) mb = ENC_CODERANGE_UNKNOWN; tokadd_mbchar(c); c = nextc(); } while (parser_is_identchar()); @@ -6920,7 +6936,7 @@ parser_yylex(struct parser_params *parser) } } - if (!mb && lex_state != EXPR_DOT) { + if (mb == ENC_CODERANGE_SINGLE && lex_state != EXPR_DOT) { const struct kwtable *kw; /* See if it is a reserved word. */ |