Byte/raw binary literal fixes

2014-07-14 20:45:39 -07:00 · 2014-07-14 20:45:39 -07:00 · f8fd32ef9d
commit f8fd32ef9d
parent 9fc5cf902f
3 changed files with 24 additions and 4 deletions
--- a/src/grammar/.gitignore
+++ b/src/grammar/.gitignore
@ -0,0 +1,4 @@
 verify
 *.class
 *.java
 *.tokens
--- a/src/grammar/RustLexer.g4
+++ b/src/grammar/RustLexer.g4
@ -44,6 +44,7 @@ SHR     : '>>' ;
 BINOP
    : PLUS
    | SLASH
    | MINUS
    | STAR
    | PERCENT
@ -95,6 +96,10 @@ LIT_CHAR
  : '\'' ( '\\' CHAR_ESCAPE | ~[\\'\n\t\r] ) '\''
  ;
 LIT_BYTE
  : 'b\'' ( '\\' ( [xX] HEXIT HEXIT | [nrt\\'"0] ) | ~[\\'\n\t\r] ) '\''
  ;
 fragment INT_SUFFIX
  : 'i'
  | 'i8'
@ -130,7 +135,7 @@ LIT_STR
  ;
 LIT_BINARY : 'b' LIT_STR ;
-LIT_BINARY_RAW : 'b' LIT_STR_RAW ;
+LIT_BINARY_RAW : 'rb' LIT_STR_RAW ;
 /* this is a bit messy */
@ -159,7 +164,7 @@ OUTER_DOC_COMMENT : '//!' ~[\r\n]* -> type(DOC_COMMENT) ;
 LINE_COMMENT      : '//' ~[\r\n]* -> type(COMMENT) ;
 DOC_BLOCK_COMMENT
-  : ('/**' | '/*!') (DOC_BLOCK_COMMENT | .)*? '*/' -> type(DOC_COMMENT)
+  : ('/**' ~[*] | '/*!') (DOC_BLOCK_COMMENT | .)*? '*/' -> type(DOC_COMMENT)
  ;
 BLOCK_COMMENT : '/*' (BLOCK_COMMENT | .)*? '*/' -> type(COMMENT) ;
--- a/src/grammar/verify.rs
+++ b/src/grammar/verify.rs
@ -71,6 +71,7 @@ fn parse_token_list(file: &str) -> HashMap<String, Token> {
            "IDENT" => id(),
            "PLUS" => BINOP(PLUS),
            "LIT_CHAR" => LIT_CHAR(Name(0)),
            "LIT_BYTE" => LIT_BYTE(Name(0)),
            "EQ" => EQ,
            "RBRACKET" => RBRACKET,
            "COMMENT" => COMMENT,
@ -124,7 +125,7 @@ fn str_to_binop(s: &str) -> BinOp {
    }
 }
-/// Assuming a raw string/binary literal, strip out the leading/trailing
+/// Assuming a string/binary literal, strip out the leading/trailing
 /// hashes and surrounding quotes/raw/binary prefix.
 fn fix(mut lit: &str) -> ast::Name {
    if lit.char_at(0) == 'r' {
@ -143,6 +144,15 @@ fn fix(mut lit: &str) -> ast::Name {
    parse::token::intern(lit.slice(leading_hashes + 1, lit.len() - leading_hashes - 1))
 }
 /// Assuming a char/byte literal, strip the 'b' prefix and the single quotes.
 fn fixchar(mut lit: &str) -> ast::Name {
    if lit.char_at(0) == 'b' {
        lit = lit.slice_from(1);
    }
    parse::token::intern(lit.slice(1, lit.len() - 1))
 }
 fn count(lit: &str) -> uint {
    lit.chars().take_while(|c| *c == '#').count()
 }
@ -167,7 +177,8 @@ fn parse_antlr_token(s: &str, tokens: &HashMap<String, Token>) -> TokenAndSpan {
        BINOPEQ(..) => BINOPEQ(str_to_binop(content.slice_to(content.len() - 1))),
        LIT_STR(..) => LIT_STR(fix(content)),
        LIT_STR_RAW(..) => LIT_STR_RAW(fix(content), count(content)),
-        LIT_CHAR(..) => LIT_CHAR(nm),
+        LIT_CHAR(..) => LIT_CHAR(fixchar(content)),
        LIT_BYTE(..) => LIT_BYTE(fixchar(content)),
        DOC_COMMENT(..) => DOC_COMMENT(nm),
        LIT_INTEGER(..) => LIT_INTEGER(nm),
        LIT_FLOAT(..) => LIT_FLOAT(nm),