Rollup merge of #53521 - alexcrichton:optimize-lit-token, r=michaelwoerister

syntax: Optimize some literal parsing Currently in the `wasm-bindgen` project we have a very very large crate that's procedurally generated, `web-sys`. To generate this crate we parse all of a browser's WebIDL and we then generate bindings for all of the APIs contained within. The resulting Rust file is 18MB large (wow!) and currently takes a very long time to compile in debug mode. On the nightly compiler a *debug* build takes 90s for the crate to finish. I was curious what was taking so long and upon investigating a *massive* portion of the time was spent in the `lit_token` method of the compiler, primarily formatting strings via `format!`. Upon some more investigation it looks like the `byte_str_lit` was allocating an error message once per byte, causing a very large number of allocations to happen for large literals, of which wasm-bindgen generates quite a few (some are MB large). This commit fixes the issue by lazily allocating the error message, only doing so if the error message is actually needed (which should be never). As a result, the debug mode compilation time for our `web-sys` crate decreased from 90s to 20s, a very nice improvement! (although we've still got some work to do).
author: kennytm <kennytm@gmail.com> 2018-08-21 11:07:45 +0800
committer: kennytm <kennytm@gmail.com> 2018-08-21 17:51:52 +0800
commit: 445718084f481956382f65f2020418f6ebeabcde (patch)
tree: 629971d76bfcd3c7ae0de01cc11b35ef6c20cb82 /src/libsyntax/parse
parent: b5519db3236a94c1f090dcafaf38ef858ec33a26 (diff)
parent: 5bf2ad3018de1f5a94bed2685211f3694f94249c (diff)
download: rust-445718084f481956382f65f2020418f6ebeabcde.tar.gz
rust-445718084f481956382f65f2020418f6ebeabcde.zip
1 files changed, 4 insertions, 6 deletions
diff --git a/src/libsyntax/parse/mod.rs b/src/libsyntax/parse/mod.rs
index adf01197c6d..1136cda5ee3 100644
--- a/src/libsyntax/parse/mod.rs
+++ b/src/libsyntax/parse/mod.rs
@@ -533,7 +533,7 @@ fn byte_lit(lit: &str) -> (u8, usize) {
 fn byte_str_lit(lit: &str) -> Lrc<Vec<u8>> {
     let mut res = Vec::with_capacity(lit.len());
 
-    let error = |i| format!("lexer should have rejected {} at {}", lit, i);
+    let error = |i| panic!("lexer should have rejected {} at {}", lit, i);
 
     /// Eat everything up to a non-whitespace
     fn eat<I: Iterator<Item=(usize, u8)>>(it: &mut iter::Peekable<I>) {
@@ -552,12 +552,11 @@ fn byte_str_lit(lit: &str) -> Lrc<Vec<u8>> {
     loop {
         match chars.next() {
             Some((i, b'\\')) => {
-                let em = error(i);
-                match chars.peek().expect(&em).1 {
+                match chars.peek().unwrap_or_else(|| error(i)).1 {
                     b'\n' => eat(&mut chars),
                     b'\r' => {
                         chars.next();
-                        if chars.peek().expect(&em).1 != b'\n' {
+                        if chars.peek().unwrap_or_else(|| error(i)).1 != b'\n' {
                             panic!("lexer accepted bare CR");
                         }
                         eat(&mut chars);
@@ -574,8 +573,7 @@ fn byte_str_lit(lit: &str) -> Lrc<Vec<u8>> {
                 }
             },
             Some((i, b'\r')) => {
-                let em = error(i);
-                if chars.peek().expect(&em).1 != b'\n' {
+                if chars.peek().unwrap_or_else(|| error(i)).1 != b'\n' {
                     panic!("lexer accepted bare CR");
                 }
                 chars.next();
author	kennytm <kennytm@gmail.com>	2018-08-21 11:07:45 +0800
committer	kennytm <kennytm@gmail.com>	2018-08-21 17:51:52 +0800
commit	445718084f481956382f65f2020418f6ebeabcde (patch)
tree	629971d76bfcd3c7ae0de01cc11b35ef6c20cb82 /src/libsyntax/parse
parent	b5519db3236a94c1f090dcafaf38ef858ec33a26 (diff)
parent	5bf2ad3018de1f5a94bed2685211f3694f94249c (diff)
download	rust-445718084f481956382f65f2020418f6ebeabcde.tar.gz rust-445718084f481956382f65f2020418f6ebeabcde.zip