diff options
| author | Andrea Canciani <ranma42@gmail.com> | 2019-12-24 12:47:51 +0100 |
|---|---|---|
| committer | Andrea Canciani <ranma42@gmail.com> | 2020-02-11 10:22:47 +0100 |
| commit | 4e7aeaf1b52ee66ede1adb104fcd08b0463eb0f9 (patch) | |
| tree | 63714665d664085780edc48352ec4ee60a9e881a /src/libcore/char | |
| parent | dc4242d9052a42cdf329c3a2430d02a3b3d415cb (diff) | |
| download | rust-4e7aeaf1b52ee66ede1adb104fcd08b0463eb0f9.tar.gz rust-4e7aeaf1b52ee66ede1adb104fcd08b0463eb0f9.zip | |
Improve `char::is_ascii_*` code
These methods explicitly check if a char is in a specific ASCII range, therefore the `is_ascii()` check is not needed, but LLVM seems to be unable to remove it. WARNING: this change improves the performance on ASCII `char`s, but complex checks such as `is_ascii_punctuation` become slower on non-ASCII `char`s.
Diffstat (limited to 'src/libcore/char')
| -rw-r--r-- | src/libcore/char/methods.rs | 50 |
1 files changed, 40 insertions, 10 deletions
diff --git a/src/libcore/char/methods.rs b/src/libcore/char/methods.rs index 2b52c48cb90..302400744e2 100644 --- a/src/libcore/char/methods.rs +++ b/src/libcore/char/methods.rs @@ -1075,7 +1075,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_alphabetic(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_alphabetic() + match *self { + 'A'..='Z' | 'a'..='z' => true, + _ => false, + } } /// Checks if the value is an ASCII uppercase character: @@ -1108,7 +1111,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_uppercase(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_uppercase() + match *self { + 'A'..='Z' => true, + _ => false, + } } /// Checks if the value is an ASCII lowercase character: @@ -1141,7 +1147,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_lowercase(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_lowercase() + match *self { + 'a'..='z' => true, + _ => false, + } } /// Checks if the value is an ASCII alphanumeric character: @@ -1177,7 +1186,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_alphanumeric(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_alphanumeric() + match *self { + '0'..='9' | 'A'..='Z' | 'a'..='z' => true, + _ => false, + } } /// Checks if the value is an ASCII decimal digit: @@ -1210,7 +1222,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_digit(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_digit() + match *self { + '0'..='9' => true, + _ => false, + } } /// Checks if the value is an ASCII hexadecimal digit: @@ -1246,7 +1261,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_hexdigit(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_hexdigit() + match *self { + '0'..='9' | 'A'..='F' | 'a'..='f' => true, + _ => false, + } } /// Checks if the value is an ASCII punctuation character: @@ -1283,7 +1301,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_punctuation(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_punctuation() + match *self { + '!'..='/' | ':'..='@' | '['..='`' | '{'..='~' => true, + _ => false, + } } /// Checks if the value is an ASCII graphic character: @@ -1316,7 +1337,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_graphic(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_graphic() + match *self { + '!'..='~' => true, + _ => false, + } } /// Checks if the value is an ASCII whitespace character: @@ -1366,7 +1390,10 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_whitespace(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_whitespace() + match *self { + '\t' | '\n' | '\x0C' | '\r' | ' ' => true, + _ => false, + } } /// Checks if the value is an ASCII control character: @@ -1401,6 +1428,9 @@ impl char { #[rustc_const_unstable(feature = "const_ascii_ctype_on_intrinsics", issue = "68983")] #[inline] pub const fn is_ascii_control(&self) -> bool { - self.is_ascii() && (*self as u8).is_ascii_control() + match *self { + '\0'..='\x1F' | '\x7F' => true, + _ => false, + } } } |
