diff --git a/ntex-bytes/CHANGELOG.md b/ntex-bytes/CHANGELOG.md index f66d945d..97744292 100644 --- a/ntex-bytes/CHANGELOG.md +++ b/ntex-bytes/CHANGELOG.md @@ -1,5 +1,9 @@ # Changes +## [0.1.9] (2022-01-10) + +* Add optional simd utf8 validation + ## [0.1.8] (2021-12-18) * Remove futures patch dependency diff --git a/ntex-bytes/Cargo.toml b/ntex-bytes/Cargo.toml index 21a23eed..0c5185af 100644 --- a/ntex-bytes/Cargo.toml +++ b/ntex-bytes/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "ntex-bytes" -version = "0.1.8" +version = "0.1.9" license = "MIT" authors = ["Nikolay Kim ", "Carl Lerche "] description = "Types and traits for working with bytes (bytes crate fork)" @@ -11,13 +11,20 @@ keywords = ["buffers", "zero-copy", "io"] categories = ["network-programming", "data-structures"] edition = "2018" +[features] +default = [] + +# simd utf8 check support +simd = ["simdutf8"] + [dependencies] bitflags = "1.3" bytes = "1.0.0" serde = "1.0.0" futures-core = { version = "0.3", default-features = false, features = ["alloc"] } +simdutf8 = { version = "0.1.3", optional = true } [dev-dependencies] serde_test = "1.0" serde_json = "1.0" -ntex = "0.5.0-b.0" +ntex = "0.5.0" diff --git a/ntex-bytes/src/string.rs b/ntex-bytes/src/string.rs index 71da803d..56cd8fc2 100644 --- a/ntex-bytes/src/string.rs +++ b/ntex-bytes/src/string.rs @@ -179,7 +179,7 @@ impl ops::Deref for ByteString { fn deref(&self) -> &str { let bytes = self.0.as_ref(); // SAFETY: - // UTF-8 validity is guaranteed at during construction. + // UTF-8 validity is guaranteed during construction. unsafe { str::from_utf8_unchecked(bytes) } } } @@ -213,42 +213,54 @@ impl<'a> From> for ByteString { } impl TryFrom<&[u8]> for ByteString { - type Error = str::Utf8Error; + type Error = (); #[inline] fn try_from(value: &[u8]) -> Result { - let _ = str::from_utf8(value)?; - Ok(ByteString(Bytes::copy_from_slice(value))) + if utf8::is_valid(&value) { + Ok(ByteString(Bytes::copy_from_slice(value))) + } else { + Err(()) + } } } impl TryFrom> for ByteString { - type Error = str::Utf8Error; + type Error = (); #[inline] fn try_from(value: Vec) -> Result { - let buf = String::from_utf8(value).map_err(|err| err.utf8_error())?; - Ok(ByteString(Bytes::from(buf))) + if utf8::is_valid(&value) { + Ok(ByteString(Bytes::from(value))) + } else { + Err(()) + } } } impl TryFrom for ByteString { - type Error = str::Utf8Error; + type Error = (); #[inline] fn try_from(value: Bytes) -> Result { - let _ = str::from_utf8(value.as_ref())?; - Ok(ByteString(value)) + if utf8::is_valid(&value) { + Ok(ByteString(value)) + } else { + Err(()) + } } } impl TryFrom for ByteString { - type Error = str::Utf8Error; + type Error = (); #[inline] fn try_from(value: crate::BytesMut) -> Result { - let _ = str::from_utf8(&value)?; - Ok(ByteString(value.freeze())) + if utf8::is_valid(&value) { + Ok(ByteString(value.freeze())) + } else { + Err(()) + } } } @@ -291,6 +303,20 @@ mod serde { } } +#[cfg(feature = "simd")] +mod utf8 { + pub(super) fn is_valid(input: &[u8]) -> bool { + simdutf8::basic::from_utf8(input).is_ok() + } +} + +#[cfg(not(feature = "simd"))] +mod utf8 { + pub(super) fn is_valid(input: &[u8]) -> bool { + std::str::from_utf8(input).is_ok() + } +} + #[cfg(test)] mod test { use std::borrow::ToOwned; diff --git a/ntex-codec/Cargo.toml b/ntex-codec/Cargo.toml index 13e835a1..93e62288 100644 --- a/ntex-codec/Cargo.toml +++ b/ntex-codec/Cargo.toml @@ -16,4 +16,4 @@ name = "ntex_codec" path = "src/lib.rs" [dependencies] -ntex-bytes = "0.1" +ntex-bytes = "0.1.9" diff --git a/ntex-io/Cargo.toml b/ntex-io/Cargo.toml index 4d0a3ade..896bd276 100644 --- a/ntex-io/Cargo.toml +++ b/ntex-io/Cargo.toml @@ -17,7 +17,7 @@ path = "src/lib.rs" [dependencies] ntex-codec = "0.6.0" -ntex-bytes = "0.1.8" +ntex-bytes = "0.1.9" ntex-util = "0.1.8" ntex-service = "0.3.1" diff --git a/ntex-router/Cargo.toml b/ntex-router/Cargo.toml index 17bd290f..3b7e32ba 100644 --- a/ntex-router/Cargo.toml +++ b/ntex-router/Cargo.toml @@ -18,7 +18,7 @@ default = ["http"] [dependencies] serde = "1.0" -ntex-bytes = "0.1" +ntex-bytes = "0.1.9" log = "0.4" http = { version = "0.2", optional = true } regex = { version = "1.5.4", default-features = false, features = ["std"] } diff --git a/ntex-tls/Cargo.toml b/ntex-tls/Cargo.toml index adc48078..65d12546 100644 --- a/ntex-tls/Cargo.toml +++ b/ntex-tls/Cargo.toml @@ -25,7 +25,7 @@ openssl = ["tls_openssl"] rustls = ["tls_rust"] [dependencies] -ntex-bytes = "0.1.8" +ntex-bytes = "0.1.9" ntex-io = "0.1.2" ntex-util = "0.1.8" ntex-service = "0.3.1" diff --git a/ntex-tokio/Cargo.toml b/ntex-tokio/Cargo.toml index 4c590d20..61afdfd0 100644 --- a/ntex-tokio/Cargo.toml +++ b/ntex-tokio/Cargo.toml @@ -16,9 +16,9 @@ name = "ntex_tokio" path = "src/lib.rs" [dependencies] -ntex-bytes = "0.1.8" -ntex-io = "0.1.0" -ntex-util = "0.1.6" +ntex-bytes = "0.1.9" +ntex-io = "0.1.1" +ntex-util = "0.1.8" log = "0.4" pin-project-lite = "0.2" tokio = { version = "1", default-features = false, features = ["rt", "net", "sync", "signal"] } diff --git a/ntex/Cargo.toml b/ntex/Cargo.toml index e6b28723..6426b6f1 100644 --- a/ntex/Cargo.toml +++ b/ntex/Cargo.toml @@ -50,7 +50,7 @@ ntex-router = "0.5.1" ntex-service = "0.3.1" ntex-macros = "0.1.3" ntex-util = "0.1.8" -ntex-bytes = "0.1.8" +ntex-bytes = "0.1.9" ntex-tls = "0.1.1" ntex-rt = "0.4.1" ntex-io = "0.1.2"