| 1 | use std::convert::TryFrom; |
| 2 | use std::str::FromStr; |
| 3 | use std::{cmp, fmt, hash, str}; |
| 4 | |
| 5 | use bytes::Bytes; |
| 6 | |
| 7 | use super::{ErrorKind, InvalidUri}; |
| 8 | use crate::byte_str::ByteStr; |
| 9 | |
| 10 | /// Represents the path component of a URI |
| 11 | #[derive(Clone)] |
| 12 | pub struct PathAndQuery { |
| 13 | pub(super) data: ByteStr, |
| 14 | pub(super) query: u16, |
| 15 | } |
| 16 | |
| 17 | const NONE: u16 = ::std::u16::MAX; |
| 18 | |
| 19 | impl PathAndQuery { |
| 20 | // Not public while `bytes` is unstable. |
| 21 | pub(super) fn from_shared(mut src: Bytes) -> Result<Self, InvalidUri> { |
| 22 | let mut query = NONE; |
| 23 | let mut fragment = None; |
| 24 | |
| 25 | // block for iterator borrow |
| 26 | { |
| 27 | let mut iter = src.as_ref().iter().enumerate(); |
| 28 | |
| 29 | // path ... |
| 30 | for (i, &b) in &mut iter { |
| 31 | // See https://url.spec.whatwg.org/#path-state |
| 32 | match b { |
| 33 | b'?' => { |
| 34 | debug_assert_eq!(query, NONE); |
| 35 | query = i as u16; |
| 36 | break; |
| 37 | } |
| 38 | b'#' => { |
| 39 | fragment = Some(i); |
| 40 | break; |
| 41 | } |
| 42 | |
| 43 | // This is the range of bytes that don't need to be |
| 44 | // percent-encoded in the path. If it should have been |
| 45 | // percent-encoded, then error. |
| 46 | 0x21 | |
| 47 | 0x24..=0x3B | |
| 48 | 0x3D | |
| 49 | 0x40..=0x5F | |
| 50 | 0x61..=0x7A | |
| 51 | 0x7C | |
| 52 | 0x7E => {}, |
| 53 | |
| 54 | // These are code points that are supposed to be |
| 55 | // percent-encoded in the path but there are clients |
| 56 | // out there sending them as is and httparse accepts |
| 57 | // to parse those requests, so they are allowed here |
| 58 | // for parity. |
| 59 | // |
| 60 | // For reference, those are code points that are used |
| 61 | // to send requests with JSON directly embedded in |
| 62 | // the URI path. Yes, those things happen for real. |
| 63 | b'"' | |
| 64 | b'{' | b'}' => {}, |
| 65 | |
| 66 | _ => return Err(ErrorKind::InvalidUriChar.into()), |
| 67 | } |
| 68 | } |
| 69 | |
| 70 | // query ... |
| 71 | if query != NONE { |
| 72 | for (i, &b) in iter { |
| 73 | match b { |
| 74 | // While queries *should* be percent-encoded, most |
| 75 | // bytes are actually allowed... |
| 76 | // See https://url.spec.whatwg.org/#query-state |
| 77 | // |
| 78 | // Allowed: 0x21 / 0x24 - 0x3B / 0x3D / 0x3F - 0x7E |
| 79 | 0x21 | |
| 80 | 0x24..=0x3B | |
| 81 | 0x3D | |
| 82 | 0x3F..=0x7E => {}, |
| 83 | |
| 84 | b'#' => { |
| 85 | fragment = Some(i); |
| 86 | break; |
| 87 | } |
| 88 | |
| 89 | _ => return Err(ErrorKind::InvalidUriChar.into()), |
| 90 | } |
| 91 | } |
| 92 | } |
| 93 | } |
| 94 | |
| 95 | if let Some(i) = fragment { |
| 96 | src.truncate(i); |
| 97 | } |
| 98 | |
| 99 | Ok(PathAndQuery { |
| 100 | data: unsafe { ByteStr::from_utf8_unchecked(src) }, |
| 101 | query: query, |
| 102 | }) |
| 103 | } |
| 104 | |
| 105 | /// Convert a `PathAndQuery` from a static string. |
| 106 | /// |
| 107 | /// This function will not perform any copying, however the string is |
| 108 | /// checked to ensure that it is valid. |
| 109 | /// |
| 110 | /// # Panics |
| 111 | /// |
| 112 | /// This function panics if the argument is an invalid path and query. |
| 113 | /// |
| 114 | /// # Examples |
| 115 | /// |
| 116 | /// ``` |
| 117 | /// # use http::uri::*; |
| 118 | /// let v = PathAndQuery::from_static("/hello?world" ); |
| 119 | /// |
| 120 | /// assert_eq!(v.path(), "/hello" ); |
| 121 | /// assert_eq!(v.query(), Some("world" )); |
| 122 | /// ``` |
| 123 | #[inline ] |
| 124 | pub fn from_static(src: &'static str) -> Self { |
| 125 | let src = Bytes::from_static(src.as_bytes()); |
| 126 | |
| 127 | PathAndQuery::from_shared(src).unwrap() |
| 128 | } |
| 129 | |
| 130 | /// Attempt to convert a `Bytes` buffer to a `PathAndQuery`. |
| 131 | /// |
| 132 | /// This will try to prevent a copy if the type passed is the type used |
| 133 | /// internally, and will copy the data if it is not. |
| 134 | pub fn from_maybe_shared<T>(src: T) -> Result<Self, InvalidUri> |
| 135 | where |
| 136 | T: AsRef<[u8]> + 'static, |
| 137 | { |
| 138 | if_downcast_into!(T, Bytes, src, { |
| 139 | return PathAndQuery::from_shared(src); |
| 140 | }); |
| 141 | |
| 142 | PathAndQuery::try_from(src.as_ref()) |
| 143 | } |
| 144 | |
| 145 | pub(super) fn empty() -> Self { |
| 146 | PathAndQuery { |
| 147 | data: ByteStr::new(), |
| 148 | query: NONE, |
| 149 | } |
| 150 | } |
| 151 | |
| 152 | pub(super) fn slash() -> Self { |
| 153 | PathAndQuery { |
| 154 | data: ByteStr::from_static("/" ), |
| 155 | query: NONE, |
| 156 | } |
| 157 | } |
| 158 | |
| 159 | pub(super) fn star() -> Self { |
| 160 | PathAndQuery { |
| 161 | data: ByteStr::from_static("*" ), |
| 162 | query: NONE, |
| 163 | } |
| 164 | } |
| 165 | |
| 166 | /// Returns the path component |
| 167 | /// |
| 168 | /// The path component is **case sensitive**. |
| 169 | /// |
| 170 | /// ```notrust |
| 171 | /// abc://username:password@example.com:123/path/data?key=value&key2=value2#fragid1 |
| 172 | /// |--------| |
| 173 | /// | |
| 174 | /// path |
| 175 | /// ``` |
| 176 | /// |
| 177 | /// If the URI is `*` then the path component is equal to `*`. |
| 178 | /// |
| 179 | /// # Examples |
| 180 | /// |
| 181 | /// ``` |
| 182 | /// # use http::uri::*; |
| 183 | /// |
| 184 | /// let path_and_query: PathAndQuery = "/hello/world" .parse().unwrap(); |
| 185 | /// |
| 186 | /// assert_eq!(path_and_query.path(), "/hello/world" ); |
| 187 | /// ``` |
| 188 | #[inline ] |
| 189 | pub fn path(&self) -> &str { |
| 190 | let ret = if self.query == NONE { |
| 191 | &self.data[..] |
| 192 | } else { |
| 193 | &self.data[..self.query as usize] |
| 194 | }; |
| 195 | |
| 196 | if ret.is_empty() { |
| 197 | return "/" ; |
| 198 | } |
| 199 | |
| 200 | ret |
| 201 | } |
| 202 | |
| 203 | /// Returns the query string component |
| 204 | /// |
| 205 | /// The query component contains non-hierarchical data that, along with data |
| 206 | /// in the path component, serves to identify a resource within the scope of |
| 207 | /// the URI's scheme and naming authority (if any). The query component is |
| 208 | /// indicated by the first question mark ("?") character and terminated by a |
| 209 | /// number sign ("#") character or by the end of the URI. |
| 210 | /// |
| 211 | /// ```notrust |
| 212 | /// abc://username:password@example.com:123/path/data?key=value&key2=value2#fragid1 |
| 213 | /// |-------------------| |
| 214 | /// | |
| 215 | /// query |
| 216 | /// ``` |
| 217 | /// |
| 218 | /// # Examples |
| 219 | /// |
| 220 | /// With a query string component |
| 221 | /// |
| 222 | /// ``` |
| 223 | /// # use http::uri::*; |
| 224 | /// let path_and_query: PathAndQuery = "/hello/world?key=value&foo=bar" .parse().unwrap(); |
| 225 | /// |
| 226 | /// assert_eq!(path_and_query.query(), Some("key=value&foo=bar" )); |
| 227 | /// ``` |
| 228 | /// |
| 229 | /// Without a query string component |
| 230 | /// |
| 231 | /// ``` |
| 232 | /// # use http::uri::*; |
| 233 | /// let path_and_query: PathAndQuery = "/hello/world" .parse().unwrap(); |
| 234 | /// |
| 235 | /// assert!(path_and_query.query().is_none()); |
| 236 | /// ``` |
| 237 | #[inline ] |
| 238 | pub fn query(&self) -> Option<&str> { |
| 239 | if self.query == NONE { |
| 240 | None |
| 241 | } else { |
| 242 | let i = self.query + 1; |
| 243 | Some(&self.data[i as usize..]) |
| 244 | } |
| 245 | } |
| 246 | |
| 247 | /// Returns the path and query as a string component. |
| 248 | /// |
| 249 | /// # Examples |
| 250 | /// |
| 251 | /// With a query string component |
| 252 | /// |
| 253 | /// ``` |
| 254 | /// # use http::uri::*; |
| 255 | /// let path_and_query: PathAndQuery = "/hello/world?key=value&foo=bar" .parse().unwrap(); |
| 256 | /// |
| 257 | /// assert_eq!(path_and_query.as_str(), "/hello/world?key=value&foo=bar" ); |
| 258 | /// ``` |
| 259 | /// |
| 260 | /// Without a query string component |
| 261 | /// |
| 262 | /// ``` |
| 263 | /// # use http::uri::*; |
| 264 | /// let path_and_query: PathAndQuery = "/hello/world" .parse().unwrap(); |
| 265 | /// |
| 266 | /// assert_eq!(path_and_query.as_str(), "/hello/world" ); |
| 267 | /// ``` |
| 268 | #[inline ] |
| 269 | pub fn as_str(&self) -> &str { |
| 270 | let ret = &self.data[..]; |
| 271 | if ret.is_empty() { |
| 272 | return "/" ; |
| 273 | } |
| 274 | ret |
| 275 | } |
| 276 | } |
| 277 | |
| 278 | impl<'a> TryFrom<&'a [u8]> for PathAndQuery { |
| 279 | type Error = InvalidUri; |
| 280 | #[inline ] |
| 281 | fn try_from(s: &'a [u8]) -> Result<Self, Self::Error> { |
| 282 | PathAndQuery::from_shared(Bytes::copy_from_slice(s)) |
| 283 | } |
| 284 | } |
| 285 | |
| 286 | impl<'a> TryFrom<&'a str> for PathAndQuery { |
| 287 | type Error = InvalidUri; |
| 288 | #[inline ] |
| 289 | fn try_from(s: &'a str) -> Result<Self, Self::Error> { |
| 290 | TryFrom::try_from(s.as_bytes()) |
| 291 | } |
| 292 | } |
| 293 | |
| 294 | impl<'a> TryFrom<Vec<u8>> for PathAndQuery { |
| 295 | type Error = InvalidUri; |
| 296 | #[inline ] |
| 297 | fn try_from(vec: Vec<u8>) -> Result<Self, Self::Error> { |
| 298 | PathAndQuery::from_shared(vec.into()) |
| 299 | } |
| 300 | } |
| 301 | |
| 302 | impl TryFrom<String> for PathAndQuery { |
| 303 | type Error = InvalidUri; |
| 304 | #[inline ] |
| 305 | fn try_from(s: String) -> Result<Self, Self::Error> { |
| 306 | PathAndQuery::from_shared(s.into()) |
| 307 | } |
| 308 | } |
| 309 | |
| 310 | impl TryFrom<&String> for PathAndQuery { |
| 311 | type Error = InvalidUri; |
| 312 | #[inline ] |
| 313 | fn try_from(s: &String) -> Result<Self, Self::Error> { |
| 314 | TryFrom::try_from(s.as_bytes()) |
| 315 | } |
| 316 | } |
| 317 | |
| 318 | impl FromStr for PathAndQuery { |
| 319 | type Err = InvalidUri; |
| 320 | #[inline ] |
| 321 | fn from_str(s: &str) -> Result<Self, InvalidUri> { |
| 322 | TryFrom::try_from(s) |
| 323 | } |
| 324 | } |
| 325 | |
| 326 | impl fmt::Debug for PathAndQuery { |
| 327 | fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { |
| 328 | fmt::Display::fmt(self, f) |
| 329 | } |
| 330 | } |
| 331 | |
| 332 | impl fmt::Display for PathAndQuery { |
| 333 | fn fmt(&self, fmt: &mut fmt::Formatter<'_>) -> fmt::Result { |
| 334 | if !self.data.is_empty() { |
| 335 | match self.data.as_bytes()[0] { |
| 336 | b'/' | b'*' => write!(fmt, "{}" , &self.data[..]), |
| 337 | _ => write!(fmt, "/{}" , &self.data[..]), |
| 338 | } |
| 339 | } else { |
| 340 | write!(fmt, "/" ) |
| 341 | } |
| 342 | } |
| 343 | } |
| 344 | |
| 345 | impl hash::Hash for PathAndQuery { |
| 346 | fn hash<H: hash::Hasher>(&self, state: &mut H) { |
| 347 | self.data.hash(state); |
| 348 | } |
| 349 | } |
| 350 | |
| 351 | // ===== PartialEq / PartialOrd ===== |
| 352 | |
| 353 | impl PartialEq for PathAndQuery { |
| 354 | #[inline ] |
| 355 | fn eq(&self, other: &PathAndQuery) -> bool { |
| 356 | self.data == other.data |
| 357 | } |
| 358 | } |
| 359 | |
| 360 | impl Eq for PathAndQuery {} |
| 361 | |
| 362 | impl PartialEq<str> for PathAndQuery { |
| 363 | #[inline ] |
| 364 | fn eq(&self, other: &str) -> bool { |
| 365 | self.as_str() == other |
| 366 | } |
| 367 | } |
| 368 | |
| 369 | impl<'a> PartialEq<PathAndQuery> for &'a str { |
| 370 | #[inline ] |
| 371 | fn eq(&self, other: &PathAndQuery) -> bool { |
| 372 | self == &other.as_str() |
| 373 | } |
| 374 | } |
| 375 | |
| 376 | impl<'a> PartialEq<&'a str> for PathAndQuery { |
| 377 | #[inline ] |
| 378 | fn eq(&self, other: &&'a str) -> bool { |
| 379 | self.as_str() == *other |
| 380 | } |
| 381 | } |
| 382 | |
| 383 | impl PartialEq<PathAndQuery> for str { |
| 384 | #[inline ] |
| 385 | fn eq(&self, other: &PathAndQuery) -> bool { |
| 386 | self == other.as_str() |
| 387 | } |
| 388 | } |
| 389 | |
| 390 | impl PartialEq<String> for PathAndQuery { |
| 391 | #[inline ] |
| 392 | fn eq(&self, other: &String) -> bool { |
| 393 | self.as_str() == other.as_str() |
| 394 | } |
| 395 | } |
| 396 | |
| 397 | impl PartialEq<PathAndQuery> for String { |
| 398 | #[inline ] |
| 399 | fn eq(&self, other: &PathAndQuery) -> bool { |
| 400 | self.as_str() == other.as_str() |
| 401 | } |
| 402 | } |
| 403 | |
| 404 | impl PartialOrd for PathAndQuery { |
| 405 | #[inline ] |
| 406 | fn partial_cmp(&self, other: &PathAndQuery) -> Option<cmp::Ordering> { |
| 407 | self.as_str().partial_cmp(other.as_str()) |
| 408 | } |
| 409 | } |
| 410 | |
| 411 | impl PartialOrd<str> for PathAndQuery { |
| 412 | #[inline ] |
| 413 | fn partial_cmp(&self, other: &str) -> Option<cmp::Ordering> { |
| 414 | self.as_str().partial_cmp(other) |
| 415 | } |
| 416 | } |
| 417 | |
| 418 | impl PartialOrd<PathAndQuery> for str { |
| 419 | #[inline ] |
| 420 | fn partial_cmp(&self, other: &PathAndQuery) -> Option<cmp::Ordering> { |
| 421 | self.partial_cmp(other.as_str()) |
| 422 | } |
| 423 | } |
| 424 | |
| 425 | impl<'a> PartialOrd<&'a str> for PathAndQuery { |
| 426 | #[inline ] |
| 427 | fn partial_cmp(&self, other: &&'a str) -> Option<cmp::Ordering> { |
| 428 | self.as_str().partial_cmp(*other) |
| 429 | } |
| 430 | } |
| 431 | |
| 432 | impl<'a> PartialOrd<PathAndQuery> for &'a str { |
| 433 | #[inline ] |
| 434 | fn partial_cmp(&self, other: &PathAndQuery) -> Option<cmp::Ordering> { |
| 435 | self.partial_cmp(&other.as_str()) |
| 436 | } |
| 437 | } |
| 438 | |
| 439 | impl PartialOrd<String> for PathAndQuery { |
| 440 | #[inline ] |
| 441 | fn partial_cmp(&self, other: &String) -> Option<cmp::Ordering> { |
| 442 | self.as_str().partial_cmp(other.as_str()) |
| 443 | } |
| 444 | } |
| 445 | |
| 446 | impl PartialOrd<PathAndQuery> for String { |
| 447 | #[inline ] |
| 448 | fn partial_cmp(&self, other: &PathAndQuery) -> Option<cmp::Ordering> { |
| 449 | self.as_str().partial_cmp(other.as_str()) |
| 450 | } |
| 451 | } |
| 452 | |
| 453 | #[cfg (test)] |
| 454 | mod tests { |
| 455 | use super::*; |
| 456 | |
| 457 | #[test] |
| 458 | fn equal_to_self_of_same_path() { |
| 459 | let p1: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 460 | let p2: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 461 | assert_eq!(p1, p2); |
| 462 | assert_eq!(p2, p1); |
| 463 | } |
| 464 | |
| 465 | #[test] |
| 466 | fn not_equal_to_self_of_different_path() { |
| 467 | let p1: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 468 | let p2: PathAndQuery = "/world&foo=bar" .parse().unwrap(); |
| 469 | assert_ne!(p1, p2); |
| 470 | assert_ne!(p2, p1); |
| 471 | } |
| 472 | |
| 473 | #[test] |
| 474 | fn equates_with_a_str() { |
| 475 | let path_and_query: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 476 | assert_eq!(&path_and_query, "/hello/world&foo=bar" ); |
| 477 | assert_eq!("/hello/world&foo=bar" , &path_and_query); |
| 478 | assert_eq!(path_and_query, "/hello/world&foo=bar" ); |
| 479 | assert_eq!("/hello/world&foo=bar" , path_and_query); |
| 480 | } |
| 481 | |
| 482 | #[test] |
| 483 | fn not_equal_with_a_str_of_a_different_path() { |
| 484 | let path_and_query: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 485 | // as a reference |
| 486 | assert_ne!(&path_and_query, "/hello&foo=bar" ); |
| 487 | assert_ne!("/hello&foo=bar" , &path_and_query); |
| 488 | // without reference |
| 489 | assert_ne!(path_and_query, "/hello&foo=bar" ); |
| 490 | assert_ne!("/hello&foo=bar" , path_and_query); |
| 491 | } |
| 492 | |
| 493 | #[test] |
| 494 | fn equates_with_a_string() { |
| 495 | let path_and_query: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 496 | assert_eq!(path_and_query, "/hello/world&foo=bar" .to_string()); |
| 497 | assert_eq!("/hello/world&foo=bar" .to_string(), path_and_query); |
| 498 | } |
| 499 | |
| 500 | #[test] |
| 501 | fn not_equal_with_a_string_of_a_different_path() { |
| 502 | let path_and_query: PathAndQuery = "/hello/world&foo=bar" .parse().unwrap(); |
| 503 | assert_ne!(path_and_query, "/hello&foo=bar" .to_string()); |
| 504 | assert_ne!("/hello&foo=bar" .to_string(), path_and_query); |
| 505 | } |
| 506 | |
| 507 | #[test] |
| 508 | fn compares_to_self() { |
| 509 | let p1: PathAndQuery = "/a/world&foo=bar" .parse().unwrap(); |
| 510 | let p2: PathAndQuery = "/b/world&foo=bar" .parse().unwrap(); |
| 511 | assert!(p1 < p2); |
| 512 | assert!(p2 > p1); |
| 513 | } |
| 514 | |
| 515 | #[test] |
| 516 | fn compares_with_a_str() { |
| 517 | let path_and_query: PathAndQuery = "/b/world&foo=bar" .parse().unwrap(); |
| 518 | // by ref |
| 519 | assert!(&path_and_query < "/c/world&foo=bar" ); |
| 520 | assert!("/c/world&foo=bar" > &path_and_query); |
| 521 | assert!(&path_and_query > "/a/world&foo=bar" ); |
| 522 | assert!("/a/world&foo=bar" < &path_and_query); |
| 523 | |
| 524 | // by val |
| 525 | assert!(path_and_query < "/c/world&foo=bar" ); |
| 526 | assert!("/c/world&foo=bar" > path_and_query); |
| 527 | assert!(path_and_query > "/a/world&foo=bar" ); |
| 528 | assert!("/a/world&foo=bar" < path_and_query); |
| 529 | } |
| 530 | |
| 531 | #[test] |
| 532 | fn compares_with_a_string() { |
| 533 | let path_and_query: PathAndQuery = "/b/world&foo=bar" .parse().unwrap(); |
| 534 | assert!(path_and_query < "/c/world&foo=bar" .to_string()); |
| 535 | assert!("/c/world&foo=bar" .to_string() > path_and_query); |
| 536 | assert!(path_and_query > "/a/world&foo=bar" .to_string()); |
| 537 | assert!("/a/world&foo=bar" .to_string() < path_and_query); |
| 538 | } |
| 539 | |
| 540 | #[test] |
| 541 | fn ignores_valid_percent_encodings() { |
| 542 | assert_eq!("/a%20b" , pq("/a%20b?r=1" ).path()); |
| 543 | assert_eq!("qr=%31" , pq("/a/b?qr=%31" ).query().unwrap()); |
| 544 | } |
| 545 | |
| 546 | #[test] |
| 547 | fn ignores_invalid_percent_encodings() { |
| 548 | assert_eq!("/a%%b" , pq("/a%%b?r=1" ).path()); |
| 549 | assert_eq!("/aaa%" , pq("/aaa%" ).path()); |
| 550 | assert_eq!("/aaa%" , pq("/aaa%?r=1" ).path()); |
| 551 | assert_eq!("/aa%2" , pq("/aa%2" ).path()); |
| 552 | assert_eq!("/aa%2" , pq("/aa%2?r=1" ).path()); |
| 553 | assert_eq!("qr=%3" , pq("/a/b?qr=%3" ).query().unwrap()); |
| 554 | } |
| 555 | |
| 556 | #[test] |
| 557 | fn json_is_fine() { |
| 558 | assert_eq!(r#"/{"bread":"baguette"}"# , pq(r#"/{"bread":"baguette"}"# ).path()); |
| 559 | } |
| 560 | |
| 561 | fn pq(s: &str) -> PathAndQuery { |
| 562 | s.parse().expect(&format!("parsing {}" , s)) |
| 563 | } |
| 564 | } |
| 565 | |