diff options
Diffstat (limited to 'third_party/rust/url')
30 files changed, 0 insertions, 11104 deletions
diff --git a/third_party/rust/url/.cargo-checksum.json b/third_party/rust/url/.cargo-checksum.json deleted file mode 100644 index 84a2a4d9b..000000000 --- a/third_party/rust/url/.cargo-checksum.json +++ /dev/null @@ -1 +0,0 @@ -{"files":{".cargo-ok":"e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",".gitignore":"e20a03cb660e0039506f8828204fd93815ebfe051ef62194f8dcf3fc8b7d0e5a",".travis.yml":"2a3033f9edf86bc829de486fc1e74fe0bbe3166ed99b0139754ea29772c19b06","Cargo.toml":"30055a6d4ff3d1bf29a9fa99401e4ffffeecc4b5bade830843a9a5f1634fefd1","LICENSE-APACHE":"a60eea817514531668d7e00765731449fe14d059d3249e0bc93b36de45f759f2","LICENSE-MIT":"20c7855c364d57ea4c97889a5e8d98470a9952dade37bd9248b9a54431670e5e","Makefile":"92b64915724e3b5fec95ec96c5af738bd219b80709e18bf8639d784bc3d9a600","README.md":"eb3f4694003f408cbe3c7f3e9fbbc71241defb940cc55a816981f0f0f144c8eb","UPGRADING.md":"fbcc2d39bdf17db0745793db6626fcd5c909dddd4ce13b27566cfabece22c368","appveyor.yml":"c78486dbfbe6ebbf3d808afb9a19f7ec18c4704ce451c6305f0716999b70a1a6","docs/.nojekyll":"e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855","docs/404.html":"f61e6271c1ea1aa113b64b356e994595fa548f0433f89948d747503ad22195cd","docs/index.html":"f61e6271c1ea1aa113b64b356e994595fa548f0433f89948d747503ad22195cd","github.png":"b432fd855efe7c430fe6a57ccf83935c1996f03a7cdc8d6e1b34154b8c43f6ec","rust-url-todo":"1192cee7b6cedf2133d97dc6074b593a1d19b0ee13fff6f28d6329855044e575","src/encoding.rs":"7fb43e1c109bf9f2a80a05525082f90e79dba8e8056547571c49fba074406d39","src/form_urlencoded.rs":"172922f2c51eb8dae0182d70e5e0c2969f1b5b7aac026720ced9f84059465999","src/host.rs":"a654dc3c9ce9024b98698e000bc97abaac7f10c49b1635be8125cf72376fd5d1","src/lib.rs":"c3542aabc733f76a3b9c7d24b5c41e60e9eb84d2712660611300d1de0e7c2072","src/origin.rs":"d52010a280d363aed6832f7de5e52c1a62815302e59dcbc9cdc2574e2ac884b9","src/parser.rs":"8ca331ada66f309e91fcc375d8467c929b453979fe0ac5abe190eb8a32074db8","src/path_segments.rs":"0414985c441d0c0292ccc6f56a144b84728ae03382476e6cae1a766f8c333ef8","src/percent_encoding.rs":"44d3321eaa1c77715e9ea1421519289ca73612a31c3d6fce04ff489dfa7db3c5","src/quirks.rs":"3249d1a1f73dd29ec06d626ea2ea4d61e7b2a782543742a5bee422b2f3864b19","src/slicing.rs":"4e539886b23945a92094625f3e531a4bff40daa44240b5d19ee8577478c4f7fe","tests/data.rs":"d36f0ee509fb00524635a7968e336bb89674a82a4fcb06be189155e4b9d43db5","tests/setters_tests.json":"ebb439306ea748be6d0f93132cb59220c5805afd56357d6017f1eb1e4f0f80b3","tests/unit.rs":"9a05f55c7b381b58ee67ef8ef145220e5df88a403225a1a324a36afc9bb6a7d7","tests/urltestdata.json":"11abe4a459566c3929e3326828f8576cb59ec8fab1d191714c34eac28d5f15f9"},"package":"8527c62d9869a08325c38272b3f85668df22a65890c61a639d233dc0ed0b23a2"}
\ No newline at end of file diff --git a/third_party/rust/url/.cargo-ok b/third_party/rust/url/.cargo-ok deleted file mode 100644 index e69de29bb..000000000 --- a/third_party/rust/url/.cargo-ok +++ /dev/null diff --git a/third_party/rust/url/.gitignore b/third_party/rust/url/.gitignore deleted file mode 100644 index 0284c25cc..000000000 --- a/third_party/rust/url/.gitignore +++ /dev/null @@ -1,3 +0,0 @@ -target -Cargo.lock -/.cargo/config diff --git a/third_party/rust/url/.travis.yml b/third_party/rust/url/.travis.yml deleted file mode 100644 index 810995dfa..000000000 --- a/third_party/rust/url/.travis.yml +++ /dev/null @@ -1,8 +0,0 @@ -language: rust -rust: - - nightly - - beta - - stable -script: make test -notifications: - webhooks: http://build.servo.org:54856/travis diff --git a/third_party/rust/url/Cargo.toml b/third_party/rust/url/Cargo.toml deleted file mode 100644 index c3f4d364b..000000000 --- a/third_party/rust/url/Cargo.toml +++ /dev/null @@ -1,38 +0,0 @@ -[package] - -name = "url" -version = "1.2.1" -authors = ["The rust-url developers"] - -description = "URL library for Rust, based on the WHATWG URL Standard" -documentation = "http://servo.github.io/rust-url/url/index.html" -repository = "https://github.com/servo/rust-url" -readme = "README.md" -keywords = ["url", "parser"] -license = "MIT/Apache-2.0" - -[[test]] -name = "unit" - -[[test]] -name = "data" -harness = false - -[lib] -test = false - -[dev-dependencies] -rustc-test = "0.1" -rustc-serialize = "0.3" - -[features] -query_encoding = ["encoding"] -heap_size = ["heapsize"] - -[dependencies] -encoding = {version = "0.2", optional = true} -heapsize = {version = ">=0.1.1, <0.4", optional = true} -idna = { version = "0.1.0", path = "./idna" } -matches = "0.1" -rustc-serialize = {version = "0.3", optional = true} -serde = {version = ">=0.6.1, <0.9", optional = true} diff --git a/third_party/rust/url/LICENSE-APACHE b/third_party/rust/url/LICENSE-APACHE deleted file mode 100644 index 16fe87b06..000000000 --- a/third_party/rust/url/LICENSE-APACHE +++ /dev/null @@ -1,201 +0,0 @@ - Apache License - Version 2.0, January 2004 - http://www.apache.org/licenses/ - -TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION - -1. Definitions. - - "License" shall mean the terms and conditions for use, reproduction, - and distribution as defined by Sections 1 through 9 of this document. - - "Licensor" shall mean the copyright owner or entity authorized by - the copyright owner that is granting the License. - - "Legal Entity" shall mean the union of the acting entity and all - other entities that control, are controlled by, or are under common - control with that entity. For the purposes of this definition, - "control" means (i) the power, direct or indirect, to cause the - direction or management of such entity, whether by contract or - otherwise, or (ii) ownership of fifty percent (50%) or more of the - outstanding shares, or (iii) beneficial ownership of such entity. - - "You" (or "Your") shall mean an individual or Legal Entity - exercising permissions granted by this License. - - "Source" form shall mean the preferred form for making modifications, - including but not limited to software source code, documentation - source, and configuration files. - - "Object" form shall mean any form resulting from mechanical - transformation or translation of a Source form, including but - not limited to compiled object code, generated documentation, - and conversions to other media types. - - "Work" shall mean the work of authorship, whether in Source or - Object form, made available under the License, as indicated by a - copyright notice that is included in or attached to the work - (an example is provided in the Appendix below). - - "Derivative Works" shall mean any work, whether in Source or Object - form, that is based on (or derived from) the Work and for which the - editorial revisions, annotations, elaborations, or other modifications - represent, as a whole, an original work of authorship. For the purposes - of this License, Derivative Works shall not include works that remain - separable from, or merely link (or bind by name) to the interfaces of, - the Work and Derivative Works thereof. - - "Contribution" shall mean any work of authorship, including - the original version of the Work and any modifications or additions - to that Work or Derivative Works thereof, that is intentionally - submitted to Licensor for inclusion in the Work by the copyright owner - or by an individual or Legal Entity authorized to submit on behalf of - the copyright owner. For the purposes of this definition, "submitted" - means any form of electronic, verbal, or written communication sent - to the Licensor or its representatives, including but not limited to - communication on electronic mailing lists, source code control systems, - and issue tracking systems that are managed by, or on behalf of, the - Licensor for the purpose of discussing and improving the Work, but - excluding communication that is conspicuously marked or otherwise - designated in writing by the copyright owner as "Not a Contribution." - - "Contributor" shall mean Licensor and any individual or Legal Entity - on behalf of whom a Contribution has been received by Licensor and - subsequently incorporated within the Work. - -2. Grant of Copyright License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - copyright license to reproduce, prepare Derivative Works of, - publicly display, publicly perform, sublicense, and distribute the - Work and such Derivative Works in Source or Object form. - -3. Grant of Patent License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - (except as stated in this section) patent license to make, have made, - use, offer to sell, sell, import, and otherwise transfer the Work, - where such license applies only to those patent claims licensable - by such Contributor that are necessarily infringed by their - Contribution(s) alone or by combination of their Contribution(s) - with the Work to which such Contribution(s) was submitted. If You - institute patent litigation against any entity (including a - cross-claim or counterclaim in a lawsuit) alleging that the Work - or a Contribution incorporated within the Work constitutes direct - or contributory patent infringement, then any patent licenses - granted to You under this License for that Work shall terminate - as of the date such litigation is filed. - -4. Redistribution. You may reproduce and distribute copies of the - Work or Derivative Works thereof in any medium, with or without - modifications, and in Source or Object form, provided that You - meet the following conditions: - - (a) You must give any other recipients of the Work or - Derivative Works a copy of this License; and - - (b) You must cause any modified files to carry prominent notices - stating that You changed the files; and - - (c) You must retain, in the Source form of any Derivative Works - that You distribute, all copyright, patent, trademark, and - attribution notices from the Source form of the Work, - excluding those notices that do not pertain to any part of - the Derivative Works; and - - (d) If the Work includes a "NOTICE" text file as part of its - distribution, then any Derivative Works that You distribute must - include a readable copy of the attribution notices contained - within such NOTICE file, excluding those notices that do not - pertain to any part of the Derivative Works, in at least one - of the following places: within a NOTICE text file distributed - as part of the Derivative Works; within the Source form or - documentation, if provided along with the Derivative Works; or, - within a display generated by the Derivative Works, if and - wherever such third-party notices normally appear. The contents - of the NOTICE file are for informational purposes only and - do not modify the License. You may add Your own attribution - notices within Derivative Works that You distribute, alongside - or as an addendum to the NOTICE text from the Work, provided - that such additional attribution notices cannot be construed - as modifying the License. - - You may add Your own copyright statement to Your modifications and - may provide additional or different license terms and conditions - for use, reproduction, or distribution of Your modifications, or - for any such Derivative Works as a whole, provided Your use, - reproduction, and distribution of the Work otherwise complies with - the conditions stated in this License. - -5. Submission of Contributions. Unless You explicitly state otherwise, - any Contribution intentionally submitted for inclusion in the Work - by You to the Licensor shall be under the terms and conditions of - this License, without any additional terms or conditions. - Notwithstanding the above, nothing herein shall supersede or modify - the terms of any separate license agreement you may have executed - with Licensor regarding such Contributions. - -6. Trademarks. This License does not grant permission to use the trade - names, trademarks, service marks, or product names of the Licensor, - except as required for reasonable and customary use in describing the - origin of the Work and reproducing the content of the NOTICE file. - -7. Disclaimer of Warranty. Unless required by applicable law or - agreed to in writing, Licensor provides the Work (and each - Contributor provides its Contributions) on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or - implied, including, without limitation, any warranties or conditions - of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A - PARTICULAR PURPOSE. You are solely responsible for determining the - appropriateness of using or redistributing the Work and assume any - risks associated with Your exercise of permissions under this License. - -8. Limitation of Liability. In no event and under no legal theory, - whether in tort (including negligence), contract, or otherwise, - unless required by applicable law (such as deliberate and grossly - negligent acts) or agreed to in writing, shall any Contributor be - liable to You for damages, including any direct, indirect, special, - incidental, or consequential damages of any character arising as a - result of this License or out of the use or inability to use the - Work (including but not limited to damages for loss of goodwill, - work stoppage, computer failure or malfunction, or any and all - other commercial damages or losses), even if such Contributor - has been advised of the possibility of such damages. - -9. Accepting Warranty or Additional Liability. While redistributing - the Work or Derivative Works thereof, You may choose to offer, - and charge a fee for, acceptance of support, warranty, indemnity, - or other liability obligations and/or rights consistent with this - License. However, in accepting such obligations, You may act only - on Your own behalf and on Your sole responsibility, not on behalf - of any other Contributor, and only if You agree to indemnify, - defend, and hold each Contributor harmless for any liability - incurred by, or claims asserted against, such Contributor by reason - of your accepting any such warranty or additional liability. - -END OF TERMS AND CONDITIONS - -APPENDIX: How to apply the Apache License to your work. - - To apply the Apache License to your work, attach the following - boilerplate notice, with the fields enclosed by brackets "[]" - replaced with your own identifying information. (Don't include - the brackets!) The text should be enclosed in the appropriate - comment syntax for the file format. We also recommend that a - file or class name and description of purpose be included on the - same "printed page" as the copyright notice for easier - identification within third-party archives. - -Copyright [yyyy] [name of copyright owner] - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. diff --git a/third_party/rust/url/LICENSE-MIT b/third_party/rust/url/LICENSE-MIT deleted file mode 100644 index 24de6b418..000000000 --- a/third_party/rust/url/LICENSE-MIT +++ /dev/null @@ -1,25 +0,0 @@ -Copyright (c) 2013-2016 The rust-url developers - -Permission is hereby granted, free of charge, to any -person obtaining a copy of this software and associated -documentation files (the "Software"), to deal in the -Software without restriction, including without -limitation the rights to use, copy, modify, merge, -publish, distribute, sublicense, and/or sell copies of -the Software, and to permit persons to whom the Software -is furnished to do so, subject to the following -conditions: - -The above copyright notice and this permission notice -shall be included in all copies or substantial portions -of the Software. - -THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF -ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED -TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A -PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT -SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY -CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION -OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR -IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER -DEALINGS IN THE SOFTWARE. diff --git a/third_party/rust/url/Makefile b/third_party/rust/url/Makefile deleted file mode 100644 index c6f1ff0c9..000000000 --- a/third_party/rust/url/Makefile +++ /dev/null @@ -1,5 +0,0 @@ -test: - cargo test --features "query_encoding serde rustc-serialize" - [ x$$TRAVIS_RUST_VERSION != xnightly ] || cargo test --features heapsize - -.PHONY: test diff --git a/third_party/rust/url/README.md b/third_party/rust/url/README.md deleted file mode 100644 index 0721254af..000000000 --- a/third_party/rust/url/README.md +++ /dev/null @@ -1,10 +0,0 @@ -rust-url -======== - -[![Travis build Status](https://travis-ci.org/servo/rust-url.svg?branch=master)](https://travis-ci.org/servo/rust-url) [![Appveyor build status](https://ci.appveyor.com/api/projects/status/ulkqx2xcemyod6xa?svg=true)](https://ci.appveyor.com/project/Manishearth/rust-url) - -URL library for Rust, based on the [URL Standard](https://url.spec.whatwg.org/). - -[Documentation](https://docs.rs/url/) - -Please see [UPGRADING.md](https://github.com/servo/rust-url/blob/master/UPGRADING.md) if you are upgrading from 0.x to 1.x. diff --git a/third_party/rust/url/UPGRADING.md b/third_party/rust/url/UPGRADING.md deleted file mode 100644 index f156130f6..000000000 --- a/third_party/rust/url/UPGRADING.md +++ /dev/null @@ -1,263 +0,0 @@ -# Guide to upgrading from url 0.x to 1.x - -* The fields of `Url` are now private because the `Url` constructor, parser, - and setters maintain invariants that could be violated if you were to set the fields directly. - Instead of accessing, for example, `url.scheme`, use the getter method, such as `url.scheme()`. - Instead of assigning directly to a field, for example `url.scheme = "https".to_string()`, - use the setter method, such as `url.set_scheme("https").unwrap()`. - (Some setters validate the new value and return a `Result` that must be used). - -* The methods of `Url` now return `&str` instead of `String`, - thus reducing allocations and making serialization cheap. - -* The `path()` method on `url::Url` instances used to return `Option<&[String]>`; - now it returns `&str`. - If you would like functionality more similar to the old behavior of `path()`, - use `path_segments()` that returns `Option<str::Split<char>>`. - - Before upgrading: - - ```rust - let issue_list_url = Url::parse( - "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open" - ).unwrap(); - assert_eq!(issue_list_url.path(), Some(&["rust-lang".to_string(), - "rust".to_string(), - "issues".to_string()][..])); - ``` - - After upgrading: - - ```rust - let issue_list_url = Url::parse( - "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open" - ).unwrap(); - assert_eq!(issue_list_url.path(), "/rust-lang/rust/issues"); - assert_eq!(issue_list_url.path_segments().map(|c| c.collect::<Vec<_>>()), - Some(vec!["rust-lang", "rust", "issues"])); - ``` - -* The `path_mut()` method on `url::Url` instances that allowed modification of a URL's path - has been replaced by `path_segments_mut()`. - - Before upgrading: - - ```rust - let mut url = Url::parse("https://github.com/rust-lang/rust").unwrap(); - url.path_mut().unwrap().push("issues"); - ``` - - After upgrading: - - ```rust - let mut url = Url::parse("https://github.com/rust-lang/rust").unwrap(); - url.path_segments_mut().unwrap().push("issues"); - ``` - -* The `domain_mut()` method on `url::Url` instances that allowed modification of a URL's domain - has been replaced by `set_host()` and `set_ip_host()`. - -* The `host()` method on `url::Url` instances used to return `Option<&Host>`; - now it returns `Option<Host<&str>>`. - The `serialize_host()` method that returned `Option<String>` - has been replaced by the `host_str()` method that returns `Option<&str>`. - -* The `serialize()` method on `url::Url` instances that returned `String` - has been replaced by an `as_str()` method that returns `&str`. - - Before upgrading: - - ```rust - let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap(); - assert_eq!(this_document.serialize(), "http://servo.github.io/rust-url/url/index.html".to_string()); - ``` - - After upgrading: - - ```rust - let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap(); - assert_eq!(this_document.as_str(), "http://servo.github.io/rust-url/url/index.html"); - ``` - -* `url::UrlParser` has been replaced by `url::Url::parse()` and `url::Url::join()`. - - Before upgrading: - - ```rust - let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap(); - let css_url = UrlParser::new().base_url(&this_document).parse("../main.css").unwrap(); - assert_eq!(css_url.serialize(), "http://servo.github.io/rust-url/main.css".to_string()); - ``` - - After upgrading: - - ```rust - let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap(); - let css_url = this_document.join("../main.css").unwrap(); - assert_eq!(css_url.as_str(), "http://servo.github.io/rust-url/main.css"); - ``` - -* `url::parse_path()` and `url::UrlParser::parse_path()` have been removed without replacement. - As a workaround, you can give a base URL that you then ignore too `url::Url::parse()`. - - Before upgrading: - - ```rust - let (path, query, fragment) = url::parse_path("/foo/bar/../baz?q=42").unwrap(); - assert_eq!(path, vec!["foo".to_string(), "baz".to_string()]); - assert_eq!(query, Some("q=42".to_string())); - assert_eq!(fragment, None); - ``` - - After upgrading: - - ```rust - let base = Url::parse("http://example.com").unwrap(); - let with_path = base.join("/foo/bar/../baz?q=42").unwrap(); - assert_eq!(with_path.path(), "/foo/baz"); - assert_eq!(with_path.query(), Some("q=42")); - assert_eq!(with_path.fragment(), None); - ``` - -* The `url::form_urlencoded::serialize()` method - has been replaced with the `url::form_urlencoded::Serializer` struct. - Instead of calling `serialize()` with key/value pairs, - create a new `Serializer` with a new string, - call the `extend_pairs()` method on the `Serializer` instance with the key/value pairs as the argument, - then call `finish()`. - - Before upgrading: - - ```rust - let form = url::form_urlencoded::serialize(form.iter().map(|(k, v)| { - (&k[..], &v[..]) - })); - ``` - - After upgrading: - - ```rust - let form = url::form_urlencoded::Serializer::new(String::new()).extend_pairs( - form.iter().map(|(k, v)| { (&k[..], &v[..]) }) - ).finish(); - ``` - -* The `set_query_from_pairs()` method on `url::Url` instances that took key/value pairs - has been replaced with `query_pairs_mut()`, which allows you to modify the `url::Url`'s query pairs. - - Before upgrading: - - ```rust - let mut url = Url::parse("https://duckduckgo.com/").unwrap(); - let pairs = vec![ - ("q", "test"), - ("ia", "images"), - ]; - url.set_query_from_pairs(pairs.iter().map(|&(k, v)| { - (&k[..], &v[..]) - })); - ``` - - After upgrading: - - ```rust - let mut url = Url::parse("https://duckduckgo.com/").unwrap(); - let pairs = vec![ - ("q", "test"), - ("ia", "images"), - ]; - url.query_pairs_mut().clear().extend_pairs( - pairs.iter().map(|&(k, v)| { (&k[..], &v[..]) }) - ); - ``` - -* `url::SchemeData`, its variants `Relative` and `NonRelative`, - and the struct `url::RelativeSchemeData` have been removed. - Instead of matching on these variants - to determine if you have a URL in a relative scheme such as HTTP - versus a URL in a non-relative scheme as data, - use the `cannot_be_a_base()` method to determine which kind you have. - - Before upgrading: - - ```rust - match url.scheme_data { - url::SchemeData::Relative(..) => {} - url::SchemeData::NonRelative(..) => { - return Err(human(format!("`{}` must have relative scheme \ - data: {}", field, url))) - } - } - ``` - - After upgrading: - - ```rust - if url.cannot_be_a_base() { - return Err(human(format!("`{}` must have relative scheme \ - data: {}", field, url))) - } - ``` - -* The functions `url::whatwg_scheme_type_mapper()`, the `SchemeType` enum, - and the `scheme_type_mapper()` method on `url::UrlParser` instances have been removed. - `SchemeType` had a method for getting the `default_port()`; - to replicate this functionality, use the method `port_or_known_default()` on `url::Url` instances. - The `port_or_default()` method on `url::Url` instances has been removed; - use `port_or_known_default()` instead. - - Before upgrading: - - ```rust - let port = match whatwg_scheme_type_mapper(&url.scheme) { - SchemeType::Relative(port) => port, - _ => return Err(format!("Invalid special scheme: `{}`", - raw_url.scheme)), - }; - ``` - - After upgrading: - - ```rust - let port = match url.port_or_known_default() { - Some(port) => port, - _ => return Err(format!("Invalid special scheme: `{}`", - url.scheme())), - }; - ``` - -* The following formatting utilities have been removed without replacement; - look at their linked previous implementations - if you would like to replicate the functionality in your code: - * [`url::format::PathFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL24) - * [`url::format::UserInfoFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL50) - * [`url::format::UrlNoFragmentFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL70) - -* `url::percent_encoding::percent_decode()` used to have a return type of `Vec<u8>`; - now it returns an iterator of decoded `u8` bytes that also implements `Into<Cow<u8>>`. - Use `.into().to_owned()` to obtain a `Vec<u8>`. - (`.collect()` also works but might not be as efficient.) - -* The `url::percent_encoding::EncodeSet` struct and constant instances - used with `url::percent_encoding::percent_encode()` - have been changed to structs that implement the trait `url::percent_encoding::EncodeSet`. - * `SIMPLE_ENCODE_SET`, `QUERY_ENCODE_SET`, `DEFAULT_ENCODE_SET`, - and `USERINFO_ENCODE_SET` have the same behavior. - * `USERNAME_ENCODE_SET` and `PASSWORD_ENCODE_SET` have been removed; - use `USERINFO_ENCODE_SET` instead. - * `HTTP_VALUE_ENCODE_SET` has been removed; - an implementation of it in the new types can be found [in hyper's source]( - https://github.com/hyperium/hyper/blob/67436c5bf615cf5a55a71e32b788afef5985570e/src/header/parsing.rs#L131-L138) - if you need to replicate this functionality in your code. - * `FORM_URLENCODED_ENCODE_SET` has been removed; - instead, use the functionality in `url::form_urlencoded`. - * `PATH_SEGMENT_ENCODE_SET` has been added for use on '/'-separated path segments. - -* `url::percent_encoding::percent_decode_to()` has been removed. - Use `url::percent_encoding::percent_decode()` which returns an iterator. - You can then use the iterator’s `collect()` method - or give it to some data structure’s `extend()` method. -* A number of `ParseError` variants have changed. - [See the documentation for the current set](http://servo.github.io/rust-url/url/enum.ParseError.html). -* `url::OpaqueOrigin::new()` and `url::Origin::UID(OpaqueOrigin)` - have been replaced by `url::Origin::new_opaque()` and `url::Origin::Opaque(OpaqueOrigin)`, respectively. diff --git a/third_party/rust/url/appveyor.yml b/third_party/rust/url/appveyor.yml deleted file mode 100644 index 5819d38b1..000000000 --- a/third_party/rust/url/appveyor.yml +++ /dev/null @@ -1,13 +0,0 @@ -install: - - ps: Start-FileDownload 'https://static.rust-lang.org/dist/rust-nightly-i686-pc-windows-gnu.exe' - - rust-nightly-i686-pc-windows-gnu.exe /VERYSILENT /NORESTART /DIR="C:\Program Files (x86)\Rust" - - SET PATH=%PATH%;C:\Program Files (x86)\Rust\bin - - rustc -V - - cargo -V - - git submodule update --init --recursive - -build: false - -test_script: - - cargo build - - cargo test --verbose diff --git a/third_party/rust/url/docs/.nojekyll b/third_party/rust/url/docs/.nojekyll deleted file mode 100644 index e69de29bb..000000000 --- a/third_party/rust/url/docs/.nojekyll +++ /dev/null diff --git a/third_party/rust/url/docs/404.html b/third_party/rust/url/docs/404.html deleted file mode 100644 index b13eac0ee..000000000 --- a/third_party/rust/url/docs/404.html +++ /dev/null @@ -1,3 +0,0 @@ -<meta http-equiv="refresh" content="0; url=https://docs.rs/url/"> -<link rel="canonical" href="https://docs.rs/url/"> -<a href="https://docs.rs/url/">Moved to docs.rs</a> diff --git a/third_party/rust/url/docs/index.html b/third_party/rust/url/docs/index.html deleted file mode 100644 index b13eac0ee..000000000 --- a/third_party/rust/url/docs/index.html +++ /dev/null @@ -1,3 +0,0 @@ -<meta http-equiv="refresh" content="0; url=https://docs.rs/url/"> -<link rel="canonical" href="https://docs.rs/url/"> -<a href="https://docs.rs/url/">Moved to docs.rs</a> diff --git a/third_party/rust/url/github.png b/third_party/rust/url/github.png Binary files differdeleted file mode 100644 index b2c327097..000000000 --- a/third_party/rust/url/github.png +++ /dev/null diff --git a/third_party/rust/url/rust-url-todo b/third_party/rust/url/rust-url-todo deleted file mode 100644 index 6aeefbf13..000000000 --- a/third_party/rust/url/rust-url-todo +++ /dev/null @@ -1,14 +0,0 @@ -* standalone path parsing? -* Test setters - * Test trim C0/space - * Test remove tab & newline - - - -#[test] -fn test_path_segments() { - let mut url = Url::parse("http://example.net").unwrap(); - url.push_path_segment("foo").unwrap(); - url.extend_path_segments(&["bar", "b/az"]).unwrap(); - assert_eq!(url.as_str(), "http://example.net/foo"); -} diff --git a/third_party/rust/url/src/encoding.rs b/third_party/rust/url/src/encoding.rs deleted file mode 100644 index 0703c788f..000000000 --- a/third_party/rust/url/src/encoding.rs +++ /dev/null @@ -1,135 +0,0 @@ -// Copyright 2013-2014 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - - -//! Abstraction that conditionally compiles either to rust-encoding, -//! or to only support UTF-8. - -#[cfg(feature = "query_encoding")] extern crate encoding; - -use std::borrow::Cow; - -#[cfg(feature = "query_encoding")] use self::encoding::types::{DecoderTrap, EncoderTrap}; -#[cfg(feature = "query_encoding")] use self::encoding::label::encoding_from_whatwg_label; -#[cfg(feature = "query_encoding")] pub use self::encoding::types::EncodingRef; - -#[cfg(feature = "query_encoding")] -#[derive(Copy, Clone)] -pub struct EncodingOverride { - /// `None` means UTF-8. - encoding: Option<EncodingRef> -} - -#[cfg(feature = "query_encoding")] -impl EncodingOverride { - pub fn from_opt_encoding(encoding: Option<EncodingRef>) -> Self { - encoding.map(Self::from_encoding).unwrap_or_else(Self::utf8) - } - - pub fn from_encoding(encoding: EncodingRef) -> Self { - EncodingOverride { - encoding: if encoding.name() == "utf-8" { None } else { Some(encoding) } - } - } - - #[inline] - pub fn utf8() -> Self { - EncodingOverride { encoding: None } - } - - pub fn lookup(label: &[u8]) -> Option<Self> { - // Don't use String::from_utf8_lossy since no encoding label contains U+FFFD - // https://encoding.spec.whatwg.org/#names-and-labels - ::std::str::from_utf8(label) - .ok() - .and_then(encoding_from_whatwg_label) - .map(Self::from_encoding) - } - - /// https://encoding.spec.whatwg.org/#get-an-output-encoding - pub fn to_output_encoding(self) -> Self { - if let Some(encoding) = self.encoding { - if matches!(encoding.name(), "utf-16le" | "utf-16be") { - return Self::utf8() - } - } - self - } - - pub fn is_utf8(&self) -> bool { - self.encoding.is_none() - } - - pub fn name(&self) -> &'static str { - match self.encoding { - Some(encoding) => encoding.name(), - None => "utf-8", - } - } - - pub fn decode<'a>(&self, input: Cow<'a, [u8]>) -> Cow<'a, str> { - match self.encoding { - // `encoding.decode` never returns `Err` when called with `DecoderTrap::Replace` - Some(encoding) => encoding.decode(&input, DecoderTrap::Replace).unwrap().into(), - None => decode_utf8_lossy(input), - } - } - - pub fn encode<'a>(&self, input: Cow<'a, str>) -> Cow<'a, [u8]> { - match self.encoding { - // `encoding.encode` never returns `Err` when called with `EncoderTrap::NcrEscape` - Some(encoding) => Cow::Owned(encoding.encode(&input, EncoderTrap::NcrEscape).unwrap()), - None => encode_utf8(input) - } - } -} - - -#[cfg(not(feature = "query_encoding"))] -#[derive(Copy, Clone)] -pub struct EncodingOverride; - -#[cfg(not(feature = "query_encoding"))] -impl EncodingOverride { - #[inline] - pub fn utf8() -> Self { - EncodingOverride - } - - pub fn decode<'a>(&self, input: Cow<'a, [u8]>) -> Cow<'a, str> { - decode_utf8_lossy(input) - } - - pub fn encode<'a>(&self, input: Cow<'a, str>) -> Cow<'a, [u8]> { - encode_utf8(input) - } -} - -pub fn decode_utf8_lossy(input: Cow<[u8]>) -> Cow<str> { - match input { - Cow::Borrowed(bytes) => String::from_utf8_lossy(bytes), - Cow::Owned(bytes) => { - let raw_utf8: *const [u8]; - match String::from_utf8_lossy(&bytes) { - Cow::Borrowed(utf8) => raw_utf8 = utf8.as_bytes(), - Cow::Owned(s) => return s.into(), - } - // from_utf8_lossy returned a borrow of `bytes` unchanged. - debug_assert!(raw_utf8 == &*bytes as *const [u8]); - // Reuse the existing `Vec` allocation. - unsafe { String::from_utf8_unchecked(bytes) }.into() - } - } -} - -pub fn encode_utf8(input: Cow<str>) -> Cow<[u8]> { - match input { - Cow::Borrowed(s) => Cow::Borrowed(s.as_bytes()), - Cow::Owned(s) => Cow::Owned(s.into_bytes()) - } -} diff --git a/third_party/rust/url/src/form_urlencoded.rs b/third_party/rust/url/src/form_urlencoded.rs deleted file mode 100644 index f4a655507..000000000 --- a/third_party/rust/url/src/form_urlencoded.rs +++ /dev/null @@ -1,364 +0,0 @@ -// Copyright 2013-2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -//! Parser and serializer for the [`application/x-www-form-urlencoded` syntax]( -//! http://url.spec.whatwg.org/#application/x-www-form-urlencoded), -//! as used by HTML forms. -//! -//! Converts between a string (such as an URL’s query string) -//! and a sequence of (name, value) pairs. - -use encoding::EncodingOverride; -use percent_encoding::{percent_encode_byte, percent_decode}; -use std::borrow::{Borrow, Cow}; -use std::str; - - -/// Convert a byte string in the `application/x-www-form-urlencoded` syntax -/// into a iterator of (name, value) pairs. -/// -/// Use `parse(input.as_bytes())` to parse a `&str` string. -/// -/// The names and values are percent-decoded. For instance, `%23first=%25try%25` will be -/// converted to `[("#first", "%try%")]`. -#[inline] -pub fn parse(input: &[u8]) -> Parse { - Parse { - input: input, - encoding: EncodingOverride::utf8(), - } -} - - -/// Convert a byte string in the `application/x-www-form-urlencoded` syntax -/// into a iterator of (name, value) pairs. -/// -/// Use `parse(input.as_bytes())` to parse a `&str` string. -/// -/// This function is only available if the `query_encoding` Cargo feature is enabled. -/// -/// Arguments: -/// -/// * `encoding_override`: The character encoding each name and values is decoded as -/// after percent-decoding. Defaults to UTF-8. -/// * `use_charset`: The *use _charset_ flag*. If in doubt, set to `false`. -#[cfg(feature = "query_encoding")] -pub fn parse_with_encoding<'a>(input: &'a [u8], - encoding_override: Option<::encoding::EncodingRef>, - use_charset: bool) - -> Result<Parse<'a>, ()> { - use std::ascii::AsciiExt; - - let mut encoding = EncodingOverride::from_opt_encoding(encoding_override); - if !(encoding.is_utf8() || input.is_ascii()) { - return Err(()) - } - if use_charset { - for sequence in input.split(|&b| b == b'&') { - // No '+' in "_charset_" to replace with ' '. - if sequence.starts_with(b"_charset_=") { - let value = &sequence[b"_charset_=".len()..]; - // Skip replacing '+' with ' ' in value since no encoding label contains either: - // https://encoding.spec.whatwg.org/#names-and-labels - if let Some(e) = EncodingOverride::lookup(value) { - encoding = e; - break - } - } - } - } - Ok(Parse { - input: input, - encoding: encoding, - }) -} - -/// The return type of `parse()`. -#[derive(Copy, Clone)] -pub struct Parse<'a> { - input: &'a [u8], - encoding: EncodingOverride, -} - -impl<'a> Iterator for Parse<'a> { - type Item = (Cow<'a, str>, Cow<'a, str>); - - fn next(&mut self) -> Option<Self::Item> { - loop { - if self.input.is_empty() { - return None - } - let mut split2 = self.input.splitn(2, |&b| b == b'&'); - let sequence = split2.next().unwrap(); - self.input = split2.next().unwrap_or(&[][..]); - if sequence.is_empty() { - continue - } - let mut split2 = sequence.splitn(2, |&b| b == b'='); - let name = split2.next().unwrap(); - let value = split2.next().unwrap_or(&[][..]); - return Some(( - decode(name, self.encoding), - decode(value, self.encoding), - )) - } - } -} - -fn decode(input: &[u8], encoding: EncodingOverride) -> Cow<str> { - let replaced = replace_plus(input); - encoding.decode(match percent_decode(&replaced).if_any() { - Some(vec) => Cow::Owned(vec), - None => replaced, - }) -} - -/// Replace b'+' with b' ' -fn replace_plus<'a>(input: &'a [u8]) -> Cow<'a, [u8]> { - match input.iter().position(|&b| b == b'+') { - None => Cow::Borrowed(input), - Some(first_position) => { - let mut replaced = input.to_owned(); - replaced[first_position] = b' '; - for byte in &mut replaced[first_position + 1..] { - if *byte == b'+' { - *byte = b' '; - } - } - Cow::Owned(replaced) - } - } -} - -impl<'a> Parse<'a> { - /// Return a new iterator that yields pairs of `String` instead of pairs of `Cow<str>`. - pub fn into_owned(self) -> ParseIntoOwned<'a> { - ParseIntoOwned { inner: self } - } -} - -/// Like `Parse`, but yields pairs of `String` instead of pairs of `Cow<str>`. -pub struct ParseIntoOwned<'a> { - inner: Parse<'a> -} - -impl<'a> Iterator for ParseIntoOwned<'a> { - type Item = (String, String); - - fn next(&mut self) -> Option<Self::Item> { - self.inner.next().map(|(k, v)| (k.into_owned(), v.into_owned())) - } -} - -/// The [`application/x-www-form-urlencoded` byte serializer]( -/// https://url.spec.whatwg.org/#concept-urlencoded-byte-serializer). -/// -/// Return an iterator of `&str` slices. -pub fn byte_serialize(input: &[u8]) -> ByteSerialize { - ByteSerialize { - bytes: input, - } -} - -/// Return value of `byte_serialize()`. -pub struct ByteSerialize<'a> { - bytes: &'a [u8], -} - -fn byte_serialized_unchanged(byte: u8) -> bool { - matches!(byte, b'*' | b'-' | b'.' | b'0' ... b'9' | b'A' ... b'Z' | b'_' | b'a' ... b'z') -} - -impl<'a> Iterator for ByteSerialize<'a> { - type Item = &'a str; - - fn next(&mut self) -> Option<&'a str> { - if let Some((&first, tail)) = self.bytes.split_first() { - if !byte_serialized_unchanged(first) { - self.bytes = tail; - return Some(if first == b' ' { "+" } else { percent_encode_byte(first) }) - } - let position = tail.iter().position(|&b| !byte_serialized_unchanged(b)); - let (unchanged_slice, remaining) = match position { - // 1 for first_byte + i unchanged in tail - Some(i) => self.bytes.split_at(1 + i), - None => (self.bytes, &[][..]), - }; - self.bytes = remaining; - Some(unsafe { str::from_utf8_unchecked(unchanged_slice) }) - } else { - None - } - } - - fn size_hint(&self) -> (usize, Option<usize>) { - if self.bytes.is_empty() { - (0, Some(0)) - } else { - (1, Some(self.bytes.len())) - } - } -} - -/// The [`application/x-www-form-urlencoded` serializer]( -/// https://url.spec.whatwg.org/#concept-urlencoded-serializer). -pub struct Serializer<T: Target> { - target: Option<T>, - start_position: usize, - encoding: EncodingOverride, -} - -pub trait Target { - fn as_mut_string(&mut self) -> &mut String; - fn finish(self) -> Self::Finished; - type Finished; -} - -impl Target for String { - fn as_mut_string(&mut self) -> &mut String { self } - fn finish(self) -> Self { self } - type Finished = Self; -} - -impl<'a> Target for &'a mut String { - fn as_mut_string(&mut self) -> &mut String { &mut **self } - fn finish(self) -> Self { self } - type Finished = Self; -} - -// `as_mut_string` string here exposes the internal serialization of an `Url`, -// which should not be exposed to users. -// We achieve that by not giving users direct access to `UrlQuery`: -// * Its fields are private -// (and so can not be constructed with struct literal syntax outside of this crate), -// * It has no constructor -// * It is only visible (on the type level) to users in the return type of -// `Url::query_pairs_mut` which is `Serializer<UrlQuery>` -// * `Serializer` keeps its target in a private field -// * Unlike in other `Target` impls, `UrlQuery::finished` does not return `Self`. -impl<'a> Target for ::UrlQuery<'a> { - fn as_mut_string(&mut self) -> &mut String { &mut self.url.serialization } - fn finish(self) -> &'a mut ::Url { self.url } - type Finished = &'a mut ::Url; -} - -impl<T: Target> Serializer<T> { - /// Create a new `application/x-www-form-urlencoded` serializer for the given target. - /// - /// If the target is non-empty, - /// its content is assumed to already be in `application/x-www-form-urlencoded` syntax. - pub fn new(target: T) -> Self { - Self::for_suffix(target, 0) - } - - /// Create a new `application/x-www-form-urlencoded` serializer - /// for a suffix of the given target. - /// - /// If that suffix is non-empty, - /// its content is assumed to already be in `application/x-www-form-urlencoded` syntax. - pub fn for_suffix(mut target: T, start_position: usize) -> Self { - &target.as_mut_string()[start_position..]; // Panic if out of bounds - Serializer { - target: Some(target), - start_position: start_position, - encoding: EncodingOverride::utf8(), - } - } - - /// Remove any existing name/value pair. - /// - /// Panics if called after `.finish()`. - pub fn clear(&mut self) -> &mut Self { - string(&mut self.target).truncate(self.start_position); - self - } - - /// Set the character encoding to be used for names and values before percent-encoding. - #[cfg(feature = "query_encoding")] - pub fn encoding_override(&mut self, new: Option<::encoding::EncodingRef>) -> &mut Self { - self.encoding = EncodingOverride::from_opt_encoding(new).to_output_encoding(); - self - } - - /// Serialize and append a name/value pair. - /// - /// Panics if called after `.finish()`. - pub fn append_pair(&mut self, name: &str, value: &str) -> &mut Self { - append_pair(string(&mut self.target), self.start_position, self.encoding, name, value); - self - } - - /// Serialize and append a number of name/value pairs. - /// - /// This simply calls `append_pair` repeatedly. - /// This can be more convenient, so the user doesn’t need to introduce a block - /// to limit the scope of `Serializer`’s borrow of its string. - /// - /// Panics if called after `.finish()`. - pub fn extend_pairs<I, K, V>(&mut self, iter: I) -> &mut Self - where I: IntoIterator, I::Item: Borrow<(K, V)>, K: AsRef<str>, V: AsRef<str> { - { - let string = string(&mut self.target); - for pair in iter { - let &(ref k, ref v) = pair.borrow(); - append_pair(string, self.start_position, self.encoding, k.as_ref(), v.as_ref()); - } - } - self - } - - /// Add a name/value pair whose name is `_charset_` - /// and whose value is the character encoding’s name. - /// (See the `encoding_override()` method.) - /// - /// Panics if called after `.finish()`. - #[cfg(feature = "query_encoding")] - pub fn append_charset(&mut self) -> &mut Self { - { - let string = string(&mut self.target); - append_separator_if_needed(string, self.start_position); - string.push_str("_charset_="); - string.push_str(self.encoding.name()); - } - self - } - - /// If this serializer was constructed with a string, take and return that string. - /// - /// ```rust - /// use url::form_urlencoded; - /// let encoded: String = form_urlencoded::Serializer::new(String::new()) - /// .append_pair("foo", "bar & baz") - /// .append_pair("saison", "Été+hiver") - /// .finish(); - /// assert_eq!(encoded, "foo=bar+%26+baz&saison=%C3%89t%C3%A9%2Bhiver"); - /// ``` - /// - /// Panics if called more than once. - pub fn finish(&mut self) -> T::Finished { - self.target.take().expect("url::form_urlencoded::Serializer double finish").finish() - } -} - -fn append_separator_if_needed(string: &mut String, start_position: usize) { - if string.len() > start_position { - string.push('&') - } -} - -fn string<T: Target>(target: &mut Option<T>) -> &mut String { - target.as_mut().expect("url::form_urlencoded::Serializer finished").as_mut_string() -} - -fn append_pair(string: &mut String, start_position: usize, encoding: EncodingOverride, - name: &str, value: &str) { - append_separator_if_needed(string, start_position); - string.extend(byte_serialize(&encoding.encode(name.into()))); - string.push('='); - string.extend(byte_serialize(&encoding.encode(value.into()))); -} diff --git a/third_party/rust/url/src/host.rs b/third_party/rust/url/src/host.rs deleted file mode 100644 index 47b049a27..000000000 --- a/third_party/rust/url/src/host.rs +++ /dev/null @@ -1,418 +0,0 @@ -// Copyright 2013-2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf; -use std::cmp; -use std::fmt::{self, Formatter}; -use std::io; -use std::net::{Ipv4Addr, Ipv6Addr, SocketAddr, SocketAddrV4, SocketAddrV6, ToSocketAddrs}; -use std::vec; -use parser::{ParseResult, ParseError}; -use percent_encoding::percent_decode; -use idna; - -#[derive(Copy, Clone, Debug, Eq, PartialEq)] -pub enum HostInternal { - None, - Domain, - Ipv4(Ipv4Addr), - Ipv6(Ipv6Addr), -} - -#[cfg(feature = "heapsize")] -known_heap_size!(0, HostInternal); - -impl<S> From<Host<S>> for HostInternal { - fn from(host: Host<S>) -> HostInternal { - match host { - Host::Domain(_) => HostInternal::Domain, - Host::Ipv4(address) => HostInternal::Ipv4(address), - Host::Ipv6(address) => HostInternal::Ipv6(address), - } - } -} - -/// The host name of an URL. -#[derive(Clone, Debug, Eq, PartialEq, Ord, PartialOrd, Hash)] -pub enum Host<S=String> { - /// A DNS domain name, as '.' dot-separated labels. - /// Non-ASCII labels are encoded in punycode per IDNA. - Domain(S), - - /// An IPv4 address. - /// `Url::host_str` returns the serialization of this address, - /// as four decimal integers separated by `.` dots. - Ipv4(Ipv4Addr), - - /// An IPv6 address. - /// `Url::host_str` returns the serialization of that address between `[` and `]` brackets, - /// in the format per [RFC 5952 *A Recommendation - /// for IPv6 Address Text Representation*](https://tools.ietf.org/html/rfc5952): - /// lowercase hexadecimal with maximal `::` compression. - Ipv6(Ipv6Addr), -} - -#[cfg(feature = "heapsize")] -impl<S: HeapSizeOf> HeapSizeOf for Host<S> { - fn heap_size_of_children(&self) -> usize { - match *self { - Host::Domain(ref s) => s.heap_size_of_children(), - _ => 0, - } - } -} - -impl<'a> Host<&'a str> { - /// Return a copy of `self` that owns an allocated `String` but does not borrow an `&Url`. - pub fn to_owned(&self) -> Host<String> { - match *self { - Host::Domain(domain) => Host::Domain(domain.to_owned()), - Host::Ipv4(address) => Host::Ipv4(address), - Host::Ipv6(address) => Host::Ipv6(address), - } - } -} - -impl Host<String> { - /// Parse a host: either an IPv6 address in [] square brackets, or a domain. - /// - /// https://url.spec.whatwg.org/#host-parsing - pub fn parse(input: &str) -> Result<Self, ParseError> { - if input.starts_with("[") { - if !input.ends_with("]") { - return Err(ParseError::InvalidIpv6Address) - } - return parse_ipv6addr(&input[1..input.len() - 1]).map(Host::Ipv6) - } - let domain = percent_decode(input.as_bytes()).decode_utf8_lossy(); - let domain = try!(idna::domain_to_ascii(&domain)); - if domain.find(|c| matches!(c, - '\0' | '\t' | '\n' | '\r' | ' ' | '#' | '%' | '/' | ':' | '?' | '@' | '[' | '\\' | ']' - )).is_some() { - return Err(ParseError::InvalidDomainCharacter) - } - if let Some(address) = try!(parse_ipv4addr(&domain)) { - Ok(Host::Ipv4(address)) - } else { - Ok(Host::Domain(domain.into())) - } - } -} - -impl<S: AsRef<str>> fmt::Display for Host<S> { - fn fmt(&self, f: &mut Formatter) -> fmt::Result { - match *self { - Host::Domain(ref domain) => domain.as_ref().fmt(f), - Host::Ipv4(ref addr) => addr.fmt(f), - Host::Ipv6(ref addr) => { - try!(f.write_str("[")); - try!(write_ipv6(addr, f)); - f.write_str("]") - } - } - } -} - -/// This mostly exists because coherence rules don’t allow us to implement -/// `ToSocketAddrs for (Host<S>, u16)`. -pub struct HostAndPort<S=String> { - pub host: Host<S>, - pub port: u16, -} - -impl<'a> HostAndPort<&'a str> { - /// Return a copy of `self` that owns an allocated `String` but does not borrow an `&Url`. - pub fn to_owned(&self) -> HostAndPort<String> { - HostAndPort { - host: self.host.to_owned(), - port: self.port - } - } -} - -impl<S: AsRef<str>> ToSocketAddrs for HostAndPort<S> { - type Iter = SocketAddrs; - - fn to_socket_addrs(&self) -> io::Result<Self::Iter> { - let port = self.port; - match self.host { - Host::Domain(ref domain) => Ok(SocketAddrs { - // FIXME: use std::net::lookup_host when it’s stable. - state: SocketAddrsState::Domain(try!((domain.as_ref(), port).to_socket_addrs())) - }), - Host::Ipv4(address) => Ok(SocketAddrs { - state: SocketAddrsState::One(SocketAddr::V4(SocketAddrV4::new(address, port))) - }), - Host::Ipv6(address) => Ok(SocketAddrs { - state: SocketAddrsState::One(SocketAddr::V6(SocketAddrV6::new(address, port, 0, 0))) - }), - } - } -} - -/// Socket addresses for an URL. -pub struct SocketAddrs { - state: SocketAddrsState -} - -enum SocketAddrsState { - Domain(vec::IntoIter<SocketAddr>), - One(SocketAddr), - Done, -} - -impl Iterator for SocketAddrs { - type Item = SocketAddr; - fn next(&mut self) -> Option<SocketAddr> { - match self.state { - SocketAddrsState::Domain(ref mut iter) => iter.next(), - SocketAddrsState::One(s) => { - self.state = SocketAddrsState::Done; - Some(s) - } - SocketAddrsState::Done => None - } - } -} - -fn write_ipv6(addr: &Ipv6Addr, f: &mut Formatter) -> fmt::Result { - let segments = addr.segments(); - let (compress_start, compress_end) = longest_zero_sequence(&segments); - let mut i = 0; - while i < 8 { - if i == compress_start { - try!(f.write_str(":")); - if i == 0 { - try!(f.write_str(":")); - } - if compress_end < 8 { - i = compress_end; - } else { - break; - } - } - try!(write!(f, "{:x}", segments[i as usize])); - if i < 7 { - try!(f.write_str(":")); - } - i += 1; - } - Ok(()) -} - -fn longest_zero_sequence(pieces: &[u16; 8]) -> (isize, isize) { - let mut longest = -1; - let mut longest_length = -1; - let mut start = -1; - macro_rules! finish_sequence( - ($end: expr) => { - if start >= 0 { - let length = $end - start; - if length > longest_length { - longest = start; - longest_length = length; - } - } - }; - ); - for i in 0..8 { - if pieces[i as usize] == 0 { - if start < 0 { - start = i; - } - } else { - finish_sequence!(i); - start = -1; - } - } - finish_sequence!(8); - (longest, longest + longest_length) -} - - -fn parse_ipv4number(mut input: &str) -> Result<u32, ()> { - let mut r = 10; - if input.starts_with("0x") || input.starts_with("0X") { - input = &input[2..]; - r = 16; - } else if input.len() >= 2 && input.starts_with("0") { - input = &input[1..]; - r = 8; - } - if input.is_empty() { - return Ok(0); - } - if input.starts_with("+") { - return Err(()) - } - match u32::from_str_radix(&input, r) { - Ok(number) => Ok(number), - Err(_) => Err(()), - } -} - -fn parse_ipv4addr(input: &str) -> ParseResult<Option<Ipv4Addr>> { - if input.is_empty() { - return Ok(None) - } - let mut parts: Vec<&str> = input.split('.').collect(); - if parts.last() == Some(&"") { - parts.pop(); - } - if parts.len() > 4 { - return Ok(None); - } - let mut numbers: Vec<u32> = Vec::new(); - for part in parts { - if part == "" { - return Ok(None); - } - if let Ok(n) = parse_ipv4number(part) { - numbers.push(n); - } else { - return Ok(None); - } - } - let mut ipv4 = numbers.pop().expect("a non-empty list of numbers"); - // Equivalent to: ipv4 >= 256 ** (4 − numbers.len()) - if ipv4 > u32::max_value() >> (8 * numbers.len() as u32) { - return Err(ParseError::InvalidIpv4Address); - } - if numbers.iter().any(|x| *x > 255) { - return Err(ParseError::InvalidIpv4Address); - } - for (counter, n) in numbers.iter().enumerate() { - ipv4 += n << (8 * (3 - counter as u32)) - } - Ok(Some(Ipv4Addr::from(ipv4))) -} - - -fn parse_ipv6addr(input: &str) -> ParseResult<Ipv6Addr> { - let input = input.as_bytes(); - let len = input.len(); - let mut is_ip_v4 = false; - let mut pieces = [0, 0, 0, 0, 0, 0, 0, 0]; - let mut piece_pointer = 0; - let mut compress_pointer = None; - let mut i = 0; - - if len < 2 { - return Err(ParseError::InvalidIpv6Address) - } - - if input[0] == b':' { - if input[1] != b':' { - return Err(ParseError::InvalidIpv6Address) - } - i = 2; - piece_pointer = 1; - compress_pointer = Some(1); - } - - while i < len { - if piece_pointer == 8 { - return Err(ParseError::InvalidIpv6Address) - } - if input[i] == b':' { - if compress_pointer.is_some() { - return Err(ParseError::InvalidIpv6Address) - } - i += 1; - piece_pointer += 1; - compress_pointer = Some(piece_pointer); - continue - } - let start = i; - let end = cmp::min(len, start + 4); - let mut value = 0u16; - while i < end { - match (input[i] as char).to_digit(16) { - Some(digit) => { - value = value * 0x10 + digit as u16; - i += 1; - }, - None => break - } - } - if i < len { - match input[i] { - b'.' => { - if i == start { - return Err(ParseError::InvalidIpv6Address) - } - i = start; - is_ip_v4 = true; - }, - b':' => { - i += 1; - if i == len { - return Err(ParseError::InvalidIpv6Address) - } - }, - _ => return Err(ParseError::InvalidIpv6Address) - } - } - if is_ip_v4 { - break - } - pieces[piece_pointer] = value; - piece_pointer += 1; - } - - if is_ip_v4 { - if piece_pointer > 6 { - return Err(ParseError::InvalidIpv6Address) - } - let mut dots_seen = 0; - while i < len { - // FIXME: https://github.com/whatwg/url/commit/1c22aa119c354e0020117e02571cec53f7c01064 - let mut value = 0u16; - while i < len { - let digit = match input[i] { - c @ b'0' ... b'9' => c - b'0', - _ => break - }; - value = value * 10 + digit as u16; - if value == 0 || value > 255 { - return Err(ParseError::InvalidIpv6Address) - } - } - if dots_seen < 3 && !(i < len && input[i] == b'.') { - return Err(ParseError::InvalidIpv6Address) - } - pieces[piece_pointer] = pieces[piece_pointer] * 0x100 + value; - if dots_seen == 0 || dots_seen == 2 { - piece_pointer += 1; - } - i += 1; - if dots_seen == 3 && i < len { - return Err(ParseError::InvalidIpv6Address) - } - dots_seen += 1; - } - } - - match compress_pointer { - Some(compress_pointer) => { - let mut swaps = piece_pointer - compress_pointer; - piece_pointer = 7; - while swaps > 0 { - pieces[piece_pointer] = pieces[compress_pointer + swaps - 1]; - pieces[compress_pointer + swaps - 1] = 0; - swaps -= 1; - piece_pointer -= 1; - } - } - _ => if piece_pointer != 8 { - return Err(ParseError::InvalidIpv6Address) - } - } - Ok(Ipv6Addr::new(pieces[0], pieces[1], pieces[2], pieces[3], - pieces[4], pieces[5], pieces[6], pieces[7])) -} diff --git a/third_party/rust/url/src/lib.rs b/third_party/rust/url/src/lib.rs deleted file mode 100644 index 9378318b4..000000000 --- a/third_party/rust/url/src/lib.rs +++ /dev/null @@ -1,1456 +0,0 @@ -// Copyright 2013-2015 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -/*! - -rust-url is an implementation of the [URL Standard](http://url.spec.whatwg.org/) -for the [Rust](http://rust-lang.org/) programming language. - -It builds with [Cargo](http://crates.io/). -To use it in your project, add this to your `Cargo.toml` file: - -```Cargo -[dependencies.url] -git = "https://github.com/servo/rust-url" -``` - -Supporting encodings other than UTF-8 in query strings is an optional feature -that requires [rust-encoding](https://github.com/lifthrasiir/rust-encoding) -and is off by default. -You can enable it with -[Cargo’s *features* mechanism](http://doc.crates.io/manifest.html#the-[features]-section): - -```Cargo -[dependencies.url] -git = "https://github.com/servo/rust-url" -features = ["query_encoding"] -``` - -… or by passing `--cfg 'feature="query_encoding"'` to rustc. - - -# URL parsing and data structures - -First, URL parsing may fail for various reasons and therefore returns a `Result`. - -``` -use url::{Url, ParseError}; - -assert!(Url::parse("http://[:::1]") == Err(ParseError::InvalidIpv6Address)) -``` - -Let’s parse a valid URL and look at its components. - -``` -use url::{Url, Host}; - -let issue_list_url = Url::parse( - "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open" -).unwrap(); - - -assert!(issue_list_url.scheme() == "https"); -assert!(issue_list_url.username() == ""); -assert!(issue_list_url.password() == None); -assert!(issue_list_url.host_str() == Some("github.com")); -assert!(issue_list_url.host() == Some(Host::Domain("github.com"))); -assert!(issue_list_url.port() == None); -assert!(issue_list_url.path() == "/rust-lang/rust/issues"); -assert!(issue_list_url.path_segments().map(|c| c.collect::<Vec<_>>()) == - Some(vec!["rust-lang", "rust", "issues"])); -assert!(issue_list_url.query() == Some("labels=E-easy&state=open")); -assert!(issue_list_url.fragment() == None); -assert!(!issue_list_url.cannot_be_a_base()); -``` - -Some URLs are said to be *cannot-be-a-base*: -they don’t have a username, password, host, or port, -and their "path" is an arbitrary string rather than slash-separated segments: - -``` -use url::Url; - -let data_url = Url::parse("data:text/plain,Hello?World#").unwrap(); - -assert!(data_url.cannot_be_a_base()); -assert!(data_url.scheme() == "data"); -assert!(data_url.path() == "text/plain,Hello"); -assert!(data_url.path_segments().is_none()); -assert!(data_url.query() == Some("World")); -assert!(data_url.fragment() == Some("")); -``` - - -# Base URL - -Many contexts allow URL *references* that can be relative to a *base URL*: - -```html -<link rel="stylesheet" href="../main.css"> -``` - -Since parsed URL are absolute, giving a base is required for parsing relative URLs: - -``` -use url::{Url, ParseError}; - -assert!(Url::parse("../main.css") == Err(ParseError::RelativeUrlWithoutBase)) -``` - -Use the `join` method on an `Url` to use it as a base URL: - -``` -use url::Url; - -let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap(); -let css_url = this_document.join("../main.css").unwrap(); -assert_eq!(css_url.as_str(), "http://servo.github.io/rust-url/main.css") -*/ - -#[cfg(feature="rustc-serialize")] extern crate rustc_serialize; -#[macro_use] extern crate matches; -#[cfg(feature="serde")] extern crate serde; -#[cfg(feature="heapsize")] #[macro_use] extern crate heapsize; - -pub extern crate idna; - -use encoding::EncodingOverride; -#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf; -use host::HostInternal; -use parser::{Parser, Context, SchemeType, to_u32}; -use percent_encoding::{PATH_SEGMENT_ENCODE_SET, USERINFO_ENCODE_SET, - percent_encode, percent_decode, utf8_percent_encode}; -use std::cmp; -use std::fmt::{self, Write}; -use std::hash; -use std::io; -use std::mem; -use std::net::{ToSocketAddrs, IpAddr}; -use std::ops::{Range, RangeFrom, RangeTo}; -use std::path::{Path, PathBuf}; -use std::str; - -pub use origin::{Origin, OpaqueOrigin}; -pub use host::{Host, HostAndPort, SocketAddrs}; -pub use path_segments::PathSegmentsMut; -pub use parser::ParseError; -pub use slicing::Position; - -mod encoding; -mod host; -mod origin; -mod path_segments; -mod parser; -mod slicing; - -pub mod form_urlencoded; -pub mod percent_encoding; -pub mod quirks; - -/// A parsed URL record. -#[derive(Clone)] -pub struct Url { - /// Syntax in pseudo-BNF: - /// - /// url = scheme ":" [ hierarchical | non-hierarchical ] [ "?" query ]? [ "#" fragment ]? - /// non-hierarchical = non-hierarchical-path - /// non-hierarchical-path = /* Does not start with "/" */ - /// hierarchical = authority? hierarchical-path - /// authority = "//" userinfo? host [ ":" port ]? - /// userinfo = username [ ":" password ]? "@" - /// hierarchical-path = [ "/" path-segment ]+ - serialization: String, - - // Components - scheme_end: u32, // Before ':' - username_end: u32, // Before ':' (if a password is given) or '@' (if not) - host_start: u32, - host_end: u32, - host: HostInternal, - port: Option<u16>, - path_start: u32, // Before initial '/', if any - query_start: Option<u32>, // Before '?', unlike Position::QueryStart - fragment_start: Option<u32>, // Before '#', unlike Position::FragmentStart -} - -#[cfg(feature = "heapsize")] -impl HeapSizeOf for Url { - fn heap_size_of_children(&self) -> usize { - self.serialization.heap_size_of_children() - } -} - -/// Full configuration for the URL parser. -#[derive(Copy, Clone)] -pub struct ParseOptions<'a> { - base_url: Option<&'a Url>, - encoding_override: encoding::EncodingOverride, - log_syntax_violation: Option<&'a Fn(&'static str)>, -} - -impl<'a> ParseOptions<'a> { - /// Change the base URL - pub fn base_url(mut self, new: Option<&'a Url>) -> Self { - self.base_url = new; - self - } - - /// Override the character encoding of query strings. - /// This is a legacy concept only relevant for HTML. - #[cfg(feature = "query_encoding")] - pub fn encoding_override(mut self, new: Option<encoding::EncodingRef>) -> Self { - self.encoding_override = EncodingOverride::from_opt_encoding(new).to_output_encoding(); - self - } - - /// Call the provided function or closure on non-fatal parse errors. - pub fn log_syntax_violation(mut self, new: Option<&'a Fn(&'static str)>) -> Self { - self.log_syntax_violation = new; - self - } - - /// Parse an URL string with the configuration so far. - pub fn parse(self, input: &str) -> Result<Url, ::ParseError> { - Parser { - serialization: String::with_capacity(input.len()), - base_url: self.base_url, - query_encoding_override: self.encoding_override, - log_syntax_violation: self.log_syntax_violation, - context: Context::UrlParser, - }.parse_url(input) - } -} - -impl Url { - /// Parse an absolute URL from a string. - #[inline] - pub fn parse(input: &str) -> Result<Url, ::ParseError> { - Url::options().parse(input) - } - - /// Parse a string as an URL, with this URL as the base URL. - #[inline] - pub fn join(&self, input: &str) -> Result<Url, ::ParseError> { - Url::options().base_url(Some(self)).parse(input) - } - - /// Return a default `ParseOptions` that can fully configure the URL parser. - pub fn options<'a>() -> ParseOptions<'a> { - ParseOptions { - base_url: None, - encoding_override: EncodingOverride::utf8(), - log_syntax_violation: None, - } - } - - /// Return the serialization of this URL. - /// - /// This is fast since that serialization is already stored in the `Url` struct. - #[inline] - pub fn as_str(&self) -> &str { - &self.serialization - } - - /// Return the serialization of this URL. - /// - /// This consumes the `Url` and takes ownership of the `String` stored in it. - #[inline] - pub fn into_string(self) -> String { - self.serialization - } - - /// For internal testing, not part of the public API. - /// - /// Methods of the `Url` struct assume a number of invariants. - /// This checks each of these invariants and panic if one is not met. - /// This is for testing rust-url itself. - #[doc(hidden)] - pub fn assert_invariants(&self) { - macro_rules! assert { - ($x: expr) => { - if !$x { - panic!("!( {} ) for URL {:?}", stringify!($x), self.serialization) - } - } - } - - macro_rules! assert_eq { - ($a: expr, $b: expr) => { - { - let a = $a; - let b = $b; - if a != b { - panic!("{:?} != {:?} ({} != {}) for URL {:?}", - a, b, stringify!($a), stringify!($b), self.serialization) - } - } - } - } - - assert!(self.scheme_end >= 1); - assert!(matches!(self.byte_at(0), b'a'...b'z' | b'A'...b'Z')); - assert!(self.slice(1..self.scheme_end).chars() - .all(|c| matches!(c, 'a'...'z' | 'A'...'Z' | '0'...'9' | '+' | '-' | '.'))); - assert_eq!(self.byte_at(self.scheme_end), b':'); - - if self.slice(self.scheme_end + 1 ..).starts_with("//") { - // URL with authority - match self.byte_at(self.username_end) { - b':' => { - assert!(self.host_start >= self.username_end + 2); - assert_eq!(self.byte_at(self.host_start - 1), b'@'); - } - b'@' => assert!(self.host_start == self.username_end + 1), - _ => assert_eq!(self.username_end, self.scheme_end + 3), - } - assert!(self.host_start >= self.username_end); - assert!(self.host_end >= self.host_start); - let host_str = self.slice(self.host_start..self.host_end); - match self.host { - HostInternal::None => assert_eq!(host_str, ""), - HostInternal::Ipv4(address) => assert_eq!(host_str, address.to_string()), - HostInternal::Ipv6(address) => assert_eq!(host_str, format!("[{}]", address)), - HostInternal::Domain => { - if SchemeType::from(self.scheme()).is_special() { - assert!(!host_str.is_empty()) - } - } - } - if self.path_start == self.host_end { - assert_eq!(self.port, None); - } else { - assert_eq!(self.byte_at(self.host_end), b':'); - let port_str = self.slice(self.host_end + 1..self.path_start); - assert_eq!(self.port, Some(port_str.parse::<u16>().expect("Couldn't parse port?"))); - } - assert_eq!(self.byte_at(self.path_start), b'/'); - } else { - // Anarchist URL (no authority) - assert_eq!(self.username_end, self.scheme_end + 1); - assert_eq!(self.host_start, self.scheme_end + 1); - assert_eq!(self.host_end, self.scheme_end + 1); - assert_eq!(self.host, HostInternal::None); - assert_eq!(self.port, None); - assert_eq!(self.path_start, self.scheme_end + 1); - } - if let Some(start) = self.query_start { - assert!(start > self.path_start); - assert_eq!(self.byte_at(start), b'?'); - } - if let Some(start) = self.fragment_start { - assert!(start > self.path_start); - assert_eq!(self.byte_at(start), b'#'); - } - if let (Some(query_start), Some(fragment_start)) = (self.query_start, self.fragment_start) { - assert!(fragment_start > query_start); - } - - let other = Url::parse(self.as_str()).expect("Failed to parse myself?"); - assert_eq!(&self.serialization, &other.serialization); - assert_eq!(self.scheme_end, other.scheme_end); - assert_eq!(self.username_end, other.username_end); - assert_eq!(self.host_start, other.host_start); - assert_eq!(self.host_end, other.host_end); - assert!(self.host == other.host || - // XXX No host round-trips to empty host. - // See https://github.com/whatwg/url/issues/79 - (self.host_str(), other.host_str()) == (None, Some(""))); - assert_eq!(self.port, other.port); - assert_eq!(self.path_start, other.path_start); - assert_eq!(self.query_start, other.query_start); - assert_eq!(self.fragment_start, other.fragment_start); - } - - /// Return the origin of this URL (https://url.spec.whatwg.org/#origin) - /// - /// Note: this returns an opaque origin for `file:` URLs, which causes - /// `url.origin() != url.origin()`. - /// - /// # Examples - /// - /// URL with `ftp` scheme: - /// - /// ```rust - /// use url::{Host, Origin, Url}; - /// - /// let url = Url::parse("ftp://example.com/foo").unwrap(); - /// assert_eq!(url.origin(), - /// Origin::Tuple("ftp".into(), - /// Host::Domain("example.com".into()), - /// 21)); - /// ``` - /// - /// URL with `blob` scheme: - /// - /// ```rust - /// use url::{Host, Origin, Url}; - /// - /// let url = Url::parse("blob:https://example.com/foo").unwrap(); - /// assert_eq!(url.origin(), - /// Origin::Tuple("https".into(), - /// Host::Domain("example.com".into()), - /// 443)); - /// ``` - /// - /// URL with `file` scheme: - /// - /// ```rust - /// use url::{Host, Origin, Url}; - /// - /// let url = Url::parse("file:///tmp/foo").unwrap(); - /// assert!(!url.origin().is_tuple()); - /// - /// let other_url = Url::parse("file:///tmp/foo").unwrap(); - /// assert!(url.origin() != other_url.origin()); - /// ``` - /// - /// URL with other scheme: - /// - /// ```rust - /// use url::{Host, Origin, Url}; - /// - /// let url = Url::parse("foo:bar").unwrap(); - /// assert!(!url.origin().is_tuple()); - /// ``` - #[inline] - pub fn origin(&self) -> Origin { - origin::url_origin(self) - } - - /// Return the scheme of this URL, lower-cased, as an ASCII string without the ':' delimiter. - /// - /// # Examples - /// - /// ``` - /// use url::Url; - /// - /// let url = Url::parse("file:///tmp/foo").unwrap(); - /// assert_eq!(url.scheme(), "file"); - /// ``` - #[inline] - pub fn scheme(&self) -> &str { - self.slice(..self.scheme_end) - } - - /// Return whether the URL has an 'authority', - /// which can contain a username, password, host, and port number. - /// - /// URLs that do *not* are either path-only like `unix:/run/foo.socket` - /// or cannot-be-a-base like `data:text/plain,Stuff`. - #[inline] - pub fn has_authority(&self) -> bool { - debug_assert!(self.byte_at(self.scheme_end) == b':'); - self.slice(self.scheme_end..).starts_with("://") - } - - /// Return whether this URL is a cannot-be-a-base URL, - /// meaning that parsing a relative URL string with this URL as the base will return an error. - /// - /// This is the case if the scheme and `:` delimiter are not followed by a `/` slash, - /// as is typically the case of `data:` and `mailto:` URLs. - #[inline] - pub fn cannot_be_a_base(&self) -> bool { - self.byte_at(self.path_start) != b'/' - } - - /// Return the username for this URL (typically the empty string) - /// as a percent-encoded ASCII string. - /// - /// # Examples - /// - /// ``` - /// use url::Url; - /// - /// let url = Url::parse("ftp://rms@example.com").unwrap(); - /// assert_eq!(url.username(), "rms"); - /// - /// let url = Url::parse("ftp://:secret123@example.com").unwrap(); - /// assert_eq!(url.username(), ""); - /// - /// let url = Url::parse("https://example.com").unwrap(); - /// assert_eq!(url.username(), ""); - /// ``` - pub fn username(&self) -> &str { - if self.has_authority() { - self.slice(self.scheme_end + ("://".len() as u32)..self.username_end) - } else { - "" - } - } - - /// Return the password for this URL, if any, as a percent-encoded ASCII string. - /// - /// # Examples - /// - /// ``` - /// use url::Url; - /// - /// let url = Url::parse("ftp://rms:secret123@example.com").unwrap(); - /// assert_eq!(url.password(), Some("secret123")); - /// - /// let url = Url::parse("ftp://:secret123@example.com").unwrap(); - /// assert_eq!(url.password(), Some("secret123")); - /// - /// let url = Url::parse("ftp://rms@example.com").unwrap(); - /// assert_eq!(url.password(), None); - /// - /// let url = Url::parse("https://example.com").unwrap(); - /// assert_eq!(url.password(), None); - /// ``` - pub fn password(&self) -> Option<&str> { - // This ':' is not the one marking a port number since a host can not be empty. - // (Except for file: URLs, which do not have port numbers.) - if self.has_authority() && self.byte_at(self.username_end) == b':' { - debug_assert!(self.byte_at(self.host_start - 1) == b'@'); - Some(self.slice(self.username_end + 1..self.host_start - 1)) - } else { - None - } - } - - /// Equivalent to `url.host().is_some()`. - pub fn has_host(&self) -> bool { - !matches!(self.host, HostInternal::None) - } - - /// Return the string representation of the host (domain or IP address) for this URL, if any. - /// - /// Non-ASCII domains are punycode-encoded per IDNA. - /// IPv6 addresses are given between `[` and `]` brackets. - /// - /// Cannot-be-a-base URLs (typical of `data:` and `mailto:`) and some `file:` URLs - /// don’t have a host. - /// - /// See also the `host` method. - pub fn host_str(&self) -> Option<&str> { - if self.has_host() { - Some(self.slice(self.host_start..self.host_end)) - } else { - None - } - } - - /// Return the parsed representation of the host for this URL. - /// Non-ASCII domain labels are punycode-encoded per IDNA. - /// - /// Cannot-be-a-base URLs (typical of `data:` and `mailto:`) and some `file:` URLs - /// don’t have a host. - /// - /// See also the `host_str` method. - pub fn host(&self) -> Option<Host<&str>> { - match self.host { - HostInternal::None => None, - HostInternal::Domain => Some(Host::Domain(self.slice(self.host_start..self.host_end))), - HostInternal::Ipv4(address) => Some(Host::Ipv4(address)), - HostInternal::Ipv6(address) => Some(Host::Ipv6(address)), - } - } - - /// If this URL has a host and it is a domain name (not an IP address), return it. - pub fn domain(&self) -> Option<&str> { - match self.host { - HostInternal::Domain => Some(self.slice(self.host_start..self.host_end)), - _ => None, - } - } - - /// Return the port number for this URL, if any. - #[inline] - pub fn port(&self) -> Option<u16> { - self.port - } - - /// Return the port number for this URL, or the default port number if it is known. - /// - /// This method only knows the default port number - /// of the `http`, `https`, `ws`, `wss`, `ftp`, and `gopher` schemes. - /// - /// For URLs in these schemes, this method always returns `Some(_)`. - /// For other schemes, it is the same as `Url::port()`. - #[inline] - pub fn port_or_known_default(&self) -> Option<u16> { - self.port.or_else(|| parser::default_port(self.scheme())) - } - - /// If the URL has a host, return something that implements `ToSocketAddrs`. - /// - /// If the URL has no port number and the scheme’s default port number is not known - /// (see `Url::port_or_known_default`), - /// the closure is called to obtain a port number. - /// Typically, this closure can match on the result `Url::scheme` - /// to have per-scheme default port numbers, - /// and panic for schemes it’s not prepared to handle. - /// For example: - /// - /// ```rust - /// # use url::Url; - /// # use std::net::TcpStream; - /// # use std::io; - /// - /// fn connect(url: &Url) -> io::Result<TcpStream> { - /// TcpStream::connect(try!(url.with_default_port(default_port))) - /// } - /// - /// fn default_port(url: &Url) -> Result<u16, ()> { - /// match url.scheme() { - /// "git" => Ok(9418), - /// "git+ssh" => Ok(22), - /// "git+https" => Ok(443), - /// "git+http" => Ok(80), - /// _ => Err(()), - /// } - /// } - /// ``` - pub fn with_default_port<F>(&self, f: F) -> io::Result<HostAndPort<&str>> - where F: FnOnce(&Url) -> Result<u16, ()> { - Ok(HostAndPort { - host: try!(self.host() - .ok_or(()) - .or_else(|()| io_error("URL has no host"))), - port: try!(self.port_or_known_default() - .ok_or(()) - .or_else(|()| f(self)) - .or_else(|()| io_error("URL has no port number"))) - }) - } - - /// Return the path for this URL, as a percent-encoded ASCII string. - /// For cannot-be-a-base URLs, this is an arbitrary string that doesn’t start with '/'. - /// For other URLs, this starts with a '/' slash - /// and continues with slash-separated path segments. - pub fn path(&self) -> &str { - match (self.query_start, self.fragment_start) { - (None, None) => self.slice(self.path_start..), - (Some(next_component_start), _) | - (None, Some(next_component_start)) => { - self.slice(self.path_start..next_component_start) - } - } - } - - /// Unless this URL is cannot-be-a-base, - /// return an iterator of '/' slash-separated path segments, - /// each as a percent-encoded ASCII string. - /// - /// Return `None` for cannot-be-a-base URLs. - /// - /// When `Some` is returned, the iterator always contains at least one string - /// (which may be empty). - pub fn path_segments(&self) -> Option<str::Split<char>> { - let path = self.path(); - if path.starts_with('/') { - Some(path[1..].split('/')) - } else { - None - } - } - - /// Return this URL’s query string, if any, as a percent-encoded ASCII string. - pub fn query(&self) -> Option<&str> { - match (self.query_start, self.fragment_start) { - (None, _) => None, - (Some(query_start), None) => { - debug_assert!(self.byte_at(query_start) == b'?'); - Some(self.slice(query_start + 1..)) - } - (Some(query_start), Some(fragment_start)) => { - debug_assert!(self.byte_at(query_start) == b'?'); - Some(self.slice(query_start + 1..fragment_start)) - } - } - } - - /// Parse the URL’s query string, if any, as `application/x-www-form-urlencoded` - /// and return an iterator of (key, value) pairs. - #[inline] - pub fn query_pairs(&self) -> form_urlencoded::Parse { - form_urlencoded::parse(self.query().unwrap_or("").as_bytes()) - } - - /// Return this URL’s fragment identifier, if any. - /// - /// **Note:** the parser did *not* percent-encode this component, - /// but the input may have been percent-encoded already. - pub fn fragment(&self) -> Option<&str> { - self.fragment_start.map(|start| { - debug_assert!(self.byte_at(start) == b'#'); - self.slice(start + 1..) - }) - } - - fn mutate<F: FnOnce(&mut Parser) -> R, R>(&mut self, f: F) -> R { - let mut parser = Parser::for_setter(mem::replace(&mut self.serialization, String::new())); - let result = f(&mut parser); - self.serialization = parser.serialization; - result - } - - /// Change this URL’s fragment identifier. - pub fn set_fragment(&mut self, fragment: Option<&str>) { - // Remove any previous fragment - if let Some(start) = self.fragment_start { - debug_assert!(self.byte_at(start) == b'#'); - self.serialization.truncate(start as usize); - } - // Write the new one - if let Some(input) = fragment { - self.fragment_start = Some(to_u32(self.serialization.len()).unwrap()); - self.serialization.push('#'); - self.mutate(|parser| parser.parse_fragment(parser::Input::new(input))) - } else { - self.fragment_start = None - } - } - - fn take_fragment(&mut self) -> Option<String> { - self.fragment_start.take().map(|start| { - debug_assert!(self.byte_at(start) == b'#'); - let fragment = self.slice(start + 1..).to_owned(); - self.serialization.truncate(start as usize); - fragment - }) - } - - fn restore_already_parsed_fragment(&mut self, fragment: Option<String>) { - if let Some(ref fragment) = fragment { - assert!(self.fragment_start.is_none()); - self.fragment_start = Some(to_u32(self.serialization.len()).unwrap()); - self.serialization.push('#'); - self.serialization.push_str(fragment); - } - } - - /// Change this URL’s query string. - pub fn set_query(&mut self, query: Option<&str>) { - let fragment = self.take_fragment(); - - // Remove any previous query - if let Some(start) = self.query_start.take() { - debug_assert!(self.byte_at(start) == b'?'); - self.serialization.truncate(start as usize); - } - // Write the new query, if any - if let Some(input) = query { - self.query_start = Some(to_u32(self.serialization.len()).unwrap()); - self.serialization.push('?'); - let scheme_end = self.scheme_end; - self.mutate(|parser| parser.parse_query(scheme_end, parser::Input::new(input))); - } - - self.restore_already_parsed_fragment(fragment); - } - - /// Manipulate this URL’s query string, viewed as a sequence of name/value pairs - /// in `application/x-www-form-urlencoded` syntax. - /// - /// The return value has a method-chaining API: - /// - /// ```rust - /// # use url::Url; - /// let mut url = Url::parse("https://example.net?lang=fr#nav").unwrap(); - /// assert_eq!(url.query(), Some("lang=fr")); - /// - /// url.query_pairs_mut().append_pair("foo", "bar"); - /// assert_eq!(url.query(), Some("lang=fr&foo=bar")); - /// assert_eq!(url.as_str(), "https://example.net/?lang=fr&foo=bar#nav"); - /// - /// url.query_pairs_mut() - /// .clear() - /// .append_pair("foo", "bar & baz") - /// .append_pair("saisons", "Été+hiver"); - /// assert_eq!(url.query(), Some("foo=bar+%26+baz&saisons=%C3%89t%C3%A9%2Bhiver")); - /// assert_eq!(url.as_str(), - /// "https://example.net/?foo=bar+%26+baz&saisons=%C3%89t%C3%A9%2Bhiver#nav"); - /// ``` - /// - /// Note: `url.query_pairs_mut().clear();` is equivalent to `url.set_query(Some(""))`, - /// not `url.set_query(None)`. - /// - /// The state of `Url` is unspecified if this return value is leaked without being dropped. - pub fn query_pairs_mut(&mut self) -> form_urlencoded::Serializer<UrlQuery> { - let fragment = self.take_fragment(); - - let query_start; - if let Some(start) = self.query_start { - debug_assert!(self.byte_at(start) == b'?'); - query_start = start as usize; - } else { - query_start = self.serialization.len(); - self.query_start = Some(to_u32(query_start).unwrap()); - self.serialization.push('?'); - } - - let query = UrlQuery { url: self, fragment: fragment }; - form_urlencoded::Serializer::for_suffix(query, query_start + "?".len()) - } - - fn take_after_path(&mut self) -> String { - match (self.query_start, self.fragment_start) { - (Some(i), _) | (None, Some(i)) => { - let after_path = self.slice(i..).to_owned(); - self.serialization.truncate(i as usize); - after_path - }, - (None, None) => String::new(), - } - } - - /// Change this URL’s path. - pub fn set_path(&mut self, mut path: &str) { - let after_path = self.take_after_path(); - let old_after_path_pos = to_u32(self.serialization.len()).unwrap(); - let cannot_be_a_base = self.cannot_be_a_base(); - let scheme_type = SchemeType::from(self.scheme()); - self.serialization.truncate(self.path_start as usize); - self.mutate(|parser| { - if cannot_be_a_base { - if path.starts_with('/') { - parser.serialization.push_str("%2F"); - path = &path[1..]; - } - parser.parse_cannot_be_a_base_path(parser::Input::new(path)); - } else { - let mut has_host = true; // FIXME - parser.parse_path_start(scheme_type, &mut has_host, parser::Input::new(path)); - } - }); - self.restore_after_path(old_after_path_pos, &after_path); - } - - /// Return an object with methods to manipulate this URL’s path segments. - /// - /// Return `Err(())` if this URl is cannot-be-a-base. - pub fn path_segments_mut(&mut self) -> Result<PathSegmentsMut, ()> { - if self.cannot_be_a_base() { - Err(()) - } else { - Ok(path_segments::new(self)) - } - } - - fn restore_after_path(&mut self, old_after_path_position: u32, after_path: &str) { - let new_after_path_position = to_u32(self.serialization.len()).unwrap(); - let adjust = |index: &mut u32| { - *index -= old_after_path_position; - *index += new_after_path_position; - }; - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - self.serialization.push_str(after_path) - } - - /// Change this URL’s port number. - /// - /// If this URL is cannot-be-a-base, does not have a host, or has the `file` scheme; - /// do nothing and return `Err`. - pub fn set_port(&mut self, mut port: Option<u16>) -> Result<(), ()> { - if !self.has_host() || self.scheme() == "file" { - return Err(()) - } - if port.is_some() && port == parser::default_port(self.scheme()) { - port = None - } - self.set_port_internal(port); - Ok(()) - } - - fn set_port_internal(&mut self, port: Option<u16>) { - match (self.port, port) { - (None, None) => {} - (Some(_), None) => { - self.serialization.drain(self.host_end as usize .. self.path_start as usize); - let offset = self.path_start - self.host_end; - self.path_start = self.host_end; - if let Some(ref mut index) = self.query_start { *index -= offset } - if let Some(ref mut index) = self.fragment_start { *index -= offset } - } - (Some(old), Some(new)) if old == new => {} - (_, Some(new)) => { - let path_and_after = self.slice(self.path_start..).to_owned(); - self.serialization.truncate(self.host_end as usize); - write!(&mut self.serialization, ":{}", new).unwrap(); - let old_path_start = self.path_start; - let new_path_start = to_u32(self.serialization.len()).unwrap(); - self.path_start = new_path_start; - let adjust = |index: &mut u32| { - *index -= old_path_start; - *index += new_path_start; - }; - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - self.serialization.push_str(&path_and_after); - } - } - self.port = port; - } - - /// Change this URL’s host. - /// - /// If this URL is cannot-be-a-base or there is an error parsing the given `host`, - /// do nothing and return `Err`. - /// - /// Removing the host (calling this with `None`) - /// will also remove any username, password, and port number. - pub fn set_host(&mut self, host: Option<&str>) -> Result<(), ParseError> { - if self.cannot_be_a_base() { - return Err(ParseError::SetHostOnCannotBeABaseUrl) - } - - if let Some(host) = host { - self.set_host_internal(try!(Host::parse(host)), None) - } else if self.has_host() { - debug_assert!(self.byte_at(self.scheme_end) == b':'); - debug_assert!(self.byte_at(self.path_start) == b'/'); - let new_path_start = self.scheme_end + 1; - self.serialization.drain(self.path_start as usize..new_path_start as usize); - let offset = self.path_start - new_path_start; - self.path_start = new_path_start; - self.username_end = new_path_start; - self.host_start = new_path_start; - self.host_end = new_path_start; - self.port = None; - if let Some(ref mut index) = self.query_start { *index -= offset } - if let Some(ref mut index) = self.fragment_start { *index -= offset } - } - Ok(()) - } - - /// opt_new_port: None means leave unchanged, Some(None) means remove any port number. - fn set_host_internal(&mut self, host: Host<String>, opt_new_port: Option<Option<u16>>) { - let old_suffix_pos = if opt_new_port.is_some() { self.path_start } else { self.host_end }; - let suffix = self.slice(old_suffix_pos..).to_owned(); - self.serialization.truncate(self.host_start as usize); - if !self.has_authority() { - debug_assert!(self.slice(self.scheme_end..self.host_start) == ":"); - debug_assert!(self.username_end == self.host_start); - self.serialization.push('/'); - self.serialization.push('/'); - self.username_end += 2; - self.host_start += 2; - } - write!(&mut self.serialization, "{}", host).unwrap(); - self.host_end = to_u32(self.serialization.len()).unwrap(); - self.host = host.into(); - - if let Some(new_port) = opt_new_port { - self.port = new_port; - if let Some(port) = new_port { - write!(&mut self.serialization, ":{}", port).unwrap(); - } - } - let new_suffix_pos = to_u32(self.serialization.len()).unwrap(); - self.serialization.push_str(&suffix); - - let adjust = |index: &mut u32| { - *index -= old_suffix_pos; - *index += new_suffix_pos; - }; - adjust(&mut self.path_start); - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - } - - /// Change this URL’s host to the given IP address. - /// - /// If this URL is cannot-be-a-base, do nothing and return `Err`. - /// - /// Compared to `Url::set_host`, this skips the host parser. - pub fn set_ip_host(&mut self, address: IpAddr) -> Result<(), ()> { - if self.cannot_be_a_base() { - return Err(()) - } - - let address = match address { - IpAddr::V4(address) => Host::Ipv4(address), - IpAddr::V6(address) => Host::Ipv6(address), - }; - self.set_host_internal(address, None); - Ok(()) - } - - /// Change this URL’s password. - /// - /// If this URL is cannot-be-a-base or does not have a host, do nothing and return `Err`. - pub fn set_password(&mut self, password: Option<&str>) -> Result<(), ()> { - if !self.has_host() { - return Err(()) - } - if let Some(password) = password { - let host_and_after = self.slice(self.host_start..).to_owned(); - self.serialization.truncate(self.username_end as usize); - self.serialization.push(':'); - self.serialization.extend(utf8_percent_encode(password, USERINFO_ENCODE_SET)); - self.serialization.push('@'); - - let old_host_start = self.host_start; - let new_host_start = to_u32(self.serialization.len()).unwrap(); - let adjust = |index: &mut u32| { - *index -= old_host_start; - *index += new_host_start; - }; - self.host_start = new_host_start; - adjust(&mut self.host_end); - adjust(&mut self.path_start); - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - - self.serialization.push_str(&host_and_after); - } else if self.byte_at(self.username_end) == b':' { // If there is a password to remove - let has_username_or_password = self.byte_at(self.host_start - 1) == b'@'; - debug_assert!(has_username_or_password); - let username_start = self.scheme_end + 3; - let empty_username = username_start == self.username_end; - let start = self.username_end; // Remove the ':' - let end = if empty_username { - self.host_start // Remove the '@' as well - } else { - self.host_start - 1 // Keep the '@' to separate the username from the host - }; - self.serialization.drain(start as usize .. end as usize); - let offset = end - start; - self.host_start -= offset; - self.host_end -= offset; - self.path_start -= offset; - if let Some(ref mut index) = self.query_start { *index -= offset } - if let Some(ref mut index) = self.fragment_start { *index -= offset } - } - Ok(()) - } - - /// Change this URL’s username. - /// - /// If this URL is cannot-be-a-base or does not have a host, do nothing and return `Err`. - pub fn set_username(&mut self, username: &str) -> Result<(), ()> { - if !self.has_host() { - return Err(()) - } - let username_start = self.scheme_end + 3; - debug_assert!(self.slice(self.scheme_end..username_start) == "://"); - if self.slice(username_start..self.username_end) == username { - return Ok(()) - } - let after_username = self.slice(self.username_end..).to_owned(); - self.serialization.truncate(username_start as usize); - self.serialization.extend(utf8_percent_encode(username, USERINFO_ENCODE_SET)); - - let mut removed_bytes = self.username_end; - self.username_end = to_u32(self.serialization.len()).unwrap(); - let mut added_bytes = self.username_end; - - let new_username_is_empty = self.username_end == username_start; - match (new_username_is_empty, after_username.chars().next()) { - (true, Some('@')) => { - removed_bytes += 1; - self.serialization.push_str(&after_username[1..]); - } - (false, Some('@')) | (_, Some(':')) | (true, _) => { - self.serialization.push_str(&after_username); - } - (false, _) => { - added_bytes += 1; - self.serialization.push('@'); - self.serialization.push_str(&after_username); - } - } - - let adjust = |index: &mut u32| { - *index -= removed_bytes; - *index += added_bytes; - }; - adjust(&mut self.host_start); - adjust(&mut self.host_end); - adjust(&mut self.path_start); - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - Ok(()) - } - - /// Change this URL’s scheme. - /// - /// Do nothing and return `Err` if: - /// * The new scheme is not in `[a-zA-Z][a-zA-Z0-9+.-]+` - /// * This URL is cannot-be-a-base and the new scheme is one of - /// `http`, `https`, `ws`, `wss`, `ftp`, or `gopher` - pub fn set_scheme(&mut self, scheme: &str) -> Result<(), ()> { - let mut parser = Parser::for_setter(String::new()); - let remaining = try!(parser.parse_scheme(parser::Input::new(scheme))); - if !remaining.is_empty() || - (!self.has_host() && SchemeType::from(&parser.serialization).is_special()) { - return Err(()) - } - let old_scheme_end = self.scheme_end; - let new_scheme_end = to_u32(parser.serialization.len()).unwrap(); - let adjust = |index: &mut u32| { - *index -= old_scheme_end; - *index += new_scheme_end; - }; - - self.scheme_end = new_scheme_end; - adjust(&mut self.username_end); - adjust(&mut self.host_start); - adjust(&mut self.host_end); - adjust(&mut self.path_start); - if let Some(ref mut index) = self.query_start { adjust(index) } - if let Some(ref mut index) = self.fragment_start { adjust(index) } - - parser.serialization.push_str(self.slice(old_scheme_end..)); - self.serialization = parser.serialization; - Ok(()) - } - - /// Convert a file name as `std::path::Path` into an URL in the `file` scheme. - /// - /// This returns `Err` if the given path is not absolute or, - /// on Windows, if the prefix is not a disk prefix (e.g. `C:`). - pub fn from_file_path<P: AsRef<Path>>(path: P) -> Result<Url, ()> { - let mut serialization = "file://".to_owned(); - let path_start = serialization.len() as u32; - try!(path_to_file_url_segments(path.as_ref(), &mut serialization)); - Ok(Url { - serialization: serialization, - scheme_end: "file".len() as u32, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: None, - fragment_start: None, - }) - } - - /// Convert a directory name as `std::path::Path` into an URL in the `file` scheme. - /// - /// This returns `Err` if the given path is not absolute or, - /// on Windows, if the prefix is not a disk prefix (e.g. `C:`). - /// - /// Compared to `from_file_path`, this ensure that URL’s the path has a trailing slash - /// so that the entire path is considered when using this URL as a base URL. - /// - /// For example: - /// - /// * `"index.html"` parsed with `Url::from_directory_path(Path::new("/var/www"))` - /// as the base URL is `file:///var/www/index.html` - /// * `"index.html"` parsed with `Url::from_file_path(Path::new("/var/www"))` - /// as the base URL is `file:///var/index.html`, which might not be what was intended. - /// - /// Note that `std::path` does not consider trailing slashes significant - /// and usually does not include them (e.g. in `Path::parent()`). - pub fn from_directory_path<P: AsRef<Path>>(path: P) -> Result<Url, ()> { - let mut url = try!(Url::from_file_path(path)); - if !url.serialization.ends_with('/') { - url.serialization.push('/') - } - Ok(url) - } - - /// Assuming the URL is in the `file` scheme or similar, - /// convert its path to an absolute `std::path::Path`. - /// - /// **Note:** This does not actually check the URL’s `scheme`, - /// and may give nonsensical results for other schemes. - /// It is the user’s responsibility to check the URL’s scheme before calling this. - /// - /// ``` - /// # use url::Url; - /// # let url = Url::parse("file:///etc/passwd").unwrap(); - /// let path = url.to_file_path(); - /// ``` - /// - /// Returns `Err` if the host is neither empty nor `"localhost"`, - /// or if `Path::new_opt()` returns `None`. - /// (That is, if the percent-decoded path contains a NUL byte or, - /// for a Windows path, is not UTF-8.) - #[inline] - pub fn to_file_path(&self) -> Result<PathBuf, ()> { - // FIXME: Figure out what to do w.r.t host. - if matches!(self.host(), None | Some(Host::Domain("localhost"))) { - if let Some(segments) = self.path_segments() { - return file_url_segments_to_pathbuf(segments) - } - } - Err(()) - } - - // Private helper methods: - - #[inline] - fn slice<R>(&self, range: R) -> &str where R: RangeArg { - range.slice_of(&self.serialization) - } - - #[inline] - fn byte_at(&self, i: u32) -> u8 { - self.serialization.as_bytes()[i as usize] - } -} - -/// Return an error if `Url::host` or `Url::port_or_known_default` return `None`. -impl ToSocketAddrs for Url { - type Iter = SocketAddrs; - - fn to_socket_addrs(&self) -> io::Result<Self::Iter> { - try!(self.with_default_port(|_| Err(()))).to_socket_addrs() - } -} - -/// Parse a string as an URL, without a base URL or encoding override. -impl str::FromStr for Url { - type Err = ParseError; - - #[inline] - fn from_str(input: &str) -> Result<Url, ::ParseError> { - Url::parse(input) - } -} - -/// Display the serialization of this URL. -impl fmt::Display for Url { - #[inline] - fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result { - fmt::Display::fmt(&self.serialization, formatter) - } -} - -/// Debug the serialization of this URL. -impl fmt::Debug for Url { - #[inline] - fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result { - fmt::Debug::fmt(&self.serialization, formatter) - } -} - -/// URLs compare like their serialization. -impl Eq for Url {} - -/// URLs compare like their serialization. -impl PartialEq for Url { - #[inline] - fn eq(&self, other: &Self) -> bool { - self.serialization == other.serialization - } -} - -/// URLs compare like their serialization. -impl Ord for Url { - #[inline] - fn cmp(&self, other: &Self) -> cmp::Ordering { - self.serialization.cmp(&other.serialization) - } -} - -/// URLs compare like their serialization. -impl PartialOrd for Url { - #[inline] - fn partial_cmp(&self, other: &Self) -> Option<cmp::Ordering> { - self.serialization.partial_cmp(&other.serialization) - } -} - -/// URLs hash like their serialization. -impl hash::Hash for Url { - #[inline] - fn hash<H>(&self, state: &mut H) where H: hash::Hasher { - hash::Hash::hash(&self.serialization, state) - } -} - -/// Return the serialization of this URL. -impl AsRef<str> for Url { - #[inline] - fn as_ref(&self) -> &str { - &self.serialization - } -} - -trait RangeArg { - fn slice_of<'a>(&self, s: &'a str) -> &'a str; -} - -impl RangeArg for Range<u32> { - #[inline] - fn slice_of<'a>(&self, s: &'a str) -> &'a str { - &s[self.start as usize .. self.end as usize] - } -} - -impl RangeArg for RangeFrom<u32> { - #[inline] - fn slice_of<'a>(&self, s: &'a str) -> &'a str { - &s[self.start as usize ..] - } -} - -impl RangeArg for RangeTo<u32> { - #[inline] - fn slice_of<'a>(&self, s: &'a str) -> &'a str { - &s[.. self.end as usize] - } -} - -#[cfg(feature="rustc-serialize")] -impl rustc_serialize::Encodable for Url { - fn encode<S: rustc_serialize::Encoder>(&self, encoder: &mut S) -> Result<(), S::Error> { - encoder.emit_str(self.as_str()) - } -} - - -#[cfg(feature="rustc-serialize")] -impl rustc_serialize::Decodable for Url { - fn decode<D: rustc_serialize::Decoder>(decoder: &mut D) -> Result<Url, D::Error> { - Url::parse(&*try!(decoder.read_str())).map_err(|error| { - decoder.error(&format!("URL parsing error: {}", error)) - }) - } -} - -/// Serializes this URL into a `serde` stream. -/// -/// This implementation is only available if the `serde` Cargo feature is enabled. -#[cfg(feature="serde")] -impl serde::Serialize for Url { - fn serialize<S>(&self, serializer: &mut S) -> Result<(), S::Error> where S: serde::Serializer { - format!("{}", self).serialize(serializer) - } -} - -/// Deserializes this URL from a `serde` stream. -/// -/// This implementation is only available if the `serde` Cargo feature is enabled. -#[cfg(feature="serde")] -impl serde::Deserialize for Url { - fn deserialize<D>(deserializer: &mut D) -> Result<Url, D::Error> where D: serde::Deserializer { - let string_representation: String = try!(serde::Deserialize::deserialize(deserializer)); - Ok(Url::parse(&string_representation).unwrap()) - } -} - -#[cfg(unix)] -fn path_to_file_url_segments(path: &Path, serialization: &mut String) -> Result<(), ()> { - use std::os::unix::prelude::OsStrExt; - if !path.is_absolute() { - return Err(()) - } - let mut empty = true; - // skip the root component - for component in path.components().skip(1) { - empty = false; - serialization.push('/'); - serialization.extend(percent_encode( - component.as_os_str().as_bytes(), PATH_SEGMENT_ENCODE_SET)); - } - if empty { - // An URL’s path must not be empty. - serialization.push('/'); - } - Ok(()) -} - -#[cfg(windows)] -fn path_to_file_url_segments(path: &Path, serialization: &mut String) -> Result<(), ()> { - path_to_file_url_segments_windows(path, serialization) -} - -// Build this unconditionally to alleviate https://github.com/servo/rust-url/issues/102 -#[cfg_attr(not(windows), allow(dead_code))] -fn path_to_file_url_segments_windows(path: &Path, serialization: &mut String) -> Result<(), ()> { - use std::path::{Prefix, Component}; - if !path.is_absolute() { - return Err(()) - } - let mut components = path.components(); - let disk = match components.next() { - Some(Component::Prefix(ref p)) => match p.kind() { - Prefix::Disk(byte) => byte, - Prefix::VerbatimDisk(byte) => byte, - _ => return Err(()), - }, - - // FIXME: do something with UNC and other prefixes? - _ => return Err(()) - }; - - // Start with the prefix, e.g. "C:" - serialization.push('/'); - serialization.push(disk as char); - serialization.push(':'); - - for component in components { - if component == Component::RootDir { continue } - // FIXME: somehow work with non-unicode? - let component = try!(component.as_os_str().to_str().ok_or(())); - serialization.push('/'); - serialization.extend(percent_encode(component.as_bytes(), PATH_SEGMENT_ENCODE_SET)); - } - Ok(()) -} - -#[cfg(unix)] -fn file_url_segments_to_pathbuf(segments: str::Split<char>) -> Result<PathBuf, ()> { - use std::ffi::OsStr; - use std::os::unix::prelude::OsStrExt; - use std::path::PathBuf; - - let mut bytes = Vec::new(); - for segment in segments { - bytes.push(b'/'); - bytes.extend(percent_decode(segment.as_bytes())); - } - let os_str = OsStr::from_bytes(&bytes); - let path = PathBuf::from(os_str); - debug_assert!(path.is_absolute(), - "to_file_path() failed to produce an absolute Path"); - Ok(path) -} - -#[cfg(windows)] -fn file_url_segments_to_pathbuf(segments: str::Split<char>) -> Result<PathBuf, ()> { - file_url_segments_to_pathbuf_windows(segments) -} - -// Build this unconditionally to alleviate https://github.com/servo/rust-url/issues/102 -#[cfg_attr(not(windows), allow(dead_code))] -fn file_url_segments_to_pathbuf_windows(mut segments: str::Split<char>) -> Result<PathBuf, ()> { - let first = try!(segments.next().ok_or(())); - if first.len() != 2 || !first.starts_with(parser::ascii_alpha) - || first.as_bytes()[1] != b':' { - return Err(()) - } - let mut string = first.to_owned(); - for segment in segments { - string.push('\\'); - - // Currently non-unicode windows paths cannot be represented - match String::from_utf8(percent_decode(segment.as_bytes()).collect()) { - Ok(s) => string.push_str(&s), - Err(..) => return Err(()), - } - } - let path = PathBuf::from(string); - debug_assert!(path.is_absolute(), - "to_file_path() failed to produce an absolute Path"); - Ok(path) -} - -fn io_error<T>(reason: &str) -> io::Result<T> { - Err(io::Error::new(io::ErrorKind::InvalidData, reason)) -} - -/// Implementation detail of `Url::query_pairs_mut`. Typically not used directly. -pub struct UrlQuery<'a> { - url: &'a mut Url, - fragment: Option<String>, -} - -impl<'a> Drop for UrlQuery<'a> { - fn drop(&mut self) { - self.url.restore_already_parsed_fragment(self.fragment.take()) - } -} diff --git a/third_party/rust/url/src/origin.rs b/third_party/rust/url/src/origin.rs deleted file mode 100644 index 2217c94fe..000000000 --- a/third_party/rust/url/src/origin.rs +++ /dev/null @@ -1,114 +0,0 @@ -// Copyright 2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf; -use host::Host; -use idna::domain_to_unicode; -use parser::default_port; -use std::sync::atomic::{AtomicUsize, ATOMIC_USIZE_INIT, Ordering}; -use Url; - -pub fn url_origin(url: &Url) -> Origin { - let scheme = url.scheme(); - match scheme { - "blob" => { - let result = Url::parse(url.path()); - match result { - Ok(ref url) => url_origin(url), - Err(_) => Origin::new_opaque() - } - }, - "ftp" | "gopher" | "http" | "https" | "ws" | "wss" => { - Origin::Tuple(scheme.to_owned(), url.host().unwrap().to_owned(), - url.port_or_known_default().unwrap()) - }, - // TODO: Figure out what to do if the scheme is a file - "file" => Origin::new_opaque(), - _ => Origin::new_opaque() - } -} - -/// The origin of an URL -#[derive(PartialEq, Eq, Clone, Debug)] -pub enum Origin { - /// A globally unique identifier - Opaque(OpaqueOrigin), - - /// Consists of the URL's scheme, host and port - Tuple(String, Host<String>, u16) -} - -#[cfg(feature = "heapsize")] -impl HeapSizeOf for Origin { - fn heap_size_of_children(&self) -> usize { - match *self { - Origin::Tuple(ref scheme, ref host, _) => { - scheme.heap_size_of_children() + - host.heap_size_of_children() - }, - _ => 0, - } - } -} - - -impl Origin { - /// Creates a new opaque origin that is only equal to itself. - pub fn new_opaque() -> Origin { - static COUNTER: AtomicUsize = ATOMIC_USIZE_INIT; - Origin::Opaque(OpaqueOrigin(COUNTER.fetch_add(1, Ordering::SeqCst))) - } - - /// Return whether this origin is a (scheme, host, port) tuple - /// (as opposed to an opaque origin). - pub fn is_tuple(&self) -> bool { - matches!(*self, Origin::Tuple(..)) - } - - /// https://html.spec.whatwg.org/multipage/#ascii-serialisation-of-an-origin - pub fn ascii_serialization(&self) -> String { - match *self { - Origin::Opaque(_) => "null".to_owned(), - Origin::Tuple(ref scheme, ref host, port) => { - if default_port(scheme) == Some(port) { - format!("{}://{}", scheme, host) - } else { - format!("{}://{}:{}", scheme, host, port) - } - } - } - } - - /// https://html.spec.whatwg.org/multipage/#unicode-serialisation-of-an-origin - pub fn unicode_serialization(&self) -> String { - match *self { - Origin::Opaque(_) => "null".to_owned(), - Origin::Tuple(ref scheme, ref host, port) => { - let host = match *host { - Host::Domain(ref domain) => { - let (domain, _errors) = domain_to_unicode(domain); - Host::Domain(domain) - } - _ => host.clone() - }; - if default_port(scheme) == Some(port) { - format!("{}://{}", scheme, host) - } else { - format!("{}://{}:{}", scheme, host, port) - } - } - } - } -} - -/// Opaque identifier for URLs that have file or other schemes -#[derive(Eq, PartialEq, Clone, Debug)] -pub struct OpaqueOrigin(usize); - -#[cfg(feature = "heapsize")] -known_heap_size!(0, OpaqueOrigin); diff --git a/third_party/rust/url/src/parser.rs b/third_party/rust/url/src/parser.rs deleted file mode 100644 index 2945432fc..000000000 --- a/third_party/rust/url/src/parser.rs +++ /dev/null @@ -1,1179 +0,0 @@ -// Copyright 2013-2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -use std::ascii::AsciiExt; -use std::error::Error; -use std::fmt::{self, Formatter, Write}; -use std::str; - -use Url; -use encoding::EncodingOverride; -use host::{Host, HostInternal}; -use percent_encoding::{ - utf8_percent_encode, percent_encode, - SIMPLE_ENCODE_SET, DEFAULT_ENCODE_SET, USERINFO_ENCODE_SET, QUERY_ENCODE_SET, - PATH_SEGMENT_ENCODE_SET -}; - -pub type ParseResult<T> = Result<T, ParseError>; - -macro_rules! simple_enum_error { - ($($name: ident => $description: expr,)+) => { - /// Errors that can occur during parsing. - #[derive(PartialEq, Eq, Clone, Copy, Debug)] - pub enum ParseError { - $( - $name, - )+ - } - - impl Error for ParseError { - fn description(&self) -> &str { - match *self { - $( - ParseError::$name => $description, - )+ - } - } - } - } -} - -simple_enum_error! { - EmptyHost => "empty host", - IdnaError => "invalid international domain name", - InvalidPort => "invalid port number", - InvalidIpv4Address => "invalid IPv4 address", - InvalidIpv6Address => "invalid IPv6 address", - InvalidDomainCharacter => "invalid domain character", - RelativeUrlWithoutBase => "relative URL without a base", - RelativeUrlWithCannotBeABaseBase => "relative URL with a cannot-be-a-base base", - SetHostOnCannotBeABaseUrl => "a cannot-be-a-base URL doesn’t have a host to set", - Overflow => "URLs more than 4 GB are not supported", -} - -impl fmt::Display for ParseError { - fn fmt(&self, fmt: &mut Formatter) -> fmt::Result { - self.description().fmt(fmt) - } -} - -impl From<::idna::uts46::Errors> for ParseError { - fn from(_: ::idna::uts46::Errors) -> ParseError { ParseError::IdnaError } -} - -#[derive(Copy, Clone)] -pub enum SchemeType { - File, - SpecialNotFile, - NotSpecial, -} - -impl SchemeType { - pub fn is_special(&self) -> bool { - !matches!(*self, SchemeType::NotSpecial) - } - - pub fn is_file(&self) -> bool { - matches!(*self, SchemeType::File) - } - - pub fn from(s: &str) -> Self { - match s { - "http" | "https" | "ws" | "wss" | "ftp" | "gopher" => SchemeType::SpecialNotFile, - "file" => SchemeType::File, - _ => SchemeType::NotSpecial, - } - } -} - -pub fn default_port(scheme: &str) -> Option<u16> { - match scheme { - "http" | "ws" => Some(80), - "https" | "wss" => Some(443), - "ftp" => Some(21), - "gopher" => Some(70), - _ => None, - } -} - -#[derive(Clone)] -pub struct Input<'i> { - chars: str::Chars<'i>, -} - -impl<'i> Input<'i> { - pub fn new(input: &'i str) -> Self { - Input::with_log(input, None) - } - - pub fn with_log(original_input: &'i str, log_syntax_violation: Option<&Fn(&'static str)>) - -> Self { - let input = original_input.trim_matches(c0_control_or_space); - if let Some(log) = log_syntax_violation { - if input.len() < original_input.len() { - log("leading or trailing control or space character are ignored in URLs") - } - if input.chars().any(|c| matches!(c, '\t' | '\n' | '\r')) { - log("tabs or newlines are ignored in URLs") - } - } - Input { chars: input.chars() } - } - - #[inline] - pub fn is_empty(&self) -> bool { - self.clone().next().is_none() - } - - #[inline] - fn starts_with<P: Pattern>(&self, p: P) -> bool { - p.split_prefix(&mut self.clone()) - } - - #[inline] - pub fn split_prefix<P: Pattern>(&self, p: P) -> Option<Self> { - let mut remaining = self.clone(); - if p.split_prefix(&mut remaining) { - Some(remaining) - } else { - None - } - } - - #[inline] - fn split_first(&self) -> (Option<char>, Self) { - let mut remaining = self.clone(); - (remaining.next(), remaining) - } - - #[inline] - fn count_matching<F: Fn(char) -> bool>(&self, f: F) -> (u32, Self) { - let mut count = 0; - let mut remaining = self.clone(); - loop { - let mut input = remaining.clone(); - if matches!(input.next(), Some(c) if f(c)) { - remaining = input; - count += 1; - } else { - return (count, remaining) - } - } - } - - #[inline] - fn next_utf8(&mut self) -> Option<(char, &'i str)> { - loop { - let utf8 = self.chars.as_str(); - match self.chars.next() { - Some(c) => { - if !matches!(c, '\t' | '\n' | '\r') { - return Some((c, &utf8[..c.len_utf8()])) - } - } - None => return None - } - } - } -} - -pub trait Pattern { - fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool; -} - -impl Pattern for char { - fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool { input.next() == Some(self) } -} - -impl<'a> Pattern for &'a str { - fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool { - for c in self.chars() { - if input.next() != Some(c) { - return false - } - } - true - } -} - -impl<F: FnMut(char) -> bool> Pattern for F { - fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool { input.next().map_or(false, self) } -} - -impl<'i> Iterator for Input<'i> { - type Item = char; - fn next(&mut self) -> Option<char> { - self.chars.by_ref().filter(|&c| !matches!(c, '\t' | '\n' | '\r')).next() - } -} - -pub struct Parser<'a> { - pub serialization: String, - pub base_url: Option<&'a Url>, - pub query_encoding_override: EncodingOverride, - pub log_syntax_violation: Option<&'a Fn(&'static str)>, - pub context: Context, -} - -#[derive(PartialEq, Eq, Copy, Clone)] -pub enum Context { - UrlParser, - Setter, - PathSegmentSetter, -} - -impl<'a> Parser<'a> { - pub fn for_setter(serialization: String) -> Parser<'a> { - Parser { - serialization: serialization, - base_url: None, - query_encoding_override: EncodingOverride::utf8(), - log_syntax_violation: None, - context: Context::Setter, - } - } - - fn syntax_violation(&self, reason: &'static str) { - if let Some(log) = self.log_syntax_violation { - log(reason) - } - } - - fn syntax_violation_if<F: Fn() -> bool>(&self, reason: &'static str, test: F) { - // Skip test if not logging. - if let Some(log) = self.log_syntax_violation { - if test() { - log(reason) - } - } - } - - /// https://url.spec.whatwg.org/#concept-basic-url-parser - pub fn parse_url(mut self, input: &str) -> ParseResult<Url> { - let input = Input::with_log(input, self.log_syntax_violation); - if let Ok(remaining) = self.parse_scheme(input.clone()) { - return self.parse_with_scheme(remaining) - } - - // No-scheme state - if let Some(base_url) = self.base_url { - if input.starts_with('#') { - self.fragment_only(base_url, input) - } else if base_url.cannot_be_a_base() { - Err(ParseError::RelativeUrlWithCannotBeABaseBase) - } else { - let scheme_type = SchemeType::from(base_url.scheme()); - if scheme_type.is_file() { - self.parse_file(input, Some(base_url)) - } else { - self.parse_relative(input, scheme_type, base_url) - } - } - } else { - Err(ParseError::RelativeUrlWithoutBase) - } - } - - pub fn parse_scheme<'i>(&mut self, mut input: Input<'i>) -> Result<Input<'i>, ()> { - if input.is_empty() || !input.starts_with(ascii_alpha) { - return Err(()) - } - debug_assert!(self.serialization.is_empty()); - while let Some(c) = input.next() { - match c { - 'a'...'z' | 'A'...'Z' | '0'...'9' | '+' | '-' | '.' => { - self.serialization.push(c.to_ascii_lowercase()) - } - ':' => return Ok(input), - _ => { - self.serialization.clear(); - return Err(()) - } - } - } - // EOF before ':' - if self.context == Context::Setter { - Ok(input) - } else { - self.serialization.clear(); - Err(()) - } - } - - fn parse_with_scheme(mut self, input: Input) -> ParseResult<Url> { - let scheme_end = try!(to_u32(self.serialization.len())); - let scheme_type = SchemeType::from(&self.serialization); - self.serialization.push(':'); - match scheme_type { - SchemeType::File => { - self.syntax_violation_if("expected // after file:", || !input.starts_with("//")); - let base_file_url = self.base_url.and_then(|base| { - if base.scheme() == "file" { Some(base) } else { None } - }); - self.serialization.clear(); - self.parse_file(input, base_file_url) - } - SchemeType::SpecialNotFile => { - // special relative or authority state - let (slashes_count, remaining) = input.count_matching(|c| matches!(c, '/' | '\\')); - if let Some(base_url) = self.base_url { - if slashes_count < 2 && - base_url.scheme() == &self.serialization[..scheme_end as usize] { - // "Cannot-be-a-base" URLs only happen with "not special" schemes. - debug_assert!(!base_url.cannot_be_a_base()); - self.serialization.clear(); - return self.parse_relative(input, scheme_type, base_url) - } - } - // special authority slashes state - self.syntax_violation_if("expected //", || { - input.clone().take_while(|&c| matches!(c, '/' | '\\')) - .collect::<String>() != "//" - }); - self.after_double_slash(remaining, scheme_type, scheme_end) - } - SchemeType::NotSpecial => self.parse_non_special(input, scheme_type, scheme_end) - } - } - - /// Scheme other than file, http, https, ws, ws, ftp, gopher. - fn parse_non_special(mut self, input: Input, scheme_type: SchemeType, scheme_end: u32) - -> ParseResult<Url> { - // path or authority state ( - if let Some(input) = input.split_prefix("//") { - return self.after_double_slash(input, scheme_type, scheme_end) - } - // Anarchist URL (no authority) - let path_start = try!(to_u32(self.serialization.len())); - let username_end = path_start; - let host_start = path_start; - let host_end = path_start; - let host = HostInternal::None; - let port = None; - let remaining = if let Some(input) = input.split_prefix('/') { - let path_start = self.serialization.len(); - self.serialization.push('/'); - self.parse_path(scheme_type, &mut false, path_start, input) - } else { - self.parse_cannot_be_a_base_path(input) - }; - self.with_query_and_fragment(scheme_end, username_end, host_start, - host_end, host, port, path_start, remaining) - } - - fn parse_file(mut self, input: Input, mut base_file_url: Option<&Url>) -> ParseResult<Url> { - // file state - debug_assert!(self.serialization.is_empty()); - let (first_char, input_after_first_char) = input.split_first(); - match first_char { - None => { - if let Some(base_url) = base_file_url { - // Copy everything except the fragment - let before_fragment = match base_url.fragment_start { - Some(i) => &base_url.serialization[..i as usize], - None => &*base_url.serialization, - }; - self.serialization.push_str(before_fragment); - Ok(Url { - serialization: self.serialization, - fragment_start: None, - ..*base_url - }) - } else { - self.serialization.push_str("file:///"); - let scheme_end = "file".len() as u32; - let path_start = "file://".len() as u32; - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: None, - fragment_start: None, - }) - } - }, - Some('?') => { - if let Some(base_url) = base_file_url { - // Copy everything up to the query string - let before_query = match (base_url.query_start, base_url.fragment_start) { - (None, None) => &*base_url.serialization, - (Some(i), _) | - (None, Some(i)) => base_url.slice(..i) - }; - self.serialization.push_str(before_query); - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(base_url.scheme_end, input)); - Ok(Url { - serialization: self.serialization, - query_start: query_start, - fragment_start: fragment_start, - ..*base_url - }) - } else { - self.serialization.push_str("file:///"); - let scheme_end = "file".len() as u32; - let path_start = "file://".len() as u32; - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(scheme_end, input)); - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: query_start, - fragment_start: fragment_start, - }) - } - }, - Some('#') => { - if let Some(base_url) = base_file_url { - self.fragment_only(base_url, input) - } else { - self.serialization.push_str("file:///"); - let scheme_end = "file".len() as u32; - let path_start = "file://".len() as u32; - let fragment_start = "file:///".len() as u32; - self.parse_fragment(input_after_first_char); - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: None, - fragment_start: Some(fragment_start), - }) - } - } - Some('/') | Some('\\') => { - self.syntax_violation_if("backslash", || first_char == Some('\\')); - // file slash state - let (next_char, input_after_next_char) = input_after_first_char.split_first(); - self.syntax_violation_if("backslash", || next_char == Some('\\')); - if matches!(next_char, Some('/') | Some('\\')) { - // file host state - self.serialization.push_str("file://"); - let scheme_end = "file".len() as u32; - let host_start = "file://".len() as u32; - let (path_start, host, remaining) = - try!(self.parse_file_host(input_after_next_char)); - let host_end = try!(to_u32(self.serialization.len())); - let mut has_host = !matches!(host, HostInternal::None); - let remaining = if path_start { - self.parse_path_start(SchemeType::File, &mut has_host, remaining) - } else { - let path_start = self.serialization.len(); - self.serialization.push('/'); - self.parse_path(SchemeType::File, &mut has_host, path_start, remaining) - }; - // FIXME: deal with has_host - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(scheme_end, remaining)); - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: host_start, - host_start: host_start, - host_end: host_end, - host: host, - port: None, - path_start: host_end, - query_start: query_start, - fragment_start: fragment_start, - }) - } else { - self.serialization.push_str("file:///"); - let scheme_end = "file".len() as u32; - let path_start = "file://".len(); - if let Some(base_url) = base_file_url { - let first_segment = base_url.path_segments().unwrap().next().unwrap(); - // FIXME: *normalized* drive letter - if is_windows_drive_letter(first_segment) { - self.serialization.push_str(first_segment); - self.serialization.push('/'); - } - } - let remaining = self.parse_path( - SchemeType::File, &mut false, path_start, input_after_first_char); - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(scheme_end, remaining)); - let path_start = path_start as u32; - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: query_start, - fragment_start: fragment_start, - }) - } - } - _ => { - if starts_with_windows_drive_letter_segment(&input) { - base_file_url = None; - } - if let Some(base_url) = base_file_url { - let before_query = match (base_url.query_start, base_url.fragment_start) { - (None, None) => &*base_url.serialization, - (Some(i), _) | - (None, Some(i)) => base_url.slice(..i) - }; - self.serialization.push_str(before_query); - self.pop_path(SchemeType::File, base_url.path_start as usize); - let remaining = self.parse_path( - SchemeType::File, &mut true, base_url.path_start as usize, input); - self.with_query_and_fragment( - base_url.scheme_end, base_url.username_end, base_url.host_start, - base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining) - } else { - self.serialization.push_str("file:///"); - let scheme_end = "file".len() as u32; - let path_start = "file://".len(); - let remaining = self.parse_path( - SchemeType::File, &mut false, path_start, input); - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(scheme_end, remaining)); - let path_start = path_start as u32; - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: path_start, - host_start: path_start, - host_end: path_start, - host: HostInternal::None, - port: None, - path_start: path_start, - query_start: query_start, - fragment_start: fragment_start, - }) - } - } - } - } - - fn parse_relative(mut self, input: Input, scheme_type: SchemeType, base_url: &Url) - -> ParseResult<Url> { - // relative state - debug_assert!(self.serialization.is_empty()); - let (first_char, input_after_first_char) = input.split_first(); - match first_char { - None => { - // Copy everything except the fragment - let before_fragment = match base_url.fragment_start { - Some(i) => &base_url.serialization[..i as usize], - None => &*base_url.serialization, - }; - self.serialization.push_str(before_fragment); - Ok(Url { - serialization: self.serialization, - fragment_start: None, - ..*base_url - }) - }, - Some('?') => { - // Copy everything up to the query string - let before_query = match (base_url.query_start, base_url.fragment_start) { - (None, None) => &*base_url.serialization, - (Some(i), _) | - (None, Some(i)) => base_url.slice(..i) - }; - self.serialization.push_str(before_query); - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(base_url.scheme_end, input)); - Ok(Url { - serialization: self.serialization, - query_start: query_start, - fragment_start: fragment_start, - ..*base_url - }) - }, - Some('#') => self.fragment_only(base_url, input), - Some('/') | Some('\\') => { - let (slashes_count, remaining) = input.count_matching(|c| matches!(c, '/' | '\\')); - if slashes_count >= 2 { - self.syntax_violation_if("expected //", || { - input.clone().take_while(|&c| matches!(c, '/' | '\\')) - .collect::<String>() != "//" - }); - let scheme_end = base_url.scheme_end; - debug_assert!(base_url.byte_at(scheme_end) == b':'); - self.serialization.push_str(base_url.slice(..scheme_end + 1)); - return self.after_double_slash(remaining, scheme_type, scheme_end) - } - let path_start = base_url.path_start; - debug_assert!(base_url.byte_at(path_start) == b'/'); - self.serialization.push_str(base_url.slice(..path_start + 1)); - let remaining = self.parse_path( - scheme_type, &mut true, path_start as usize, input_after_first_char); - self.with_query_and_fragment( - base_url.scheme_end, base_url.username_end, base_url.host_start, - base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining) - } - _ => { - let before_query = match (base_url.query_start, base_url.fragment_start) { - (None, None) => &*base_url.serialization, - (Some(i), _) | - (None, Some(i)) => base_url.slice(..i) - }; - self.serialization.push_str(before_query); - // FIXME spec says just "remove last entry", not the "pop" algorithm - self.pop_path(scheme_type, base_url.path_start as usize); - let remaining = self.parse_path( - scheme_type, &mut true, base_url.path_start as usize, input); - self.with_query_and_fragment( - base_url.scheme_end, base_url.username_end, base_url.host_start, - base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining) - } - } - } - - fn after_double_slash(mut self, input: Input, scheme_type: SchemeType, scheme_end: u32) - -> ParseResult<Url> { - self.serialization.push('/'); - self.serialization.push('/'); - // authority state - let (username_end, remaining) = try!(self.parse_userinfo(input, scheme_type)); - // host state - let host_start = try!(to_u32(self.serialization.len())); - let (host_end, host, port, remaining) = - try!(self.parse_host_and_port(remaining, scheme_end, scheme_type)); - // path state - let path_start = try!(to_u32(self.serialization.len())); - let remaining = self.parse_path_start( - scheme_type, &mut true, remaining); - self.with_query_and_fragment(scheme_end, username_end, host_start, - host_end, host, port, path_start, remaining) - } - - /// Return (username_end, remaining) - fn parse_userinfo<'i>(&mut self, mut input: Input<'i>, scheme_type: SchemeType) - -> ParseResult<(u32, Input<'i>)> { - let mut last_at = None; - let mut remaining = input.clone(); - let mut char_count = 0; - while let Some(c) = remaining.next() { - match c { - '@' => { - if last_at.is_some() { - self.syntax_violation("unencoded @ sign in username or password") - } else { - self.syntax_violation( - "embedding authentification information (username or password) \ - in an URL is not recommended") - } - last_at = Some((char_count, remaining.clone())) - }, - '/' | '?' | '#' => break, - '\\' if scheme_type.is_special() => break, - _ => (), - } - char_count += 1; - } - let (mut userinfo_char_count, remaining) = match last_at { - None => return Ok((try!(to_u32(self.serialization.len())), input)), - Some((0, remaining)) => return Ok((try!(to_u32(self.serialization.len())), remaining)), - Some(x) => x - }; - - let mut username_end = None; - while userinfo_char_count > 0 { - let (c, utf8_c) = input.next_utf8().unwrap(); - userinfo_char_count -= 1; - if c == ':' && username_end.is_none() { - // Start parsing password - username_end = Some(try!(to_u32(self.serialization.len()))); - self.serialization.push(':'); - } else { - self.check_url_code_point(c, &input); - self.serialization.extend(utf8_percent_encode(utf8_c, USERINFO_ENCODE_SET)); - } - } - let username_end = match username_end { - Some(i) => i, - None => try!(to_u32(self.serialization.len())), - }; - self.serialization.push('@'); - Ok((username_end, remaining)) - } - - fn parse_host_and_port<'i>(&mut self, input: Input<'i>, - scheme_end: u32, scheme_type: SchemeType) - -> ParseResult<(u32, HostInternal, Option<u16>, Input<'i>)> { - let (host, remaining) = try!( - Parser::parse_host(input, scheme_type)); - write!(&mut self.serialization, "{}", host).unwrap(); - let host_end = try!(to_u32(self.serialization.len())); - let (port, remaining) = if let Some(remaining) = remaining.split_prefix(':') { - let scheme = || default_port(&self.serialization[..scheme_end as usize]); - try!(Parser::parse_port(remaining, scheme, self.context)) - } else { - (None, remaining) - }; - if let Some(port) = port { - write!(&mut self.serialization, ":{}", port).unwrap() - } - Ok((host_end, host.into(), port, remaining)) - } - - pub fn parse_host<'i>(mut input: Input<'i>, scheme_type: SchemeType) - -> ParseResult<(Host<String>, Input<'i>)> { - // Undo the Input abstraction here to avoid allocating in the common case - // where the host part of the input does not contain any tab or newline - let input_str = input.chars.as_str(); - let mut inside_square_brackets = false; - let mut has_ignored_chars = false; - let mut non_ignored_chars = 0; - let mut bytes = 0; - for c in input_str.chars() { - match c { - ':' if !inside_square_brackets => break, - '\\' if scheme_type.is_special() => break, - '/' | '?' | '#' => break, - '\t' | '\n' | '\r' => { - has_ignored_chars = true; - } - '[' => { - inside_square_brackets = true; - non_ignored_chars += 1 - } - ']' => { - inside_square_brackets = false; - non_ignored_chars += 1 - } - _ => non_ignored_chars += 1 - } - bytes += c.len_utf8(); - } - let replaced: String; - let host_str; - { - let host_input = input.by_ref().take(non_ignored_chars); - if has_ignored_chars { - replaced = host_input.collect(); - host_str = &*replaced - } else { - for _ in host_input {} - host_str = &input_str[..bytes] - } - } - if scheme_type.is_special() && host_str.is_empty() { - return Err(ParseError::EmptyHost) - } - let host = try!(Host::parse(host_str)); - Ok((host, input)) - } - - pub fn parse_file_host<'i>(&mut self, input: Input<'i>) - -> ParseResult<(bool, HostInternal, Input<'i>)> { - // Undo the Input abstraction here to avoid allocating in the common case - // where the host part of the input does not contain any tab or newline - let input_str = input.chars.as_str(); - let mut has_ignored_chars = false; - let mut non_ignored_chars = 0; - let mut bytes = 0; - for c in input_str.chars() { - match c { - '/' | '\\' | '?' | '#' => break, - '\t' | '\n' | '\r' => has_ignored_chars = true, - _ => non_ignored_chars += 1, - } - bytes += c.len_utf8(); - } - let replaced: String; - let host_str; - let mut remaining = input.clone(); - { - let host_input = remaining.by_ref().take(non_ignored_chars); - if has_ignored_chars { - replaced = host_input.collect(); - host_str = &*replaced - } else { - for _ in host_input {} - host_str = &input_str[..bytes] - } - } - if is_windows_drive_letter(host_str) { - return Ok((false, HostInternal::None, input)) - } - let host = if host_str.is_empty() { - HostInternal::None - } else { - match try!(Host::parse(host_str)) { - Host::Domain(ref d) if d == "localhost" => HostInternal::None, - host => { - write!(&mut self.serialization, "{}", host).unwrap(); - host.into() - } - } - }; - Ok((true, host, remaining)) - } - - pub fn parse_port<'i, P>(mut input: Input<'i>, default_port: P, - context: Context) - -> ParseResult<(Option<u16>, Input<'i>)> - where P: Fn() -> Option<u16> { - let mut port: u32 = 0; - let mut has_any_digit = false; - while let (Some(c), remaining) = input.split_first() { - if let Some(digit) = c.to_digit(10) { - port = port * 10 + digit; - if port > ::std::u16::MAX as u32 { - return Err(ParseError::InvalidPort) - } - has_any_digit = true; - } else if context == Context::UrlParser && !matches!(c, '/' | '\\' | '?' | '#') { - return Err(ParseError::InvalidPort) - } else { - break - } - input = remaining; - } - let mut opt_port = Some(port as u16); - if !has_any_digit || opt_port == default_port() { - opt_port = None; - } - return Ok((opt_port, input)) - } - - pub fn parse_path_start<'i>(&mut self, scheme_type: SchemeType, has_host: &mut bool, - mut input: Input<'i>) - -> Input<'i> { - // Path start state - match input.split_first() { - (Some('/'), remaining) => input = remaining, - (Some('\\'), remaining) => if scheme_type.is_special() { - self.syntax_violation("backslash"); - input = remaining - }, - _ => {} - } - let path_start = self.serialization.len(); - self.serialization.push('/'); - self.parse_path(scheme_type, has_host, path_start, input) - } - - pub fn parse_path<'i>(&mut self, scheme_type: SchemeType, has_host: &mut bool, - path_start: usize, mut input: Input<'i>) - -> Input<'i> { - // Relative path state - debug_assert!(self.serialization.ends_with("/")); - loop { - let segment_start = self.serialization.len(); - let mut ends_with_slash = false; - loop { - let input_before_c = input.clone(); - let (c, utf8_c) = if let Some(x) = input.next_utf8() { x } else { break }; - match c { - '/' if self.context != Context::PathSegmentSetter => { - ends_with_slash = true; - break - }, - '\\' if self.context != Context::PathSegmentSetter && - scheme_type.is_special() => { - self.syntax_violation("backslash"); - ends_with_slash = true; - break - }, - '?' | '#' if self.context == Context::UrlParser => { - input = input_before_c; - break - }, - _ => { - self.check_url_code_point(c, &input); - if c == '%' { - let after_percent_sign = input.clone(); - if matches!(input.next(), Some('2')) && - matches!(input.next(), Some('E') | Some('e')) { - self.serialization.push('.'); - continue - } - input = after_percent_sign - } - if self.context == Context::PathSegmentSetter { - self.serialization.extend(utf8_percent_encode( - utf8_c, PATH_SEGMENT_ENCODE_SET)); - } else { - self.serialization.extend(utf8_percent_encode( - utf8_c, DEFAULT_ENCODE_SET)); - } - } - } - } - match &self.serialization[segment_start..] { - ".." => { - debug_assert!(self.serialization.as_bytes()[segment_start - 1] == b'/'); - self.serialization.truncate(segment_start - 1); // Truncate "/.." - self.pop_path(scheme_type, path_start); - if !self.serialization[path_start..].ends_with("/") { - self.serialization.push('/') - } - }, - "." => { - self.serialization.truncate(segment_start); - }, - _ => { - if scheme_type.is_file() && is_windows_drive_letter( - &self.serialization[path_start + 1..] - ) { - if self.serialization.ends_with('|') { - self.serialization.pop(); - self.serialization.push(':'); - } - if *has_host { - self.syntax_violation("file: with host and Windows drive letter"); - *has_host = false; // FIXME account for this in callers - } - } - if ends_with_slash { - self.serialization.push('/') - } - } - } - if !ends_with_slash { - break - } - } - input - } - - /// https://url.spec.whatwg.org/#pop-a-urls-path - fn pop_path(&mut self, scheme_type: SchemeType, path_start: usize) { - if self.serialization.len() > path_start { - let slash_position = self.serialization[path_start..].rfind('/').unwrap(); - // + 1 since rfind returns the position before the slash. - let segment_start = path_start + slash_position + 1; - // Don’t pop a Windows drive letter - // FIXME: *normalized* Windows drive letter - if !( - scheme_type.is_file() && - is_windows_drive_letter(&self.serialization[segment_start..]) - ) { - self.serialization.truncate(segment_start); - } - } - - } - - pub fn parse_cannot_be_a_base_path<'i>(&mut self, mut input: Input<'i>) -> Input<'i> { - loop { - let input_before_c = input.clone(); - match input.next_utf8() { - Some(('?', _)) | Some(('#', _)) if self.context == Context::UrlParser => { - return input_before_c - } - Some((c, utf8_c)) => { - self.check_url_code_point(c, &input); - self.serialization.extend(utf8_percent_encode( - utf8_c, SIMPLE_ENCODE_SET)); - } - None => return input - } - } - } - - fn with_query_and_fragment(mut self, scheme_end: u32, username_end: u32, - host_start: u32, host_end: u32, host: HostInternal, - port: Option<u16>, path_start: u32, remaining: Input) - -> ParseResult<Url> { - let (query_start, fragment_start) = - try!(self.parse_query_and_fragment(scheme_end, remaining)); - Ok(Url { - serialization: self.serialization, - scheme_end: scheme_end, - username_end: username_end, - host_start: host_start, - host_end: host_end, - host: host, - port: port, - path_start: path_start, - query_start: query_start, - fragment_start: fragment_start - }) - } - - /// Return (query_start, fragment_start) - fn parse_query_and_fragment(&mut self, scheme_end: u32, mut input: Input) - -> ParseResult<(Option<u32>, Option<u32>)> { - let mut query_start = None; - match input.next() { - Some('#') => {} - Some('?') => { - query_start = Some(try!(to_u32(self.serialization.len()))); - self.serialization.push('?'); - let remaining = self.parse_query(scheme_end, input); - if let Some(remaining) = remaining { - input = remaining - } else { - return Ok((query_start, None)) - } - } - None => return Ok((None, None)), - _ => panic!("Programming error. parse_query_and_fragment() called without ? or # {:?}") - } - - let fragment_start = try!(to_u32(self.serialization.len())); - self.serialization.push('#'); - self.parse_fragment(input); - Ok((query_start, Some(fragment_start))) - } - - pub fn parse_query<'i>(&mut self, scheme_end: u32, mut input: Input<'i>) - -> Option<Input<'i>> { - let mut query = String::new(); // FIXME: use a streaming decoder instead - let mut remaining = None; - while let Some(c) = input.next() { - if c == '#' && self.context == Context::UrlParser { - remaining = Some(input); - break - } else { - self.check_url_code_point(c, &input); - query.push(c); - } - } - - let encoding = match &self.serialization[..scheme_end as usize] { - "http" | "https" | "file" | "ftp" | "gopher" => self.query_encoding_override, - _ => EncodingOverride::utf8(), - }; - let query_bytes = encoding.encode(query.into()); - self.serialization.extend(percent_encode(&query_bytes, QUERY_ENCODE_SET)); - remaining - } - - fn fragment_only(mut self, base_url: &Url, mut input: Input) -> ParseResult<Url> { - let before_fragment = match base_url.fragment_start { - Some(i) => base_url.slice(..i), - None => &*base_url.serialization, - }; - debug_assert!(self.serialization.is_empty()); - self.serialization.reserve(before_fragment.len() + input.chars.as_str().len()); - self.serialization.push_str(before_fragment); - self.serialization.push('#'); - let next = input.next(); - debug_assert!(next == Some('#')); - self.parse_fragment(input); - Ok(Url { - serialization: self.serialization, - fragment_start: Some(try!(to_u32(before_fragment.len()))), - ..*base_url - }) - } - - pub fn parse_fragment(&mut self, mut input: Input) { - while let Some(c) = input.next() { - if c == '\0' { - self.syntax_violation("NULL characters are ignored in URL fragment identifiers") - } else { - self.check_url_code_point(c, &input); - self.serialization.push(c); // No percent-encoding here. - } - } - } - - fn check_url_code_point(&self, c: char, input: &Input) { - if let Some(log) = self.log_syntax_violation { - if c == '%' { - let mut input = input.clone(); - if !matches!((input.next(), input.next()), (Some(a), Some(b)) - if is_ascii_hex_digit(a) && is_ascii_hex_digit(b)) { - log("expected 2 hex digits after %") - } - } else if !is_url_code_point(c) { - log("non-URL code point") - } - } - } -} - -#[inline] -fn is_ascii_hex_digit(c: char) -> bool { - matches!(c, 'a'...'f' | 'A'...'F' | '0'...'9') -} - -// Non URL code points: -// U+0000 to U+0020 (space) -// " # % < > [ \ ] ^ ` { | } -// U+007F to U+009F -// surrogates -// U+FDD0 to U+FDEF -// Last two of each plane: U+__FFFE to U+__FFFF for __ in 00 to 10 hex -#[inline] -fn is_url_code_point(c: char) -> bool { - matches!(c, - 'a'...'z' | - 'A'...'Z' | - '0'...'9' | - '!' | '$' | '&' | '\'' | '(' | ')' | '*' | '+' | ',' | '-' | - '.' | '/' | ':' | ';' | '=' | '?' | '@' | '_' | '~' | - '\u{A0}'...'\u{D7FF}' | '\u{E000}'...'\u{FDCF}' | '\u{FDF0}'...'\u{FFFD}' | - '\u{10000}'...'\u{1FFFD}' | '\u{20000}'...'\u{2FFFD}' | - '\u{30000}'...'\u{3FFFD}' | '\u{40000}'...'\u{4FFFD}' | - '\u{50000}'...'\u{5FFFD}' | '\u{60000}'...'\u{6FFFD}' | - '\u{70000}'...'\u{7FFFD}' | '\u{80000}'...'\u{8FFFD}' | - '\u{90000}'...'\u{9FFFD}' | '\u{A0000}'...'\u{AFFFD}' | - '\u{B0000}'...'\u{BFFFD}' | '\u{C0000}'...'\u{CFFFD}' | - '\u{D0000}'...'\u{DFFFD}' | '\u{E1000}'...'\u{EFFFD}' | - '\u{F0000}'...'\u{FFFFD}' | '\u{100000}'...'\u{10FFFD}') -} - -/// https://url.spec.whatwg.org/#c0-controls-and-space -#[inline] -fn c0_control_or_space(ch: char) -> bool { - ch <= ' ' // U+0000 to U+0020 -} - -/// https://url.spec.whatwg.org/#ascii-alpha -#[inline] -pub fn ascii_alpha(ch: char) -> bool { - matches!(ch, 'a'...'z' | 'A'...'Z') -} - -#[inline] -pub fn to_u32(i: usize) -> ParseResult<u32> { - if i <= ::std::u32::MAX as usize { - Ok(i as u32) - } else { - Err(ParseError::Overflow) - } -} - -/// Wether the scheme is file:, the path has a single segment, and that segment -/// is a Windows drive letter -fn is_windows_drive_letter(segment: &str) -> bool { - segment.len() == 2 - && starts_with_windows_drive_letter(segment) -} - -fn starts_with_windows_drive_letter(s: &str) -> bool { - ascii_alpha(s.as_bytes()[0] as char) - && matches!(s.as_bytes()[1], b':' | b'|') -} - -fn starts_with_windows_drive_letter_segment(input: &Input) -> bool { - let mut input = input.clone(); - matches!((input.next(), input.next(), input.next()), (Some(a), Some(b), Some(c)) - if ascii_alpha(a) && matches!(b, ':' | '|') && matches!(c, '/' | '\\' | '?' | '#')) -} diff --git a/third_party/rust/url/src/path_segments.rs b/third_party/rust/url/src/path_segments.rs deleted file mode 100644 index 437a84ee7..000000000 --- a/third_party/rust/url/src/path_segments.rs +++ /dev/null @@ -1,187 +0,0 @@ -// Copyright 2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -use parser::{self, SchemeType, to_u32}; -use std::str; -use Url; - -/// Exposes methods to manipulate the path of an URL that is not cannot-be-base. -/// -/// The path always starts with a `/` slash, and is made of slash-separated segments. -/// There is always at least one segment (which may be the empty string). -/// -/// Examples: -/// -/// ```rust -/// # use url::Url; -/// let mut url = Url::parse("mailto:me@example.com").unwrap(); -/// assert!(url.path_segments_mut().is_err()); -/// -/// let mut url = Url::parse("http://example.net/foo/index.html").unwrap(); -/// url.path_segments_mut().unwrap().pop().push("img").push("2/100%.png"); -/// assert_eq!(url.as_str(), "http://example.net/foo/img/2%2F100%25.png"); -/// ``` -pub struct PathSegmentsMut<'a> { - url: &'a mut Url, - after_first_slash: usize, - after_path: String, - old_after_path_position: u32, -} - -// Not re-exported outside the crate -pub fn new(url: &mut Url) -> PathSegmentsMut { - let after_path = url.take_after_path(); - let old_after_path_position = to_u32(url.serialization.len()).unwrap(); - debug_assert!(url.byte_at(url.path_start) == b'/'); - PathSegmentsMut { - after_first_slash: url.path_start as usize + "/".len(), - url: url, - old_after_path_position: old_after_path_position, - after_path: after_path, - } -} - -impl<'a> Drop for PathSegmentsMut<'a> { - fn drop(&mut self) { - self.url.restore_after_path(self.old_after_path_position, &self.after_path) - } -} - -impl<'a> PathSegmentsMut<'a> { - /// Remove all segments in the path, leaving the minimal `url.path() == "/"`. - /// - /// Returns `&mut Self` so that method calls can be chained. - /// - /// Example: - /// - /// ```rust - /// # use url::Url; - /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap(); - /// url.path_segments_mut().unwrap().clear().push("logout"); - /// assert_eq!(url.as_str(), "https://github.com/logout"); - /// ``` - pub fn clear(&mut self) -> &mut Self { - self.url.serialization.truncate(self.after_first_slash); - self - } - - /// Remove the last segment of this URL’s path if it is empty, - /// except if these was only one segment to begin with. - /// - /// In other words, remove one path trailing slash, if any, - /// unless it is also the initial slash (so this does nothing if `url.path() == "/")`. - /// - /// Returns `&mut Self` so that method calls can be chained. - /// - /// Example: - /// - /// ```rust - /// # use url::Url; - /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap(); - /// url.path_segments_mut().unwrap().push("pulls"); - /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url//pulls"); - /// - /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap(); - /// url.path_segments_mut().unwrap().pop_if_empty().push("pulls"); - /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/pulls"); - /// ``` - pub fn pop_if_empty(&mut self) -> &mut Self { - if self.url.serialization[self.after_first_slash..].ends_with('/') { - self.url.serialization.pop(); - } - self - } - - /// Remove the last segment of this URL’s path. - /// - /// If the path only has one segment, make it empty such that `url.path() == "/"`. - /// - /// Returns `&mut Self` so that method calls can be chained. - pub fn pop(&mut self) -> &mut Self { - let last_slash = self.url.serialization[self.after_first_slash..].rfind('/').unwrap_or(0); - self.url.serialization.truncate(self.after_first_slash + last_slash); - self - } - - /// Append the given segment at the end of this URL’s path. - /// - /// See the documentation for `.extend()`. - /// - /// Returns `&mut Self` so that method calls can be chained. - pub fn push(&mut self, segment: &str) -> &mut Self { - self.extend(Some(segment)) - } - - /// Append each segment from the given iterator at the end of this URL’s path. - /// - /// Each segment is percent-encoded like in `Url::parse` or `Url::join`, - /// except that `%` and `/` characters are also encoded (to `%25` and `%2F`). - /// This is unlike `Url::parse` where `%` is left as-is in case some of the input - /// is already percent-encoded, and `/` denotes a path segment separator.) - /// - /// Note that, in addition to slashes between new segments, - /// this always adds a slash between the existing path and the new segments - /// *except* if the existing path is `"/"`. - /// If the previous last segment was empty (if the path had a trailing slash) - /// the path after `.extend()` will contain two consecutive slashes. - /// If that is undesired, call `.pop_if_empty()` first. - /// - /// To obtain a behavior similar to `Url::join`, call `.pop()` unconditionally first. - /// - /// Returns `&mut Self` so that method calls can be chained. - /// - /// Example: - /// - /// ```rust - /// # use url::Url; - /// let mut url = Url::parse("https://github.com/").unwrap(); - /// let org = "servo"; - /// let repo = "rust-url"; - /// let issue_number = "188"; - /// url.path_segments_mut().unwrap().extend(&[org, repo, "issues", issue_number]); - /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/issues/188"); - /// ``` - /// - /// In order to make sure that parsing the serialization of an URL gives the same URL, - /// a segment is ignored if it is `"."` or `".."`: - /// - /// ```rust - /// # use url::Url; - /// let mut url = Url::parse("https://github.com/servo").unwrap(); - /// url.path_segments_mut().unwrap().extend(&["..", "rust-url", ".", "pulls"]); - /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/pulls"); - /// ``` - pub fn extend<I>(&mut self, segments: I) -> &mut Self - where I: IntoIterator, I::Item: AsRef<str> { - let scheme_type = SchemeType::from(self.url.scheme()); - let path_start = self.url.path_start as usize; - self.url.mutate(|parser| { - parser.context = parser::Context::PathSegmentSetter; - for segment in segments { - let segment = segment.as_ref(); - if matches!(segment, "." | "..") { - continue - } - if parser.serialization.len() > path_start + 1 { - parser.serialization.push('/'); - } - let mut has_host = true; // FIXME account for this? - parser.parse_path(scheme_type, &mut has_host, path_start, - parser::Input::new(segment)); - } - }); - self - } - - /// For internal testing, not part of the public API. - #[doc(hidden)] - pub fn assert_url_invariants(&mut self) -> &mut Self { - self.url.assert_invariants(); - self - } -} diff --git a/third_party/rust/url/src/percent_encoding.rs b/third_party/rust/url/src/percent_encoding.rs deleted file mode 100644 index a4fb6177a..000000000 --- a/third_party/rust/url/src/percent_encoding.rs +++ /dev/null @@ -1,344 +0,0 @@ -// Copyright 2013-2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -use encoding; -use std::ascii::AsciiExt; -use std::borrow::Cow; -use std::fmt; -use std::slice; -use std::str; - -/// Represents a set of characters / bytes that should be percent-encoded. -/// -/// See [encode sets specification](http://url.spec.whatwg.org/#simple-encode-set). -/// -/// Different characters need to be encoded in different parts of an URL. -/// For example, a literal `?` question mark in an URL’s path would indicate -/// the start of the query string. -/// A question mark meant to be part of the path therefore needs to be percent-encoded. -/// In the query string however, a question mark does not have any special meaning -/// and does not need to be percent-encoded. -/// -/// A few sets are defined in this module. -/// Use the [`define_encode_set!`](../macro.define_encode_set!.html) macro to define different ones. -pub trait EncodeSet: Clone { - /// Called with UTF-8 bytes rather than code points. - /// Should return true for all non-ASCII bytes. - fn contains(&self, byte: u8) -> bool; -} - -/// Define a new struct -/// that implements the [`EncodeSet`](percent_encoding/trait.EncodeSet.html) trait, -/// for use in [`percent_decode()`](percent_encoding/fn.percent_encode.html) -/// and related functions. -/// -/// Parameters are characters to include in the set in addition to those of the base set. -/// See [encode sets specification](http://url.spec.whatwg.org/#simple-encode-set). -/// -/// Example -/// ======= -/// -/// ```rust -/// #[macro_use] extern crate url; -/// use url::percent_encoding::{utf8_percent_encode, SIMPLE_ENCODE_SET}; -/// define_encode_set! { -/// /// This encode set is used in the URL parser for query strings. -/// pub QUERY_ENCODE_SET = [SIMPLE_ENCODE_SET] | {' ', '"', '#', '<', '>'} -/// } -/// # fn main() { -/// assert_eq!(utf8_percent_encode("foo bar", QUERY_ENCODE_SET).collect::<String>(), "foo%20bar"); -/// # } -/// ``` -#[macro_export] -macro_rules! define_encode_set { - ($(#[$attr: meta])* pub $name: ident = [$base_set: expr] | {$($ch: pat),*}) => { - $(#[$attr])* - #[derive(Copy, Clone)] - #[allow(non_camel_case_types)] - pub struct $name; - - impl $crate::percent_encoding::EncodeSet for $name { - #[inline] - fn contains(&self, byte: u8) -> bool { - match byte as char { - $( - $ch => true, - )* - _ => $base_set.contains(byte) - } - } - } - } -} - -/// This encode set is used for the path of cannot-be-a-base URLs. -#[derive(Copy, Clone)] -#[allow(non_camel_case_types)] -pub struct SIMPLE_ENCODE_SET; - -impl EncodeSet for SIMPLE_ENCODE_SET { - #[inline] - fn contains(&self, byte: u8) -> bool { - byte < 0x20 || byte > 0x7E - } -} - -define_encode_set! { - /// This encode set is used in the URL parser for query strings. - pub QUERY_ENCODE_SET = [SIMPLE_ENCODE_SET] | {' ', '"', '#', '<', '>'} -} - -define_encode_set! { - /// This encode set is used for path components. - pub DEFAULT_ENCODE_SET = [QUERY_ENCODE_SET] | {'`', '?', '{', '}'} -} - -define_encode_set! { - /// This encode set is used for on '/'-separated path segment - pub PATH_SEGMENT_ENCODE_SET = [DEFAULT_ENCODE_SET] | {'%', '/'} -} - -define_encode_set! { - /// This encode set is used for username and password. - pub USERINFO_ENCODE_SET = [DEFAULT_ENCODE_SET] | { - '/', ':', ';', '=', '@', '[', '\\', ']', '^', '|' - } -} - -/// Return the percent-encoding of the given bytes. -/// -/// This is unconditional, unlike `percent_encode()` which uses an encode set. -pub fn percent_encode_byte(byte: u8) -> &'static str { - let index = usize::from(byte) * 3; - &"\ - %00%01%02%03%04%05%06%07%08%09%0A%0B%0C%0D%0E%0F\ - %10%11%12%13%14%15%16%17%18%19%1A%1B%1C%1D%1E%1F\ - %20%21%22%23%24%25%26%27%28%29%2A%2B%2C%2D%2E%2F\ - %30%31%32%33%34%35%36%37%38%39%3A%3B%3C%3D%3E%3F\ - %40%41%42%43%44%45%46%47%48%49%4A%4B%4C%4D%4E%4F\ - %50%51%52%53%54%55%56%57%58%59%5A%5B%5C%5D%5E%5F\ - %60%61%62%63%64%65%66%67%68%69%6A%6B%6C%6D%6E%6F\ - %70%71%72%73%74%75%76%77%78%79%7A%7B%7C%7D%7E%7F\ - %80%81%82%83%84%85%86%87%88%89%8A%8B%8C%8D%8E%8F\ - %90%91%92%93%94%95%96%97%98%99%9A%9B%9C%9D%9E%9F\ - %A0%A1%A2%A3%A4%A5%A6%A7%A8%A9%AA%AB%AC%AD%AE%AF\ - %B0%B1%B2%B3%B4%B5%B6%B7%B8%B9%BA%BB%BC%BD%BE%BF\ - %C0%C1%C2%C3%C4%C5%C6%C7%C8%C9%CA%CB%CC%CD%CE%CF\ - %D0%D1%D2%D3%D4%D5%D6%D7%D8%D9%DA%DB%DC%DD%DE%DF\ - %E0%E1%E2%E3%E4%E5%E6%E7%E8%E9%EA%EB%EC%ED%EE%EF\ - %F0%F1%F2%F3%F4%F5%F6%F7%F8%F9%FA%FB%FC%FD%FE%FF\ - "[index..index + 3] -} - -/// Percent-encode the given bytes with the given encode set. -/// -/// The encode set define which bytes (in addition to non-ASCII and controls) -/// need to be percent-encoded. -/// The choice of this set depends on context. -/// For example, `?` needs to be encoded in an URL path but not in a query string. -/// -/// The return value is an iterator of `&str` slices (so it has a `.collect::<String>()` method) -/// that also implements `Display` and `Into<Cow<str>>`. -/// The latter returns `Cow::Borrowed` when none of the bytes in `input` -/// are in the given encode set. -#[inline] -pub fn percent_encode<E: EncodeSet>(input: &[u8], encode_set: E) -> PercentEncode<E> { - PercentEncode { - bytes: input, - encode_set: encode_set, - } -} - -/// Percent-encode the UTF-8 encoding of the given string. -/// -/// See `percent_encode()` for how to use the return value. -#[inline] -pub fn utf8_percent_encode<E: EncodeSet>(input: &str, encode_set: E) -> PercentEncode<E> { - percent_encode(input.as_bytes(), encode_set) -} - -/// The return type of `percent_encode()` and `utf8_percent_encode()`. -#[derive(Clone)] -pub struct PercentEncode<'a, E: EncodeSet> { - bytes: &'a [u8], - encode_set: E, -} - -impl<'a, E: EncodeSet> Iterator for PercentEncode<'a, E> { - type Item = &'a str; - - fn next(&mut self) -> Option<&'a str> { - if let Some((&first_byte, remaining)) = self.bytes.split_first() { - if self.encode_set.contains(first_byte) { - self.bytes = remaining; - Some(percent_encode_byte(first_byte)) - } else { - assert!(first_byte.is_ascii()); - for (i, &byte) in remaining.iter().enumerate() { - if self.encode_set.contains(byte) { - // 1 for first_byte + i for previous iterations of this loop - let (unchanged_slice, remaining) = self.bytes.split_at(1 + i); - self.bytes = remaining; - return Some(unsafe { str::from_utf8_unchecked(unchanged_slice) }) - } else { - assert!(byte.is_ascii()); - } - } - let unchanged_slice = self.bytes; - self.bytes = &[][..]; - Some(unsafe { str::from_utf8_unchecked(unchanged_slice) }) - } - } else { - None - } - } - - fn size_hint(&self) -> (usize, Option<usize>) { - if self.bytes.is_empty() { - (0, Some(0)) - } else { - (1, Some(self.bytes.len())) - } - } -} - -impl<'a, E: EncodeSet> fmt::Display for PercentEncode<'a, E> { - fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result { - for c in (*self).clone() { - try!(formatter.write_str(c)) - } - Ok(()) - } -} - -impl<'a, E: EncodeSet> From<PercentEncode<'a, E>> for Cow<'a, str> { - fn from(mut iter: PercentEncode<'a, E>) -> Self { - match iter.next() { - None => "".into(), - Some(first) => { - match iter.next() { - None => first.into(), - Some(second) => { - let mut string = first.to_owned(); - string.push_str(second); - string.extend(iter); - string.into() - } - } - } - } - } -} - -/// Percent-decode the given bytes. -/// -/// The return value is an iterator of decoded `u8` bytes -/// that also implements `Into<Cow<u8>>` -/// (which returns `Cow::Borrowed` when `input` contains no percent-encoded sequence) -/// and has `decode_utf8()` and `decode_utf8_lossy()` methods. -#[inline] -pub fn percent_decode<'a>(input: &'a [u8]) -> PercentDecode<'a> { - PercentDecode { - bytes: input.iter() - } -} - -/// The return type of `percent_decode()`. -#[derive(Clone)] -pub struct PercentDecode<'a> { - bytes: slice::Iter<'a, u8>, -} - -fn after_percent_sign(iter: &mut slice::Iter<u8>) -> Option<u8> { - let initial_iter = iter.clone(); - let h = iter.next().and_then(|&b| (b as char).to_digit(16)); - let l = iter.next().and_then(|&b| (b as char).to_digit(16)); - if let (Some(h), Some(l)) = (h, l) { - Some(h as u8 * 0x10 + l as u8) - } else { - *iter = initial_iter; - None - } -} - -impl<'a> Iterator for PercentDecode<'a> { - type Item = u8; - - fn next(&mut self) -> Option<u8> { - self.bytes.next().map(|&byte| { - if byte == b'%' { - after_percent_sign(&mut self.bytes).unwrap_or(byte) - } else { - byte - } - }) - } - - fn size_hint(&self) -> (usize, Option<usize>) { - let bytes = self.bytes.len(); - (bytes / 3, Some(bytes)) - } -} - -impl<'a> From<PercentDecode<'a>> for Cow<'a, [u8]> { - fn from(iter: PercentDecode<'a>) -> Self { - match iter.if_any() { - Some(vec) => Cow::Owned(vec), - None => Cow::Borrowed(iter.bytes.as_slice()), - } - } -} - -impl<'a> PercentDecode<'a> { - /// If the percent-decoding is different from the input, return it as a new bytes vector. - pub fn if_any(&self) -> Option<Vec<u8>> { - let mut bytes_iter = self.bytes.clone(); - while bytes_iter.find(|&&b| b == b'%').is_some() { - if let Some(decoded_byte) = after_percent_sign(&mut bytes_iter) { - let initial_bytes = self.bytes.as_slice(); - let unchanged_bytes_len = initial_bytes.len() - bytes_iter.len() - 3; - let mut decoded = initial_bytes[..unchanged_bytes_len].to_owned(); - decoded.push(decoded_byte); - decoded.extend(PercentDecode { - bytes: bytes_iter - }); - return Some(decoded) - } - } - // Nothing to decode - None - } - - /// Decode the result of percent-decoding as UTF-8. - /// - /// This is return `Err` when the percent-decoded bytes are not well-formed in UTF-8. - pub fn decode_utf8(self) -> Result<Cow<'a, str>, str::Utf8Error> { - match self.clone().into() { - Cow::Borrowed(bytes) => { - match str::from_utf8(bytes) { - Ok(s) => Ok(s.into()), - Err(e) => Err(e), - } - } - Cow::Owned(bytes) => { - match String::from_utf8(bytes) { - Ok(s) => Ok(s.into()), - Err(e) => Err(e.utf8_error()), - } - } - } - } - - /// Decode the result of percent-decoding as UTF-8, lossily. - /// - /// Invalid UTF-8 percent-encoded byte sequences will be replaced � U+FFFD, - /// the replacement character. - pub fn decode_utf8_lossy(self) -> Cow<'a, str> { - encoding::decode_utf8_lossy(self.clone().into()) - } -} diff --git a/third_party/rust/url/src/quirks.rs b/third_party/rust/url/src/quirks.rs deleted file mode 100644 index 9a7537f47..000000000 --- a/third_party/rust/url/src/quirks.rs +++ /dev/null @@ -1,217 +0,0 @@ -// Copyright 2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -//! Getters and setters for URL components implemented per https://url.spec.whatwg.org/#api -//! -//! Unless you need to be interoperable with web browsers, -//! you probably want to use `Url` method instead. - -use {Url, Position, Host, ParseError, idna}; -use parser::{Parser, SchemeType, default_port, Context, Input}; - -/// https://url.spec.whatwg.org/#dom-url-domaintoascii -pub fn domain_to_ascii(domain: &str) -> String { - match Host::parse(domain) { - Ok(Host::Domain(domain)) => domain, - _ => String::new(), - } -} - -/// https://url.spec.whatwg.org/#dom-url-domaintounicode -pub fn domain_to_unicode(domain: &str) -> String { - match Host::parse(domain) { - Ok(Host::Domain(ref domain)) => { - let (unicode, _errors) = idna::domain_to_unicode(domain); - unicode - } - _ => String::new(), - } -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-href -pub fn href(url: &Url) -> &str { - url.as_str() -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-href -pub fn set_href(url: &mut Url, value: &str) -> Result<(), ParseError> { - *url = try!(Url::parse(value)); - Ok(()) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-origin -pub fn origin(url: &Url) -> String { - url.origin().unicode_serialization() -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-protocol -#[inline] -pub fn protocol(url: &Url) -> &str { - &url.as_str()[..url.scheme().len() + ":".len()] -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-protocol -pub fn set_protocol(url: &mut Url, mut new_protocol: &str) -> Result<(), ()> { - // The scheme state in the spec ignores everything after the first `:`, - // but `set_scheme` errors if there is more. - if let Some(position) = new_protocol.find(':') { - new_protocol = &new_protocol[..position]; - } - url.set_scheme(new_protocol) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-username -#[inline] -pub fn username(url: &Url) -> &str { - url.username() -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-username -pub fn set_username(url: &mut Url, new_username: &str) -> Result<(), ()> { - url.set_username(new_username) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-password -#[inline] -pub fn password(url: &Url) -> &str { - url.password().unwrap_or("") -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-password -pub fn set_password(url: &mut Url, new_password: &str) -> Result<(), ()> { - url.set_password(if new_password.is_empty() { None } else { Some(new_password) }) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-host -#[inline] -pub fn host(url: &Url) -> &str { - &url[Position::BeforeHost..Position::AfterPort] -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-host -pub fn set_host(url: &mut Url, new_host: &str) -> Result<(), ()> { - if url.cannot_be_a_base() { - return Err(()) - } - let host; - let opt_port; - { - let scheme = url.scheme(); - let result = Parser::parse_host(Input::new(new_host), SchemeType::from(scheme)); - match result { - Ok((h, remaining)) => { - host = h; - opt_port = if let Some(remaining) = remaining.split_prefix(':') { - Parser::parse_port(remaining, || default_port(scheme), Context::Setter) - .ok().map(|(port, _remaining)| port) - } else { - None - }; - } - Err(_) => return Err(()) - } - } - url.set_host_internal(host, opt_port); - Ok(()) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-hostname -#[inline] -pub fn hostname(url: &Url) -> &str { - url.host_str().unwrap_or("") -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-hostname -pub fn set_hostname(url: &mut Url, new_hostname: &str) -> Result<(), ()> { - if url.cannot_be_a_base() { - return Err(()) - } - let result = Parser::parse_host(Input::new(new_hostname), SchemeType::from(url.scheme())); - if let Ok((host, _remaining)) = result { - url.set_host_internal(host, None); - Ok(()) - } else { - Err(()) - } -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-port -#[inline] -pub fn port(url: &Url) -> &str { - &url[Position::BeforePort..Position::AfterPort] -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-port -pub fn set_port(url: &mut Url, new_port: &str) -> Result<(), ()> { - let result; - { - // has_host implies !cannot_be_a_base - let scheme = url.scheme(); - if !url.has_host() || scheme == "file" { - return Err(()) - } - result = Parser::parse_port(Input::new(new_port), || default_port(scheme), Context::Setter) - } - if let Ok((new_port, _remaining)) = result { - url.set_port_internal(new_port); - Ok(()) - } else { - Err(()) - } -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-pathname -#[inline] -pub fn pathname(url: &Url) -> &str { - url.path() -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-pathname -pub fn set_pathname(url: &mut Url, new_pathname: &str) { - if !url.cannot_be_a_base() { - url.set_path(new_pathname) - } -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-search -pub fn search(url: &Url) -> &str { - trim(&url[Position::AfterPath..Position::AfterQuery]) -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-search -pub fn set_search(url: &mut Url, new_search: &str) { - url.set_query(match new_search { - "" => None, - _ if new_search.starts_with('?') => Some(&new_search[1..]), - _ => Some(new_search), - }) -} - -/// Getter for https://url.spec.whatwg.org/#dom-url-hash -pub fn hash(url: &Url) -> &str { - trim(&url[Position::AfterQuery..]) -} - -/// Setter for https://url.spec.whatwg.org/#dom-url-hash -pub fn set_hash(url: &mut Url, new_hash: &str) { - if url.scheme() != "javascript" { - url.set_fragment(match new_hash { - "" => None, - _ if new_hash.starts_with('#') => Some(&new_hash[1..]), - _ => Some(new_hash), - }) - } -} - -fn trim(s: &str) -> &str { - if s.len() == 1 { - "" - } else { - s - } -} diff --git a/third_party/rust/url/src/slicing.rs b/third_party/rust/url/src/slicing.rs deleted file mode 100644 index 926f3c796..000000000 --- a/third_party/rust/url/src/slicing.rs +++ /dev/null @@ -1,182 +0,0 @@ -// Copyright 2016 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -use std::ops::{Range, RangeFrom, RangeTo, RangeFull, Index}; -use Url; - -impl Index<RangeFull> for Url { - type Output = str; - fn index(&self, _: RangeFull) -> &str { - &self.serialization - } -} - -impl Index<RangeFrom<Position>> for Url { - type Output = str; - fn index(&self, range: RangeFrom<Position>) -> &str { - &self.serialization[self.index(range.start)..] - } -} - -impl Index<RangeTo<Position>> for Url { - type Output = str; - fn index(&self, range: RangeTo<Position>) -> &str { - &self.serialization[..self.index(range.end)] - } -} - -impl Index<Range<Position>> for Url { - type Output = str; - fn index(&self, range: Range<Position>) -> &str { - &self.serialization[self.index(range.start)..self.index(range.end)] - } -} - -/// Indicates a position within a URL based on its components. -/// -/// A range of positions can be used for slicing `Url`: -/// -/// ```rust -/// # use url::{Url, Position}; -/// # fn something(some_url: Url) { -/// let serialization: &str = &some_url[..]; -/// let serialization_without_fragment: &str = &some_url[..Position::AfterQuery]; -/// let authority: &str = &some_url[Position::BeforeUsername..Position::AfterPort]; -/// let data_url_payload: &str = &some_url[Position::BeforePath..Position::AfterQuery]; -/// let scheme_relative: &str = &some_url[Position::BeforeUsername..]; -/// # } -/// ``` -/// -/// In a pseudo-grammar (where `[`…`]?` makes a sub-sequence optional), -/// URL components and delimiters that separate them are: -/// -/// ```notrust -/// url = -/// scheme ":" -/// [ "//" [ username [ ":" password ]? "@" ]? host [ ":" port ]? ]? -/// path [ "?" query ]? [ "#" fragment ]? -/// ``` -/// -/// When a given component is not present, -/// its "before" and "after" position are the same -/// (so that `&some_url[BeforeFoo..AfterFoo]` is the empty string) -/// and component ordering is preserved -/// (so that a missing query "is between" a path and a fragment). -/// -/// The end of a component and the start of the next are either the same or separate -/// by a delimiter. -/// (Not that the initial `/` of a path is considered part of the path here, not a delimiter.) -/// For example, `&url[..BeforeFragment]` would include a `#` delimiter (if present in `url`), -/// so `&url[..AfterQuery]` might be desired instead. -/// -/// `BeforeScheme` and `AfterFragment` are always the start and end of the entire URL, -/// so `&url[BeforeScheme..X]` is the same as `&url[..X]` -/// and `&url[X..AfterFragment]` is the same as `&url[X..]`. -#[derive(Copy, Clone, Debug)] -pub enum Position { - BeforeScheme, - AfterScheme, - BeforeUsername, - AfterUsername, - BeforePassword, - AfterPassword, - BeforeHost, - AfterHost, - BeforePort, - AfterPort, - BeforePath, - AfterPath, - BeforeQuery, - AfterQuery, - BeforeFragment, - AfterFragment -} - -impl Url { - #[inline] - fn index(&self, position: Position) -> usize { - match position { - Position::BeforeScheme => 0, - - Position::AfterScheme => self.scheme_end as usize, - - Position::BeforeUsername => if self.has_authority() { - self.scheme_end as usize + "://".len() - } else { - debug_assert!(self.byte_at(self.scheme_end) == b':'); - debug_assert!(self.scheme_end + ":".len() as u32 == self.username_end); - self.scheme_end as usize + ":".len() - }, - - Position::AfterUsername => self.username_end as usize, - - Position::BeforePassword => if self.has_authority() && - self.byte_at(self.username_end) == b':' { - self.username_end as usize + ":".len() - } else { - debug_assert!(self.username_end == self.host_start); - self.username_end as usize - }, - - Position::AfterPassword => if self.has_authority() && - self.byte_at(self.username_end) == b':' { - debug_assert!(self.byte_at(self.host_start - "@".len() as u32) == b'@'); - self.host_start as usize - "@".len() - } else { - debug_assert!(self.username_end == self.host_start); - self.host_start as usize - }, - - Position::BeforeHost => self.host_start as usize, - - Position::AfterHost => self.host_end as usize, - - Position::BeforePort => if self.port.is_some() { - debug_assert!(self.byte_at(self.host_end) == b':'); - self.host_end as usize + ":".len() - } else { - self.host_end as usize - }, - - Position::AfterPort => self.path_start as usize, - - Position::BeforePath => self.path_start as usize, - - Position::AfterPath => match (self.query_start, self.fragment_start) { - (Some(q), _) => q as usize, - (None, Some(f)) => f as usize, - (None, None) => self.serialization.len(), - }, - - Position::BeforeQuery => match (self.query_start, self.fragment_start) { - (Some(q), _) => { - debug_assert!(self.byte_at(q) == b'?'); - q as usize + "?".len() - } - (None, Some(f)) => f as usize, - (None, None) => self.serialization.len(), - }, - - Position::AfterQuery => match self.fragment_start { - None => self.serialization.len(), - Some(f) => f as usize, - }, - - Position::BeforeFragment => match self.fragment_start { - Some(f) => { - debug_assert!(self.byte_at(f) == b'#'); - f as usize + "#".len() - } - None => self.serialization.len(), - }, - - Position::AfterFragment => self.serialization.len(), - } - } -} - diff --git a/third_party/rust/url/tests/data.rs b/third_party/rust/url/tests/data.rs deleted file mode 100644 index b8945aa48..000000000 --- a/third_party/rust/url/tests/data.rs +++ /dev/null @@ -1,193 +0,0 @@ -// Copyright 2013-2014 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -//! Data-driven tests - -extern crate rustc_serialize; -extern crate test; -extern crate url; - -use rustc_serialize::json::{self, Json}; -use url::{Url, quirks}; - - -fn run_parsing(input: String, base: String, expected: Result<ExpectedAttributes, ()>) { - let base = match Url::parse(&base) { - Ok(base) => base, - Err(message) => panic!("Error parsing base {:?}: {}", base, message) - }; - let (url, expected) = match (base.join(&input), expected) { - (Ok(url), Ok(expected)) => (url, expected), - (Err(_), Err(())) => return, - (Err(message), Ok(_)) => panic!("Error parsing URL {:?}: {}", input, message), - (Ok(_), Err(())) => panic!("Expected a parse error for URL {:?}", input), - }; - - url.assert_invariants(); - - macro_rules! assert_eq { - ($expected: expr, $got: expr) => { - { - let expected = $expected; - let got = $got; - assert!(expected == got, "{:?} != {} {:?} for URL {:?}", - got, stringify!($expected), expected, url); - } - } - } - - macro_rules! assert_attributes { - ($($attr: ident)+) => { - { - $( - assert_eq!(expected.$attr, quirks::$attr(&url)); - )+; - } - } - } - - assert_attributes!(href protocol username password host hostname port pathname search hash); - - if let Some(expected_origin) = expected.origin { - assert_eq!(expected_origin, quirks::origin(&url)); - } -} - -struct ExpectedAttributes { - href: String, - origin: Option<String>, - protocol: String, - username: String, - password: String, - host: String, - hostname: String, - port: String, - pathname: String, - search: String, - hash: String, -} - -trait JsonExt { - fn take(&mut self, key: &str) -> Option<Json>; - fn object(self) -> json::Object; - fn string(self) -> String; - fn take_string(&mut self, key: &str) -> String; -} - -impl JsonExt for Json { - fn take(&mut self, key: &str) -> Option<Json> { - self.as_object_mut().unwrap().remove(key) - } - - fn object(self) -> json::Object { - if let Json::Object(o) = self { o } else { panic!("Not a Json::Object") } - } - - fn string(self) -> String { - if let Json::String(s) = self { s } else { panic!("Not a Json::String") } - } - - fn take_string(&mut self, key: &str) -> String { - self.take(key).unwrap().string() - } -} - -fn collect_parsing<F: FnMut(String, test::TestFn)>(add_test: &mut F) { - // Copied form https://github.com/w3c/web-platform-tests/blob/master/url/ - let mut json = Json::from_str(include_str!("urltestdata.json")) - .expect("JSON parse error in urltestdata.json"); - for entry in json.as_array_mut().unwrap() { - if entry.is_string() { - continue // ignore comments - } - let base = entry.take_string("base"); - let input = entry.take_string("input"); - let expected = if entry.find("failure").is_some() { - Err(()) - } else { - Ok(ExpectedAttributes { - href: entry.take_string("href"), - origin: entry.take("origin").map(Json::string), - protocol: entry.take_string("protocol"), - username: entry.take_string("username"), - password: entry.take_string("password"), - host: entry.take_string("host"), - hostname: entry.take_string("hostname"), - port: entry.take_string("port"), - pathname: entry.take_string("pathname"), - search: entry.take_string("search"), - hash: entry.take_string("hash"), - }) - }; - add_test(format!("{:?} @ base {:?}", input, base), - test::TestFn::dyn_test_fn(move || run_parsing(input, base, expected))); - } -} - -fn collect_setters<F>(add_test: &mut F) where F: FnMut(String, test::TestFn) { - let mut json = Json::from_str(include_str!("setters_tests.json")) - .expect("JSON parse error in setters_tests.json"); - - macro_rules! setter { - ($attr: expr, $setter: ident) => {{ - let mut tests = json.take($attr).unwrap(); - for mut test in tests.as_array_mut().unwrap().drain(..) { - let comment = test.take("comment").map(Json::string).unwrap_or(String::new()); - let href = test.take_string("href"); - let new_value = test.take_string("new_value"); - let name = format!("{:?}.{} = {:?} {}", href, $attr, new_value, comment); - let mut expected = test.take("expected").unwrap(); - add_test(name, test::TestFn::dyn_test_fn(move || { - let mut url = Url::parse(&href).unwrap(); - url.assert_invariants(); - let _ = quirks::$setter(&mut url, &new_value); - assert_attributes!(url, expected, - href protocol username password host hostname port pathname search hash); - url.assert_invariants(); - })) - } - }} - } - macro_rules! assert_attributes { - ($url: expr, $expected: expr, $($attr: ident)+) => { - $( - if let Some(value) = $expected.take(stringify!($attr)) { - assert_eq!(quirks::$attr(&$url), value.string()) - } - )+ - } - } - setter!("protocol", set_protocol); - setter!("username", set_username); - setter!("password", set_password); - setter!("hostname", set_hostname); - setter!("host", set_host); - setter!("port", set_port); - setter!("pathname", set_pathname); - setter!("search", set_search); - setter!("hash", set_hash); -} - -fn main() { - let mut tests = Vec::new(); - { - let mut add_one = |name: String, run: test::TestFn| { - tests.push(test::TestDescAndFn { - desc: test::TestDesc { - name: test::DynTestName(name), - ignore: false, - should_panic: test::ShouldPanic::No, - }, - testfn: run, - }) - }; - collect_parsing(&mut add_one); - collect_setters(&mut add_one); - } - test::test_main(&std::env::args().collect::<Vec<_>>(), tests) -} diff --git a/third_party/rust/url/tests/setters_tests.json b/third_party/rust/url/tests/setters_tests.json deleted file mode 100644 index 669cc084a..000000000 --- a/third_party/rust/url/tests/setters_tests.json +++ /dev/null @@ -1,1148 +0,0 @@ -{ - "comment": [ - "## Tests for setters of https://url.spec.whatwg.org/#urlutils-members", - "", - "This file contains a JSON object.", - "Other than 'comment', each key is an attribute of the `URL` interface", - "defined in WHATWG’s URL Standard.", - "The values are arrays of test case objects for that attribute.", - "", - "To run a test case for the attribute `attr`:", - "", - "* Create a new `URL` object with the value for the 'href' key", - " the constructor single parameter. (Without a base URL.)", - " This must not throw.", - "* Set the attribute `attr` to (invoke its setter with)", - " with the value of for 'new_value' key.", - "* The value for the 'expected' key is another object.", - " For each `key` / `value` pair of that object,", - " get the attribute `key` (invoke its getter).", - " The returned string must be equal to `value`.", - "", - "Note: the 'href' setter is already covered by urltestdata.json." - ], - "protocol": [ - { - "comment": "The empty string is not a valid scheme. Setter leaves the URL unchanged.", - "href": "a://example.net", - "new_value": "", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "href": "a://example.net", - "new_value": "b", - "expected": { - "href": "b://example.net/", - "protocol": "b:" - } - }, - { - "comment": "Upper-case ASCII is lower-cased", - "href": "a://example.net", - "new_value": "B", - "expected": { - "href": "b://example.net/", - "protocol": "b:" - } - }, - { - "comment": "Non-ASCII is rejected", - "href": "a://example.net", - "new_value": "é", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "comment": "No leading digit", - "href": "a://example.net", - "new_value": "0b", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "comment": "No leading punctuation", - "href": "a://example.net", - "new_value": "+b", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "href": "a://example.net", - "new_value": "bC0+-.", - "expected": { - "href": "bc0+-.://example.net/", - "protocol": "bc0+-.:" - } - }, - { - "comment": "Only some punctuation is acceptable", - "href": "a://example.net", - "new_value": "b,c", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "comment": "Non-ASCII is rejected", - "href": "a://example.net", - "new_value": "bé", - "expected": { - "href": "a://example.net/", - "protocol": "a:" - } - }, - { - "comment": "Spec deviation: from special scheme to not is not problematic. https://github.com/whatwg/url/issues/104", - "href": "http://example.net", - "new_value": "b", - "expected": { - "href": "b://example.net/", - "protocol": "b:" - } - }, - { - "comment": "Cannot-be-a-base URL doesn’t have a host, but URL in a special scheme must.", - "href": "mailto:me@example.net", - "new_value": "http", - "expected": { - "href": "mailto:me@example.net", - "protocol": "mailto:" - } - }, - { - "comment": "Spec deviation: from non-special scheme with a host to special is not problematic. https://github.com/whatwg/url/issues/104", - "href": "ssh://me@example.net", - "new_value": "http", - "expected": { - "href": "http://me@example.net/", - "protocol": "http:" - } - }, - { - "comment": "Stuff after the first ':' is ignored", - "href": "http://example.net", - "new_value": "https:foo : bar", - "expected": { - "href": "https://example.net/", - "protocol": "https:" - } - }, - { - "comment": "Stuff after the first ':' is ignored", - "href": "data:text/html,<p>Test", - "new_value": "view-source+data:foo : bar", - "expected": { - "href": "view-source+data:text/html,<p>Test", - "protocol": "view-source+data:" - } - } - ], - "username": [ - { - "comment": "No host means no username", - "href": "file:///home/you/index.html", - "new_value": "me", - "expected": { - "href": "file:///home/you/index.html", - "username": "" - } - }, - { - "comment": "No host means no username", - "href": "unix:/run/foo.socket", - "new_value": "me", - "expected": { - "href": "unix:/run/foo.socket", - "username": "" - } - }, - { - "comment": "Cannot-be-a-base means no username", - "href": "mailto:you@example.net", - "new_value": "me", - "expected": { - "href": "mailto:you@example.net", - "username": "" - } - }, - { - "href": "http://example.net", - "new_value": "me", - "expected": { - "href": "http://me@example.net/", - "username": "me" - } - }, - { - "href": "http://:secret@example.net", - "new_value": "me", - "expected": { - "href": "http://me:secret@example.net/", - "username": "me" - } - }, - { - "href": "http://me@example.net", - "new_value": "", - "expected": { - "href": "http://example.net/", - "username": "" - } - }, - { - "href": "http://me:secret@example.net", - "new_value": "", - "expected": { - "href": "http://:secret@example.net/", - "username": "" - } - }, - { - "comment": "UTF-8 percent encoding with the userinfo encode set.", - "href": "http://example.net", - "new_value": "\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "expected": { - "href": "http://%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9@example.net/", - "username": "%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9" - } - }, - { - "comment": "Bytes already percent-encoded are left as-is.", - "href": "http://example.net", - "new_value": "%c3%89té", - "expected": { - "href": "http://%c3%89t%C3%A9@example.net/", - "username": "%c3%89t%C3%A9" - } - } - ], - "password": [ - { - "comment": "No host means no password", - "href": "file:///home/me/index.html", - "new_value": "secret", - "expected": { - "href": "file:///home/me/index.html", - "password": "" - } - }, - { - "comment": "No host means no password", - "href": "unix:/run/foo.socket", - "new_value": "secret", - "expected": { - "href": "unix:/run/foo.socket", - "password": "" - } - }, - { - "comment": "Cannot-be-a-base means no password", - "href": "mailto:me@example.net", - "new_value": "secret", - "expected": { - "href": "mailto:me@example.net", - "password": "" - } - }, - { - "href": "http://example.net", - "new_value": "secret", - "expected": { - "href": "http://:secret@example.net/", - "password": "secret" - } - }, - { - "href": "http://me@example.net", - "new_value": "secret", - "expected": { - "href": "http://me:secret@example.net/", - "password": "secret" - } - }, - { - "href": "http://:secret@example.net", - "new_value": "", - "expected": { - "href": "http://example.net/", - "password": "" - } - }, - { - "href": "http://me:secret@example.net", - "new_value": "", - "expected": { - "href": "http://me@example.net/", - "password": "" - } - }, - { - "comment": "UTF-8 percent encoding with the userinfo encode set.", - "href": "http://example.net", - "new_value": "\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "expected": { - "href": "http://:%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9@example.net/", - "password": "%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9" - } - }, - { - "comment": "Bytes already percent-encoded are left as-is.", - "href": "http://example.net", - "new_value": "%c3%89té", - "expected": { - "href": "http://:%c3%89t%C3%A9@example.net/", - "password": "%c3%89t%C3%A9" - } - } - ], - "host": [ - { - "comment": "Cannot-be-a-base means no host", - "href": "mailto:me@example.net", - "new_value": "example.com", - "expected": { - "href": "mailto:me@example.net", - "host": "" - } - }, - { - "comment": "Cannot-be-a-base means no password", - "href": "data:text/plain,Stuff", - "new_value": "example.net", - "expected": { - "href": "data:text/plain,Stuff", - "host": "" - } - }, - { - "href": "http://example.net", - "new_value": "example.com:8080", - "expected": { - "href": "http://example.com:8080/", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Port number is unchanged if not specified in the new value", - "href": "http://example.net:8080", - "new_value": "example.com", - "expected": { - "href": "http://example.com:8080/", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Port number is removed if empty in the new value: https://github.com/whatwg/url/pull/113", - "href": "http://example.net:8080", - "new_value": "example.com:", - "expected": { - "href": "http://example.com/", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "The empty host is not valid for special schemes", - "href": "http://example.net", - "new_value": "", - "expected": { - "href": "http://example.net/", - "host": "example.net" - } - }, - { - "comment": "The empty host is OK for non-special schemes", - "href": "view-source+http://example.net/foo", - "new_value": "", - "expected": { - "href": "view-source+http:///foo", - "host": "" - } - }, - { - "comment": "Path-only URLs can gain a host", - "href": "a:/foo", - "new_value": "example.net", - "expected": { - "href": "a://example.net/foo", - "host": "example.net" - } - }, - { - "comment": "Path-only URLs can gain a host", - "href": "a:/foo", - "new_value": "example.net", - "expected": { - "href": "a://example.net/foo", - "host": "example.net" - } - }, - { - "comment": "IPv4 address syntax is normalized", - "href": "http://example.net", - "new_value": "0x7F000001:8080", - "expected": { - "href": "http://127.0.0.1:8080/", - "host": "127.0.0.1:8080", - "hostname": "127.0.0.1", - "port": "8080" - } - }, - { - "comment": "IPv6 address syntax is normalized", - "href": "http://example.net", - "new_value": "[::0:01]:2", - "expected": { - "href": "http://[::1]:2/", - "host": "[::1]:2", - "hostname": "[::1]", - "port": "2" - } - }, - { - "comment": "Default port number is removed", - "href": "http://example.net", - "new_value": "example.com:80", - "expected": { - "href": "http://example.com/", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Default port number is removed", - "href": "https://example.net", - "new_value": "example.com:443", - "expected": { - "href": "https://example.com/", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Default port number is only removed for the relevant scheme", - "href": "https://example.net", - "new_value": "example.com:80", - "expected": { - "href": "https://example.com:80/", - "host": "example.com:80", - "hostname": "example.com", - "port": "80" - } - }, - { - "comment": "Stuff after a / delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com/stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a / delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com:8080/stuff", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Stuff after a ? delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com?stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a ? delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com:8080?stuff", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Stuff after a # delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com#stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a # delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com:8080#stuff", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Stuff after a \\ delimiter is ignored for special schemes", - "href": "http://example.net/path", - "new_value": "example.com\\stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a \\ delimiter is ignored for special schemes", - "href": "http://example.net/path", - "new_value": "example.com:8080\\stuff", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "\\ is not a delimiter for non-special schemes, and it’s invalid in a domain", - "href": "view-source+http://example.net/path", - "new_value": "example.com\\stuff", - "expected": { - "href": "view-source+http://example.net/path", - "host": "example.net", - "hostname": "example.net", - "port": "" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "view-source+http://example.net/path", - "new_value": "example.com:8080stuff2", - "expected": { - "href": "view-source+http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "http://example.net/path", - "new_value": "example.com:8080stuff2", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "http://example.net/path", - "new_value": "example.com:8080+2", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Port numbers are 16 bit integers", - "href": "http://example.net/path", - "new_value": "example.com:65535", - "expected": { - "href": "http://example.com:65535/path", - "host": "example.com:65535", - "hostname": "example.com", - "port": "65535" - } - }, - { - "comment": "Port numbers are 16 bit integers, overflowing is an error. Hostname is still set, though.", - "href": "http://example.net/path", - "new_value": "example.com:65536", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - } - ], - "hostname": [ - { - "comment": "Cannot-be-a-base means no host", - "href": "mailto:me@example.net", - "new_value": "example.com", - "expected": { - "href": "mailto:me@example.net", - "host": "" - } - }, - { - "comment": "Cannot-be-a-base means no password", - "href": "data:text/plain,Stuff", - "new_value": "example.net", - "expected": { - "href": "data:text/plain,Stuff", - "host": "" - } - }, - { - "href": "http://example.net:8080", - "new_value": "example.com", - "expected": { - "href": "http://example.com:8080/", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "The empty host is not valid for special schemes", - "href": "http://example.net", - "new_value": "", - "expected": { - "href": "http://example.net/", - "host": "example.net" - } - }, - { - "comment": "The empty host is OK for non-special schemes", - "href": "view-source+http://example.net/foo", - "new_value": "", - "expected": { - "href": "view-source+http:///foo", - "host": "" - } - }, - { - "comment": "Path-only URLs can gain a host", - "href": "a:/foo", - "new_value": "example.net", - "expected": { - "href": "a://example.net/foo", - "host": "example.net" - } - }, - { - "comment": "Path-only URLs can gain a host", - "href": "a:/foo", - "new_value": "example.net", - "expected": { - "href": "a://example.net/foo", - "host": "example.net" - } - }, - { - "comment": "IPv4 address syntax is normalized", - "href": "http://example.net:8080", - "new_value": "0x7F000001", - "expected": { - "href": "http://127.0.0.1:8080/", - "host": "127.0.0.1:8080", - "hostname": "127.0.0.1", - "port": "8080" - } - }, - { - "comment": "IPv6 address syntax is normalized", - "href": "http://example.net", - "new_value": "[::0:01]", - "expected": { - "href": "http://[::1]/", - "host": "[::1]", - "hostname": "[::1]", - "port": "" - } - }, - { - "comment": "Stuff after a : delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com:8080", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a : delimiter is ignored", - "href": "http://example.net:8080/path", - "new_value": "example.com:", - "expected": { - "href": "http://example.com:8080/path", - "host": "example.com:8080", - "hostname": "example.com", - "port": "8080" - } - }, - { - "comment": "Stuff after a / delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com/stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a ? delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com?stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a # delimiter is ignored", - "href": "http://example.net/path", - "new_value": "example.com#stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "Stuff after a \\ delimiter is ignored for special schemes", - "href": "http://example.net/path", - "new_value": "example.com\\stuff", - "expected": { - "href": "http://example.com/path", - "host": "example.com", - "hostname": "example.com", - "port": "" - } - }, - { - "comment": "\\ is not a delimiter for non-special schemes, and it’s invalid in a domain", - "href": "view-source+http://example.net/path", - "new_value": "example.com\\stuff", - "expected": { - "href": "view-source+http://example.net/path", - "host": "example.net", - "hostname": "example.net", - "port": "" - } - } - ], - "port": [ - { - "href": "http://example.net", - "new_value": "8080", - "expected": { - "href": "http://example.net:8080/", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Port number is removed if empty in the new value: https://github.com/whatwg/url/pull/113", - "href": "http://example.net:8080", - "new_value": "", - "expected": { - "href": "http://example.net/", - "host": "example.net", - "hostname": "example.net", - "port": "" - } - }, - { - "comment": "Default port number is removed", - "href": "http://example.net:8080", - "new_value": "80", - "expected": { - "href": "http://example.net/", - "host": "example.net", - "hostname": "example.net", - "port": "" - } - }, - { - "comment": "Default port number is removed", - "href": "https://example.net:4433", - "new_value": "443", - "expected": { - "href": "https://example.net/", - "host": "example.net", - "hostname": "example.net", - "port": "" - } - }, - { - "comment": "Default port number is only removed for the relevant scheme", - "href": "https://example.net", - "new_value": "80", - "expected": { - "href": "https://example.net:80/", - "host": "example.net:80", - "hostname": "example.net", - "port": "80" - } - }, - { - "comment": "Stuff after a / delimiter is ignored", - "href": "http://example.net/path", - "new_value": "8080/stuff", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Stuff after a ? delimiter is ignored", - "href": "http://example.net/path", - "new_value": "8080?stuff", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Stuff after a # delimiter is ignored", - "href": "http://example.net/path", - "new_value": "8080#stuff", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Stuff after a \\ delimiter is ignored for special schemes", - "href": "http://example.net/path", - "new_value": "8080\\stuff", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "view-source+http://example.net/path", - "new_value": "8080stuff2", - "expected": { - "href": "view-source+http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "http://example.net/path", - "new_value": "8080stuff2", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error", - "href": "http://example.net/path", - "new_value": "8080+2", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - }, - { - "comment": "Port numbers are 16 bit integers", - "href": "http://example.net/path", - "new_value": "65535", - "expected": { - "href": "http://example.net:65535/path", - "host": "example.net:65535", - "hostname": "example.net", - "port": "65535" - } - }, - { - "comment": "Port numbers are 16 bit integers, overflowing is an error", - "href": "http://example.net:8080/path", - "new_value": "65536", - "expected": { - "href": "http://example.net:8080/path", - "host": "example.net:8080", - "hostname": "example.net", - "port": "8080" - } - } - ], - "pathname": [ - { - "comment": "Cannot-be-a-base don’t have a path", - "href": "mailto:me@example.net", - "new_value": "/foo", - "expected": { - "href": "mailto:me@example.net", - "pathname": "me@example.net" - } - }, - { - "href": "unix:/run/foo.socket?timeout=10", - "new_value": "/var/log/../run/bar.socket", - "expected": { - "href": "unix:/var/run/bar.socket?timeout=10", - "pathname": "/var/run/bar.socket" - } - }, - { - "href": "https://example.net#nav", - "new_value": "home", - "expected": { - "href": "https://example.net/home#nav", - "pathname": "/home" - } - }, - { - "href": "https://example.net#nav", - "new_value": "../home", - "expected": { - "href": "https://example.net/home#nav", - "pathname": "/home" - } - }, - { - "comment": "\\ is a segment delimiter for 'special' URLs", - "href": "http://example.net/home?lang=fr#nav", - "new_value": "\\a\\%2E\\b\\%2e.\\c", - "expected": { - "href": "http://example.net/a/c?lang=fr#nav", - "pathname": "/a/c" - } - }, - { - "comment": "\\ is *not* a segment delimiter for non-'special' URLs", - "href": "view-source+http://example.net/home?lang=fr#nav", - "new_value": "\\a\\%2E\\b\\%2e.\\c", - "expected": { - "href": "view-source+http://example.net/\\a\\.\\b\\..\\c?lang=fr#nav", - "pathname": "/\\a\\.\\b\\..\\c" - } - }, - { - "comment": "UTF-8 percent encoding with the default encode set. Tabs and newlines are removed. Leading or training C0 controls and space are removed.", - "href": "a:/", - "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "expected": { - "href": "a:/!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E%3F@AZ[\\]^_%60az%7B|%7D~%7F%C2%80%C2%81%C3%89%C3%A9", - "pathname": "/!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E%3F@AZ[\\]^_%60az%7B|%7D~%7F%C2%80%C2%81%C3%89%C3%A9" - } - }, - { - "comment": "Bytes already percent-encoded are left as-is, except %2E.", - "href": "http://example.net", - "new_value": "%2e%2E%c3%89té", - "expected": { - "href": "http://example.net/..%c3%89t%C3%A9", - "pathname": "/..%c3%89t%C3%A9" - } - } - ], - "search": [ - { - "href": "https://example.net#nav", - "new_value": "lang=fr", - "expected": { - "href": "https://example.net/?lang=fr#nav", - "search": "?lang=fr" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "lang=fr", - "expected": { - "href": "https://example.net/?lang=fr#nav", - "search": "?lang=fr" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "?lang=fr", - "expected": { - "href": "https://example.net/?lang=fr#nav", - "search": "?lang=fr" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "??lang=fr", - "expected": { - "href": "https://example.net/??lang=fr#nav", - "search": "??lang=fr" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "?", - "expected": { - "href": "https://example.net/?#nav", - "search": "" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "", - "expected": { - "href": "https://example.net/#nav", - "search": "" - } - }, - { - "href": "https://example.net?lang=en-US", - "new_value": "", - "expected": { - "href": "https://example.net/", - "search": "" - } - }, - { - "href": "https://example.net", - "new_value": "", - "expected": { - "href": "https://example.net/", - "search": "" - } - }, - { - "comment": "UTF-8 percent encoding with the query encode set. Tabs and newlines are removed. Leading or training C0 controls and space are removed.", - "href": "a:/", - "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "expected": { - "href": "a:/?!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E?@AZ[\\]^_`az{|}~%7F%C2%80%C2%81%C3%89%C3%A9", - "search": "?!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E?@AZ[\\]^_`az{|}~%7F%C2%80%C2%81%C3%89%C3%A9" - } - }, - { - "comment": "Bytes already percent-encoded are left as-is", - "href": "http://example.net", - "new_value": "%c3%89té", - "expected": { - "href": "http://example.net/?%c3%89t%C3%A9", - "search": "?%c3%89t%C3%A9" - } - } - ], - "hash": [ - { - "href": "https://example.net", - "new_value": "main", - "expected": { - "href": "https://example.net/#main", - "hash": "#main" - } - }, - { - "href": "https://example.net#nav", - "new_value": "main", - "expected": { - "href": "https://example.net/#main", - "hash": "#main" - } - }, - { - "href": "https://example.net?lang=en-US", - "new_value": "##nav", - "expected": { - "href": "https://example.net/?lang=en-US##nav", - "hash": "##nav" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "#main", - "expected": { - "href": "https://example.net/?lang=en-US#main", - "hash": "#main" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "#", - "expected": { - "href": "https://example.net/?lang=en-US#", - "hash": "" - } - }, - { - "href": "https://example.net?lang=en-US#nav", - "new_value": "", - "expected": { - "href": "https://example.net/?lang=en-US", - "hash": "" - } - }, - { - "comment": "No percent-encoding at all (!); nuls, tabs, and newlines are removed. Leading or training C0 controls and space are removed.", - "href": "a:/", - "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "expected": { - "href": "a:/#!\u0001\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé", - "hash": "#!\u0001\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé" - } - }, - { - "comment": "Bytes already percent-encoded are left as-is", - "href": "http://example.net", - "new_value": "%c3%89té", - "expected": { - "href": "http://example.net/#%c3%89té", - "hash": "#%c3%89té" - } - } - ] -} diff --git a/third_party/rust/url/tests/unit.rs b/third_party/rust/url/tests/unit.rs deleted file mode 100644 index 7cea1000c..000000000 --- a/third_party/rust/url/tests/unit.rs +++ /dev/null @@ -1,303 +0,0 @@ -// Copyright 2013-2014 The rust-url developers. -// -// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or -// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license -// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your -// option. This file may not be copied, modified, or distributed -// except according to those terms. - -//! Unit tests - -extern crate url; - -use std::borrow::Cow; -use std::net::{Ipv4Addr, Ipv6Addr}; -use std::path::{Path, PathBuf}; -use url::{Host, Url, form_urlencoded}; - -macro_rules! assert_from_file_path { - ($path: expr) => { assert_from_file_path!($path, $path) }; - ($path: expr, $url_path: expr) => {{ - let url = Url::from_file_path(Path::new($path)).unwrap(); - assert_eq!(url.host(), None); - assert_eq!(url.path(), $url_path); - assert_eq!(url.to_file_path(), Ok(PathBuf::from($path))); - }}; -} - - - -#[test] -fn new_file_paths() { - if cfg!(unix) { - assert_eq!(Url::from_file_path(Path::new("relative")), Err(())); - assert_eq!(Url::from_file_path(Path::new("../relative")), Err(())); - } - if cfg!(windows) { - assert_eq!(Url::from_file_path(Path::new("relative")), Err(())); - assert_eq!(Url::from_file_path(Path::new(r"..\relative")), Err(())); - assert_eq!(Url::from_file_path(Path::new(r"\drive-relative")), Err(())); - assert_eq!(Url::from_file_path(Path::new(r"\\ucn\")), Err(())); - } - - if cfg!(unix) { - assert_from_file_path!("/foo/bar"); - assert_from_file_path!("/foo/ba\0r", "/foo/ba%00r"); - assert_from_file_path!("/foo/ba%00r", "/foo/ba%2500r"); - } -} - -#[test] -#[cfg(unix)] -fn new_path_bad_utf8() { - use std::ffi::OsStr; - use std::os::unix::prelude::*; - - let url = Url::from_file_path(Path::new(OsStr::from_bytes(b"/foo/ba\x80r"))).unwrap(); - let os_str = OsStr::from_bytes(b"/foo/ba\x80r"); - assert_eq!(url.to_file_path(), Ok(PathBuf::from(os_str))); -} - -#[test] -fn new_path_windows_fun() { - if cfg!(windows) { - assert_from_file_path!(r"C:\foo\bar", "/C:/foo/bar"); - assert_from_file_path!("C:\\foo\\ba\0r", "/C:/foo/ba%00r"); - - // Invalid UTF-8 - assert!(Url::parse("file:///C:/foo/ba%80r").unwrap().to_file_path().is_err()); - - // test windows canonicalized path - let path = PathBuf::from(r"\\?\C:\foo\bar"); - assert!(Url::from_file_path(path).is_ok()); - } -} - - -#[test] -fn new_directory_paths() { - if cfg!(unix) { - assert_eq!(Url::from_directory_path(Path::new("relative")), Err(())); - assert_eq!(Url::from_directory_path(Path::new("../relative")), Err(())); - - let url = Url::from_directory_path(Path::new("/foo/bar")).unwrap(); - assert_eq!(url.host(), None); - assert_eq!(url.path(), "/foo/bar/"); - } - if cfg!(windows) { - assert_eq!(Url::from_directory_path(Path::new("relative")), Err(())); - assert_eq!(Url::from_directory_path(Path::new(r"..\relative")), Err(())); - assert_eq!(Url::from_directory_path(Path::new(r"\drive-relative")), Err(())); - assert_eq!(Url::from_directory_path(Path::new(r"\\ucn\")), Err(())); - - let url = Url::from_directory_path(Path::new(r"C:\foo\bar")).unwrap(); - assert_eq!(url.host(), None); - assert_eq!(url.path(), "/C:/foo/bar/"); - } -} - -#[test] -fn from_str() { - assert!("http://testing.com/this".parse::<Url>().is_ok()); -} - -#[test] -fn issue_124() { - let url: Url = "file:a".parse().unwrap(); - assert_eq!(url.path(), "/a"); - let url: Url = "file:...".parse().unwrap(); - assert_eq!(url.path(), "/..."); - let url: Url = "file:..".parse().unwrap(); - assert_eq!(url.path(), "/"); -} - -#[test] -fn test_equality() { - use std::hash::{Hash, Hasher, SipHasher}; - - fn check_eq(a: &Url, b: &Url) { - assert_eq!(a, b); - - let mut h1 = SipHasher::new(); - a.hash(&mut h1); - let mut h2 = SipHasher::new(); - b.hash(&mut h2); - assert_eq!(h1.finish(), h2.finish()); - } - - fn url(s: &str) -> Url { - let rv = s.parse().unwrap(); - check_eq(&rv, &rv); - rv - } - - // Doesn't care if default port is given. - let a: Url = url("https://example.com/"); - let b: Url = url("https://example.com:443/"); - check_eq(&a, &b); - - // Different ports - let a: Url = url("http://example.com/"); - let b: Url = url("http://example.com:8080/"); - assert!(a != b, "{:?} != {:?}", a, b); - - // Different scheme - let a: Url = url("http://example.com/"); - let b: Url = url("https://example.com/"); - assert!(a != b); - - // Different host - let a: Url = url("http://foo.com/"); - let b: Url = url("http://bar.com/"); - assert!(a != b); - - // Missing path, automatically substituted. Semantically the same. - let a: Url = url("http://foo.com"); - let b: Url = url("http://foo.com/"); - check_eq(&a, &b); -} - -#[test] -fn host() { - fn assert_host(input: &str, host: Host<&str>) { - assert_eq!(Url::parse(input).unwrap().host(), Some(host)); - } - assert_host("http://www.mozilla.org", Host::Domain("www.mozilla.org")); - assert_host("http://1.35.33.49", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49))); - assert_host("http://[2001:0db8:85a3:08d3:1319:8a2e:0370:7344]", Host::Ipv6(Ipv6Addr::new( - 0x2001, 0x0db8, 0x85a3, 0x08d3, 0x1319, 0x8a2e, 0x0370, 0x7344))); - assert_host("http://1.35.+33.49", Host::Domain("1.35.+33.49")); - assert_host("http://[::]", Host::Ipv6(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 0))); - assert_host("http://[::1]", Host::Ipv6(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 1))); - assert_host("http://0x1.0X23.0x21.061", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49))); - assert_host("http://0x1232131", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49))); - assert_host("http://111", Host::Ipv4(Ipv4Addr::new(0, 0, 0, 111))); - assert_host("http://2..2.3", Host::Domain("2..2.3")); - assert!(Url::parse("http://42.0x1232131").is_err()); - assert!(Url::parse("http://192.168.0.257").is_err()); -} - -#[test] -fn host_serialization() { - // libstd’s `Display for Ipv6Addr` serializes 0:0:0:0:0:0:_:_ and 0:0:0:0:0:ffff:_:_ - // using IPv4-like syntax, as suggested in https://tools.ietf.org/html/rfc5952#section-4 - // but https://url.spec.whatwg.org/#concept-ipv6-serializer specifies not to. - - // Not [::0.0.0.2] / [::ffff:0.0.0.2] - assert_eq!(Url::parse("http://[0::2]").unwrap().host_str(), Some("[::2]")); - assert_eq!(Url::parse("http://[0::ffff:0:2]").unwrap().host_str(), Some("[::ffff:0:2]")); -} - -#[test] -fn test_idna() { - assert!("http://goșu.ro".parse::<Url>().is_ok()); - assert_eq!(Url::parse("http://☃.net/").unwrap().host(), Some(Host::Domain("xn--n3h.net"))); -} - -#[test] -fn test_serialization() { - let data = [ - ("http://example.com/", "http://example.com/"), - ("http://addslash.com", "http://addslash.com/"), - ("http://@emptyuser.com/", "http://emptyuser.com/"), - ("http://:@emptypass.com/", "http://:@emptypass.com/"), - ("http://user@user.com/", "http://user@user.com/"), - ("http://user:pass@userpass.com/", "http://user:pass@userpass.com/"), - ("http://slashquery.com/path/?q=something", "http://slashquery.com/path/?q=something"), - ("http://noslashquery.com/path?q=something", "http://noslashquery.com/path?q=something") - ]; - for &(input, result) in &data { - let url = Url::parse(input).unwrap(); - assert_eq!(url.as_str(), result); - } -} - -#[test] -fn test_form_urlencoded() { - let pairs: &[(Cow<str>, Cow<str>)] = &[ - ("foo".into(), "é&".into()), - ("bar".into(), "".into()), - ("foo".into(), "#".into()) - ]; - let encoded = form_urlencoded::Serializer::new(String::new()).extend_pairs(pairs).finish(); - assert_eq!(encoded, "foo=%C3%A9%26&bar=&foo=%23"); - assert_eq!(form_urlencoded::parse(encoded.as_bytes()).collect::<Vec<_>>(), pairs.to_vec()); -} - -#[test] -fn test_form_serialize() { - let encoded = form_urlencoded::Serializer::new(String::new()) - .append_pair("foo", "é&") - .append_pair("bar", "") - .append_pair("foo", "#") - .finish(); - assert_eq!(encoded, "foo=%C3%A9%26&bar=&foo=%23"); -} - -#[test] -/// https://github.com/servo/rust-url/issues/25 -fn issue_25() { - let filename = if cfg!(windows) { r"C:\run\pg.sock" } else { "/run/pg.sock" }; - let mut url = Url::from_file_path(filename).unwrap(); - url.assert_invariants(); - url.set_scheme("postgres").unwrap(); - url.assert_invariants(); - url.set_host(Some("")).unwrap(); - url.assert_invariants(); - url.set_username("me").unwrap(); - url.assert_invariants(); - let expected = format!("postgres://me@/{}run/pg.sock", if cfg!(windows) { "C:/" } else { "" }); - assert_eq!(url.as_str(), expected); -} - -#[test] -/// https://github.com/servo/rust-url/issues/61 -fn issue_61() { - let mut url = Url::parse("http://mozilla.org").unwrap(); - url.set_scheme("https").unwrap(); - assert_eq!(url.port(), None); - assert_eq!(url.port_or_known_default(), Some(443)); - url.assert_invariants(); -} - -#[test] -#[cfg(not(windows))] -/// https://github.com/servo/rust-url/issues/197 -fn issue_197() { - let mut url = Url::from_file_path("/").expect("Failed to parse path"); - url.assert_invariants(); - assert_eq!(url, Url::parse("file:///").expect("Failed to parse path + protocol")); - url.path_segments_mut().expect("path_segments_mut").pop_if_empty(); -} - -#[test] -/// https://github.com/servo/rust-url/issues/222 -fn append_trailing_slash() { - let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap(); - url.assert_invariants(); - url.path_segments_mut().unwrap().push(""); - url.assert_invariants(); - assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/?a=b"); -} - -#[test] -/// https://github.com/servo/rust-url/issues/227 -fn extend_query_pairs_then_mutate() { - let mut url: Url = "http://localhost:6767/foo/bar".parse().unwrap(); - url.query_pairs_mut().extend_pairs(vec![ ("auth", "my-token") ].into_iter()); - url.assert_invariants(); - assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?auth=my-token"); - url.path_segments_mut().unwrap().push("some_other_path"); - url.assert_invariants(); - assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/some_other_path?auth=my-token"); -} - -#[test] -/// https://github.com/servo/rust-url/issues/222 -fn append_empty_segment_then_mutate() { - let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap(); - url.assert_invariants(); - url.path_segments_mut().unwrap().push("").pop(); - url.assert_invariants(); - assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?a=b"); -} diff --git a/third_party/rust/url/tests/urltestdata.json b/third_party/rust/url/tests/urltestdata.json deleted file mode 100644 index ee5416ecf..000000000 --- a/third_party/rust/url/tests/urltestdata.json +++ /dev/null @@ -1,4277 +0,0 @@ -[ - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/segments.js", - { - "input": "http://example\t.\norg", - "base": "http://example.org/foo/bar", - "href": "http://example.org/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://user:pass@foo:21/bar;par?b#c", - "base": "http://example.org/foo/bar", - "href": "http://user:pass@foo:21/bar;par?b#c", - "origin": "http://foo:21", - "protocol": "http:", - "username": "user", - "password": "pass", - "host": "foo:21", - "hostname": "foo", - "port": "21", - "pathname": "/bar;par", - "search": "?b", - "hash": "#c" - }, - { - "input": "http:foo.com", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/foo.com", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/foo.com", - "search": "", - "hash": "" - }, - { - "input": "\t :foo.com \n", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:foo.com", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:foo.com", - "search": "", - "hash": "" - }, - { - "input": " foo.com ", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/foo.com", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/foo.com", - "search": "", - "hash": "" - }, - { - "input": "a:\t foo.com", - "base": "http://example.org/foo/bar", - "href": "a: foo.com", - "origin": "null", - "protocol": "a:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": " foo.com", - "search": "", - "hash": "" - }, - { - "input": "http://f:21/ b ? d # e ", - "base": "http://example.org/foo/bar", - "href": "http://f:21/%20b%20?%20d%20# e", - "origin": "http://f:21", - "protocol": "http:", - "username": "", - "password": "", - "host": "f:21", - "hostname": "f", - "port": "21", - "pathname": "/%20b%20", - "search": "?%20d%20", - "hash": "# e" - }, - { - "input": "http://f:/c", - "base": "http://example.org/foo/bar", - "href": "http://f/c", - "origin": "http://f", - "protocol": "http:", - "username": "", - "password": "", - "host": "f", - "hostname": "f", - "port": "", - "pathname": "/c", - "search": "", - "hash": "" - }, - { - "input": "http://f:0/c", - "base": "http://example.org/foo/bar", - "href": "http://f:0/c", - "origin": "http://f:0", - "protocol": "http:", - "username": "", - "password": "", - "host": "f:0", - "hostname": "f", - "port": "0", - "pathname": "/c", - "search": "", - "hash": "" - }, - { - "input": "http://f:00000000000000/c", - "base": "http://example.org/foo/bar", - "href": "http://f:0/c", - "origin": "http://f:0", - "protocol": "http:", - "username": "", - "password": "", - "host": "f:0", - "hostname": "f", - "port": "0", - "pathname": "/c", - "search": "", - "hash": "" - }, - { - "input": "http://f:00000000000000000000080/c", - "base": "http://example.org/foo/bar", - "href": "http://f/c", - "origin": "http://f", - "protocol": "http:", - "username": "", - "password": "", - "host": "f", - "hostname": "f", - "port": "", - "pathname": "/c", - "search": "", - "hash": "" - }, - { - "input": "http://f:b/c", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://f: /c", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://f:\n/c", - "base": "http://example.org/foo/bar", - "href": "http://f/c", - "origin": "http://f", - "protocol": "http:", - "username": "", - "password": "", - "host": "f", - "hostname": "f", - "port": "", - "pathname": "/c", - "search": "", - "hash": "" - }, - { - "input": "http://f:fifty-two/c", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://f:999999/c", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://f: 21 / b ? d # e ", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "" - }, - { - "input": " \t", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "" - }, - { - "input": ":foo.com/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:foo.com/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:foo.com/", - "search": "", - "hash": "" - }, - { - "input": ":foo.com\\", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:foo.com/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:foo.com/", - "search": "", - "hash": "" - }, - { - "input": ":", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:", - "search": "", - "hash": "" - }, - { - "input": ":a", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:a", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:a", - "search": "", - "hash": "" - }, - { - "input": ":/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:/", - "search": "", - "hash": "" - }, - { - "input": ":\\", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:/", - "search": "", - "hash": "" - }, - { - "input": ":#", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:#", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:", - "search": "", - "hash": "" - }, - { - "input": "#", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar#", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "" - }, - { - "input": "#/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar#/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "#/" - }, - { - "input": "#\\", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar#\\", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "#\\" - }, - { - "input": "#;?", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar#;?", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "#;?" - }, - { - "input": "?", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar?", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "" - }, - { - "input": "/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": ":23", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:23", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:23", - "search": "", - "hash": "" - }, - { - "input": "/:23", - "base": "http://example.org/foo/bar", - "href": "http://example.org/:23", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/:23", - "search": "", - "hash": "" - }, - { - "input": "::", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/::", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/::", - "search": "", - "hash": "" - }, - { - "input": "::23", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/::23", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/::23", - "search": "", - "hash": "" - }, - { - "input": "foo://", - "base": "http://example.org/foo/bar", - "href": "foo:///", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://a:b@c:29/d", - "base": "http://example.org/foo/bar", - "href": "http://a:b@c:29/d", - "origin": "http://c:29", - "protocol": "http:", - "username": "a", - "password": "b", - "host": "c:29", - "hostname": "c", - "port": "29", - "pathname": "/d", - "search": "", - "hash": "" - }, - { - "input": "http::@c:29", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/:@c:29", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/:@c:29", - "search": "", - "hash": "" - }, - { - "input": "http://&a:foo(b]c@d:2/", - "base": "http://example.org/foo/bar", - "href": "http://&a:foo(b%5Dc@d:2/", - "origin": "http://d:2", - "protocol": "http:", - "username": "&a", - "password": "foo(b%5Dc", - "host": "d:2", - "hostname": "d", - "port": "2", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://::@c@d:2", - "base": "http://example.org/foo/bar", - "href": "http://:%3A%40c@d:2/", - "origin": "http://d:2", - "protocol": "http:", - "username": "", - "password": "%3A%40c", - "host": "d:2", - "hostname": "d", - "port": "2", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://foo.com:b@d/", - "base": "http://example.org/foo/bar", - "href": "http://foo.com:b@d/", - "origin": "http://d", - "protocol": "http:", - "username": "foo.com", - "password": "b", - "host": "d", - "hostname": "d", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://foo.com/\\@", - "base": "http://example.org/foo/bar", - "href": "http://foo.com//@", - "origin": "http://foo.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo.com", - "hostname": "foo.com", - "port": "", - "pathname": "//@", - "search": "", - "hash": "" - }, - { - "input": "http:\\\\foo.com\\", - "base": "http://example.org/foo/bar", - "href": "http://foo.com/", - "origin": "http://foo.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo.com", - "hostname": "foo.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:\\\\a\\b:c\\d@foo.com\\", - "base": "http://example.org/foo/bar", - "href": "http://a/b:c/d@foo.com/", - "origin": "http://a", - "protocol": "http:", - "username": "", - "password": "", - "host": "a", - "hostname": "a", - "port": "", - "pathname": "/b:c/d@foo.com/", - "search": "", - "hash": "" - }, - { - "input": "foo:/", - "base": "http://example.org/foo/bar", - "href": "foo:/", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "foo:/bar.com/", - "base": "http://example.org/foo/bar", - "href": "foo:/bar.com/", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/bar.com/", - "search": "", - "hash": "" - }, - { - "input": "foo://///////", - "base": "http://example.org/foo/bar", - "href": "foo://///////", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "///////", - "search": "", - "hash": "" - }, - { - "input": "foo://///////bar.com/", - "base": "http://example.org/foo/bar", - "href": "foo://///////bar.com/", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "///////bar.com/", - "search": "", - "hash": "" - }, - { - "input": "foo:////://///", - "base": "http://example.org/foo/bar", - "href": "foo:////://///", - "origin": "null", - "protocol": "foo:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "//://///", - "search": "", - "hash": "" - }, - { - "input": "c:/foo", - "base": "http://example.org/foo/bar", - "href": "c:/foo", - "origin": "null", - "protocol": "c:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/foo", - "search": "", - "hash": "" - }, - { - "input": "//foo/bar", - "base": "http://example.org/foo/bar", - "href": "http://foo/bar", - "origin": "http://foo", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/bar", - "search": "", - "hash": "" - }, - { - "input": "http://foo/path;a??e#f#g", - "base": "http://example.org/foo/bar", - "href": "http://foo/path;a??e#f#g", - "origin": "http://foo", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/path;a", - "search": "??e", - "hash": "#f#g" - }, - { - "input": "http://foo/abcd?efgh?ijkl", - "base": "http://example.org/foo/bar", - "href": "http://foo/abcd?efgh?ijkl", - "origin": "http://foo", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/abcd", - "search": "?efgh?ijkl", - "hash": "" - }, - { - "input": "http://foo/abcd#foo?bar", - "base": "http://example.org/foo/bar", - "href": "http://foo/abcd#foo?bar", - "origin": "http://foo", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/abcd", - "search": "", - "hash": "#foo?bar" - }, - { - "input": "[61:24:74]:98", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/[61:24:74]:98", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/[61:24:74]:98", - "search": "", - "hash": "" - }, - { - "input": "http:[61:27]/:foo", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/[61:27]/:foo", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/[61:27]/:foo", - "search": "", - "hash": "" - }, - { - "input": "http://[1::2]:3:4", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://2001::1", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://2001::1]", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://2001::1]:80", - "base": "http://example.org/foo/bar", - "failure": true - }, - { - "input": "http://[2001::1]", - "base": "http://example.org/foo/bar", - "href": "http://[2001::1]/", - "origin": "http://[2001::1]", - "protocol": "http:", - "username": "", - "password": "", - "host": "[2001::1]", - "hostname": "[2001::1]", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://[2001::1]:80", - "base": "http://example.org/foo/bar", - "href": "http://[2001::1]/", - "origin": "http://[2001::1]", - "protocol": "http:", - "username": "", - "password": "", - "host": "[2001::1]", - "hostname": "[2001::1]", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/example.com/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/example.com/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftp:/example.com/", - "base": "http://example.org/foo/bar", - "href": "ftp://example.com/", - "origin": "ftp://example.com", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https:/example.com/", - "base": "http://example.org/foo/bar", - "href": "https://example.com/", - "origin": "https://example.com", - "protocol": "https:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "madeupscheme:/example.com/", - "base": "http://example.org/foo/bar", - "href": "madeupscheme:/example.com/", - "origin": "null", - "protocol": "madeupscheme:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "file:/example.com/", - "base": "http://example.org/foo/bar", - "href": "file:///example.com/", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftps:/example.com/", - "base": "http://example.org/foo/bar", - "href": "ftps:/example.com/", - "origin": "null", - "protocol": "ftps:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "gopher:/example.com/", - "base": "http://example.org/foo/bar", - "href": "gopher://example.com/", - "origin": "gopher://example.com", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws:/example.com/", - "base": "http://example.org/foo/bar", - "href": "ws://example.com/", - "origin": "ws://example.com", - "protocol": "ws:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss:/example.com/", - "base": "http://example.org/foo/bar", - "href": "wss://example.com/", - "origin": "wss://example.com", - "protocol": "wss:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "data:/example.com/", - "base": "http://example.org/foo/bar", - "href": "data:/example.com/", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "javascript:/example.com/", - "base": "http://example.org/foo/bar", - "href": "javascript:/example.com/", - "origin": "null", - "protocol": "javascript:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "mailto:/example.com/", - "base": "http://example.org/foo/bar", - "href": "mailto:/example.com/", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "http:example.com/", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/example.com/", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftp:example.com/", - "base": "http://example.org/foo/bar", - "href": "ftp://example.com/", - "origin": "ftp://example.com", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https:example.com/", - "base": "http://example.org/foo/bar", - "href": "https://example.com/", - "origin": "https://example.com", - "protocol": "https:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "madeupscheme:example.com/", - "base": "http://example.org/foo/bar", - "href": "madeupscheme:example.com/", - "origin": "null", - "protocol": "madeupscheme:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftps:example.com/", - "base": "http://example.org/foo/bar", - "href": "ftps:example.com/", - "origin": "null", - "protocol": "ftps:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "gopher:example.com/", - "base": "http://example.org/foo/bar", - "href": "gopher://example.com/", - "origin": "gopher://example.com", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws:example.com/", - "base": "http://example.org/foo/bar", - "href": "ws://example.com/", - "origin": "ws://example.com", - "protocol": "ws:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss:example.com/", - "base": "http://example.org/foo/bar", - "href": "wss://example.com/", - "origin": "wss://example.com", - "protocol": "wss:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "data:example.com/", - "base": "http://example.org/foo/bar", - "href": "data:example.com/", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "javascript:example.com/", - "base": "http://example.org/foo/bar", - "href": "javascript:example.com/", - "origin": "null", - "protocol": "javascript:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "mailto:example.com/", - "base": "http://example.org/foo/bar", - "href": "mailto:example.com/", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "/a/b/c", - "base": "http://example.org/foo/bar", - "href": "http://example.org/a/b/c", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/a/b/c", - "search": "", - "hash": "" - }, - { - "input": "/a/ /c", - "base": "http://example.org/foo/bar", - "href": "http://example.org/a/%20/c", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/a/%20/c", - "search": "", - "hash": "" - }, - { - "input": "/a%2fc", - "base": "http://example.org/foo/bar", - "href": "http://example.org/a%2fc", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/a%2fc", - "search": "", - "hash": "" - }, - { - "input": "/a/%2f/c", - "base": "http://example.org/foo/bar", - "href": "http://example.org/a/%2f/c", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/a/%2f/c", - "search": "", - "hash": "" - }, - { - "input": "#β", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar#β", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "", - "hash": "#β" - }, - { - "input": "data:text/html,test#test", - "base": "http://example.org/foo/bar", - "href": "data:text/html,test#test", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "text/html,test", - "search": "", - "hash": "#test" - }, - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/file.html", - { - "input": "file:c:\\foo\\bar.html", - "base": "file:///tmp/mock/path", - "href": "file:///c:/foo/bar.html", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/c:/foo/bar.html", - "search": "", - "hash": "" - }, - { - "input": " File:c|////foo\\bar.html", - "base": "file:///tmp/mock/path", - "href": "file:///c:////foo/bar.html", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/c:////foo/bar.html", - "search": "", - "hash": "" - }, - { - "input": "C|/foo/bar", - "base": "file:///tmp/mock/path", - "href": "file:///C:/foo/bar", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/C:/foo/bar", - "search": "", - "hash": "" - }, - { - "input": "/C|\\foo\\bar", - "base": "file:///tmp/mock/path", - "href": "file:///C:/foo/bar", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/C:/foo/bar", - "search": "", - "hash": "" - }, - { - "input": "//C|/foo/bar", - "base": "file:///tmp/mock/path", - "href": "file:///C:/foo/bar", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/C:/foo/bar", - "search": "", - "hash": "" - }, - { - "input": "//server/file", - "base": "file:///tmp/mock/path", - "href": "file://server/file", - "protocol": "file:", - "username": "", - "password": "", - "host": "server", - "hostname": "server", - "port": "", - "pathname": "/file", - "search": "", - "hash": "" - }, - { - "input": "\\\\server\\file", - "base": "file:///tmp/mock/path", - "href": "file://server/file", - "protocol": "file:", - "username": "", - "password": "", - "host": "server", - "hostname": "server", - "port": "", - "pathname": "/file", - "search": "", - "hash": "" - }, - { - "input": "/\\server/file", - "base": "file:///tmp/mock/path", - "href": "file://server/file", - "protocol": "file:", - "username": "", - "password": "", - "host": "server", - "hostname": "server", - "port": "", - "pathname": "/file", - "search": "", - "hash": "" - }, - { - "input": "file:///foo/bar.txt", - "base": "file:///tmp/mock/path", - "href": "file:///foo/bar.txt", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/foo/bar.txt", - "search": "", - "hash": "" - }, - { - "input": "file:///home/me", - "base": "file:///tmp/mock/path", - "href": "file:///home/me", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/home/me", - "search": "", - "hash": "" - }, - { - "input": "//", - "base": "file:///tmp/mock/path", - "href": "file:///", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "///", - "base": "file:///tmp/mock/path", - "href": "file:///", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "///test", - "base": "file:///tmp/mock/path", - "href": "file:///test", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/test", - "search": "", - "hash": "" - }, - { - "input": "file://test", - "base": "file:///tmp/mock/path", - "href": "file://test/", - "protocol": "file:", - "username": "", - "password": "", - "host": "test", - "hostname": "test", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "file://localhost", - "base": "file:///tmp/mock/path", - "href": "file:///", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "file://localhost/", - "base": "file:///tmp/mock/path", - "href": "file:///", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "file://localhost/test", - "base": "file:///tmp/mock/path", - "href": "file:///test", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/test", - "search": "", - "hash": "" - }, - { - "input": "test", - "base": "file:///tmp/mock/path", - "href": "file:///tmp/mock/test", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/tmp/mock/test", - "search": "", - "hash": "" - }, - { - "input": "file:test", - "base": "file:///tmp/mock/path", - "href": "file:///tmp/mock/test", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/tmp/mock/test", - "search": "", - "hash": "" - }, - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/path.js", - { - "input": "http://example.com/././foo", - "base": "about:blank", - "href": "http://example.com/foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/./.foo", - "base": "about:blank", - "href": "http://example.com/.foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/.foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/.", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/./", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar/..", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar/../", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/..bar", - "base": "about:blank", - "href": "http://example.com/foo/..bar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/..bar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar/../ton", - "base": "about:blank", - "href": "http://example.com/foo/ton", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/ton", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar/../ton/../../a", - "base": "about:blank", - "href": "http://example.com/a", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/a", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/../../..", - "base": "about:blank", - "href": "http://example.com/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/../../../ton", - "base": "about:blank", - "href": "http://example.com/ton", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/ton", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/%2e", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/%2e%2", - "base": "about:blank", - "href": "http://example.com/foo/.%2", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/.%2", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/%2e./%2e%2e/.%2e/%2e.bar", - "base": "about:blank", - "href": "http://example.com/..bar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/..bar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com////../..", - "base": "about:blank", - "href": "http://example.com//", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "//", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar//../..", - "base": "about:blank", - "href": "http://example.com/foo/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo/bar//..", - "base": "about:blank", - "href": "http://example.com/foo/bar/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo/bar/", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo", - "base": "about:blank", - "href": "http://example.com/foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/%20foo", - "base": "about:blank", - "href": "http://example.com/%20foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%20foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%", - "base": "about:blank", - "href": "http://example.com/foo%", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%2", - "base": "about:blank", - "href": "http://example.com/foo%2", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%2", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%2zbar", - "base": "about:blank", - "href": "http://example.com/foo%2zbar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%2zbar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%2©zbar", - "base": "about:blank", - "href": "http://example.com/foo%2%C3%82%C2%A9zbar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%2%C3%82%C2%A9zbar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%41%7a", - "base": "about:blank", - "href": "http://example.com/foo%41%7a", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%41%7a", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo\t\u0091%91", - "base": "about:blank", - "href": "http://example.com/foo%C2%91%91", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%C2%91%91", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo%00%51", - "base": "about:blank", - "href": "http://example.com/foo%00%51", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foo%00%51", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/(%28:%3A%29)", - "base": "about:blank", - "href": "http://example.com/(%28:%3A%29)", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/(%28:%3A%29)", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/%3A%3a%3C%3c", - "base": "about:blank", - "href": "http://example.com/%3A%3a%3C%3c", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%3A%3a%3C%3c", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/foo\tbar", - "base": "about:blank", - "href": "http://example.com/foobar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/foobar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com\\\\foo\\\\bar", - "base": "about:blank", - "href": "http://example.com//foo//bar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "//foo//bar", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/%7Ffp3%3Eju%3Dduvgw%3Dd", - "base": "about:blank", - "href": "http://example.com/%7Ffp3%3Eju%3Dduvgw%3Dd", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%7Ffp3%3Eju%3Dduvgw%3Dd", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/@asdf%40", - "base": "about:blank", - "href": "http://example.com/@asdf%40", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/@asdf%40", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/你好你好", - "base": "about:blank", - "href": "http://example.com/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD", - "search": "", - "hash": "" - }, - { - "input": "http://example.com/‥/foo", - "base": "about:blank", - "href": "http://example.com/%E2%80%A5/foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%E2%80%A5/foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com//foo", - "base": "about:blank", - "href": "http://example.com/%EF%BB%BF/foo", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%EF%BB%BF/foo", - "search": "", - "hash": "" - }, - { - "input": "http://example.com//foo//bar", - "base": "about:blank", - "href": "http://example.com/%E2%80%AE/foo/%E2%80%AD/bar", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/%E2%80%AE/foo/%E2%80%AD/bar", - "search": "", - "hash": "" - }, - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/relative.js", - { - "input": "http://www.google.com/foo?bar=baz#", - "base": "about:blank", - "href": "http://www.google.com/foo?bar=baz#", - "origin": "http://www.google.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.google.com", - "hostname": "www.google.com", - "port": "", - "pathname": "/foo", - "search": "?bar=baz", - "hash": "" - }, - { - "input": "http://www.google.com/foo?bar=baz# »", - "base": "about:blank", - "href": "http://www.google.com/foo?bar=baz# »", - "origin": "http://www.google.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.google.com", - "hostname": "www.google.com", - "port": "", - "pathname": "/foo", - "search": "?bar=baz", - "hash": "# »" - }, - { - "input": "data:test# »", - "base": "about:blank", - "href": "data:test# »", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "test", - "search": "", - "hash": "# »" - }, - { - "input": "http://[www.google.com]/", - "base": "about:blank", - "failure": true - }, - { - "input": "http://www.google.com", - "base": "about:blank", - "href": "http://www.google.com/", - "origin": "http://www.google.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.google.com", - "hostname": "www.google.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://192.0x00A80001", - "base": "about:blank", - "href": "http://192.168.0.1/", - "origin": "http://192.168.0.1", - "protocol": "http:", - "username": "", - "password": "", - "host": "192.168.0.1", - "hostname": "192.168.0.1", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://www/foo%2Ehtml", - "base": "about:blank", - "href": "http://www/foo.html", - "origin": "http://www", - "protocol": "http:", - "username": "", - "password": "", - "host": "www", - "hostname": "www", - "port": "", - "pathname": "/foo.html", - "search": "", - "hash": "" - }, - { - "input": "http://www/foo/%2E/html", - "base": "about:blank", - "href": "http://www/foo/html", - "origin": "http://www", - "protocol": "http:", - "username": "", - "password": "", - "host": "www", - "hostname": "www", - "port": "", - "pathname": "/foo/html", - "search": "", - "hash": "" - }, - { - "input": "http://user:pass@/", - "base": "about:blank", - "failure": true - }, - { - "input": "http://%25DOMAIN:foobar@foodomain.com/", - "base": "about:blank", - "href": "http://%25DOMAIN:foobar@foodomain.com/", - "origin": "http://foodomain.com", - "protocol": "http:", - "username": "%25DOMAIN", - "password": "foobar", - "host": "foodomain.com", - "hostname": "foodomain.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:\\\\www.google.com\\foo", - "base": "about:blank", - "href": "http://www.google.com/foo", - "origin": "http://www.google.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.google.com", - "hostname": "www.google.com", - "port": "", - "pathname": "/foo", - "search": "", - "hash": "" - }, - { - "input": "http://foo:80/", - "base": "about:blank", - "href": "http://foo/", - "origin": "http://foo", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://foo:81/", - "base": "about:blank", - "href": "http://foo:81/", - "origin": "http://foo:81", - "protocol": "http:", - "username": "", - "password": "", - "host": "foo:81", - "hostname": "foo", - "port": "81", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "httpa://foo:80/", - "base": "about:blank", - "href": "httpa://foo:80/", - "origin": "null", - "protocol": "httpa:", - "username": "", - "password": "", - "host": "foo:80", - "hostname": "foo", - "port": "80", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://foo:-80/", - "base": "about:blank", - "failure": true - }, - { - "input": "https://foo:443/", - "base": "about:blank", - "href": "https://foo/", - "origin": "https://foo", - "protocol": "https:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https://foo:80/", - "base": "about:blank", - "href": "https://foo:80/", - "origin": "https://foo:80", - "protocol": "https:", - "username": "", - "password": "", - "host": "foo:80", - "hostname": "foo", - "port": "80", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ftp://foo:21/", - "base": "about:blank", - "href": "ftp://foo/", - "origin": "ftp://foo", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ftp://foo:80/", - "base": "about:blank", - "href": "ftp://foo:80/", - "origin": "ftp://foo:80", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "foo:80", - "hostname": "foo", - "port": "80", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "gopher://foo:70/", - "base": "about:blank", - "href": "gopher://foo/", - "origin": "gopher://foo", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "gopher://foo:443/", - "base": "about:blank", - "href": "gopher://foo:443/", - "origin": "gopher://foo:443", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "foo:443", - "hostname": "foo", - "port": "443", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws://foo:80/", - "base": "about:blank", - "href": "ws://foo/", - "origin": "ws://foo", - "protocol": "ws:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws://foo:81/", - "base": "about:blank", - "href": "ws://foo:81/", - "origin": "ws://foo:81", - "protocol": "ws:", - "username": "", - "password": "", - "host": "foo:81", - "hostname": "foo", - "port": "81", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws://foo:443/", - "base": "about:blank", - "href": "ws://foo:443/", - "origin": "ws://foo:443", - "protocol": "ws:", - "username": "", - "password": "", - "host": "foo:443", - "hostname": "foo", - "port": "443", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws://foo:815/", - "base": "about:blank", - "href": "ws://foo:815/", - "origin": "ws://foo:815", - "protocol": "ws:", - "username": "", - "password": "", - "host": "foo:815", - "hostname": "foo", - "port": "815", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss://foo:80/", - "base": "about:blank", - "href": "wss://foo:80/", - "origin": "wss://foo:80", - "protocol": "wss:", - "username": "", - "password": "", - "host": "foo:80", - "hostname": "foo", - "port": "80", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss://foo:81/", - "base": "about:blank", - "href": "wss://foo:81/", - "origin": "wss://foo:81", - "protocol": "wss:", - "username": "", - "password": "", - "host": "foo:81", - "hostname": "foo", - "port": "81", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss://foo:443/", - "base": "about:blank", - "href": "wss://foo/", - "origin": "wss://foo", - "protocol": "wss:", - "username": "", - "password": "", - "host": "foo", - "hostname": "foo", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss://foo:815/", - "base": "about:blank", - "href": "wss://foo:815/", - "origin": "wss://foo:815", - "protocol": "wss:", - "username": "", - "password": "", - "host": "foo:815", - "hostname": "foo", - "port": "815", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/example.com/", - "base": "about:blank", - "href": "http://example.com/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ftp:/example.com/", - "base": "about:blank", - "href": "ftp://example.com/", - "origin": "ftp://example.com", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https:/example.com/", - "base": "about:blank", - "href": "https://example.com/", - "origin": "https://example.com", - "protocol": "https:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "madeupscheme:/example.com/", - "base": "about:blank", - "href": "madeupscheme:/example.com/", - "origin": "null", - "protocol": "madeupscheme:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "file:/example.com/", - "base": "about:blank", - "href": "file:///example.com/", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftps:/example.com/", - "base": "about:blank", - "href": "ftps:/example.com/", - "origin": "null", - "protocol": "ftps:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "gopher:/example.com/", - "base": "about:blank", - "href": "gopher://example.com/", - "origin": "gopher://example.com", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws:/example.com/", - "base": "about:blank", - "href": "ws://example.com/", - "origin": "ws://example.com", - "protocol": "ws:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss:/example.com/", - "base": "about:blank", - "href": "wss://example.com/", - "origin": "wss://example.com", - "protocol": "wss:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "data:/example.com/", - "base": "about:blank", - "href": "data:/example.com/", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "javascript:/example.com/", - "base": "about:blank", - "href": "javascript:/example.com/", - "origin": "null", - "protocol": "javascript:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "mailto:/example.com/", - "base": "about:blank", - "href": "mailto:/example.com/", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/example.com/", - "search": "", - "hash": "" - }, - { - "input": "http:example.com/", - "base": "about:blank", - "href": "http://example.com/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ftp:example.com/", - "base": "about:blank", - "href": "ftp://example.com/", - "origin": "ftp://example.com", - "protocol": "ftp:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https:example.com/", - "base": "about:blank", - "href": "https://example.com/", - "origin": "https://example.com", - "protocol": "https:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "madeupscheme:example.com/", - "base": "about:blank", - "href": "madeupscheme:example.com/", - "origin": "null", - "protocol": "madeupscheme:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "ftps:example.com/", - "base": "about:blank", - "href": "ftps:example.com/", - "origin": "null", - "protocol": "ftps:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "gopher:example.com/", - "base": "about:blank", - "href": "gopher://example.com/", - "origin": "gopher://example.com", - "protocol": "gopher:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "ws:example.com/", - "base": "about:blank", - "href": "ws://example.com/", - "origin": "ws://example.com", - "protocol": "ws:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "wss:example.com/", - "base": "about:blank", - "href": "wss://example.com/", - "origin": "wss://example.com", - "protocol": "wss:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "data:example.com/", - "base": "about:blank", - "href": "data:example.com/", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "javascript:example.com/", - "base": "about:blank", - "href": "javascript:example.com/", - "origin": "null", - "protocol": "javascript:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - { - "input": "mailto:example.com/", - "base": "about:blank", - "href": "mailto:example.com/", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "example.com/", - "search": "", - "hash": "" - }, - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/segments-userinfo-vs-host.html", - { - "input": "http:@www.example.com", - "base": "about:blank", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/@www.example.com", - "base": "about:blank", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://@www.example.com", - "base": "about:blank", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:a:b@www.example.com", - "base": "about:blank", - "href": "http://a:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/a:b@www.example.com", - "base": "about:blank", - "href": "http://a:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://a:b@www.example.com", - "base": "about:blank", - "href": "http://a:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://@pple.com", - "base": "about:blank", - "href": "http://pple.com/", - "origin": "http://pple.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "pple.com", - "hostname": "pple.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http::b@www.example.com", - "base": "about:blank", - "href": "http://:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/:b@www.example.com", - "base": "about:blank", - "href": "http://:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://:b@www.example.com", - "base": "about:blank", - "href": "http://:b@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "b", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/:@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http://user@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:/@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http://@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "https:@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:a:b@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:/a:b@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http://a:b@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http::@/www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:a:@www.example.com", - "base": "about:blank", - "href": "http://a:@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:/a:@www.example.com", - "base": "about:blank", - "href": "http://a:@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://a:@www.example.com", - "base": "about:blank", - "href": "http://a:@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "a", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://www.@pple.com", - "base": "about:blank", - "href": "http://www.@pple.com/", - "origin": "http://pple.com", - "protocol": "http:", - "username": "www.", - "password": "", - "host": "pple.com", - "hostname": "pple.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http:@:www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http:/@:www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http://@:www.example.com", - "base": "about:blank", - "failure": true - }, - { - "input": "http://:@www.example.com", - "base": "about:blank", - "href": "http://:@www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "# Others", - { - "input": "/", - "base": "http://www.example.com/test", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "/test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/test.txt", - "search": "", - "hash": "" - }, - { - "input": ".", - "base": "http://www.example.com/test", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "..", - "base": "http://www.example.com/test", - "href": "http://www.example.com/", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/test.txt", - "search": "", - "hash": "" - }, - { - "input": "./test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/test.txt", - "search": "", - "hash": "" - }, - { - "input": "../test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/test.txt", - "search": "", - "hash": "" - }, - { - "input": "../aaa/test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/aaa/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/aaa/test.txt", - "search": "", - "hash": "" - }, - { - "input": "../../test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/test.txt", - "search": "", - "hash": "" - }, - { - "input": "中/test.txt", - "base": "http://www.example.com/test", - "href": "http://www.example.com/%E4%B8%AD/test.txt", - "origin": "http://www.example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example.com", - "hostname": "www.example.com", - "port": "", - "pathname": "/%E4%B8%AD/test.txt", - "search": "", - "hash": "" - }, - { - "input": "http://www.example2.com", - "base": "http://www.example.com/test", - "href": "http://www.example2.com/", - "origin": "http://www.example2.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example2.com", - "hostname": "www.example2.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "//www.example2.com", - "base": "http://www.example.com/test", - "href": "http://www.example2.com/", - "origin": "http://www.example2.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.example2.com", - "hostname": "www.example2.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "file:...", - "base": "http://www.example.com/test", - "href": "file:///...", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/...", - "search": "", - "hash": "" - }, - { - "input": "file:..", - "base": "http://www.example.com/test", - "href": "file:///", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "file:a", - "base": "http://www.example.com/test", - "href": "file:///a", - "protocol": "file:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/a", - "search": "", - "hash": "" - }, - "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/host.html", - "Basic canonicalization, uppercase should be converted to lowercase", - { - "input": "http://ExAmPlE.CoM", - "base": "http://other.com/", - "href": "http://example.com/", - "origin": "http://example.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://example example.com", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://Goo%20 goo%7C|.com", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://[]", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://[:]", - "base": "http://other.com/", - "failure": true - }, - "U+3000 is mapped to U+0020 (space) which is disallowed", - { - "input": "http://GOO\u00a0\u3000goo.com", - "base": "http://other.com/", - "failure": true - }, - "Other types of space (no-break, zero-width, zero-width-no-break) are name-prepped away to nothing. U+200B, U+2060, and U+FEFF, are ignored", - { - "input": "http://GOO\u200b\u2060\ufeffgoo.com", - "base": "http://other.com/", - "href": "http://googoo.com/", - "origin": "http://googoo.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "googoo.com", - "hostname": "googoo.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "Ideographic full stop (full-width period for Chinese, etc.) should be treated as a dot. U+3002 is mapped to U+002E (dot)", - { - "input": "http://www.foo。bar.com", - "base": "http://other.com/", - "href": "http://www.foo.bar.com/", - "origin": "http://www.foo.bar.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "www.foo.bar.com", - "hostname": "www.foo.bar.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "Invalid unicode characters should fail... U+FDD0 is disallowed; %ef%b7%90 is U+FDD0", - { - "input": "http://\ufdd0zyx.com", - "base": "http://other.com/", - "failure": true - }, - "This is the same as previous but escaped", - { - "input": "http://%ef%b7%90zyx.com", - "base": "http://other.com/", - "failure": true - }, - "Test name prepping, fullwidth input should be converted to ASCII and NOT IDN-ized. This is 'Go' in fullwidth UTF-8/UTF-16.", - { - "input": "http://Go.com", - "base": "http://other.com/", - "href": "http://go.com/", - "origin": "http://go.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "go.com", - "hostname": "go.com", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "URL spec forbids the following. https://www.w3.org/Bugs/Public/show_bug.cgi?id=24257", - { - "input": "http://%41.com", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://%ef%bc%85%ef%bc%94%ef%bc%91.com", - "base": "http://other.com/", - "failure": true - }, - "...%00 in fullwidth should fail (also as escaped UTF-8 input)", - { - "input": "http://%00.com", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://%ef%bc%85%ef%bc%90%ef%bc%90.com", - "base": "http://other.com/", - "failure": true - }, - "Basic IDN support, UTF-8 and UTF-16 input should be converted to IDN", - { - "input": "http://你好你好", - "base": "http://other.com/", - "href": "http://xn--6qqa088eba/", - "origin": "http://你好你好", - "protocol": "http:", - "username": "", - "password": "", - "host": "xn--6qqa088eba", - "hostname": "xn--6qqa088eba", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "Invalid escaped characters should fail and the percents should be escaped. https://www.w3.org/Bugs/Public/show_bug.cgi?id=24191", - { - "input": "http://%zz%66%a.com", - "base": "http://other.com/", - "failure": true - }, - "If we get an invalid character that has been escaped.", - { - "input": "http://%25", - "base": "http://other.com/", - "failure": true - }, - { - "input": "http://hello%00", - "base": "http://other.com/", - "failure": true - }, - "Escaped numbers should be treated like IP addresses if they are.", - { - "input": "http://%30%78%63%30%2e%30%32%35%30.01", - "base": "http://other.com/", - "href": "http://192.168.0.1/", - "origin": "http://192.168.0.1", - "protocol": "http:", - "username": "", - "password": "", - "host": "192.168.0.1", - "hostname": "192.168.0.1", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://%30%78%63%30%2e%30%32%35%30.01%2e", - "base": "http://other.com/", - "href": "http://192.168.0.1/", - "origin": "http://192.168.0.1", - "protocol": "http:", - "username": "", - "password": "", - "host": "192.168.0.1", - "hostname": "192.168.0.1", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "http://192.168.0.257", - "base": "http://other.com/", - "failure": true - }, - "Invalid escaping should trigger the regular host error handling", - { - "input": "http://%3g%78%63%30%2e%30%32%35%30%2E.01", - "base": "http://other.com/", - "failure": true - }, - "Something that isn't exactly an IP should get treated as a host and spaces escaped", - { - "input": "http://192.168.0.1 hello", - "base": "http://other.com/", - "failure": true - }, - "Fullwidth and escaped UTF-8 fullwidth should still be treated as IP", - { - "input": "http://0Xc0.0250.01", - "base": "http://other.com/", - "href": "http://192.168.0.1/", - "origin": "http://192.168.0.1", - "protocol": "http:", - "username": "", - "password": "", - "host": "192.168.0.1", - "hostname": "192.168.0.1", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "Broken IPv6", - { - "input": "http://[google.com]", - "base": "http://other.com/", - "failure": true - }, - "Misc Unicode", - { - "input": "http://foo:💩@example.com/bar", - "base": "http://other.com/", - "href": "http://foo:%F0%9F%92%A9@example.com/bar", - "origin": "http://example.com", - "protocol": "http:", - "username": "foo", - "password": "%F0%9F%92%A9", - "host": "example.com", - "hostname": "example.com", - "port": "", - "pathname": "/bar", - "search": "", - "hash": "" - }, - "# resolving a fragment against any scheme succeeds", - { - "input": "#", - "base": "test:test", - "href": "test:test#", - "origin": "null", - "protocol": "test:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "test", - "search": "", - "hash": "" - }, - { - "input": "#x", - "base": "mailto:x@x.com", - "href": "mailto:x@x.com#x", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "x@x.com", - "search": "", - "hash": "#x" - }, - { - "input": "#x", - "base": "data:,", - "href": "data:,#x", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": ",", - "search": "", - "hash": "#x" - }, - { - "input": "#x", - "base": "about:blank", - "href": "about:blank#x", - "origin": "null", - "protocol": "about:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "blank", - "search": "", - "hash": "#x" - }, - { - "input": "#", - "base": "test:test?test", - "href": "test:test?test#", - "origin": "null", - "protocol": "test:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "test", - "search": "?test", - "hash": "" - }, - "# multiple @ in authority state", - { - "input": "https://@test@test@example:800/", - "base": "http://doesnotmatter/", - "href": "https://%40test%40test@example:800/", - "origin": "https://example:800", - "protocol": "https:", - "username": "%40test%40test", - "password": "", - "host": "example:800", - "hostname": "example", - "port": "800", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "https://@@@example", - "base": "http://doesnotmatter/", - "href": "https://%40%40@example/", - "origin": "https://example", - "protocol": "https:", - "username": "%40%40", - "password": "", - "host": "example", - "hostname": "example", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "non-az-09 characters", - { - "input": "http://`{}:`{}@h/`{}?`{}", - "base": "http://doesnotmatter/", - "href": "http://%60%7B%7D:%60%7B%7D@h/%60%7B%7D?`{}", - "origin": "http://h", - "protocol": "http:", - "username": "%60%7B%7D", - "password": "%60%7B%7D", - "host": "h", - "hostname": "h", - "port": "", - "pathname": "/%60%7B%7D", - "search": "?`{}", - "hash": "" - }, - "# Credentials in base", - { - "input": "/some/path", - "base": "http://user@example.org/smth", - "href": "http://user@example.org/some/path", - "origin": "http://example.org", - "protocol": "http:", - "username": "user", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/some/path", - "search": "", - "hash": "" - }, - { - "input": "", - "base": "http://user:pass@example.org:21/smth", - "href": "http://user:pass@example.org:21/smth", - "origin": "http://example.org:21", - "protocol": "http:", - "username": "user", - "password": "pass", - "host": "example.org:21", - "hostname": "example.org", - "port": "21", - "pathname": "/smth", - "search": "", - "hash": "" - }, - { - "input": "/some/path", - "base": "http://user:pass@example.org:21/smth", - "href": "http://user:pass@example.org:21/some/path", - "origin": "http://example.org:21", - "protocol": "http:", - "username": "user", - "password": "pass", - "host": "example.org:21", - "hostname": "example.org", - "port": "21", - "pathname": "/some/path", - "search": "", - "hash": "" - }, - "# a set of tests designed by zcorpan for relative URLs with unknown schemes", - { - "input": "i", - "base": "sc:sd", - "failure": true - }, - { - "input": "i", - "base": "sc:sd/sd", - "failure": true - }, - { - "input": "i", - "base": "sc:/pa/pa", - "href": "sc:/pa/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/i", - "search": "", - "hash": "" - }, - { - "input": "i", - "base": "sc://ho/pa", - "href": "sc://ho/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "ho", - "hostname": "ho", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "i", - "base": "sc:///pa/pa", - "href": "sc:///pa/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/i", - "search": "", - "hash": "" - }, - { - "input": "../i", - "base": "sc:sd", - "failure": true - }, - { - "input": "../i", - "base": "sc:sd/sd", - "failure": true - }, - { - "input": "../i", - "base": "sc:/pa/pa", - "href": "sc:/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "../i", - "base": "sc://ho/pa", - "href": "sc://ho/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "ho", - "hostname": "ho", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "../i", - "base": "sc:///pa/pa", - "href": "sc:///i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "/i", - "base": "sc:sd", - "failure": true - }, - { - "input": "/i", - "base": "sc:sd/sd", - "failure": true - }, - { - "input": "/i", - "base": "sc:/pa/pa", - "href": "sc:/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "/i", - "base": "sc://ho/pa", - "href": "sc://ho/i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "ho", - "hostname": "ho", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "/i", - "base": "sc:///pa/pa", - "href": "sc:///i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/i", - "search": "", - "hash": "" - }, - { - "input": "?i", - "base": "sc:sd", - "failure": true - }, - { - "input": "?i", - "base": "sc:sd/sd", - "failure": true - }, - { - "input": "?i", - "base": "sc:/pa/pa", - "href": "sc:/pa/pa?i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/pa", - "search": "?i", - "hash": "" - }, - { - "input": "?i", - "base": "sc://ho/pa", - "href": "sc://ho/pa?i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "ho", - "hostname": "ho", - "port": "", - "pathname": "/pa", - "search": "?i", - "hash": "" - }, - { - "input": "?i", - "base": "sc:///pa/pa", - "href": "sc:///pa/pa?i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/pa", - "search": "?i", - "hash": "" - }, - { - "input": "#i", - "base": "sc:sd", - "href": "sc:sd#i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "sd", - "search": "", - "hash": "#i" - }, - { - "input": "#i", - "base": "sc:sd/sd", - "href": "sc:sd/sd#i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "sd/sd", - "search": "", - "hash": "#i" - }, - { - "input": "#i", - "base": "sc:/pa/pa", - "href": "sc:/pa/pa#i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/pa", - "search": "", - "hash": "#i" - }, - { - "input": "#i", - "base": "sc://ho/pa", - "href": "sc://ho/pa#i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "ho", - "hostname": "ho", - "port": "", - "pathname": "/pa", - "search": "", - "hash": "#i" - }, - { - "input": "#i", - "base": "sc:///pa/pa", - "href": "sc:///pa/pa#i", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/pa/pa", - "search": "", - "hash": "#i" - }, - "# make sure that relative URL logic works on known typically non-relative schemes too", - { - "input": "about:/../", - "base": "about:blank", - "href": "about:/", - "origin": "null", - "protocol": "about:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "data:/../", - "base": "about:blank", - "href": "data:/", - "origin": "null", - "protocol": "data:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "javascript:/../", - "base": "about:blank", - "href": "javascript:/", - "origin": "null", - "protocol": "javascript:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - { - "input": "mailto:/../", - "base": "about:blank", - "href": "mailto:/", - "origin": "null", - "protocol": "mailto:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "# unknown schemes and non-ASCII domains", - { - "input": "sc://ñ.test/", - "base": "about:blank", - "href": "sc://xn--ida.test/", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "xn--ida.test", - "hostname": "xn--ida.test", - "port": "", - "pathname": "/", - "search": "", - "hash": "" - }, - "# unknown schemes and backslashes", - { - "input": "sc:\\../", - "base": "about:blank", - "href": "sc:\\../", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": "\\../", - "search": "", - "hash": "" - }, - "# unknown scheme with path looking like a password", - { - "input": "sc::a@example.net", - "base": "about:blank", - "href": "sc::a@example.net", - "origin": "null", - "protocol": "sc:", - "username": "", - "password": "", - "host": "", - "hostname": "", - "port": "", - "pathname": ":a@example.net", - "search": "", - "hash": "" - }, - "# tests from jsdom/whatwg-url designed for code coverage", - { - "input": "http://127.0.0.1:10100/relative_import.html", - "base": "about:blank", - "href": "http://127.0.0.1:10100/relative_import.html", - "origin": "http://127.0.0.1:10100", - "protocol": "http:", - "username": "", - "password": "", - "host": "127.0.0.1:10100", - "hostname": "127.0.0.1", - "port": "10100", - "pathname": "/relative_import.html", - "search": "", - "hash": "" - }, - { - "input": "http://facebook.com/?foo=%7B%22abc%22", - "base": "about:blank", - "href": "http://facebook.com/?foo=%7B%22abc%22", - "origin": "http://facebook.com", - "protocol": "http:", - "username": "", - "password": "", - "host": "facebook.com", - "hostname": "facebook.com", - "port": "", - "pathname": "/", - "search": "?foo=%7B%22abc%22", - "hash": "" - }, - { - "input": "https://localhost:3000/jqueryui@1.2.3", - "base": "about:blank", - "href": "https://localhost:3000/jqueryui@1.2.3", - "origin": "https://localhost:3000", - "protocol": "https:", - "username": "", - "password": "", - "host": "localhost:3000", - "hostname": "localhost", - "port": "3000", - "pathname": "/jqueryui@1.2.3", - "search": "", - "hash": "" - }, - "# tab/LF/CR", - { - "input": "h\tt\nt\rp://h\to\ns\rt:9\t0\n0\r0/p\ta\nt\rh?q\tu\ne\rry#f\tr\na\rg", - "base": "about:blank", - "href": "http://host:9000/path?query#frag", - "origin": "http://host:9000", - "protocol": "http:", - "username": "", - "password": "", - "host": "host:9000", - "hostname": "host", - "port": "9000", - "pathname": "/path", - "search": "?query", - "hash": "#frag" - }, - "# Stringification of URL.searchParams", - { - "input": "?a=b&c=d", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar?a=b&c=d", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "?a=b&c=d", - "searchParams": "a=b&c=d", - "hash": "" - }, - { - "input": "??a=b&c=d", - "base": "http://example.org/foo/bar", - "href": "http://example.org/foo/bar??a=b&c=d", - "origin": "http://example.org", - "protocol": "http:", - "username": "", - "password": "", - "host": "example.org", - "hostname": "example.org", - "port": "", - "pathname": "/foo/bar", - "search": "??a=b&c=d", - "searchParams": "%3Fa=b&c=d", - "hash": "" - } -] |