summaryrefslogtreecommitdiffstats
path: root/third_party/rust/url
diff options
context:
space:
mode:
authorMatt A. Tobin <mattatobin@localhost.localdomain>2018-02-02 04:16:08 -0500
committerMatt A. Tobin <mattatobin@localhost.localdomain>2018-02-02 04:16:08 -0500
commit5f8de423f190bbb79a62f804151bc24824fa32d8 (patch)
tree10027f336435511475e392454359edea8e25895d /third_party/rust/url
parent49ee0794b5d912db1f95dce6eb52d781dc210db5 (diff)
downloadUXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar
UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.gz
UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.lz
UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.tar.xz
UXP-5f8de423f190bbb79a62f804151bc24824fa32d8.zip
Add m-esr52 at 52.6.0
Diffstat (limited to 'third_party/rust/url')
-rw-r--r--third_party/rust/url/.cargo-checksum.json1
-rw-r--r--third_party/rust/url/.cargo-ok0
-rw-r--r--third_party/rust/url/.gitignore3
-rw-r--r--third_party/rust/url/.travis.yml8
-rw-r--r--third_party/rust/url/Cargo.toml38
-rw-r--r--third_party/rust/url/LICENSE-APACHE201
-rw-r--r--third_party/rust/url/LICENSE-MIT25
-rw-r--r--third_party/rust/url/Makefile5
-rw-r--r--third_party/rust/url/README.md10
-rw-r--r--third_party/rust/url/UPGRADING.md263
-rw-r--r--third_party/rust/url/appveyor.yml13
-rw-r--r--third_party/rust/url/docs/.nojekyll0
-rw-r--r--third_party/rust/url/docs/404.html3
-rw-r--r--third_party/rust/url/docs/index.html3
-rw-r--r--third_party/rust/url/github.pngbin0 -> 7786 bytes
-rw-r--r--third_party/rust/url/rust-url-todo14
-rw-r--r--third_party/rust/url/src/encoding.rs135
-rw-r--r--third_party/rust/url/src/form_urlencoded.rs364
-rw-r--r--third_party/rust/url/src/host.rs418
-rw-r--r--third_party/rust/url/src/lib.rs1456
-rw-r--r--third_party/rust/url/src/origin.rs114
-rw-r--r--third_party/rust/url/src/parser.rs1179
-rw-r--r--third_party/rust/url/src/path_segments.rs187
-rw-r--r--third_party/rust/url/src/percent_encoding.rs344
-rw-r--r--third_party/rust/url/src/quirks.rs217
-rw-r--r--third_party/rust/url/src/slicing.rs182
-rw-r--r--third_party/rust/url/tests/data.rs193
-rw-r--r--third_party/rust/url/tests/setters_tests.json1148
-rw-r--r--third_party/rust/url/tests/unit.rs303
-rw-r--r--third_party/rust/url/tests/urltestdata.json4277
30 files changed, 11104 insertions, 0 deletions
diff --git a/third_party/rust/url/.cargo-checksum.json b/third_party/rust/url/.cargo-checksum.json
new file mode 100644
index 000000000..84a2a4d9b
--- /dev/null
+++ b/third_party/rust/url/.cargo-checksum.json
@@ -0,0 +1 @@
+{"files":{".cargo-ok":"e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",".gitignore":"e20a03cb660e0039506f8828204fd93815ebfe051ef62194f8dcf3fc8b7d0e5a",".travis.yml":"2a3033f9edf86bc829de486fc1e74fe0bbe3166ed99b0139754ea29772c19b06","Cargo.toml":"30055a6d4ff3d1bf29a9fa99401e4ffffeecc4b5bade830843a9a5f1634fefd1","LICENSE-APACHE":"a60eea817514531668d7e00765731449fe14d059d3249e0bc93b36de45f759f2","LICENSE-MIT":"20c7855c364d57ea4c97889a5e8d98470a9952dade37bd9248b9a54431670e5e","Makefile":"92b64915724e3b5fec95ec96c5af738bd219b80709e18bf8639d784bc3d9a600","README.md":"eb3f4694003f408cbe3c7f3e9fbbc71241defb940cc55a816981f0f0f144c8eb","UPGRADING.md":"fbcc2d39bdf17db0745793db6626fcd5c909dddd4ce13b27566cfabece22c368","appveyor.yml":"c78486dbfbe6ebbf3d808afb9a19f7ec18c4704ce451c6305f0716999b70a1a6","docs/.nojekyll":"e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855","docs/404.html":"f61e6271c1ea1aa113b64b356e994595fa548f0433f89948d747503ad22195cd","docs/index.html":"f61e6271c1ea1aa113b64b356e994595fa548f0433f89948d747503ad22195cd","github.png":"b432fd855efe7c430fe6a57ccf83935c1996f03a7cdc8d6e1b34154b8c43f6ec","rust-url-todo":"1192cee7b6cedf2133d97dc6074b593a1d19b0ee13fff6f28d6329855044e575","src/encoding.rs":"7fb43e1c109bf9f2a80a05525082f90e79dba8e8056547571c49fba074406d39","src/form_urlencoded.rs":"172922f2c51eb8dae0182d70e5e0c2969f1b5b7aac026720ced9f84059465999","src/host.rs":"a654dc3c9ce9024b98698e000bc97abaac7f10c49b1635be8125cf72376fd5d1","src/lib.rs":"c3542aabc733f76a3b9c7d24b5c41e60e9eb84d2712660611300d1de0e7c2072","src/origin.rs":"d52010a280d363aed6832f7de5e52c1a62815302e59dcbc9cdc2574e2ac884b9","src/parser.rs":"8ca331ada66f309e91fcc375d8467c929b453979fe0ac5abe190eb8a32074db8","src/path_segments.rs":"0414985c441d0c0292ccc6f56a144b84728ae03382476e6cae1a766f8c333ef8","src/percent_encoding.rs":"44d3321eaa1c77715e9ea1421519289ca73612a31c3d6fce04ff489dfa7db3c5","src/quirks.rs":"3249d1a1f73dd29ec06d626ea2ea4d61e7b2a782543742a5bee422b2f3864b19","src/slicing.rs":"4e539886b23945a92094625f3e531a4bff40daa44240b5d19ee8577478c4f7fe","tests/data.rs":"d36f0ee509fb00524635a7968e336bb89674a82a4fcb06be189155e4b9d43db5","tests/setters_tests.json":"ebb439306ea748be6d0f93132cb59220c5805afd56357d6017f1eb1e4f0f80b3","tests/unit.rs":"9a05f55c7b381b58ee67ef8ef145220e5df88a403225a1a324a36afc9bb6a7d7","tests/urltestdata.json":"11abe4a459566c3929e3326828f8576cb59ec8fab1d191714c34eac28d5f15f9"},"package":"8527c62d9869a08325c38272b3f85668df22a65890c61a639d233dc0ed0b23a2"} \ No newline at end of file
diff --git a/third_party/rust/url/.cargo-ok b/third_party/rust/url/.cargo-ok
new file mode 100644
index 000000000..e69de29bb
--- /dev/null
+++ b/third_party/rust/url/.cargo-ok
diff --git a/third_party/rust/url/.gitignore b/third_party/rust/url/.gitignore
new file mode 100644
index 000000000..0284c25cc
--- /dev/null
+++ b/third_party/rust/url/.gitignore
@@ -0,0 +1,3 @@
+target
+Cargo.lock
+/.cargo/config
diff --git a/third_party/rust/url/.travis.yml b/third_party/rust/url/.travis.yml
new file mode 100644
index 000000000..810995dfa
--- /dev/null
+++ b/third_party/rust/url/.travis.yml
@@ -0,0 +1,8 @@
+language: rust
+rust:
+ - nightly
+ - beta
+ - stable
+script: make test
+notifications:
+ webhooks: http://build.servo.org:54856/travis
diff --git a/third_party/rust/url/Cargo.toml b/third_party/rust/url/Cargo.toml
new file mode 100644
index 000000000..c3f4d364b
--- /dev/null
+++ b/third_party/rust/url/Cargo.toml
@@ -0,0 +1,38 @@
+[package]
+
+name = "url"
+version = "1.2.1"
+authors = ["The rust-url developers"]
+
+description = "URL library for Rust, based on the WHATWG URL Standard"
+documentation = "http://servo.github.io/rust-url/url/index.html"
+repository = "https://github.com/servo/rust-url"
+readme = "README.md"
+keywords = ["url", "parser"]
+license = "MIT/Apache-2.0"
+
+[[test]]
+name = "unit"
+
+[[test]]
+name = "data"
+harness = false
+
+[lib]
+test = false
+
+[dev-dependencies]
+rustc-test = "0.1"
+rustc-serialize = "0.3"
+
+[features]
+query_encoding = ["encoding"]
+heap_size = ["heapsize"]
+
+[dependencies]
+encoding = {version = "0.2", optional = true}
+heapsize = {version = ">=0.1.1, <0.4", optional = true}
+idna = { version = "0.1.0", path = "./idna" }
+matches = "0.1"
+rustc-serialize = {version = "0.3", optional = true}
+serde = {version = ">=0.6.1, <0.9", optional = true}
diff --git a/third_party/rust/url/LICENSE-APACHE b/third_party/rust/url/LICENSE-APACHE
new file mode 100644
index 000000000..16fe87b06
--- /dev/null
+++ b/third_party/rust/url/LICENSE-APACHE
@@ -0,0 +1,201 @@
+ Apache License
+ Version 2.0, January 2004
+ http://www.apache.org/licenses/
+
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+1. Definitions.
+
+ "License" shall mean the terms and conditions for use, reproduction,
+ and distribution as defined by Sections 1 through 9 of this document.
+
+ "Licensor" shall mean the copyright owner or entity authorized by
+ the copyright owner that is granting the License.
+
+ "Legal Entity" shall mean the union of the acting entity and all
+ other entities that control, are controlled by, or are under common
+ control with that entity. For the purposes of this definition,
+ "control" means (i) the power, direct or indirect, to cause the
+ direction or management of such entity, whether by contract or
+ otherwise, or (ii) ownership of fifty percent (50%) or more of the
+ outstanding shares, or (iii) beneficial ownership of such entity.
+
+ "You" (or "Your") shall mean an individual or Legal Entity
+ exercising permissions granted by this License.
+
+ "Source" form shall mean the preferred form for making modifications,
+ including but not limited to software source code, documentation
+ source, and configuration files.
+
+ "Object" form shall mean any form resulting from mechanical
+ transformation or translation of a Source form, including but
+ not limited to compiled object code, generated documentation,
+ and conversions to other media types.
+
+ "Work" shall mean the work of authorship, whether in Source or
+ Object form, made available under the License, as indicated by a
+ copyright notice that is included in or attached to the work
+ (an example is provided in the Appendix below).
+
+ "Derivative Works" shall mean any work, whether in Source or Object
+ form, that is based on (or derived from) the Work and for which the
+ editorial revisions, annotations, elaborations, or other modifications
+ represent, as a whole, an original work of authorship. For the purposes
+ of this License, Derivative Works shall not include works that remain
+ separable from, or merely link (or bind by name) to the interfaces of,
+ the Work and Derivative Works thereof.
+
+ "Contribution" shall mean any work of authorship, including
+ the original version of the Work and any modifications or additions
+ to that Work or Derivative Works thereof, that is intentionally
+ submitted to Licensor for inclusion in the Work by the copyright owner
+ or by an individual or Legal Entity authorized to submit on behalf of
+ the copyright owner. For the purposes of this definition, "submitted"
+ means any form of electronic, verbal, or written communication sent
+ to the Licensor or its representatives, including but not limited to
+ communication on electronic mailing lists, source code control systems,
+ and issue tracking systems that are managed by, or on behalf of, the
+ Licensor for the purpose of discussing and improving the Work, but
+ excluding communication that is conspicuously marked or otherwise
+ designated in writing by the copyright owner as "Not a Contribution."
+
+ "Contributor" shall mean Licensor and any individual or Legal Entity
+ on behalf of whom a Contribution has been received by Licensor and
+ subsequently incorporated within the Work.
+
+2. Grant of Copyright License. Subject to the terms and conditions of
+ this License, each Contributor hereby grants to You a perpetual,
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+ copyright license to reproduce, prepare Derivative Works of,
+ publicly display, publicly perform, sublicense, and distribute the
+ Work and such Derivative Works in Source or Object form.
+
+3. Grant of Patent License. Subject to the terms and conditions of
+ this License, each Contributor hereby grants to You a perpetual,
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+ (except as stated in this section) patent license to make, have made,
+ use, offer to sell, sell, import, and otherwise transfer the Work,
+ where such license applies only to those patent claims licensable
+ by such Contributor that are necessarily infringed by their
+ Contribution(s) alone or by combination of their Contribution(s)
+ with the Work to which such Contribution(s) was submitted. If You
+ institute patent litigation against any entity (including a
+ cross-claim or counterclaim in a lawsuit) alleging that the Work
+ or a Contribution incorporated within the Work constitutes direct
+ or contributory patent infringement, then any patent licenses
+ granted to You under this License for that Work shall terminate
+ as of the date such litigation is filed.
+
+4. Redistribution. You may reproduce and distribute copies of the
+ Work or Derivative Works thereof in any medium, with or without
+ modifications, and in Source or Object form, provided that You
+ meet the following conditions:
+
+ (a) You must give any other recipients of the Work or
+ Derivative Works a copy of this License; and
+
+ (b) You must cause any modified files to carry prominent notices
+ stating that You changed the files; and
+
+ (c) You must retain, in the Source form of any Derivative Works
+ that You distribute, all copyright, patent, trademark, and
+ attribution notices from the Source form of the Work,
+ excluding those notices that do not pertain to any part of
+ the Derivative Works; and
+
+ (d) If the Work includes a "NOTICE" text file as part of its
+ distribution, then any Derivative Works that You distribute must
+ include a readable copy of the attribution notices contained
+ within such NOTICE file, excluding those notices that do not
+ pertain to any part of the Derivative Works, in at least one
+ of the following places: within a NOTICE text file distributed
+ as part of the Derivative Works; within the Source form or
+ documentation, if provided along with the Derivative Works; or,
+ within a display generated by the Derivative Works, if and
+ wherever such third-party notices normally appear. The contents
+ of the NOTICE file are for informational purposes only and
+ do not modify the License. You may add Your own attribution
+ notices within Derivative Works that You distribute, alongside
+ or as an addendum to the NOTICE text from the Work, provided
+ that such additional attribution notices cannot be construed
+ as modifying the License.
+
+ You may add Your own copyright statement to Your modifications and
+ may provide additional or different license terms and conditions
+ for use, reproduction, or distribution of Your modifications, or
+ for any such Derivative Works as a whole, provided Your use,
+ reproduction, and distribution of the Work otherwise complies with
+ the conditions stated in this License.
+
+5. Submission of Contributions. Unless You explicitly state otherwise,
+ any Contribution intentionally submitted for inclusion in the Work
+ by You to the Licensor shall be under the terms and conditions of
+ this License, without any additional terms or conditions.
+ Notwithstanding the above, nothing herein shall supersede or modify
+ the terms of any separate license agreement you may have executed
+ with Licensor regarding such Contributions.
+
+6. Trademarks. This License does not grant permission to use the trade
+ names, trademarks, service marks, or product names of the Licensor,
+ except as required for reasonable and customary use in describing the
+ origin of the Work and reproducing the content of the NOTICE file.
+
+7. Disclaimer of Warranty. Unless required by applicable law or
+ agreed to in writing, Licensor provides the Work (and each
+ Contributor provides its Contributions) on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+ implied, including, without limitation, any warranties or conditions
+ of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+ PARTICULAR PURPOSE. You are solely responsible for determining the
+ appropriateness of using or redistributing the Work and assume any
+ risks associated with Your exercise of permissions under this License.
+
+8. Limitation of Liability. In no event and under no legal theory,
+ whether in tort (including negligence), contract, or otherwise,
+ unless required by applicable law (such as deliberate and grossly
+ negligent acts) or agreed to in writing, shall any Contributor be
+ liable to You for damages, including any direct, indirect, special,
+ incidental, or consequential damages of any character arising as a
+ result of this License or out of the use or inability to use the
+ Work (including but not limited to damages for loss of goodwill,
+ work stoppage, computer failure or malfunction, or any and all
+ other commercial damages or losses), even if such Contributor
+ has been advised of the possibility of such damages.
+
+9. Accepting Warranty or Additional Liability. While redistributing
+ the Work or Derivative Works thereof, You may choose to offer,
+ and charge a fee for, acceptance of support, warranty, indemnity,
+ or other liability obligations and/or rights consistent with this
+ License. However, in accepting such obligations, You may act only
+ on Your own behalf and on Your sole responsibility, not on behalf
+ of any other Contributor, and only if You agree to indemnify,
+ defend, and hold each Contributor harmless for any liability
+ incurred by, or claims asserted against, such Contributor by reason
+ of your accepting any such warranty or additional liability.
+
+END OF TERMS AND CONDITIONS
+
+APPENDIX: How to apply the Apache License to your work.
+
+ To apply the Apache License to your work, attach the following
+ boilerplate notice, with the fields enclosed by brackets "[]"
+ replaced with your own identifying information. (Don't include
+ the brackets!) The text should be enclosed in the appropriate
+ comment syntax for the file format. We also recommend that a
+ file or class name and description of purpose be included on the
+ same "printed page" as the copyright notice for easier
+ identification within third-party archives.
+
+Copyright [yyyy] [name of copyright owner]
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
diff --git a/third_party/rust/url/LICENSE-MIT b/third_party/rust/url/LICENSE-MIT
new file mode 100644
index 000000000..24de6b418
--- /dev/null
+++ b/third_party/rust/url/LICENSE-MIT
@@ -0,0 +1,25 @@
+Copyright (c) 2013-2016 The rust-url developers
+
+Permission is hereby granted, free of charge, to any
+person obtaining a copy of this software and associated
+documentation files (the "Software"), to deal in the
+Software without restriction, including without
+limitation the rights to use, copy, modify, merge,
+publish, distribute, sublicense, and/or sell copies of
+the Software, and to permit persons to whom the Software
+is furnished to do so, subject to the following
+conditions:
+
+The above copyright notice and this permission notice
+shall be included in all copies or substantial portions
+of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF
+ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
+TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
+PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
+SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
+CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
+OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR
+IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+DEALINGS IN THE SOFTWARE.
diff --git a/third_party/rust/url/Makefile b/third_party/rust/url/Makefile
new file mode 100644
index 000000000..c6f1ff0c9
--- /dev/null
+++ b/third_party/rust/url/Makefile
@@ -0,0 +1,5 @@
+test:
+ cargo test --features "query_encoding serde rustc-serialize"
+ [ x$$TRAVIS_RUST_VERSION != xnightly ] || cargo test --features heapsize
+
+.PHONY: test
diff --git a/third_party/rust/url/README.md b/third_party/rust/url/README.md
new file mode 100644
index 000000000..0721254af
--- /dev/null
+++ b/third_party/rust/url/README.md
@@ -0,0 +1,10 @@
+rust-url
+========
+
+[![Travis build Status](https://travis-ci.org/servo/rust-url.svg?branch=master)](https://travis-ci.org/servo/rust-url) [![Appveyor build status](https://ci.appveyor.com/api/projects/status/ulkqx2xcemyod6xa?svg=true)](https://ci.appveyor.com/project/Manishearth/rust-url)
+
+URL library for Rust, based on the [URL Standard](https://url.spec.whatwg.org/).
+
+[Documentation](https://docs.rs/url/)
+
+Please see [UPGRADING.md](https://github.com/servo/rust-url/blob/master/UPGRADING.md) if you are upgrading from 0.x to 1.x.
diff --git a/third_party/rust/url/UPGRADING.md b/third_party/rust/url/UPGRADING.md
new file mode 100644
index 000000000..f156130f6
--- /dev/null
+++ b/third_party/rust/url/UPGRADING.md
@@ -0,0 +1,263 @@
+# Guide to upgrading from url 0.x to 1.x
+
+* The fields of `Url` are now private because the `Url` constructor, parser,
+ and setters maintain invariants that could be violated if you were to set the fields directly.
+ Instead of accessing, for example, `url.scheme`, use the getter method, such as `url.scheme()`.
+ Instead of assigning directly to a field, for example `url.scheme = "https".to_string()`,
+ use the setter method, such as `url.set_scheme("https").unwrap()`.
+ (Some setters validate the new value and return a `Result` that must be used).
+
+* The methods of `Url` now return `&str` instead of `String`,
+ thus reducing allocations and making serialization cheap.
+
+* The `path()` method on `url::Url` instances used to return `Option<&[String]>`;
+ now it returns `&str`.
+ If you would like functionality more similar to the old behavior of `path()`,
+ use `path_segments()` that returns `Option<str::Split<char>>`.
+
+ Before upgrading:
+
+ ```rust
+ let issue_list_url = Url::parse(
+ "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open"
+ ).unwrap();
+ assert_eq!(issue_list_url.path(), Some(&["rust-lang".to_string(),
+ "rust".to_string(),
+ "issues".to_string()][..]));
+ ```
+
+ After upgrading:
+
+ ```rust
+ let issue_list_url = Url::parse(
+ "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open"
+ ).unwrap();
+ assert_eq!(issue_list_url.path(), "/rust-lang/rust/issues");
+ assert_eq!(issue_list_url.path_segments().map(|c| c.collect::<Vec<_>>()),
+ Some(vec!["rust-lang", "rust", "issues"]));
+ ```
+
+* The `path_mut()` method on `url::Url` instances that allowed modification of a URL's path
+ has been replaced by `path_segments_mut()`.
+
+ Before upgrading:
+
+ ```rust
+ let mut url = Url::parse("https://github.com/rust-lang/rust").unwrap();
+ url.path_mut().unwrap().push("issues");
+ ```
+
+ After upgrading:
+
+ ```rust
+ let mut url = Url::parse("https://github.com/rust-lang/rust").unwrap();
+ url.path_segments_mut().unwrap().push("issues");
+ ```
+
+* The `domain_mut()` method on `url::Url` instances that allowed modification of a URL's domain
+ has been replaced by `set_host()` and `set_ip_host()`.
+
+* The `host()` method on `url::Url` instances used to return `Option<&Host>`;
+ now it returns `Option<Host<&str>>`.
+ The `serialize_host()` method that returned `Option<String>`
+ has been replaced by the `host_str()` method that returns `Option<&str>`.
+
+* The `serialize()` method on `url::Url` instances that returned `String`
+ has been replaced by an `as_str()` method that returns `&str`.
+
+ Before upgrading:
+
+ ```rust
+ let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap();
+ assert_eq!(this_document.serialize(), "http://servo.github.io/rust-url/url/index.html".to_string());
+ ```
+
+ After upgrading:
+
+ ```rust
+ let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap();
+ assert_eq!(this_document.as_str(), "http://servo.github.io/rust-url/url/index.html");
+ ```
+
+* `url::UrlParser` has been replaced by `url::Url::parse()` and `url::Url::join()`.
+
+ Before upgrading:
+
+ ```rust
+ let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap();
+ let css_url = UrlParser::new().base_url(&this_document).parse("../main.css").unwrap();
+ assert_eq!(css_url.serialize(), "http://servo.github.io/rust-url/main.css".to_string());
+ ```
+
+ After upgrading:
+
+ ```rust
+ let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap();
+ let css_url = this_document.join("../main.css").unwrap();
+ assert_eq!(css_url.as_str(), "http://servo.github.io/rust-url/main.css");
+ ```
+
+* `url::parse_path()` and `url::UrlParser::parse_path()` have been removed without replacement.
+ As a workaround, you can give a base URL that you then ignore too `url::Url::parse()`.
+
+ Before upgrading:
+
+ ```rust
+ let (path, query, fragment) = url::parse_path("/foo/bar/../baz?q=42").unwrap();
+ assert_eq!(path, vec!["foo".to_string(), "baz".to_string()]);
+ assert_eq!(query, Some("q=42".to_string()));
+ assert_eq!(fragment, None);
+ ```
+
+ After upgrading:
+
+ ```rust
+ let base = Url::parse("http://example.com").unwrap();
+ let with_path = base.join("/foo/bar/../baz?q=42").unwrap();
+ assert_eq!(with_path.path(), "/foo/baz");
+ assert_eq!(with_path.query(), Some("q=42"));
+ assert_eq!(with_path.fragment(), None);
+ ```
+
+* The `url::form_urlencoded::serialize()` method
+ has been replaced with the `url::form_urlencoded::Serializer` struct.
+ Instead of calling `serialize()` with key/value pairs,
+ create a new `Serializer` with a new string,
+ call the `extend_pairs()` method on the `Serializer` instance with the key/value pairs as the argument,
+ then call `finish()`.
+
+ Before upgrading:
+
+ ```rust
+ let form = url::form_urlencoded::serialize(form.iter().map(|(k, v)| {
+ (&k[..], &v[..])
+ }));
+ ```
+
+ After upgrading:
+
+ ```rust
+ let form = url::form_urlencoded::Serializer::new(String::new()).extend_pairs(
+ form.iter().map(|(k, v)| { (&k[..], &v[..]) })
+ ).finish();
+ ```
+
+* The `set_query_from_pairs()` method on `url::Url` instances that took key/value pairs
+ has been replaced with `query_pairs_mut()`, which allows you to modify the `url::Url`'s query pairs.
+
+ Before upgrading:
+
+ ```rust
+ let mut url = Url::parse("https://duckduckgo.com/").unwrap();
+ let pairs = vec![
+ ("q", "test"),
+ ("ia", "images"),
+ ];
+ url.set_query_from_pairs(pairs.iter().map(|&(k, v)| {
+ (&k[..], &v[..])
+ }));
+ ```
+
+ After upgrading:
+
+ ```rust
+ let mut url = Url::parse("https://duckduckgo.com/").unwrap();
+ let pairs = vec![
+ ("q", "test"),
+ ("ia", "images"),
+ ];
+ url.query_pairs_mut().clear().extend_pairs(
+ pairs.iter().map(|&(k, v)| { (&k[..], &v[..]) })
+ );
+ ```
+
+* `url::SchemeData`, its variants `Relative` and `NonRelative`,
+ and the struct `url::RelativeSchemeData` have been removed.
+ Instead of matching on these variants
+ to determine if you have a URL in a relative scheme such as HTTP
+ versus a URL in a non-relative scheme as data,
+ use the `cannot_be_a_base()` method to determine which kind you have.
+
+ Before upgrading:
+
+ ```rust
+ match url.scheme_data {
+ url::SchemeData::Relative(..) => {}
+ url::SchemeData::NonRelative(..) => {
+ return Err(human(format!("`{}` must have relative scheme \
+ data: {}", field, url)))
+ }
+ }
+ ```
+
+ After upgrading:
+
+ ```rust
+ if url.cannot_be_a_base() {
+ return Err(human(format!("`{}` must have relative scheme \
+ data: {}", field, url)))
+ }
+ ```
+
+* The functions `url::whatwg_scheme_type_mapper()`, the `SchemeType` enum,
+ and the `scheme_type_mapper()` method on `url::UrlParser` instances have been removed.
+ `SchemeType` had a method for getting the `default_port()`;
+ to replicate this functionality, use the method `port_or_known_default()` on `url::Url` instances.
+ The `port_or_default()` method on `url::Url` instances has been removed;
+ use `port_or_known_default()` instead.
+
+ Before upgrading:
+
+ ```rust
+ let port = match whatwg_scheme_type_mapper(&url.scheme) {
+ SchemeType::Relative(port) => port,
+ _ => return Err(format!("Invalid special scheme: `{}`",
+ raw_url.scheme)),
+ };
+ ```
+
+ After upgrading:
+
+ ```rust
+ let port = match url.port_or_known_default() {
+ Some(port) => port,
+ _ => return Err(format!("Invalid special scheme: `{}`",
+ url.scheme())),
+ };
+ ```
+
+* The following formatting utilities have been removed without replacement;
+ look at their linked previous implementations
+ if you would like to replicate the functionality in your code:
+ * [`url::format::PathFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL24)
+ * [`url::format::UserInfoFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL50)
+ * [`url::format::UrlNoFragmentFormatter`](https://github.com/servo/rust-url/pull/176/commits/9e759f18726c8e1343162922b87163d4dd08fe3c#diff-0bb16ac13b75e9b568fa4aff61b0e71dL70)
+
+* `url::percent_encoding::percent_decode()` used to have a return type of `Vec<u8>`;
+ now it returns an iterator of decoded `u8` bytes that also implements `Into<Cow<u8>>`.
+ Use `.into().to_owned()` to obtain a `Vec<u8>`.
+ (`.collect()` also works but might not be as efficient.)
+
+* The `url::percent_encoding::EncodeSet` struct and constant instances
+ used with `url::percent_encoding::percent_encode()`
+ have been changed to structs that implement the trait `url::percent_encoding::EncodeSet`.
+ * `SIMPLE_ENCODE_SET`, `QUERY_ENCODE_SET`, `DEFAULT_ENCODE_SET`,
+ and `USERINFO_ENCODE_SET` have the same behavior.
+ * `USERNAME_ENCODE_SET` and `PASSWORD_ENCODE_SET` have been removed;
+ use `USERINFO_ENCODE_SET` instead.
+ * `HTTP_VALUE_ENCODE_SET` has been removed;
+ an implementation of it in the new types can be found [in hyper's source](
+ https://github.com/hyperium/hyper/blob/67436c5bf615cf5a55a71e32b788afef5985570e/src/header/parsing.rs#L131-L138)
+ if you need to replicate this functionality in your code.
+ * `FORM_URLENCODED_ENCODE_SET` has been removed;
+ instead, use the functionality in `url::form_urlencoded`.
+ * `PATH_SEGMENT_ENCODE_SET` has been added for use on '/'-separated path segments.
+
+* `url::percent_encoding::percent_decode_to()` has been removed.
+ Use `url::percent_encoding::percent_decode()` which returns an iterator.
+ You can then use the iterator’s `collect()` method
+ or give it to some data structure’s `extend()` method.
+* A number of `ParseError` variants have changed.
+ [See the documentation for the current set](http://servo.github.io/rust-url/url/enum.ParseError.html).
+* `url::OpaqueOrigin::new()` and `url::Origin::UID(OpaqueOrigin)`
+ have been replaced by `url::Origin::new_opaque()` and `url::Origin::Opaque(OpaqueOrigin)`, respectively.
diff --git a/third_party/rust/url/appveyor.yml b/third_party/rust/url/appveyor.yml
new file mode 100644
index 000000000..5819d38b1
--- /dev/null
+++ b/third_party/rust/url/appveyor.yml
@@ -0,0 +1,13 @@
+install:
+ - ps: Start-FileDownload 'https://static.rust-lang.org/dist/rust-nightly-i686-pc-windows-gnu.exe'
+ - rust-nightly-i686-pc-windows-gnu.exe /VERYSILENT /NORESTART /DIR="C:\Program Files (x86)\Rust"
+ - SET PATH=%PATH%;C:\Program Files (x86)\Rust\bin
+ - rustc -V
+ - cargo -V
+ - git submodule update --init --recursive
+
+build: false
+
+test_script:
+ - cargo build
+ - cargo test --verbose
diff --git a/third_party/rust/url/docs/.nojekyll b/third_party/rust/url/docs/.nojekyll
new file mode 100644
index 000000000..e69de29bb
--- /dev/null
+++ b/third_party/rust/url/docs/.nojekyll
diff --git a/third_party/rust/url/docs/404.html b/third_party/rust/url/docs/404.html
new file mode 100644
index 000000000..b13eac0ee
--- /dev/null
+++ b/third_party/rust/url/docs/404.html
@@ -0,0 +1,3 @@
+<meta http-equiv="refresh" content="0; url=https://docs.rs/url/">
+<link rel="canonical" href="https://docs.rs/url/">
+<a href="https://docs.rs/url/">Moved to docs.rs</a>
diff --git a/third_party/rust/url/docs/index.html b/third_party/rust/url/docs/index.html
new file mode 100644
index 000000000..b13eac0ee
--- /dev/null
+++ b/third_party/rust/url/docs/index.html
@@ -0,0 +1,3 @@
+<meta http-equiv="refresh" content="0; url=https://docs.rs/url/">
+<link rel="canonical" href="https://docs.rs/url/">
+<a href="https://docs.rs/url/">Moved to docs.rs</a>
diff --git a/third_party/rust/url/github.png b/third_party/rust/url/github.png
new file mode 100644
index 000000000..b2c327097
--- /dev/null
+++ b/third_party/rust/url/github.png
Binary files differ
diff --git a/third_party/rust/url/rust-url-todo b/third_party/rust/url/rust-url-todo
new file mode 100644
index 000000000..6aeefbf13
--- /dev/null
+++ b/third_party/rust/url/rust-url-todo
@@ -0,0 +1,14 @@
+* standalone path parsing?
+* Test setters
+ * Test trim C0/space
+ * Test remove tab & newline
+
+
+
+#[test]
+fn test_path_segments() {
+ let mut url = Url::parse("http://example.net").unwrap();
+ url.push_path_segment("foo").unwrap();
+ url.extend_path_segments(&["bar", "b/az"]).unwrap();
+ assert_eq!(url.as_str(), "http://example.net/foo");
+}
diff --git a/third_party/rust/url/src/encoding.rs b/third_party/rust/url/src/encoding.rs
new file mode 100644
index 000000000..0703c788f
--- /dev/null
+++ b/third_party/rust/url/src/encoding.rs
@@ -0,0 +1,135 @@
+// Copyright 2013-2014 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+
+//! Abstraction that conditionally compiles either to rust-encoding,
+//! or to only support UTF-8.
+
+#[cfg(feature = "query_encoding")] extern crate encoding;
+
+use std::borrow::Cow;
+
+#[cfg(feature = "query_encoding")] use self::encoding::types::{DecoderTrap, EncoderTrap};
+#[cfg(feature = "query_encoding")] use self::encoding::label::encoding_from_whatwg_label;
+#[cfg(feature = "query_encoding")] pub use self::encoding::types::EncodingRef;
+
+#[cfg(feature = "query_encoding")]
+#[derive(Copy, Clone)]
+pub struct EncodingOverride {
+ /// `None` means UTF-8.
+ encoding: Option<EncodingRef>
+}
+
+#[cfg(feature = "query_encoding")]
+impl EncodingOverride {
+ pub fn from_opt_encoding(encoding: Option<EncodingRef>) -> Self {
+ encoding.map(Self::from_encoding).unwrap_or_else(Self::utf8)
+ }
+
+ pub fn from_encoding(encoding: EncodingRef) -> Self {
+ EncodingOverride {
+ encoding: if encoding.name() == "utf-8" { None } else { Some(encoding) }
+ }
+ }
+
+ #[inline]
+ pub fn utf8() -> Self {
+ EncodingOverride { encoding: None }
+ }
+
+ pub fn lookup(label: &[u8]) -> Option<Self> {
+ // Don't use String::from_utf8_lossy since no encoding label contains U+FFFD
+ // https://encoding.spec.whatwg.org/#names-and-labels
+ ::std::str::from_utf8(label)
+ .ok()
+ .and_then(encoding_from_whatwg_label)
+ .map(Self::from_encoding)
+ }
+
+ /// https://encoding.spec.whatwg.org/#get-an-output-encoding
+ pub fn to_output_encoding(self) -> Self {
+ if let Some(encoding) = self.encoding {
+ if matches!(encoding.name(), "utf-16le" | "utf-16be") {
+ return Self::utf8()
+ }
+ }
+ self
+ }
+
+ pub fn is_utf8(&self) -> bool {
+ self.encoding.is_none()
+ }
+
+ pub fn name(&self) -> &'static str {
+ match self.encoding {
+ Some(encoding) => encoding.name(),
+ None => "utf-8",
+ }
+ }
+
+ pub fn decode<'a>(&self, input: Cow<'a, [u8]>) -> Cow<'a, str> {
+ match self.encoding {
+ // `encoding.decode` never returns `Err` when called with `DecoderTrap::Replace`
+ Some(encoding) => encoding.decode(&input, DecoderTrap::Replace).unwrap().into(),
+ None => decode_utf8_lossy(input),
+ }
+ }
+
+ pub fn encode<'a>(&self, input: Cow<'a, str>) -> Cow<'a, [u8]> {
+ match self.encoding {
+ // `encoding.encode` never returns `Err` when called with `EncoderTrap::NcrEscape`
+ Some(encoding) => Cow::Owned(encoding.encode(&input, EncoderTrap::NcrEscape).unwrap()),
+ None => encode_utf8(input)
+ }
+ }
+}
+
+
+#[cfg(not(feature = "query_encoding"))]
+#[derive(Copy, Clone)]
+pub struct EncodingOverride;
+
+#[cfg(not(feature = "query_encoding"))]
+impl EncodingOverride {
+ #[inline]
+ pub fn utf8() -> Self {
+ EncodingOverride
+ }
+
+ pub fn decode<'a>(&self, input: Cow<'a, [u8]>) -> Cow<'a, str> {
+ decode_utf8_lossy(input)
+ }
+
+ pub fn encode<'a>(&self, input: Cow<'a, str>) -> Cow<'a, [u8]> {
+ encode_utf8(input)
+ }
+}
+
+pub fn decode_utf8_lossy(input: Cow<[u8]>) -> Cow<str> {
+ match input {
+ Cow::Borrowed(bytes) => String::from_utf8_lossy(bytes),
+ Cow::Owned(bytes) => {
+ let raw_utf8: *const [u8];
+ match String::from_utf8_lossy(&bytes) {
+ Cow::Borrowed(utf8) => raw_utf8 = utf8.as_bytes(),
+ Cow::Owned(s) => return s.into(),
+ }
+ // from_utf8_lossy returned a borrow of `bytes` unchanged.
+ debug_assert!(raw_utf8 == &*bytes as *const [u8]);
+ // Reuse the existing `Vec` allocation.
+ unsafe { String::from_utf8_unchecked(bytes) }.into()
+ }
+ }
+}
+
+pub fn encode_utf8(input: Cow<str>) -> Cow<[u8]> {
+ match input {
+ Cow::Borrowed(s) => Cow::Borrowed(s.as_bytes()),
+ Cow::Owned(s) => Cow::Owned(s.into_bytes())
+ }
+}
diff --git a/third_party/rust/url/src/form_urlencoded.rs b/third_party/rust/url/src/form_urlencoded.rs
new file mode 100644
index 000000000..f4a655507
--- /dev/null
+++ b/third_party/rust/url/src/form_urlencoded.rs
@@ -0,0 +1,364 @@
+// Copyright 2013-2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+//! Parser and serializer for the [`application/x-www-form-urlencoded` syntax](
+//! http://url.spec.whatwg.org/#application/x-www-form-urlencoded),
+//! as used by HTML forms.
+//!
+//! Converts between a string (such as an URL’s query string)
+//! and a sequence of (name, value) pairs.
+
+use encoding::EncodingOverride;
+use percent_encoding::{percent_encode_byte, percent_decode};
+use std::borrow::{Borrow, Cow};
+use std::str;
+
+
+/// Convert a byte string in the `application/x-www-form-urlencoded` syntax
+/// into a iterator of (name, value) pairs.
+///
+/// Use `parse(input.as_bytes())` to parse a `&str` string.
+///
+/// The names and values are percent-decoded. For instance, `%23first=%25try%25` will be
+/// converted to `[("#first", "%try%")]`.
+#[inline]
+pub fn parse(input: &[u8]) -> Parse {
+ Parse {
+ input: input,
+ encoding: EncodingOverride::utf8(),
+ }
+}
+
+
+/// Convert a byte string in the `application/x-www-form-urlencoded` syntax
+/// into a iterator of (name, value) pairs.
+///
+/// Use `parse(input.as_bytes())` to parse a `&str` string.
+///
+/// This function is only available if the `query_encoding` Cargo feature is enabled.
+///
+/// Arguments:
+///
+/// * `encoding_override`: The character encoding each name and values is decoded as
+/// after percent-decoding. Defaults to UTF-8.
+/// * `use_charset`: The *use _charset_ flag*. If in doubt, set to `false`.
+#[cfg(feature = "query_encoding")]
+pub fn parse_with_encoding<'a>(input: &'a [u8],
+ encoding_override: Option<::encoding::EncodingRef>,
+ use_charset: bool)
+ -> Result<Parse<'a>, ()> {
+ use std::ascii::AsciiExt;
+
+ let mut encoding = EncodingOverride::from_opt_encoding(encoding_override);
+ if !(encoding.is_utf8() || input.is_ascii()) {
+ return Err(())
+ }
+ if use_charset {
+ for sequence in input.split(|&b| b == b'&') {
+ // No '+' in "_charset_" to replace with ' '.
+ if sequence.starts_with(b"_charset_=") {
+ let value = &sequence[b"_charset_=".len()..];
+ // Skip replacing '+' with ' ' in value since no encoding label contains either:
+ // https://encoding.spec.whatwg.org/#names-and-labels
+ if let Some(e) = EncodingOverride::lookup(value) {
+ encoding = e;
+ break
+ }
+ }
+ }
+ }
+ Ok(Parse {
+ input: input,
+ encoding: encoding,
+ })
+}
+
+/// The return type of `parse()`.
+#[derive(Copy, Clone)]
+pub struct Parse<'a> {
+ input: &'a [u8],
+ encoding: EncodingOverride,
+}
+
+impl<'a> Iterator for Parse<'a> {
+ type Item = (Cow<'a, str>, Cow<'a, str>);
+
+ fn next(&mut self) -> Option<Self::Item> {
+ loop {
+ if self.input.is_empty() {
+ return None
+ }
+ let mut split2 = self.input.splitn(2, |&b| b == b'&');
+ let sequence = split2.next().unwrap();
+ self.input = split2.next().unwrap_or(&[][..]);
+ if sequence.is_empty() {
+ continue
+ }
+ let mut split2 = sequence.splitn(2, |&b| b == b'=');
+ let name = split2.next().unwrap();
+ let value = split2.next().unwrap_or(&[][..]);
+ return Some((
+ decode(name, self.encoding),
+ decode(value, self.encoding),
+ ))
+ }
+ }
+}
+
+fn decode(input: &[u8], encoding: EncodingOverride) -> Cow<str> {
+ let replaced = replace_plus(input);
+ encoding.decode(match percent_decode(&replaced).if_any() {
+ Some(vec) => Cow::Owned(vec),
+ None => replaced,
+ })
+}
+
+/// Replace b'+' with b' '
+fn replace_plus<'a>(input: &'a [u8]) -> Cow<'a, [u8]> {
+ match input.iter().position(|&b| b == b'+') {
+ None => Cow::Borrowed(input),
+ Some(first_position) => {
+ let mut replaced = input.to_owned();
+ replaced[first_position] = b' ';
+ for byte in &mut replaced[first_position + 1..] {
+ if *byte == b'+' {
+ *byte = b' ';
+ }
+ }
+ Cow::Owned(replaced)
+ }
+ }
+}
+
+impl<'a> Parse<'a> {
+ /// Return a new iterator that yields pairs of `String` instead of pairs of `Cow<str>`.
+ pub fn into_owned(self) -> ParseIntoOwned<'a> {
+ ParseIntoOwned { inner: self }
+ }
+}
+
+/// Like `Parse`, but yields pairs of `String` instead of pairs of `Cow<str>`.
+pub struct ParseIntoOwned<'a> {
+ inner: Parse<'a>
+}
+
+impl<'a> Iterator for ParseIntoOwned<'a> {
+ type Item = (String, String);
+
+ fn next(&mut self) -> Option<Self::Item> {
+ self.inner.next().map(|(k, v)| (k.into_owned(), v.into_owned()))
+ }
+}
+
+/// The [`application/x-www-form-urlencoded` byte serializer](
+/// https://url.spec.whatwg.org/#concept-urlencoded-byte-serializer).
+///
+/// Return an iterator of `&str` slices.
+pub fn byte_serialize(input: &[u8]) -> ByteSerialize {
+ ByteSerialize {
+ bytes: input,
+ }
+}
+
+/// Return value of `byte_serialize()`.
+pub struct ByteSerialize<'a> {
+ bytes: &'a [u8],
+}
+
+fn byte_serialized_unchanged(byte: u8) -> bool {
+ matches!(byte, b'*' | b'-' | b'.' | b'0' ... b'9' | b'A' ... b'Z' | b'_' | b'a' ... b'z')
+}
+
+impl<'a> Iterator for ByteSerialize<'a> {
+ type Item = &'a str;
+
+ fn next(&mut self) -> Option<&'a str> {
+ if let Some((&first, tail)) = self.bytes.split_first() {
+ if !byte_serialized_unchanged(first) {
+ self.bytes = tail;
+ return Some(if first == b' ' { "+" } else { percent_encode_byte(first) })
+ }
+ let position = tail.iter().position(|&b| !byte_serialized_unchanged(b));
+ let (unchanged_slice, remaining) = match position {
+ // 1 for first_byte + i unchanged in tail
+ Some(i) => self.bytes.split_at(1 + i),
+ None => (self.bytes, &[][..]),
+ };
+ self.bytes = remaining;
+ Some(unsafe { str::from_utf8_unchecked(unchanged_slice) })
+ } else {
+ None
+ }
+ }
+
+ fn size_hint(&self) -> (usize, Option<usize>) {
+ if self.bytes.is_empty() {
+ (0, Some(0))
+ } else {
+ (1, Some(self.bytes.len()))
+ }
+ }
+}
+
+/// The [`application/x-www-form-urlencoded` serializer](
+/// https://url.spec.whatwg.org/#concept-urlencoded-serializer).
+pub struct Serializer<T: Target> {
+ target: Option<T>,
+ start_position: usize,
+ encoding: EncodingOverride,
+}
+
+pub trait Target {
+ fn as_mut_string(&mut self) -> &mut String;
+ fn finish(self) -> Self::Finished;
+ type Finished;
+}
+
+impl Target for String {
+ fn as_mut_string(&mut self) -> &mut String { self }
+ fn finish(self) -> Self { self }
+ type Finished = Self;
+}
+
+impl<'a> Target for &'a mut String {
+ fn as_mut_string(&mut self) -> &mut String { &mut **self }
+ fn finish(self) -> Self { self }
+ type Finished = Self;
+}
+
+// `as_mut_string` string here exposes the internal serialization of an `Url`,
+// which should not be exposed to users.
+// We achieve that by not giving users direct access to `UrlQuery`:
+// * Its fields are private
+// (and so can not be constructed with struct literal syntax outside of this crate),
+// * It has no constructor
+// * It is only visible (on the type level) to users in the return type of
+// `Url::query_pairs_mut` which is `Serializer<UrlQuery>`
+// * `Serializer` keeps its target in a private field
+// * Unlike in other `Target` impls, `UrlQuery::finished` does not return `Self`.
+impl<'a> Target for ::UrlQuery<'a> {
+ fn as_mut_string(&mut self) -> &mut String { &mut self.url.serialization }
+ fn finish(self) -> &'a mut ::Url { self.url }
+ type Finished = &'a mut ::Url;
+}
+
+impl<T: Target> Serializer<T> {
+ /// Create a new `application/x-www-form-urlencoded` serializer for the given target.
+ ///
+ /// If the target is non-empty,
+ /// its content is assumed to already be in `application/x-www-form-urlencoded` syntax.
+ pub fn new(target: T) -> Self {
+ Self::for_suffix(target, 0)
+ }
+
+ /// Create a new `application/x-www-form-urlencoded` serializer
+ /// for a suffix of the given target.
+ ///
+ /// If that suffix is non-empty,
+ /// its content is assumed to already be in `application/x-www-form-urlencoded` syntax.
+ pub fn for_suffix(mut target: T, start_position: usize) -> Self {
+ &target.as_mut_string()[start_position..]; // Panic if out of bounds
+ Serializer {
+ target: Some(target),
+ start_position: start_position,
+ encoding: EncodingOverride::utf8(),
+ }
+ }
+
+ /// Remove any existing name/value pair.
+ ///
+ /// Panics if called after `.finish()`.
+ pub fn clear(&mut self) -> &mut Self {
+ string(&mut self.target).truncate(self.start_position);
+ self
+ }
+
+ /// Set the character encoding to be used for names and values before percent-encoding.
+ #[cfg(feature = "query_encoding")]
+ pub fn encoding_override(&mut self, new: Option<::encoding::EncodingRef>) -> &mut Self {
+ self.encoding = EncodingOverride::from_opt_encoding(new).to_output_encoding();
+ self
+ }
+
+ /// Serialize and append a name/value pair.
+ ///
+ /// Panics if called after `.finish()`.
+ pub fn append_pair(&mut self, name: &str, value: &str) -> &mut Self {
+ append_pair(string(&mut self.target), self.start_position, self.encoding, name, value);
+ self
+ }
+
+ /// Serialize and append a number of name/value pairs.
+ ///
+ /// This simply calls `append_pair` repeatedly.
+ /// This can be more convenient, so the user doesn’t need to introduce a block
+ /// to limit the scope of `Serializer`’s borrow of its string.
+ ///
+ /// Panics if called after `.finish()`.
+ pub fn extend_pairs<I, K, V>(&mut self, iter: I) -> &mut Self
+ where I: IntoIterator, I::Item: Borrow<(K, V)>, K: AsRef<str>, V: AsRef<str> {
+ {
+ let string = string(&mut self.target);
+ for pair in iter {
+ let &(ref k, ref v) = pair.borrow();
+ append_pair(string, self.start_position, self.encoding, k.as_ref(), v.as_ref());
+ }
+ }
+ self
+ }
+
+ /// Add a name/value pair whose name is `_charset_`
+ /// and whose value is the character encoding’s name.
+ /// (See the `encoding_override()` method.)
+ ///
+ /// Panics if called after `.finish()`.
+ #[cfg(feature = "query_encoding")]
+ pub fn append_charset(&mut self) -> &mut Self {
+ {
+ let string = string(&mut self.target);
+ append_separator_if_needed(string, self.start_position);
+ string.push_str("_charset_=");
+ string.push_str(self.encoding.name());
+ }
+ self
+ }
+
+ /// If this serializer was constructed with a string, take and return that string.
+ ///
+ /// ```rust
+ /// use url::form_urlencoded;
+ /// let encoded: String = form_urlencoded::Serializer::new(String::new())
+ /// .append_pair("foo", "bar & baz")
+ /// .append_pair("saison", "Été+hiver")
+ /// .finish();
+ /// assert_eq!(encoded, "foo=bar+%26+baz&saison=%C3%89t%C3%A9%2Bhiver");
+ /// ```
+ ///
+ /// Panics if called more than once.
+ pub fn finish(&mut self) -> T::Finished {
+ self.target.take().expect("url::form_urlencoded::Serializer double finish").finish()
+ }
+}
+
+fn append_separator_if_needed(string: &mut String, start_position: usize) {
+ if string.len() > start_position {
+ string.push('&')
+ }
+}
+
+fn string<T: Target>(target: &mut Option<T>) -> &mut String {
+ target.as_mut().expect("url::form_urlencoded::Serializer finished").as_mut_string()
+}
+
+fn append_pair(string: &mut String, start_position: usize, encoding: EncodingOverride,
+ name: &str, value: &str) {
+ append_separator_if_needed(string, start_position);
+ string.extend(byte_serialize(&encoding.encode(name.into())));
+ string.push('=');
+ string.extend(byte_serialize(&encoding.encode(value.into())));
+}
diff --git a/third_party/rust/url/src/host.rs b/third_party/rust/url/src/host.rs
new file mode 100644
index 000000000..47b049a27
--- /dev/null
+++ b/third_party/rust/url/src/host.rs
@@ -0,0 +1,418 @@
+// Copyright 2013-2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf;
+use std::cmp;
+use std::fmt::{self, Formatter};
+use std::io;
+use std::net::{Ipv4Addr, Ipv6Addr, SocketAddr, SocketAddrV4, SocketAddrV6, ToSocketAddrs};
+use std::vec;
+use parser::{ParseResult, ParseError};
+use percent_encoding::percent_decode;
+use idna;
+
+#[derive(Copy, Clone, Debug, Eq, PartialEq)]
+pub enum HostInternal {
+ None,
+ Domain,
+ Ipv4(Ipv4Addr),
+ Ipv6(Ipv6Addr),
+}
+
+#[cfg(feature = "heapsize")]
+known_heap_size!(0, HostInternal);
+
+impl<S> From<Host<S>> for HostInternal {
+ fn from(host: Host<S>) -> HostInternal {
+ match host {
+ Host::Domain(_) => HostInternal::Domain,
+ Host::Ipv4(address) => HostInternal::Ipv4(address),
+ Host::Ipv6(address) => HostInternal::Ipv6(address),
+ }
+ }
+}
+
+/// The host name of an URL.
+#[derive(Clone, Debug, Eq, PartialEq, Ord, PartialOrd, Hash)]
+pub enum Host<S=String> {
+ /// A DNS domain name, as '.' dot-separated labels.
+ /// Non-ASCII labels are encoded in punycode per IDNA.
+ Domain(S),
+
+ /// An IPv4 address.
+ /// `Url::host_str` returns the serialization of this address,
+ /// as four decimal integers separated by `.` dots.
+ Ipv4(Ipv4Addr),
+
+ /// An IPv6 address.
+ /// `Url::host_str` returns the serialization of that address between `[` and `]` brackets,
+ /// in the format per [RFC 5952 *A Recommendation
+ /// for IPv6 Address Text Representation*](https://tools.ietf.org/html/rfc5952):
+ /// lowercase hexadecimal with maximal `::` compression.
+ Ipv6(Ipv6Addr),
+}
+
+#[cfg(feature = "heapsize")]
+impl<S: HeapSizeOf> HeapSizeOf for Host<S> {
+ fn heap_size_of_children(&self) -> usize {
+ match *self {
+ Host::Domain(ref s) => s.heap_size_of_children(),
+ _ => 0,
+ }
+ }
+}
+
+impl<'a> Host<&'a str> {
+ /// Return a copy of `self` that owns an allocated `String` but does not borrow an `&Url`.
+ pub fn to_owned(&self) -> Host<String> {
+ match *self {
+ Host::Domain(domain) => Host::Domain(domain.to_owned()),
+ Host::Ipv4(address) => Host::Ipv4(address),
+ Host::Ipv6(address) => Host::Ipv6(address),
+ }
+ }
+}
+
+impl Host<String> {
+ /// Parse a host: either an IPv6 address in [] square brackets, or a domain.
+ ///
+ /// https://url.spec.whatwg.org/#host-parsing
+ pub fn parse(input: &str) -> Result<Self, ParseError> {
+ if input.starts_with("[") {
+ if !input.ends_with("]") {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ return parse_ipv6addr(&input[1..input.len() - 1]).map(Host::Ipv6)
+ }
+ let domain = percent_decode(input.as_bytes()).decode_utf8_lossy();
+ let domain = try!(idna::domain_to_ascii(&domain));
+ if domain.find(|c| matches!(c,
+ '\0' | '\t' | '\n' | '\r' | ' ' | '#' | '%' | '/' | ':' | '?' | '@' | '[' | '\\' | ']'
+ )).is_some() {
+ return Err(ParseError::InvalidDomainCharacter)
+ }
+ if let Some(address) = try!(parse_ipv4addr(&domain)) {
+ Ok(Host::Ipv4(address))
+ } else {
+ Ok(Host::Domain(domain.into()))
+ }
+ }
+}
+
+impl<S: AsRef<str>> fmt::Display for Host<S> {
+ fn fmt(&self, f: &mut Formatter) -> fmt::Result {
+ match *self {
+ Host::Domain(ref domain) => domain.as_ref().fmt(f),
+ Host::Ipv4(ref addr) => addr.fmt(f),
+ Host::Ipv6(ref addr) => {
+ try!(f.write_str("["));
+ try!(write_ipv6(addr, f));
+ f.write_str("]")
+ }
+ }
+ }
+}
+
+/// This mostly exists because coherence rules don’t allow us to implement
+/// `ToSocketAddrs for (Host<S>, u16)`.
+pub struct HostAndPort<S=String> {
+ pub host: Host<S>,
+ pub port: u16,
+}
+
+impl<'a> HostAndPort<&'a str> {
+ /// Return a copy of `self` that owns an allocated `String` but does not borrow an `&Url`.
+ pub fn to_owned(&self) -> HostAndPort<String> {
+ HostAndPort {
+ host: self.host.to_owned(),
+ port: self.port
+ }
+ }
+}
+
+impl<S: AsRef<str>> ToSocketAddrs for HostAndPort<S> {
+ type Iter = SocketAddrs;
+
+ fn to_socket_addrs(&self) -> io::Result<Self::Iter> {
+ let port = self.port;
+ match self.host {
+ Host::Domain(ref domain) => Ok(SocketAddrs {
+ // FIXME: use std::net::lookup_host when it’s stable.
+ state: SocketAddrsState::Domain(try!((domain.as_ref(), port).to_socket_addrs()))
+ }),
+ Host::Ipv4(address) => Ok(SocketAddrs {
+ state: SocketAddrsState::One(SocketAddr::V4(SocketAddrV4::new(address, port)))
+ }),
+ Host::Ipv6(address) => Ok(SocketAddrs {
+ state: SocketAddrsState::One(SocketAddr::V6(SocketAddrV6::new(address, port, 0, 0)))
+ }),
+ }
+ }
+}
+
+/// Socket addresses for an URL.
+pub struct SocketAddrs {
+ state: SocketAddrsState
+}
+
+enum SocketAddrsState {
+ Domain(vec::IntoIter<SocketAddr>),
+ One(SocketAddr),
+ Done,
+}
+
+impl Iterator for SocketAddrs {
+ type Item = SocketAddr;
+ fn next(&mut self) -> Option<SocketAddr> {
+ match self.state {
+ SocketAddrsState::Domain(ref mut iter) => iter.next(),
+ SocketAddrsState::One(s) => {
+ self.state = SocketAddrsState::Done;
+ Some(s)
+ }
+ SocketAddrsState::Done => None
+ }
+ }
+}
+
+fn write_ipv6(addr: &Ipv6Addr, f: &mut Formatter) -> fmt::Result {
+ let segments = addr.segments();
+ let (compress_start, compress_end) = longest_zero_sequence(&segments);
+ let mut i = 0;
+ while i < 8 {
+ if i == compress_start {
+ try!(f.write_str(":"));
+ if i == 0 {
+ try!(f.write_str(":"));
+ }
+ if compress_end < 8 {
+ i = compress_end;
+ } else {
+ break;
+ }
+ }
+ try!(write!(f, "{:x}", segments[i as usize]));
+ if i < 7 {
+ try!(f.write_str(":"));
+ }
+ i += 1;
+ }
+ Ok(())
+}
+
+fn longest_zero_sequence(pieces: &[u16; 8]) -> (isize, isize) {
+ let mut longest = -1;
+ let mut longest_length = -1;
+ let mut start = -1;
+ macro_rules! finish_sequence(
+ ($end: expr) => {
+ if start >= 0 {
+ let length = $end - start;
+ if length > longest_length {
+ longest = start;
+ longest_length = length;
+ }
+ }
+ };
+ );
+ for i in 0..8 {
+ if pieces[i as usize] == 0 {
+ if start < 0 {
+ start = i;
+ }
+ } else {
+ finish_sequence!(i);
+ start = -1;
+ }
+ }
+ finish_sequence!(8);
+ (longest, longest + longest_length)
+}
+
+
+fn parse_ipv4number(mut input: &str) -> Result<u32, ()> {
+ let mut r = 10;
+ if input.starts_with("0x") || input.starts_with("0X") {
+ input = &input[2..];
+ r = 16;
+ } else if input.len() >= 2 && input.starts_with("0") {
+ input = &input[1..];
+ r = 8;
+ }
+ if input.is_empty() {
+ return Ok(0);
+ }
+ if input.starts_with("+") {
+ return Err(())
+ }
+ match u32::from_str_radix(&input, r) {
+ Ok(number) => Ok(number),
+ Err(_) => Err(()),
+ }
+}
+
+fn parse_ipv4addr(input: &str) -> ParseResult<Option<Ipv4Addr>> {
+ if input.is_empty() {
+ return Ok(None)
+ }
+ let mut parts: Vec<&str> = input.split('.').collect();
+ if parts.last() == Some(&"") {
+ parts.pop();
+ }
+ if parts.len() > 4 {
+ return Ok(None);
+ }
+ let mut numbers: Vec<u32> = Vec::new();
+ for part in parts {
+ if part == "" {
+ return Ok(None);
+ }
+ if let Ok(n) = parse_ipv4number(part) {
+ numbers.push(n);
+ } else {
+ return Ok(None);
+ }
+ }
+ let mut ipv4 = numbers.pop().expect("a non-empty list of numbers");
+ // Equivalent to: ipv4 >= 256 ** (4 − numbers.len())
+ if ipv4 > u32::max_value() >> (8 * numbers.len() as u32) {
+ return Err(ParseError::InvalidIpv4Address);
+ }
+ if numbers.iter().any(|x| *x > 255) {
+ return Err(ParseError::InvalidIpv4Address);
+ }
+ for (counter, n) in numbers.iter().enumerate() {
+ ipv4 += n << (8 * (3 - counter as u32))
+ }
+ Ok(Some(Ipv4Addr::from(ipv4)))
+}
+
+
+fn parse_ipv6addr(input: &str) -> ParseResult<Ipv6Addr> {
+ let input = input.as_bytes();
+ let len = input.len();
+ let mut is_ip_v4 = false;
+ let mut pieces = [0, 0, 0, 0, 0, 0, 0, 0];
+ let mut piece_pointer = 0;
+ let mut compress_pointer = None;
+ let mut i = 0;
+
+ if len < 2 {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+
+ if input[0] == b':' {
+ if input[1] != b':' {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ i = 2;
+ piece_pointer = 1;
+ compress_pointer = Some(1);
+ }
+
+ while i < len {
+ if piece_pointer == 8 {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ if input[i] == b':' {
+ if compress_pointer.is_some() {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ i += 1;
+ piece_pointer += 1;
+ compress_pointer = Some(piece_pointer);
+ continue
+ }
+ let start = i;
+ let end = cmp::min(len, start + 4);
+ let mut value = 0u16;
+ while i < end {
+ match (input[i] as char).to_digit(16) {
+ Some(digit) => {
+ value = value * 0x10 + digit as u16;
+ i += 1;
+ },
+ None => break
+ }
+ }
+ if i < len {
+ match input[i] {
+ b'.' => {
+ if i == start {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ i = start;
+ is_ip_v4 = true;
+ },
+ b':' => {
+ i += 1;
+ if i == len {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ },
+ _ => return Err(ParseError::InvalidIpv6Address)
+ }
+ }
+ if is_ip_v4 {
+ break
+ }
+ pieces[piece_pointer] = value;
+ piece_pointer += 1;
+ }
+
+ if is_ip_v4 {
+ if piece_pointer > 6 {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ let mut dots_seen = 0;
+ while i < len {
+ // FIXME: https://github.com/whatwg/url/commit/1c22aa119c354e0020117e02571cec53f7c01064
+ let mut value = 0u16;
+ while i < len {
+ let digit = match input[i] {
+ c @ b'0' ... b'9' => c - b'0',
+ _ => break
+ };
+ value = value * 10 + digit as u16;
+ if value == 0 || value > 255 {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ }
+ if dots_seen < 3 && !(i < len && input[i] == b'.') {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ pieces[piece_pointer] = pieces[piece_pointer] * 0x100 + value;
+ if dots_seen == 0 || dots_seen == 2 {
+ piece_pointer += 1;
+ }
+ i += 1;
+ if dots_seen == 3 && i < len {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ dots_seen += 1;
+ }
+ }
+
+ match compress_pointer {
+ Some(compress_pointer) => {
+ let mut swaps = piece_pointer - compress_pointer;
+ piece_pointer = 7;
+ while swaps > 0 {
+ pieces[piece_pointer] = pieces[compress_pointer + swaps - 1];
+ pieces[compress_pointer + swaps - 1] = 0;
+ swaps -= 1;
+ piece_pointer -= 1;
+ }
+ }
+ _ => if piece_pointer != 8 {
+ return Err(ParseError::InvalidIpv6Address)
+ }
+ }
+ Ok(Ipv6Addr::new(pieces[0], pieces[1], pieces[2], pieces[3],
+ pieces[4], pieces[5], pieces[6], pieces[7]))
+}
diff --git a/third_party/rust/url/src/lib.rs b/third_party/rust/url/src/lib.rs
new file mode 100644
index 000000000..9378318b4
--- /dev/null
+++ b/third_party/rust/url/src/lib.rs
@@ -0,0 +1,1456 @@
+// Copyright 2013-2015 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+/*!
+
+rust-url is an implementation of the [URL Standard](http://url.spec.whatwg.org/)
+for the [Rust](http://rust-lang.org/) programming language.
+
+It builds with [Cargo](http://crates.io/).
+To use it in your project, add this to your `Cargo.toml` file:
+
+```Cargo
+[dependencies.url]
+git = "https://github.com/servo/rust-url"
+```
+
+Supporting encodings other than UTF-8 in query strings is an optional feature
+that requires [rust-encoding](https://github.com/lifthrasiir/rust-encoding)
+and is off by default.
+You can enable it with
+[Cargo’s *features* mechanism](http://doc.crates.io/manifest.html#the-[features]-section):
+
+```Cargo
+[dependencies.url]
+git = "https://github.com/servo/rust-url"
+features = ["query_encoding"]
+```
+
+… or by passing `--cfg 'feature="query_encoding"'` to rustc.
+
+
+# URL parsing and data structures
+
+First, URL parsing may fail for various reasons and therefore returns a `Result`.
+
+```
+use url::{Url, ParseError};
+
+assert!(Url::parse("http://[:::1]") == Err(ParseError::InvalidIpv6Address))
+```
+
+Let’s parse a valid URL and look at its components.
+
+```
+use url::{Url, Host};
+
+let issue_list_url = Url::parse(
+ "https://github.com/rust-lang/rust/issues?labels=E-easy&state=open"
+).unwrap();
+
+
+assert!(issue_list_url.scheme() == "https");
+assert!(issue_list_url.username() == "");
+assert!(issue_list_url.password() == None);
+assert!(issue_list_url.host_str() == Some("github.com"));
+assert!(issue_list_url.host() == Some(Host::Domain("github.com")));
+assert!(issue_list_url.port() == None);
+assert!(issue_list_url.path() == "/rust-lang/rust/issues");
+assert!(issue_list_url.path_segments().map(|c| c.collect::<Vec<_>>()) ==
+ Some(vec!["rust-lang", "rust", "issues"]));
+assert!(issue_list_url.query() == Some("labels=E-easy&state=open"));
+assert!(issue_list_url.fragment() == None);
+assert!(!issue_list_url.cannot_be_a_base());
+```
+
+Some URLs are said to be *cannot-be-a-base*:
+they don’t have a username, password, host, or port,
+and their "path" is an arbitrary string rather than slash-separated segments:
+
+```
+use url::Url;
+
+let data_url = Url::parse("data:text/plain,Hello?World#").unwrap();
+
+assert!(data_url.cannot_be_a_base());
+assert!(data_url.scheme() == "data");
+assert!(data_url.path() == "text/plain,Hello");
+assert!(data_url.path_segments().is_none());
+assert!(data_url.query() == Some("World"));
+assert!(data_url.fragment() == Some(""));
+```
+
+
+# Base URL
+
+Many contexts allow URL *references* that can be relative to a *base URL*:
+
+```html
+<link rel="stylesheet" href="../main.css">
+```
+
+Since parsed URL are absolute, giving a base is required for parsing relative URLs:
+
+```
+use url::{Url, ParseError};
+
+assert!(Url::parse("../main.css") == Err(ParseError::RelativeUrlWithoutBase))
+```
+
+Use the `join` method on an `Url` to use it as a base URL:
+
+```
+use url::Url;
+
+let this_document = Url::parse("http://servo.github.io/rust-url/url/index.html").unwrap();
+let css_url = this_document.join("../main.css").unwrap();
+assert_eq!(css_url.as_str(), "http://servo.github.io/rust-url/main.css")
+*/
+
+#[cfg(feature="rustc-serialize")] extern crate rustc_serialize;
+#[macro_use] extern crate matches;
+#[cfg(feature="serde")] extern crate serde;
+#[cfg(feature="heapsize")] #[macro_use] extern crate heapsize;
+
+pub extern crate idna;
+
+use encoding::EncodingOverride;
+#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf;
+use host::HostInternal;
+use parser::{Parser, Context, SchemeType, to_u32};
+use percent_encoding::{PATH_SEGMENT_ENCODE_SET, USERINFO_ENCODE_SET,
+ percent_encode, percent_decode, utf8_percent_encode};
+use std::cmp;
+use std::fmt::{self, Write};
+use std::hash;
+use std::io;
+use std::mem;
+use std::net::{ToSocketAddrs, IpAddr};
+use std::ops::{Range, RangeFrom, RangeTo};
+use std::path::{Path, PathBuf};
+use std::str;
+
+pub use origin::{Origin, OpaqueOrigin};
+pub use host::{Host, HostAndPort, SocketAddrs};
+pub use path_segments::PathSegmentsMut;
+pub use parser::ParseError;
+pub use slicing::Position;
+
+mod encoding;
+mod host;
+mod origin;
+mod path_segments;
+mod parser;
+mod slicing;
+
+pub mod form_urlencoded;
+pub mod percent_encoding;
+pub mod quirks;
+
+/// A parsed URL record.
+#[derive(Clone)]
+pub struct Url {
+ /// Syntax in pseudo-BNF:
+ ///
+ /// url = scheme ":" [ hierarchical | non-hierarchical ] [ "?" query ]? [ "#" fragment ]?
+ /// non-hierarchical = non-hierarchical-path
+ /// non-hierarchical-path = /* Does not start with "/" */
+ /// hierarchical = authority? hierarchical-path
+ /// authority = "//" userinfo? host [ ":" port ]?
+ /// userinfo = username [ ":" password ]? "@"
+ /// hierarchical-path = [ "/" path-segment ]+
+ serialization: String,
+
+ // Components
+ scheme_end: u32, // Before ':'
+ username_end: u32, // Before ':' (if a password is given) or '@' (if not)
+ host_start: u32,
+ host_end: u32,
+ host: HostInternal,
+ port: Option<u16>,
+ path_start: u32, // Before initial '/', if any
+ query_start: Option<u32>, // Before '?', unlike Position::QueryStart
+ fragment_start: Option<u32>, // Before '#', unlike Position::FragmentStart
+}
+
+#[cfg(feature = "heapsize")]
+impl HeapSizeOf for Url {
+ fn heap_size_of_children(&self) -> usize {
+ self.serialization.heap_size_of_children()
+ }
+}
+
+/// Full configuration for the URL parser.
+#[derive(Copy, Clone)]
+pub struct ParseOptions<'a> {
+ base_url: Option<&'a Url>,
+ encoding_override: encoding::EncodingOverride,
+ log_syntax_violation: Option<&'a Fn(&'static str)>,
+}
+
+impl<'a> ParseOptions<'a> {
+ /// Change the base URL
+ pub fn base_url(mut self, new: Option<&'a Url>) -> Self {
+ self.base_url = new;
+ self
+ }
+
+ /// Override the character encoding of query strings.
+ /// This is a legacy concept only relevant for HTML.
+ #[cfg(feature = "query_encoding")]
+ pub fn encoding_override(mut self, new: Option<encoding::EncodingRef>) -> Self {
+ self.encoding_override = EncodingOverride::from_opt_encoding(new).to_output_encoding();
+ self
+ }
+
+ /// Call the provided function or closure on non-fatal parse errors.
+ pub fn log_syntax_violation(mut self, new: Option<&'a Fn(&'static str)>) -> Self {
+ self.log_syntax_violation = new;
+ self
+ }
+
+ /// Parse an URL string with the configuration so far.
+ pub fn parse(self, input: &str) -> Result<Url, ::ParseError> {
+ Parser {
+ serialization: String::with_capacity(input.len()),
+ base_url: self.base_url,
+ query_encoding_override: self.encoding_override,
+ log_syntax_violation: self.log_syntax_violation,
+ context: Context::UrlParser,
+ }.parse_url(input)
+ }
+}
+
+impl Url {
+ /// Parse an absolute URL from a string.
+ #[inline]
+ pub fn parse(input: &str) -> Result<Url, ::ParseError> {
+ Url::options().parse(input)
+ }
+
+ /// Parse a string as an URL, with this URL as the base URL.
+ #[inline]
+ pub fn join(&self, input: &str) -> Result<Url, ::ParseError> {
+ Url::options().base_url(Some(self)).parse(input)
+ }
+
+ /// Return a default `ParseOptions` that can fully configure the URL parser.
+ pub fn options<'a>() -> ParseOptions<'a> {
+ ParseOptions {
+ base_url: None,
+ encoding_override: EncodingOverride::utf8(),
+ log_syntax_violation: None,
+ }
+ }
+
+ /// Return the serialization of this URL.
+ ///
+ /// This is fast since that serialization is already stored in the `Url` struct.
+ #[inline]
+ pub fn as_str(&self) -> &str {
+ &self.serialization
+ }
+
+ /// Return the serialization of this URL.
+ ///
+ /// This consumes the `Url` and takes ownership of the `String` stored in it.
+ #[inline]
+ pub fn into_string(self) -> String {
+ self.serialization
+ }
+
+ /// For internal testing, not part of the public API.
+ ///
+ /// Methods of the `Url` struct assume a number of invariants.
+ /// This checks each of these invariants and panic if one is not met.
+ /// This is for testing rust-url itself.
+ #[doc(hidden)]
+ pub fn assert_invariants(&self) {
+ macro_rules! assert {
+ ($x: expr) => {
+ if !$x {
+ panic!("!( {} ) for URL {:?}", stringify!($x), self.serialization)
+ }
+ }
+ }
+
+ macro_rules! assert_eq {
+ ($a: expr, $b: expr) => {
+ {
+ let a = $a;
+ let b = $b;
+ if a != b {
+ panic!("{:?} != {:?} ({} != {}) for URL {:?}",
+ a, b, stringify!($a), stringify!($b), self.serialization)
+ }
+ }
+ }
+ }
+
+ assert!(self.scheme_end >= 1);
+ assert!(matches!(self.byte_at(0), b'a'...b'z' | b'A'...b'Z'));
+ assert!(self.slice(1..self.scheme_end).chars()
+ .all(|c| matches!(c, 'a'...'z' | 'A'...'Z' | '0'...'9' | '+' | '-' | '.')));
+ assert_eq!(self.byte_at(self.scheme_end), b':');
+
+ if self.slice(self.scheme_end + 1 ..).starts_with("//") {
+ // URL with authority
+ match self.byte_at(self.username_end) {
+ b':' => {
+ assert!(self.host_start >= self.username_end + 2);
+ assert_eq!(self.byte_at(self.host_start - 1), b'@');
+ }
+ b'@' => assert!(self.host_start == self.username_end + 1),
+ _ => assert_eq!(self.username_end, self.scheme_end + 3),
+ }
+ assert!(self.host_start >= self.username_end);
+ assert!(self.host_end >= self.host_start);
+ let host_str = self.slice(self.host_start..self.host_end);
+ match self.host {
+ HostInternal::None => assert_eq!(host_str, ""),
+ HostInternal::Ipv4(address) => assert_eq!(host_str, address.to_string()),
+ HostInternal::Ipv6(address) => assert_eq!(host_str, format!("[{}]", address)),
+ HostInternal::Domain => {
+ if SchemeType::from(self.scheme()).is_special() {
+ assert!(!host_str.is_empty())
+ }
+ }
+ }
+ if self.path_start == self.host_end {
+ assert_eq!(self.port, None);
+ } else {
+ assert_eq!(self.byte_at(self.host_end), b':');
+ let port_str = self.slice(self.host_end + 1..self.path_start);
+ assert_eq!(self.port, Some(port_str.parse::<u16>().expect("Couldn't parse port?")));
+ }
+ assert_eq!(self.byte_at(self.path_start), b'/');
+ } else {
+ // Anarchist URL (no authority)
+ assert_eq!(self.username_end, self.scheme_end + 1);
+ assert_eq!(self.host_start, self.scheme_end + 1);
+ assert_eq!(self.host_end, self.scheme_end + 1);
+ assert_eq!(self.host, HostInternal::None);
+ assert_eq!(self.port, None);
+ assert_eq!(self.path_start, self.scheme_end + 1);
+ }
+ if let Some(start) = self.query_start {
+ assert!(start > self.path_start);
+ assert_eq!(self.byte_at(start), b'?');
+ }
+ if let Some(start) = self.fragment_start {
+ assert!(start > self.path_start);
+ assert_eq!(self.byte_at(start), b'#');
+ }
+ if let (Some(query_start), Some(fragment_start)) = (self.query_start, self.fragment_start) {
+ assert!(fragment_start > query_start);
+ }
+
+ let other = Url::parse(self.as_str()).expect("Failed to parse myself?");
+ assert_eq!(&self.serialization, &other.serialization);
+ assert_eq!(self.scheme_end, other.scheme_end);
+ assert_eq!(self.username_end, other.username_end);
+ assert_eq!(self.host_start, other.host_start);
+ assert_eq!(self.host_end, other.host_end);
+ assert!(self.host == other.host ||
+ // XXX No host round-trips to empty host.
+ // See https://github.com/whatwg/url/issues/79
+ (self.host_str(), other.host_str()) == (None, Some("")));
+ assert_eq!(self.port, other.port);
+ assert_eq!(self.path_start, other.path_start);
+ assert_eq!(self.query_start, other.query_start);
+ assert_eq!(self.fragment_start, other.fragment_start);
+ }
+
+ /// Return the origin of this URL (https://url.spec.whatwg.org/#origin)
+ ///
+ /// Note: this returns an opaque origin for `file:` URLs, which causes
+ /// `url.origin() != url.origin()`.
+ ///
+ /// # Examples
+ ///
+ /// URL with `ftp` scheme:
+ ///
+ /// ```rust
+ /// use url::{Host, Origin, Url};
+ ///
+ /// let url = Url::parse("ftp://example.com/foo").unwrap();
+ /// assert_eq!(url.origin(),
+ /// Origin::Tuple("ftp".into(),
+ /// Host::Domain("example.com".into()),
+ /// 21));
+ /// ```
+ ///
+ /// URL with `blob` scheme:
+ ///
+ /// ```rust
+ /// use url::{Host, Origin, Url};
+ ///
+ /// let url = Url::parse("blob:https://example.com/foo").unwrap();
+ /// assert_eq!(url.origin(),
+ /// Origin::Tuple("https".into(),
+ /// Host::Domain("example.com".into()),
+ /// 443));
+ /// ```
+ ///
+ /// URL with `file` scheme:
+ ///
+ /// ```rust
+ /// use url::{Host, Origin, Url};
+ ///
+ /// let url = Url::parse("file:///tmp/foo").unwrap();
+ /// assert!(!url.origin().is_tuple());
+ ///
+ /// let other_url = Url::parse("file:///tmp/foo").unwrap();
+ /// assert!(url.origin() != other_url.origin());
+ /// ```
+ ///
+ /// URL with other scheme:
+ ///
+ /// ```rust
+ /// use url::{Host, Origin, Url};
+ ///
+ /// let url = Url::parse("foo:bar").unwrap();
+ /// assert!(!url.origin().is_tuple());
+ /// ```
+ #[inline]
+ pub fn origin(&self) -> Origin {
+ origin::url_origin(self)
+ }
+
+ /// Return the scheme of this URL, lower-cased, as an ASCII string without the ':' delimiter.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use url::Url;
+ ///
+ /// let url = Url::parse("file:///tmp/foo").unwrap();
+ /// assert_eq!(url.scheme(), "file");
+ /// ```
+ #[inline]
+ pub fn scheme(&self) -> &str {
+ self.slice(..self.scheme_end)
+ }
+
+ /// Return whether the URL has an 'authority',
+ /// which can contain a username, password, host, and port number.
+ ///
+ /// URLs that do *not* are either path-only like `unix:/run/foo.socket`
+ /// or cannot-be-a-base like `data:text/plain,Stuff`.
+ #[inline]
+ pub fn has_authority(&self) -> bool {
+ debug_assert!(self.byte_at(self.scheme_end) == b':');
+ self.slice(self.scheme_end..).starts_with("://")
+ }
+
+ /// Return whether this URL is a cannot-be-a-base URL,
+ /// meaning that parsing a relative URL string with this URL as the base will return an error.
+ ///
+ /// This is the case if the scheme and `:` delimiter are not followed by a `/` slash,
+ /// as is typically the case of `data:` and `mailto:` URLs.
+ #[inline]
+ pub fn cannot_be_a_base(&self) -> bool {
+ self.byte_at(self.path_start) != b'/'
+ }
+
+ /// Return the username for this URL (typically the empty string)
+ /// as a percent-encoded ASCII string.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use url::Url;
+ ///
+ /// let url = Url::parse("ftp://rms@example.com").unwrap();
+ /// assert_eq!(url.username(), "rms");
+ ///
+ /// let url = Url::parse("ftp://:secret123@example.com").unwrap();
+ /// assert_eq!(url.username(), "");
+ ///
+ /// let url = Url::parse("https://example.com").unwrap();
+ /// assert_eq!(url.username(), "");
+ /// ```
+ pub fn username(&self) -> &str {
+ if self.has_authority() {
+ self.slice(self.scheme_end + ("://".len() as u32)..self.username_end)
+ } else {
+ ""
+ }
+ }
+
+ /// Return the password for this URL, if any, as a percent-encoded ASCII string.
+ ///
+ /// # Examples
+ ///
+ /// ```
+ /// use url::Url;
+ ///
+ /// let url = Url::parse("ftp://rms:secret123@example.com").unwrap();
+ /// assert_eq!(url.password(), Some("secret123"));
+ ///
+ /// let url = Url::parse("ftp://:secret123@example.com").unwrap();
+ /// assert_eq!(url.password(), Some("secret123"));
+ ///
+ /// let url = Url::parse("ftp://rms@example.com").unwrap();
+ /// assert_eq!(url.password(), None);
+ ///
+ /// let url = Url::parse("https://example.com").unwrap();
+ /// assert_eq!(url.password(), None);
+ /// ```
+ pub fn password(&self) -> Option<&str> {
+ // This ':' is not the one marking a port number since a host can not be empty.
+ // (Except for file: URLs, which do not have port numbers.)
+ if self.has_authority() && self.byte_at(self.username_end) == b':' {
+ debug_assert!(self.byte_at(self.host_start - 1) == b'@');
+ Some(self.slice(self.username_end + 1..self.host_start - 1))
+ } else {
+ None
+ }
+ }
+
+ /// Equivalent to `url.host().is_some()`.
+ pub fn has_host(&self) -> bool {
+ !matches!(self.host, HostInternal::None)
+ }
+
+ /// Return the string representation of the host (domain or IP address) for this URL, if any.
+ ///
+ /// Non-ASCII domains are punycode-encoded per IDNA.
+ /// IPv6 addresses are given between `[` and `]` brackets.
+ ///
+ /// Cannot-be-a-base URLs (typical of `data:` and `mailto:`) and some `file:` URLs
+ /// don’t have a host.
+ ///
+ /// See also the `host` method.
+ pub fn host_str(&self) -> Option<&str> {
+ if self.has_host() {
+ Some(self.slice(self.host_start..self.host_end))
+ } else {
+ None
+ }
+ }
+
+ /// Return the parsed representation of the host for this URL.
+ /// Non-ASCII domain labels are punycode-encoded per IDNA.
+ ///
+ /// Cannot-be-a-base URLs (typical of `data:` and `mailto:`) and some `file:` URLs
+ /// don’t have a host.
+ ///
+ /// See also the `host_str` method.
+ pub fn host(&self) -> Option<Host<&str>> {
+ match self.host {
+ HostInternal::None => None,
+ HostInternal::Domain => Some(Host::Domain(self.slice(self.host_start..self.host_end))),
+ HostInternal::Ipv4(address) => Some(Host::Ipv4(address)),
+ HostInternal::Ipv6(address) => Some(Host::Ipv6(address)),
+ }
+ }
+
+ /// If this URL has a host and it is a domain name (not an IP address), return it.
+ pub fn domain(&self) -> Option<&str> {
+ match self.host {
+ HostInternal::Domain => Some(self.slice(self.host_start..self.host_end)),
+ _ => None,
+ }
+ }
+
+ /// Return the port number for this URL, if any.
+ #[inline]
+ pub fn port(&self) -> Option<u16> {
+ self.port
+ }
+
+ /// Return the port number for this URL, or the default port number if it is known.
+ ///
+ /// This method only knows the default port number
+ /// of the `http`, `https`, `ws`, `wss`, `ftp`, and `gopher` schemes.
+ ///
+ /// For URLs in these schemes, this method always returns `Some(_)`.
+ /// For other schemes, it is the same as `Url::port()`.
+ #[inline]
+ pub fn port_or_known_default(&self) -> Option<u16> {
+ self.port.or_else(|| parser::default_port(self.scheme()))
+ }
+
+ /// If the URL has a host, return something that implements `ToSocketAddrs`.
+ ///
+ /// If the URL has no port number and the scheme’s default port number is not known
+ /// (see `Url::port_or_known_default`),
+ /// the closure is called to obtain a port number.
+ /// Typically, this closure can match on the result `Url::scheme`
+ /// to have per-scheme default port numbers,
+ /// and panic for schemes it’s not prepared to handle.
+ /// For example:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// # use std::net::TcpStream;
+ /// # use std::io;
+ ///
+ /// fn connect(url: &Url) -> io::Result<TcpStream> {
+ /// TcpStream::connect(try!(url.with_default_port(default_port)))
+ /// }
+ ///
+ /// fn default_port(url: &Url) -> Result<u16, ()> {
+ /// match url.scheme() {
+ /// "git" => Ok(9418),
+ /// "git+ssh" => Ok(22),
+ /// "git+https" => Ok(443),
+ /// "git+http" => Ok(80),
+ /// _ => Err(()),
+ /// }
+ /// }
+ /// ```
+ pub fn with_default_port<F>(&self, f: F) -> io::Result<HostAndPort<&str>>
+ where F: FnOnce(&Url) -> Result<u16, ()> {
+ Ok(HostAndPort {
+ host: try!(self.host()
+ .ok_or(())
+ .or_else(|()| io_error("URL has no host"))),
+ port: try!(self.port_or_known_default()
+ .ok_or(())
+ .or_else(|()| f(self))
+ .or_else(|()| io_error("URL has no port number")))
+ })
+ }
+
+ /// Return the path for this URL, as a percent-encoded ASCII string.
+ /// For cannot-be-a-base URLs, this is an arbitrary string that doesn’t start with '/'.
+ /// For other URLs, this starts with a '/' slash
+ /// and continues with slash-separated path segments.
+ pub fn path(&self) -> &str {
+ match (self.query_start, self.fragment_start) {
+ (None, None) => self.slice(self.path_start..),
+ (Some(next_component_start), _) |
+ (None, Some(next_component_start)) => {
+ self.slice(self.path_start..next_component_start)
+ }
+ }
+ }
+
+ /// Unless this URL is cannot-be-a-base,
+ /// return an iterator of '/' slash-separated path segments,
+ /// each as a percent-encoded ASCII string.
+ ///
+ /// Return `None` for cannot-be-a-base URLs.
+ ///
+ /// When `Some` is returned, the iterator always contains at least one string
+ /// (which may be empty).
+ pub fn path_segments(&self) -> Option<str::Split<char>> {
+ let path = self.path();
+ if path.starts_with('/') {
+ Some(path[1..].split('/'))
+ } else {
+ None
+ }
+ }
+
+ /// Return this URL’s query string, if any, as a percent-encoded ASCII string.
+ pub fn query(&self) -> Option<&str> {
+ match (self.query_start, self.fragment_start) {
+ (None, _) => None,
+ (Some(query_start), None) => {
+ debug_assert!(self.byte_at(query_start) == b'?');
+ Some(self.slice(query_start + 1..))
+ }
+ (Some(query_start), Some(fragment_start)) => {
+ debug_assert!(self.byte_at(query_start) == b'?');
+ Some(self.slice(query_start + 1..fragment_start))
+ }
+ }
+ }
+
+ /// Parse the URL’s query string, if any, as `application/x-www-form-urlencoded`
+ /// and return an iterator of (key, value) pairs.
+ #[inline]
+ pub fn query_pairs(&self) -> form_urlencoded::Parse {
+ form_urlencoded::parse(self.query().unwrap_or("").as_bytes())
+ }
+
+ /// Return this URL’s fragment identifier, if any.
+ ///
+ /// **Note:** the parser did *not* percent-encode this component,
+ /// but the input may have been percent-encoded already.
+ pub fn fragment(&self) -> Option<&str> {
+ self.fragment_start.map(|start| {
+ debug_assert!(self.byte_at(start) == b'#');
+ self.slice(start + 1..)
+ })
+ }
+
+ fn mutate<F: FnOnce(&mut Parser) -> R, R>(&mut self, f: F) -> R {
+ let mut parser = Parser::for_setter(mem::replace(&mut self.serialization, String::new()));
+ let result = f(&mut parser);
+ self.serialization = parser.serialization;
+ result
+ }
+
+ /// Change this URL’s fragment identifier.
+ pub fn set_fragment(&mut self, fragment: Option<&str>) {
+ // Remove any previous fragment
+ if let Some(start) = self.fragment_start {
+ debug_assert!(self.byte_at(start) == b'#');
+ self.serialization.truncate(start as usize);
+ }
+ // Write the new one
+ if let Some(input) = fragment {
+ self.fragment_start = Some(to_u32(self.serialization.len()).unwrap());
+ self.serialization.push('#');
+ self.mutate(|parser| parser.parse_fragment(parser::Input::new(input)))
+ } else {
+ self.fragment_start = None
+ }
+ }
+
+ fn take_fragment(&mut self) -> Option<String> {
+ self.fragment_start.take().map(|start| {
+ debug_assert!(self.byte_at(start) == b'#');
+ let fragment = self.slice(start + 1..).to_owned();
+ self.serialization.truncate(start as usize);
+ fragment
+ })
+ }
+
+ fn restore_already_parsed_fragment(&mut self, fragment: Option<String>) {
+ if let Some(ref fragment) = fragment {
+ assert!(self.fragment_start.is_none());
+ self.fragment_start = Some(to_u32(self.serialization.len()).unwrap());
+ self.serialization.push('#');
+ self.serialization.push_str(fragment);
+ }
+ }
+
+ /// Change this URL’s query string.
+ pub fn set_query(&mut self, query: Option<&str>) {
+ let fragment = self.take_fragment();
+
+ // Remove any previous query
+ if let Some(start) = self.query_start.take() {
+ debug_assert!(self.byte_at(start) == b'?');
+ self.serialization.truncate(start as usize);
+ }
+ // Write the new query, if any
+ if let Some(input) = query {
+ self.query_start = Some(to_u32(self.serialization.len()).unwrap());
+ self.serialization.push('?');
+ let scheme_end = self.scheme_end;
+ self.mutate(|parser| parser.parse_query(scheme_end, parser::Input::new(input)));
+ }
+
+ self.restore_already_parsed_fragment(fragment);
+ }
+
+ /// Manipulate this URL’s query string, viewed as a sequence of name/value pairs
+ /// in `application/x-www-form-urlencoded` syntax.
+ ///
+ /// The return value has a method-chaining API:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// let mut url = Url::parse("https://example.net?lang=fr#nav").unwrap();
+ /// assert_eq!(url.query(), Some("lang=fr"));
+ ///
+ /// url.query_pairs_mut().append_pair("foo", "bar");
+ /// assert_eq!(url.query(), Some("lang=fr&foo=bar"));
+ /// assert_eq!(url.as_str(), "https://example.net/?lang=fr&foo=bar#nav");
+ ///
+ /// url.query_pairs_mut()
+ /// .clear()
+ /// .append_pair("foo", "bar & baz")
+ /// .append_pair("saisons", "Été+hiver");
+ /// assert_eq!(url.query(), Some("foo=bar+%26+baz&saisons=%C3%89t%C3%A9%2Bhiver"));
+ /// assert_eq!(url.as_str(),
+ /// "https://example.net/?foo=bar+%26+baz&saisons=%C3%89t%C3%A9%2Bhiver#nav");
+ /// ```
+ ///
+ /// Note: `url.query_pairs_mut().clear();` is equivalent to `url.set_query(Some(""))`,
+ /// not `url.set_query(None)`.
+ ///
+ /// The state of `Url` is unspecified if this return value is leaked without being dropped.
+ pub fn query_pairs_mut(&mut self) -> form_urlencoded::Serializer<UrlQuery> {
+ let fragment = self.take_fragment();
+
+ let query_start;
+ if let Some(start) = self.query_start {
+ debug_assert!(self.byte_at(start) == b'?');
+ query_start = start as usize;
+ } else {
+ query_start = self.serialization.len();
+ self.query_start = Some(to_u32(query_start).unwrap());
+ self.serialization.push('?');
+ }
+
+ let query = UrlQuery { url: self, fragment: fragment };
+ form_urlencoded::Serializer::for_suffix(query, query_start + "?".len())
+ }
+
+ fn take_after_path(&mut self) -> String {
+ match (self.query_start, self.fragment_start) {
+ (Some(i), _) | (None, Some(i)) => {
+ let after_path = self.slice(i..).to_owned();
+ self.serialization.truncate(i as usize);
+ after_path
+ },
+ (None, None) => String::new(),
+ }
+ }
+
+ /// Change this URL’s path.
+ pub fn set_path(&mut self, mut path: &str) {
+ let after_path = self.take_after_path();
+ let old_after_path_pos = to_u32(self.serialization.len()).unwrap();
+ let cannot_be_a_base = self.cannot_be_a_base();
+ let scheme_type = SchemeType::from(self.scheme());
+ self.serialization.truncate(self.path_start as usize);
+ self.mutate(|parser| {
+ if cannot_be_a_base {
+ if path.starts_with('/') {
+ parser.serialization.push_str("%2F");
+ path = &path[1..];
+ }
+ parser.parse_cannot_be_a_base_path(parser::Input::new(path));
+ } else {
+ let mut has_host = true; // FIXME
+ parser.parse_path_start(scheme_type, &mut has_host, parser::Input::new(path));
+ }
+ });
+ self.restore_after_path(old_after_path_pos, &after_path);
+ }
+
+ /// Return an object with methods to manipulate this URL’s path segments.
+ ///
+ /// Return `Err(())` if this URl is cannot-be-a-base.
+ pub fn path_segments_mut(&mut self) -> Result<PathSegmentsMut, ()> {
+ if self.cannot_be_a_base() {
+ Err(())
+ } else {
+ Ok(path_segments::new(self))
+ }
+ }
+
+ fn restore_after_path(&mut self, old_after_path_position: u32, after_path: &str) {
+ let new_after_path_position = to_u32(self.serialization.len()).unwrap();
+ let adjust = |index: &mut u32| {
+ *index -= old_after_path_position;
+ *index += new_after_path_position;
+ };
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+ self.serialization.push_str(after_path)
+ }
+
+ /// Change this URL’s port number.
+ ///
+ /// If this URL is cannot-be-a-base, does not have a host, or has the `file` scheme;
+ /// do nothing and return `Err`.
+ pub fn set_port(&mut self, mut port: Option<u16>) -> Result<(), ()> {
+ if !self.has_host() || self.scheme() == "file" {
+ return Err(())
+ }
+ if port.is_some() && port == parser::default_port(self.scheme()) {
+ port = None
+ }
+ self.set_port_internal(port);
+ Ok(())
+ }
+
+ fn set_port_internal(&mut self, port: Option<u16>) {
+ match (self.port, port) {
+ (None, None) => {}
+ (Some(_), None) => {
+ self.serialization.drain(self.host_end as usize .. self.path_start as usize);
+ let offset = self.path_start - self.host_end;
+ self.path_start = self.host_end;
+ if let Some(ref mut index) = self.query_start { *index -= offset }
+ if let Some(ref mut index) = self.fragment_start { *index -= offset }
+ }
+ (Some(old), Some(new)) if old == new => {}
+ (_, Some(new)) => {
+ let path_and_after = self.slice(self.path_start..).to_owned();
+ self.serialization.truncate(self.host_end as usize);
+ write!(&mut self.serialization, ":{}", new).unwrap();
+ let old_path_start = self.path_start;
+ let new_path_start = to_u32(self.serialization.len()).unwrap();
+ self.path_start = new_path_start;
+ let adjust = |index: &mut u32| {
+ *index -= old_path_start;
+ *index += new_path_start;
+ };
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+ self.serialization.push_str(&path_and_after);
+ }
+ }
+ self.port = port;
+ }
+
+ /// Change this URL’s host.
+ ///
+ /// If this URL is cannot-be-a-base or there is an error parsing the given `host`,
+ /// do nothing and return `Err`.
+ ///
+ /// Removing the host (calling this with `None`)
+ /// will also remove any username, password, and port number.
+ pub fn set_host(&mut self, host: Option<&str>) -> Result<(), ParseError> {
+ if self.cannot_be_a_base() {
+ return Err(ParseError::SetHostOnCannotBeABaseUrl)
+ }
+
+ if let Some(host) = host {
+ self.set_host_internal(try!(Host::parse(host)), None)
+ } else if self.has_host() {
+ debug_assert!(self.byte_at(self.scheme_end) == b':');
+ debug_assert!(self.byte_at(self.path_start) == b'/');
+ let new_path_start = self.scheme_end + 1;
+ self.serialization.drain(self.path_start as usize..new_path_start as usize);
+ let offset = self.path_start - new_path_start;
+ self.path_start = new_path_start;
+ self.username_end = new_path_start;
+ self.host_start = new_path_start;
+ self.host_end = new_path_start;
+ self.port = None;
+ if let Some(ref mut index) = self.query_start { *index -= offset }
+ if let Some(ref mut index) = self.fragment_start { *index -= offset }
+ }
+ Ok(())
+ }
+
+ /// opt_new_port: None means leave unchanged, Some(None) means remove any port number.
+ fn set_host_internal(&mut self, host: Host<String>, opt_new_port: Option<Option<u16>>) {
+ let old_suffix_pos = if opt_new_port.is_some() { self.path_start } else { self.host_end };
+ let suffix = self.slice(old_suffix_pos..).to_owned();
+ self.serialization.truncate(self.host_start as usize);
+ if !self.has_authority() {
+ debug_assert!(self.slice(self.scheme_end..self.host_start) == ":");
+ debug_assert!(self.username_end == self.host_start);
+ self.serialization.push('/');
+ self.serialization.push('/');
+ self.username_end += 2;
+ self.host_start += 2;
+ }
+ write!(&mut self.serialization, "{}", host).unwrap();
+ self.host_end = to_u32(self.serialization.len()).unwrap();
+ self.host = host.into();
+
+ if let Some(new_port) = opt_new_port {
+ self.port = new_port;
+ if let Some(port) = new_port {
+ write!(&mut self.serialization, ":{}", port).unwrap();
+ }
+ }
+ let new_suffix_pos = to_u32(self.serialization.len()).unwrap();
+ self.serialization.push_str(&suffix);
+
+ let adjust = |index: &mut u32| {
+ *index -= old_suffix_pos;
+ *index += new_suffix_pos;
+ };
+ adjust(&mut self.path_start);
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+ }
+
+ /// Change this URL’s host to the given IP address.
+ ///
+ /// If this URL is cannot-be-a-base, do nothing and return `Err`.
+ ///
+ /// Compared to `Url::set_host`, this skips the host parser.
+ pub fn set_ip_host(&mut self, address: IpAddr) -> Result<(), ()> {
+ if self.cannot_be_a_base() {
+ return Err(())
+ }
+
+ let address = match address {
+ IpAddr::V4(address) => Host::Ipv4(address),
+ IpAddr::V6(address) => Host::Ipv6(address),
+ };
+ self.set_host_internal(address, None);
+ Ok(())
+ }
+
+ /// Change this URL’s password.
+ ///
+ /// If this URL is cannot-be-a-base or does not have a host, do nothing and return `Err`.
+ pub fn set_password(&mut self, password: Option<&str>) -> Result<(), ()> {
+ if !self.has_host() {
+ return Err(())
+ }
+ if let Some(password) = password {
+ let host_and_after = self.slice(self.host_start..).to_owned();
+ self.serialization.truncate(self.username_end as usize);
+ self.serialization.push(':');
+ self.serialization.extend(utf8_percent_encode(password, USERINFO_ENCODE_SET));
+ self.serialization.push('@');
+
+ let old_host_start = self.host_start;
+ let new_host_start = to_u32(self.serialization.len()).unwrap();
+ let adjust = |index: &mut u32| {
+ *index -= old_host_start;
+ *index += new_host_start;
+ };
+ self.host_start = new_host_start;
+ adjust(&mut self.host_end);
+ adjust(&mut self.path_start);
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+
+ self.serialization.push_str(&host_and_after);
+ } else if self.byte_at(self.username_end) == b':' { // If there is a password to remove
+ let has_username_or_password = self.byte_at(self.host_start - 1) == b'@';
+ debug_assert!(has_username_or_password);
+ let username_start = self.scheme_end + 3;
+ let empty_username = username_start == self.username_end;
+ let start = self.username_end; // Remove the ':'
+ let end = if empty_username {
+ self.host_start // Remove the '@' as well
+ } else {
+ self.host_start - 1 // Keep the '@' to separate the username from the host
+ };
+ self.serialization.drain(start as usize .. end as usize);
+ let offset = end - start;
+ self.host_start -= offset;
+ self.host_end -= offset;
+ self.path_start -= offset;
+ if let Some(ref mut index) = self.query_start { *index -= offset }
+ if let Some(ref mut index) = self.fragment_start { *index -= offset }
+ }
+ Ok(())
+ }
+
+ /// Change this URL’s username.
+ ///
+ /// If this URL is cannot-be-a-base or does not have a host, do nothing and return `Err`.
+ pub fn set_username(&mut self, username: &str) -> Result<(), ()> {
+ if !self.has_host() {
+ return Err(())
+ }
+ let username_start = self.scheme_end + 3;
+ debug_assert!(self.slice(self.scheme_end..username_start) == "://");
+ if self.slice(username_start..self.username_end) == username {
+ return Ok(())
+ }
+ let after_username = self.slice(self.username_end..).to_owned();
+ self.serialization.truncate(username_start as usize);
+ self.serialization.extend(utf8_percent_encode(username, USERINFO_ENCODE_SET));
+
+ let mut removed_bytes = self.username_end;
+ self.username_end = to_u32(self.serialization.len()).unwrap();
+ let mut added_bytes = self.username_end;
+
+ let new_username_is_empty = self.username_end == username_start;
+ match (new_username_is_empty, after_username.chars().next()) {
+ (true, Some('@')) => {
+ removed_bytes += 1;
+ self.serialization.push_str(&after_username[1..]);
+ }
+ (false, Some('@')) | (_, Some(':')) | (true, _) => {
+ self.serialization.push_str(&after_username);
+ }
+ (false, _) => {
+ added_bytes += 1;
+ self.serialization.push('@');
+ self.serialization.push_str(&after_username);
+ }
+ }
+
+ let adjust = |index: &mut u32| {
+ *index -= removed_bytes;
+ *index += added_bytes;
+ };
+ adjust(&mut self.host_start);
+ adjust(&mut self.host_end);
+ adjust(&mut self.path_start);
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+ Ok(())
+ }
+
+ /// Change this URL’s scheme.
+ ///
+ /// Do nothing and return `Err` if:
+ /// * The new scheme is not in `[a-zA-Z][a-zA-Z0-9+.-]+`
+ /// * This URL is cannot-be-a-base and the new scheme is one of
+ /// `http`, `https`, `ws`, `wss`, `ftp`, or `gopher`
+ pub fn set_scheme(&mut self, scheme: &str) -> Result<(), ()> {
+ let mut parser = Parser::for_setter(String::new());
+ let remaining = try!(parser.parse_scheme(parser::Input::new(scheme)));
+ if !remaining.is_empty() ||
+ (!self.has_host() && SchemeType::from(&parser.serialization).is_special()) {
+ return Err(())
+ }
+ let old_scheme_end = self.scheme_end;
+ let new_scheme_end = to_u32(parser.serialization.len()).unwrap();
+ let adjust = |index: &mut u32| {
+ *index -= old_scheme_end;
+ *index += new_scheme_end;
+ };
+
+ self.scheme_end = new_scheme_end;
+ adjust(&mut self.username_end);
+ adjust(&mut self.host_start);
+ adjust(&mut self.host_end);
+ adjust(&mut self.path_start);
+ if let Some(ref mut index) = self.query_start { adjust(index) }
+ if let Some(ref mut index) = self.fragment_start { adjust(index) }
+
+ parser.serialization.push_str(self.slice(old_scheme_end..));
+ self.serialization = parser.serialization;
+ Ok(())
+ }
+
+ /// Convert a file name as `std::path::Path` into an URL in the `file` scheme.
+ ///
+ /// This returns `Err` if the given path is not absolute or,
+ /// on Windows, if the prefix is not a disk prefix (e.g. `C:`).
+ pub fn from_file_path<P: AsRef<Path>>(path: P) -> Result<Url, ()> {
+ let mut serialization = "file://".to_owned();
+ let path_start = serialization.len() as u32;
+ try!(path_to_file_url_segments(path.as_ref(), &mut serialization));
+ Ok(Url {
+ serialization: serialization,
+ scheme_end: "file".len() as u32,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: None,
+ fragment_start: None,
+ })
+ }
+
+ /// Convert a directory name as `std::path::Path` into an URL in the `file` scheme.
+ ///
+ /// This returns `Err` if the given path is not absolute or,
+ /// on Windows, if the prefix is not a disk prefix (e.g. `C:`).
+ ///
+ /// Compared to `from_file_path`, this ensure that URL’s the path has a trailing slash
+ /// so that the entire path is considered when using this URL as a base URL.
+ ///
+ /// For example:
+ ///
+ /// * `"index.html"` parsed with `Url::from_directory_path(Path::new("/var/www"))`
+ /// as the base URL is `file:///var/www/index.html`
+ /// * `"index.html"` parsed with `Url::from_file_path(Path::new("/var/www"))`
+ /// as the base URL is `file:///var/index.html`, which might not be what was intended.
+ ///
+ /// Note that `std::path` does not consider trailing slashes significant
+ /// and usually does not include them (e.g. in `Path::parent()`).
+ pub fn from_directory_path<P: AsRef<Path>>(path: P) -> Result<Url, ()> {
+ let mut url = try!(Url::from_file_path(path));
+ if !url.serialization.ends_with('/') {
+ url.serialization.push('/')
+ }
+ Ok(url)
+ }
+
+ /// Assuming the URL is in the `file` scheme or similar,
+ /// convert its path to an absolute `std::path::Path`.
+ ///
+ /// **Note:** This does not actually check the URL’s `scheme`,
+ /// and may give nonsensical results for other schemes.
+ /// It is the user’s responsibility to check the URL’s scheme before calling this.
+ ///
+ /// ```
+ /// # use url::Url;
+ /// # let url = Url::parse("file:///etc/passwd").unwrap();
+ /// let path = url.to_file_path();
+ /// ```
+ ///
+ /// Returns `Err` if the host is neither empty nor `"localhost"`,
+ /// or if `Path::new_opt()` returns `None`.
+ /// (That is, if the percent-decoded path contains a NUL byte or,
+ /// for a Windows path, is not UTF-8.)
+ #[inline]
+ pub fn to_file_path(&self) -> Result<PathBuf, ()> {
+ // FIXME: Figure out what to do w.r.t host.
+ if matches!(self.host(), None | Some(Host::Domain("localhost"))) {
+ if let Some(segments) = self.path_segments() {
+ return file_url_segments_to_pathbuf(segments)
+ }
+ }
+ Err(())
+ }
+
+ // Private helper methods:
+
+ #[inline]
+ fn slice<R>(&self, range: R) -> &str where R: RangeArg {
+ range.slice_of(&self.serialization)
+ }
+
+ #[inline]
+ fn byte_at(&self, i: u32) -> u8 {
+ self.serialization.as_bytes()[i as usize]
+ }
+}
+
+/// Return an error if `Url::host` or `Url::port_or_known_default` return `None`.
+impl ToSocketAddrs for Url {
+ type Iter = SocketAddrs;
+
+ fn to_socket_addrs(&self) -> io::Result<Self::Iter> {
+ try!(self.with_default_port(|_| Err(()))).to_socket_addrs()
+ }
+}
+
+/// Parse a string as an URL, without a base URL or encoding override.
+impl str::FromStr for Url {
+ type Err = ParseError;
+
+ #[inline]
+ fn from_str(input: &str) -> Result<Url, ::ParseError> {
+ Url::parse(input)
+ }
+}
+
+/// Display the serialization of this URL.
+impl fmt::Display for Url {
+ #[inline]
+ fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
+ fmt::Display::fmt(&self.serialization, formatter)
+ }
+}
+
+/// Debug the serialization of this URL.
+impl fmt::Debug for Url {
+ #[inline]
+ fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
+ fmt::Debug::fmt(&self.serialization, formatter)
+ }
+}
+
+/// URLs compare like their serialization.
+impl Eq for Url {}
+
+/// URLs compare like their serialization.
+impl PartialEq for Url {
+ #[inline]
+ fn eq(&self, other: &Self) -> bool {
+ self.serialization == other.serialization
+ }
+}
+
+/// URLs compare like their serialization.
+impl Ord for Url {
+ #[inline]
+ fn cmp(&self, other: &Self) -> cmp::Ordering {
+ self.serialization.cmp(&other.serialization)
+ }
+}
+
+/// URLs compare like their serialization.
+impl PartialOrd for Url {
+ #[inline]
+ fn partial_cmp(&self, other: &Self) -> Option<cmp::Ordering> {
+ self.serialization.partial_cmp(&other.serialization)
+ }
+}
+
+/// URLs hash like their serialization.
+impl hash::Hash for Url {
+ #[inline]
+ fn hash<H>(&self, state: &mut H) where H: hash::Hasher {
+ hash::Hash::hash(&self.serialization, state)
+ }
+}
+
+/// Return the serialization of this URL.
+impl AsRef<str> for Url {
+ #[inline]
+ fn as_ref(&self) -> &str {
+ &self.serialization
+ }
+}
+
+trait RangeArg {
+ fn slice_of<'a>(&self, s: &'a str) -> &'a str;
+}
+
+impl RangeArg for Range<u32> {
+ #[inline]
+ fn slice_of<'a>(&self, s: &'a str) -> &'a str {
+ &s[self.start as usize .. self.end as usize]
+ }
+}
+
+impl RangeArg for RangeFrom<u32> {
+ #[inline]
+ fn slice_of<'a>(&self, s: &'a str) -> &'a str {
+ &s[self.start as usize ..]
+ }
+}
+
+impl RangeArg for RangeTo<u32> {
+ #[inline]
+ fn slice_of<'a>(&self, s: &'a str) -> &'a str {
+ &s[.. self.end as usize]
+ }
+}
+
+#[cfg(feature="rustc-serialize")]
+impl rustc_serialize::Encodable for Url {
+ fn encode<S: rustc_serialize::Encoder>(&self, encoder: &mut S) -> Result<(), S::Error> {
+ encoder.emit_str(self.as_str())
+ }
+}
+
+
+#[cfg(feature="rustc-serialize")]
+impl rustc_serialize::Decodable for Url {
+ fn decode<D: rustc_serialize::Decoder>(decoder: &mut D) -> Result<Url, D::Error> {
+ Url::parse(&*try!(decoder.read_str())).map_err(|error| {
+ decoder.error(&format!("URL parsing error: {}", error))
+ })
+ }
+}
+
+/// Serializes this URL into a `serde` stream.
+///
+/// This implementation is only available if the `serde` Cargo feature is enabled.
+#[cfg(feature="serde")]
+impl serde::Serialize for Url {
+ fn serialize<S>(&self, serializer: &mut S) -> Result<(), S::Error> where S: serde::Serializer {
+ format!("{}", self).serialize(serializer)
+ }
+}
+
+/// Deserializes this URL from a `serde` stream.
+///
+/// This implementation is only available if the `serde` Cargo feature is enabled.
+#[cfg(feature="serde")]
+impl serde::Deserialize for Url {
+ fn deserialize<D>(deserializer: &mut D) -> Result<Url, D::Error> where D: serde::Deserializer {
+ let string_representation: String = try!(serde::Deserialize::deserialize(deserializer));
+ Ok(Url::parse(&string_representation).unwrap())
+ }
+}
+
+#[cfg(unix)]
+fn path_to_file_url_segments(path: &Path, serialization: &mut String) -> Result<(), ()> {
+ use std::os::unix::prelude::OsStrExt;
+ if !path.is_absolute() {
+ return Err(())
+ }
+ let mut empty = true;
+ // skip the root component
+ for component in path.components().skip(1) {
+ empty = false;
+ serialization.push('/');
+ serialization.extend(percent_encode(
+ component.as_os_str().as_bytes(), PATH_SEGMENT_ENCODE_SET));
+ }
+ if empty {
+ // An URL’s path must not be empty.
+ serialization.push('/');
+ }
+ Ok(())
+}
+
+#[cfg(windows)]
+fn path_to_file_url_segments(path: &Path, serialization: &mut String) -> Result<(), ()> {
+ path_to_file_url_segments_windows(path, serialization)
+}
+
+// Build this unconditionally to alleviate https://github.com/servo/rust-url/issues/102
+#[cfg_attr(not(windows), allow(dead_code))]
+fn path_to_file_url_segments_windows(path: &Path, serialization: &mut String) -> Result<(), ()> {
+ use std::path::{Prefix, Component};
+ if !path.is_absolute() {
+ return Err(())
+ }
+ let mut components = path.components();
+ let disk = match components.next() {
+ Some(Component::Prefix(ref p)) => match p.kind() {
+ Prefix::Disk(byte) => byte,
+ Prefix::VerbatimDisk(byte) => byte,
+ _ => return Err(()),
+ },
+
+ // FIXME: do something with UNC and other prefixes?
+ _ => return Err(())
+ };
+
+ // Start with the prefix, e.g. "C:"
+ serialization.push('/');
+ serialization.push(disk as char);
+ serialization.push(':');
+
+ for component in components {
+ if component == Component::RootDir { continue }
+ // FIXME: somehow work with non-unicode?
+ let component = try!(component.as_os_str().to_str().ok_or(()));
+ serialization.push('/');
+ serialization.extend(percent_encode(component.as_bytes(), PATH_SEGMENT_ENCODE_SET));
+ }
+ Ok(())
+}
+
+#[cfg(unix)]
+fn file_url_segments_to_pathbuf(segments: str::Split<char>) -> Result<PathBuf, ()> {
+ use std::ffi::OsStr;
+ use std::os::unix::prelude::OsStrExt;
+ use std::path::PathBuf;
+
+ let mut bytes = Vec::new();
+ for segment in segments {
+ bytes.push(b'/');
+ bytes.extend(percent_decode(segment.as_bytes()));
+ }
+ let os_str = OsStr::from_bytes(&bytes);
+ let path = PathBuf::from(os_str);
+ debug_assert!(path.is_absolute(),
+ "to_file_path() failed to produce an absolute Path");
+ Ok(path)
+}
+
+#[cfg(windows)]
+fn file_url_segments_to_pathbuf(segments: str::Split<char>) -> Result<PathBuf, ()> {
+ file_url_segments_to_pathbuf_windows(segments)
+}
+
+// Build this unconditionally to alleviate https://github.com/servo/rust-url/issues/102
+#[cfg_attr(not(windows), allow(dead_code))]
+fn file_url_segments_to_pathbuf_windows(mut segments: str::Split<char>) -> Result<PathBuf, ()> {
+ let first = try!(segments.next().ok_or(()));
+ if first.len() != 2 || !first.starts_with(parser::ascii_alpha)
+ || first.as_bytes()[1] != b':' {
+ return Err(())
+ }
+ let mut string = first.to_owned();
+ for segment in segments {
+ string.push('\\');
+
+ // Currently non-unicode windows paths cannot be represented
+ match String::from_utf8(percent_decode(segment.as_bytes()).collect()) {
+ Ok(s) => string.push_str(&s),
+ Err(..) => return Err(()),
+ }
+ }
+ let path = PathBuf::from(string);
+ debug_assert!(path.is_absolute(),
+ "to_file_path() failed to produce an absolute Path");
+ Ok(path)
+}
+
+fn io_error<T>(reason: &str) -> io::Result<T> {
+ Err(io::Error::new(io::ErrorKind::InvalidData, reason))
+}
+
+/// Implementation detail of `Url::query_pairs_mut`. Typically not used directly.
+pub struct UrlQuery<'a> {
+ url: &'a mut Url,
+ fragment: Option<String>,
+}
+
+impl<'a> Drop for UrlQuery<'a> {
+ fn drop(&mut self) {
+ self.url.restore_already_parsed_fragment(self.fragment.take())
+ }
+}
diff --git a/third_party/rust/url/src/origin.rs b/third_party/rust/url/src/origin.rs
new file mode 100644
index 000000000..2217c94fe
--- /dev/null
+++ b/third_party/rust/url/src/origin.rs
@@ -0,0 +1,114 @@
+// Copyright 2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+#[cfg(feature = "heapsize")] use heapsize::HeapSizeOf;
+use host::Host;
+use idna::domain_to_unicode;
+use parser::default_port;
+use std::sync::atomic::{AtomicUsize, ATOMIC_USIZE_INIT, Ordering};
+use Url;
+
+pub fn url_origin(url: &Url) -> Origin {
+ let scheme = url.scheme();
+ match scheme {
+ "blob" => {
+ let result = Url::parse(url.path());
+ match result {
+ Ok(ref url) => url_origin(url),
+ Err(_) => Origin::new_opaque()
+ }
+ },
+ "ftp" | "gopher" | "http" | "https" | "ws" | "wss" => {
+ Origin::Tuple(scheme.to_owned(), url.host().unwrap().to_owned(),
+ url.port_or_known_default().unwrap())
+ },
+ // TODO: Figure out what to do if the scheme is a file
+ "file" => Origin::new_opaque(),
+ _ => Origin::new_opaque()
+ }
+}
+
+/// The origin of an URL
+#[derive(PartialEq, Eq, Clone, Debug)]
+pub enum Origin {
+ /// A globally unique identifier
+ Opaque(OpaqueOrigin),
+
+ /// Consists of the URL's scheme, host and port
+ Tuple(String, Host<String>, u16)
+}
+
+#[cfg(feature = "heapsize")]
+impl HeapSizeOf for Origin {
+ fn heap_size_of_children(&self) -> usize {
+ match *self {
+ Origin::Tuple(ref scheme, ref host, _) => {
+ scheme.heap_size_of_children() +
+ host.heap_size_of_children()
+ },
+ _ => 0,
+ }
+ }
+}
+
+
+impl Origin {
+ /// Creates a new opaque origin that is only equal to itself.
+ pub fn new_opaque() -> Origin {
+ static COUNTER: AtomicUsize = ATOMIC_USIZE_INIT;
+ Origin::Opaque(OpaqueOrigin(COUNTER.fetch_add(1, Ordering::SeqCst)))
+ }
+
+ /// Return whether this origin is a (scheme, host, port) tuple
+ /// (as opposed to an opaque origin).
+ pub fn is_tuple(&self) -> bool {
+ matches!(*self, Origin::Tuple(..))
+ }
+
+ /// https://html.spec.whatwg.org/multipage/#ascii-serialisation-of-an-origin
+ pub fn ascii_serialization(&self) -> String {
+ match *self {
+ Origin::Opaque(_) => "null".to_owned(),
+ Origin::Tuple(ref scheme, ref host, port) => {
+ if default_port(scheme) == Some(port) {
+ format!("{}://{}", scheme, host)
+ } else {
+ format!("{}://{}:{}", scheme, host, port)
+ }
+ }
+ }
+ }
+
+ /// https://html.spec.whatwg.org/multipage/#unicode-serialisation-of-an-origin
+ pub fn unicode_serialization(&self) -> String {
+ match *self {
+ Origin::Opaque(_) => "null".to_owned(),
+ Origin::Tuple(ref scheme, ref host, port) => {
+ let host = match *host {
+ Host::Domain(ref domain) => {
+ let (domain, _errors) = domain_to_unicode(domain);
+ Host::Domain(domain)
+ }
+ _ => host.clone()
+ };
+ if default_port(scheme) == Some(port) {
+ format!("{}://{}", scheme, host)
+ } else {
+ format!("{}://{}:{}", scheme, host, port)
+ }
+ }
+ }
+ }
+}
+
+/// Opaque identifier for URLs that have file or other schemes
+#[derive(Eq, PartialEq, Clone, Debug)]
+pub struct OpaqueOrigin(usize);
+
+#[cfg(feature = "heapsize")]
+known_heap_size!(0, OpaqueOrigin);
diff --git a/third_party/rust/url/src/parser.rs b/third_party/rust/url/src/parser.rs
new file mode 100644
index 000000000..2945432fc
--- /dev/null
+++ b/third_party/rust/url/src/parser.rs
@@ -0,0 +1,1179 @@
+// Copyright 2013-2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+use std::ascii::AsciiExt;
+use std::error::Error;
+use std::fmt::{self, Formatter, Write};
+use std::str;
+
+use Url;
+use encoding::EncodingOverride;
+use host::{Host, HostInternal};
+use percent_encoding::{
+ utf8_percent_encode, percent_encode,
+ SIMPLE_ENCODE_SET, DEFAULT_ENCODE_SET, USERINFO_ENCODE_SET, QUERY_ENCODE_SET,
+ PATH_SEGMENT_ENCODE_SET
+};
+
+pub type ParseResult<T> = Result<T, ParseError>;
+
+macro_rules! simple_enum_error {
+ ($($name: ident => $description: expr,)+) => {
+ /// Errors that can occur during parsing.
+ #[derive(PartialEq, Eq, Clone, Copy, Debug)]
+ pub enum ParseError {
+ $(
+ $name,
+ )+
+ }
+
+ impl Error for ParseError {
+ fn description(&self) -> &str {
+ match *self {
+ $(
+ ParseError::$name => $description,
+ )+
+ }
+ }
+ }
+ }
+}
+
+simple_enum_error! {
+ EmptyHost => "empty host",
+ IdnaError => "invalid international domain name",
+ InvalidPort => "invalid port number",
+ InvalidIpv4Address => "invalid IPv4 address",
+ InvalidIpv6Address => "invalid IPv6 address",
+ InvalidDomainCharacter => "invalid domain character",
+ RelativeUrlWithoutBase => "relative URL without a base",
+ RelativeUrlWithCannotBeABaseBase => "relative URL with a cannot-be-a-base base",
+ SetHostOnCannotBeABaseUrl => "a cannot-be-a-base URL doesn’t have a host to set",
+ Overflow => "URLs more than 4 GB are not supported",
+}
+
+impl fmt::Display for ParseError {
+ fn fmt(&self, fmt: &mut Formatter) -> fmt::Result {
+ self.description().fmt(fmt)
+ }
+}
+
+impl From<::idna::uts46::Errors> for ParseError {
+ fn from(_: ::idna::uts46::Errors) -> ParseError { ParseError::IdnaError }
+}
+
+#[derive(Copy, Clone)]
+pub enum SchemeType {
+ File,
+ SpecialNotFile,
+ NotSpecial,
+}
+
+impl SchemeType {
+ pub fn is_special(&self) -> bool {
+ !matches!(*self, SchemeType::NotSpecial)
+ }
+
+ pub fn is_file(&self) -> bool {
+ matches!(*self, SchemeType::File)
+ }
+
+ pub fn from(s: &str) -> Self {
+ match s {
+ "http" | "https" | "ws" | "wss" | "ftp" | "gopher" => SchemeType::SpecialNotFile,
+ "file" => SchemeType::File,
+ _ => SchemeType::NotSpecial,
+ }
+ }
+}
+
+pub fn default_port(scheme: &str) -> Option<u16> {
+ match scheme {
+ "http" | "ws" => Some(80),
+ "https" | "wss" => Some(443),
+ "ftp" => Some(21),
+ "gopher" => Some(70),
+ _ => None,
+ }
+}
+
+#[derive(Clone)]
+pub struct Input<'i> {
+ chars: str::Chars<'i>,
+}
+
+impl<'i> Input<'i> {
+ pub fn new(input: &'i str) -> Self {
+ Input::with_log(input, None)
+ }
+
+ pub fn with_log(original_input: &'i str, log_syntax_violation: Option<&Fn(&'static str)>)
+ -> Self {
+ let input = original_input.trim_matches(c0_control_or_space);
+ if let Some(log) = log_syntax_violation {
+ if input.len() < original_input.len() {
+ log("leading or trailing control or space character are ignored in URLs")
+ }
+ if input.chars().any(|c| matches!(c, '\t' | '\n' | '\r')) {
+ log("tabs or newlines are ignored in URLs")
+ }
+ }
+ Input { chars: input.chars() }
+ }
+
+ #[inline]
+ pub fn is_empty(&self) -> bool {
+ self.clone().next().is_none()
+ }
+
+ #[inline]
+ fn starts_with<P: Pattern>(&self, p: P) -> bool {
+ p.split_prefix(&mut self.clone())
+ }
+
+ #[inline]
+ pub fn split_prefix<P: Pattern>(&self, p: P) -> Option<Self> {
+ let mut remaining = self.clone();
+ if p.split_prefix(&mut remaining) {
+ Some(remaining)
+ } else {
+ None
+ }
+ }
+
+ #[inline]
+ fn split_first(&self) -> (Option<char>, Self) {
+ let mut remaining = self.clone();
+ (remaining.next(), remaining)
+ }
+
+ #[inline]
+ fn count_matching<F: Fn(char) -> bool>(&self, f: F) -> (u32, Self) {
+ let mut count = 0;
+ let mut remaining = self.clone();
+ loop {
+ let mut input = remaining.clone();
+ if matches!(input.next(), Some(c) if f(c)) {
+ remaining = input;
+ count += 1;
+ } else {
+ return (count, remaining)
+ }
+ }
+ }
+
+ #[inline]
+ fn next_utf8(&mut self) -> Option<(char, &'i str)> {
+ loop {
+ let utf8 = self.chars.as_str();
+ match self.chars.next() {
+ Some(c) => {
+ if !matches!(c, '\t' | '\n' | '\r') {
+ return Some((c, &utf8[..c.len_utf8()]))
+ }
+ }
+ None => return None
+ }
+ }
+ }
+}
+
+pub trait Pattern {
+ fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool;
+}
+
+impl Pattern for char {
+ fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool { input.next() == Some(self) }
+}
+
+impl<'a> Pattern for &'a str {
+ fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool {
+ for c in self.chars() {
+ if input.next() != Some(c) {
+ return false
+ }
+ }
+ true
+ }
+}
+
+impl<F: FnMut(char) -> bool> Pattern for F {
+ fn split_prefix<'i>(self, input: &mut Input<'i>) -> bool { input.next().map_or(false, self) }
+}
+
+impl<'i> Iterator for Input<'i> {
+ type Item = char;
+ fn next(&mut self) -> Option<char> {
+ self.chars.by_ref().filter(|&c| !matches!(c, '\t' | '\n' | '\r')).next()
+ }
+}
+
+pub struct Parser<'a> {
+ pub serialization: String,
+ pub base_url: Option<&'a Url>,
+ pub query_encoding_override: EncodingOverride,
+ pub log_syntax_violation: Option<&'a Fn(&'static str)>,
+ pub context: Context,
+}
+
+#[derive(PartialEq, Eq, Copy, Clone)]
+pub enum Context {
+ UrlParser,
+ Setter,
+ PathSegmentSetter,
+}
+
+impl<'a> Parser<'a> {
+ pub fn for_setter(serialization: String) -> Parser<'a> {
+ Parser {
+ serialization: serialization,
+ base_url: None,
+ query_encoding_override: EncodingOverride::utf8(),
+ log_syntax_violation: None,
+ context: Context::Setter,
+ }
+ }
+
+ fn syntax_violation(&self, reason: &'static str) {
+ if let Some(log) = self.log_syntax_violation {
+ log(reason)
+ }
+ }
+
+ fn syntax_violation_if<F: Fn() -> bool>(&self, reason: &'static str, test: F) {
+ // Skip test if not logging.
+ if let Some(log) = self.log_syntax_violation {
+ if test() {
+ log(reason)
+ }
+ }
+ }
+
+ /// https://url.spec.whatwg.org/#concept-basic-url-parser
+ pub fn parse_url(mut self, input: &str) -> ParseResult<Url> {
+ let input = Input::with_log(input, self.log_syntax_violation);
+ if let Ok(remaining) = self.parse_scheme(input.clone()) {
+ return self.parse_with_scheme(remaining)
+ }
+
+ // No-scheme state
+ if let Some(base_url) = self.base_url {
+ if input.starts_with('#') {
+ self.fragment_only(base_url, input)
+ } else if base_url.cannot_be_a_base() {
+ Err(ParseError::RelativeUrlWithCannotBeABaseBase)
+ } else {
+ let scheme_type = SchemeType::from(base_url.scheme());
+ if scheme_type.is_file() {
+ self.parse_file(input, Some(base_url))
+ } else {
+ self.parse_relative(input, scheme_type, base_url)
+ }
+ }
+ } else {
+ Err(ParseError::RelativeUrlWithoutBase)
+ }
+ }
+
+ pub fn parse_scheme<'i>(&mut self, mut input: Input<'i>) -> Result<Input<'i>, ()> {
+ if input.is_empty() || !input.starts_with(ascii_alpha) {
+ return Err(())
+ }
+ debug_assert!(self.serialization.is_empty());
+ while let Some(c) = input.next() {
+ match c {
+ 'a'...'z' | 'A'...'Z' | '0'...'9' | '+' | '-' | '.' => {
+ self.serialization.push(c.to_ascii_lowercase())
+ }
+ ':' => return Ok(input),
+ _ => {
+ self.serialization.clear();
+ return Err(())
+ }
+ }
+ }
+ // EOF before ':'
+ if self.context == Context::Setter {
+ Ok(input)
+ } else {
+ self.serialization.clear();
+ Err(())
+ }
+ }
+
+ fn parse_with_scheme(mut self, input: Input) -> ParseResult<Url> {
+ let scheme_end = try!(to_u32(self.serialization.len()));
+ let scheme_type = SchemeType::from(&self.serialization);
+ self.serialization.push(':');
+ match scheme_type {
+ SchemeType::File => {
+ self.syntax_violation_if("expected // after file:", || !input.starts_with("//"));
+ let base_file_url = self.base_url.and_then(|base| {
+ if base.scheme() == "file" { Some(base) } else { None }
+ });
+ self.serialization.clear();
+ self.parse_file(input, base_file_url)
+ }
+ SchemeType::SpecialNotFile => {
+ // special relative or authority state
+ let (slashes_count, remaining) = input.count_matching(|c| matches!(c, '/' | '\\'));
+ if let Some(base_url) = self.base_url {
+ if slashes_count < 2 &&
+ base_url.scheme() == &self.serialization[..scheme_end as usize] {
+ // "Cannot-be-a-base" URLs only happen with "not special" schemes.
+ debug_assert!(!base_url.cannot_be_a_base());
+ self.serialization.clear();
+ return self.parse_relative(input, scheme_type, base_url)
+ }
+ }
+ // special authority slashes state
+ self.syntax_violation_if("expected //", || {
+ input.clone().take_while(|&c| matches!(c, '/' | '\\'))
+ .collect::<String>() != "//"
+ });
+ self.after_double_slash(remaining, scheme_type, scheme_end)
+ }
+ SchemeType::NotSpecial => self.parse_non_special(input, scheme_type, scheme_end)
+ }
+ }
+
+ /// Scheme other than file, http, https, ws, ws, ftp, gopher.
+ fn parse_non_special(mut self, input: Input, scheme_type: SchemeType, scheme_end: u32)
+ -> ParseResult<Url> {
+ // path or authority state (
+ if let Some(input) = input.split_prefix("//") {
+ return self.after_double_slash(input, scheme_type, scheme_end)
+ }
+ // Anarchist URL (no authority)
+ let path_start = try!(to_u32(self.serialization.len()));
+ let username_end = path_start;
+ let host_start = path_start;
+ let host_end = path_start;
+ let host = HostInternal::None;
+ let port = None;
+ let remaining = if let Some(input) = input.split_prefix('/') {
+ let path_start = self.serialization.len();
+ self.serialization.push('/');
+ self.parse_path(scheme_type, &mut false, path_start, input)
+ } else {
+ self.parse_cannot_be_a_base_path(input)
+ };
+ self.with_query_and_fragment(scheme_end, username_end, host_start,
+ host_end, host, port, path_start, remaining)
+ }
+
+ fn parse_file(mut self, input: Input, mut base_file_url: Option<&Url>) -> ParseResult<Url> {
+ // file state
+ debug_assert!(self.serialization.is_empty());
+ let (first_char, input_after_first_char) = input.split_first();
+ match first_char {
+ None => {
+ if let Some(base_url) = base_file_url {
+ // Copy everything except the fragment
+ let before_fragment = match base_url.fragment_start {
+ Some(i) => &base_url.serialization[..i as usize],
+ None => &*base_url.serialization,
+ };
+ self.serialization.push_str(before_fragment);
+ Ok(Url {
+ serialization: self.serialization,
+ fragment_start: None,
+ ..*base_url
+ })
+ } else {
+ self.serialization.push_str("file:///");
+ let scheme_end = "file".len() as u32;
+ let path_start = "file://".len() as u32;
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: None,
+ fragment_start: None,
+ })
+ }
+ },
+ Some('?') => {
+ if let Some(base_url) = base_file_url {
+ // Copy everything up to the query string
+ let before_query = match (base_url.query_start, base_url.fragment_start) {
+ (None, None) => &*base_url.serialization,
+ (Some(i), _) |
+ (None, Some(i)) => base_url.slice(..i)
+ };
+ self.serialization.push_str(before_query);
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(base_url.scheme_end, input));
+ Ok(Url {
+ serialization: self.serialization,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ ..*base_url
+ })
+ } else {
+ self.serialization.push_str("file:///");
+ let scheme_end = "file".len() as u32;
+ let path_start = "file://".len() as u32;
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(scheme_end, input));
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ })
+ }
+ },
+ Some('#') => {
+ if let Some(base_url) = base_file_url {
+ self.fragment_only(base_url, input)
+ } else {
+ self.serialization.push_str("file:///");
+ let scheme_end = "file".len() as u32;
+ let path_start = "file://".len() as u32;
+ let fragment_start = "file:///".len() as u32;
+ self.parse_fragment(input_after_first_char);
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: None,
+ fragment_start: Some(fragment_start),
+ })
+ }
+ }
+ Some('/') | Some('\\') => {
+ self.syntax_violation_if("backslash", || first_char == Some('\\'));
+ // file slash state
+ let (next_char, input_after_next_char) = input_after_first_char.split_first();
+ self.syntax_violation_if("backslash", || next_char == Some('\\'));
+ if matches!(next_char, Some('/') | Some('\\')) {
+ // file host state
+ self.serialization.push_str("file://");
+ let scheme_end = "file".len() as u32;
+ let host_start = "file://".len() as u32;
+ let (path_start, host, remaining) =
+ try!(self.parse_file_host(input_after_next_char));
+ let host_end = try!(to_u32(self.serialization.len()));
+ let mut has_host = !matches!(host, HostInternal::None);
+ let remaining = if path_start {
+ self.parse_path_start(SchemeType::File, &mut has_host, remaining)
+ } else {
+ let path_start = self.serialization.len();
+ self.serialization.push('/');
+ self.parse_path(SchemeType::File, &mut has_host, path_start, remaining)
+ };
+ // FIXME: deal with has_host
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(scheme_end, remaining));
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: host_start,
+ host_start: host_start,
+ host_end: host_end,
+ host: host,
+ port: None,
+ path_start: host_end,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ })
+ } else {
+ self.serialization.push_str("file:///");
+ let scheme_end = "file".len() as u32;
+ let path_start = "file://".len();
+ if let Some(base_url) = base_file_url {
+ let first_segment = base_url.path_segments().unwrap().next().unwrap();
+ // FIXME: *normalized* drive letter
+ if is_windows_drive_letter(first_segment) {
+ self.serialization.push_str(first_segment);
+ self.serialization.push('/');
+ }
+ }
+ let remaining = self.parse_path(
+ SchemeType::File, &mut false, path_start, input_after_first_char);
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(scheme_end, remaining));
+ let path_start = path_start as u32;
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ })
+ }
+ }
+ _ => {
+ if starts_with_windows_drive_letter_segment(&input) {
+ base_file_url = None;
+ }
+ if let Some(base_url) = base_file_url {
+ let before_query = match (base_url.query_start, base_url.fragment_start) {
+ (None, None) => &*base_url.serialization,
+ (Some(i), _) |
+ (None, Some(i)) => base_url.slice(..i)
+ };
+ self.serialization.push_str(before_query);
+ self.pop_path(SchemeType::File, base_url.path_start as usize);
+ let remaining = self.parse_path(
+ SchemeType::File, &mut true, base_url.path_start as usize, input);
+ self.with_query_and_fragment(
+ base_url.scheme_end, base_url.username_end, base_url.host_start,
+ base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining)
+ } else {
+ self.serialization.push_str("file:///");
+ let scheme_end = "file".len() as u32;
+ let path_start = "file://".len();
+ let remaining = self.parse_path(
+ SchemeType::File, &mut false, path_start, input);
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(scheme_end, remaining));
+ let path_start = path_start as u32;
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: path_start,
+ host_start: path_start,
+ host_end: path_start,
+ host: HostInternal::None,
+ port: None,
+ path_start: path_start,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ })
+ }
+ }
+ }
+ }
+
+ fn parse_relative(mut self, input: Input, scheme_type: SchemeType, base_url: &Url)
+ -> ParseResult<Url> {
+ // relative state
+ debug_assert!(self.serialization.is_empty());
+ let (first_char, input_after_first_char) = input.split_first();
+ match first_char {
+ None => {
+ // Copy everything except the fragment
+ let before_fragment = match base_url.fragment_start {
+ Some(i) => &base_url.serialization[..i as usize],
+ None => &*base_url.serialization,
+ };
+ self.serialization.push_str(before_fragment);
+ Ok(Url {
+ serialization: self.serialization,
+ fragment_start: None,
+ ..*base_url
+ })
+ },
+ Some('?') => {
+ // Copy everything up to the query string
+ let before_query = match (base_url.query_start, base_url.fragment_start) {
+ (None, None) => &*base_url.serialization,
+ (Some(i), _) |
+ (None, Some(i)) => base_url.slice(..i)
+ };
+ self.serialization.push_str(before_query);
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(base_url.scheme_end, input));
+ Ok(Url {
+ serialization: self.serialization,
+ query_start: query_start,
+ fragment_start: fragment_start,
+ ..*base_url
+ })
+ },
+ Some('#') => self.fragment_only(base_url, input),
+ Some('/') | Some('\\') => {
+ let (slashes_count, remaining) = input.count_matching(|c| matches!(c, '/' | '\\'));
+ if slashes_count >= 2 {
+ self.syntax_violation_if("expected //", || {
+ input.clone().take_while(|&c| matches!(c, '/' | '\\'))
+ .collect::<String>() != "//"
+ });
+ let scheme_end = base_url.scheme_end;
+ debug_assert!(base_url.byte_at(scheme_end) == b':');
+ self.serialization.push_str(base_url.slice(..scheme_end + 1));
+ return self.after_double_slash(remaining, scheme_type, scheme_end)
+ }
+ let path_start = base_url.path_start;
+ debug_assert!(base_url.byte_at(path_start) == b'/');
+ self.serialization.push_str(base_url.slice(..path_start + 1));
+ let remaining = self.parse_path(
+ scheme_type, &mut true, path_start as usize, input_after_first_char);
+ self.with_query_and_fragment(
+ base_url.scheme_end, base_url.username_end, base_url.host_start,
+ base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining)
+ }
+ _ => {
+ let before_query = match (base_url.query_start, base_url.fragment_start) {
+ (None, None) => &*base_url.serialization,
+ (Some(i), _) |
+ (None, Some(i)) => base_url.slice(..i)
+ };
+ self.serialization.push_str(before_query);
+ // FIXME spec says just "remove last entry", not the "pop" algorithm
+ self.pop_path(scheme_type, base_url.path_start as usize);
+ let remaining = self.parse_path(
+ scheme_type, &mut true, base_url.path_start as usize, input);
+ self.with_query_and_fragment(
+ base_url.scheme_end, base_url.username_end, base_url.host_start,
+ base_url.host_end, base_url.host, base_url.port, base_url.path_start, remaining)
+ }
+ }
+ }
+
+ fn after_double_slash(mut self, input: Input, scheme_type: SchemeType, scheme_end: u32)
+ -> ParseResult<Url> {
+ self.serialization.push('/');
+ self.serialization.push('/');
+ // authority state
+ let (username_end, remaining) = try!(self.parse_userinfo(input, scheme_type));
+ // host state
+ let host_start = try!(to_u32(self.serialization.len()));
+ let (host_end, host, port, remaining) =
+ try!(self.parse_host_and_port(remaining, scheme_end, scheme_type));
+ // path state
+ let path_start = try!(to_u32(self.serialization.len()));
+ let remaining = self.parse_path_start(
+ scheme_type, &mut true, remaining);
+ self.with_query_and_fragment(scheme_end, username_end, host_start,
+ host_end, host, port, path_start, remaining)
+ }
+
+ /// Return (username_end, remaining)
+ fn parse_userinfo<'i>(&mut self, mut input: Input<'i>, scheme_type: SchemeType)
+ -> ParseResult<(u32, Input<'i>)> {
+ let mut last_at = None;
+ let mut remaining = input.clone();
+ let mut char_count = 0;
+ while let Some(c) = remaining.next() {
+ match c {
+ '@' => {
+ if last_at.is_some() {
+ self.syntax_violation("unencoded @ sign in username or password")
+ } else {
+ self.syntax_violation(
+ "embedding authentification information (username or password) \
+ in an URL is not recommended")
+ }
+ last_at = Some((char_count, remaining.clone()))
+ },
+ '/' | '?' | '#' => break,
+ '\\' if scheme_type.is_special() => break,
+ _ => (),
+ }
+ char_count += 1;
+ }
+ let (mut userinfo_char_count, remaining) = match last_at {
+ None => return Ok((try!(to_u32(self.serialization.len())), input)),
+ Some((0, remaining)) => return Ok((try!(to_u32(self.serialization.len())), remaining)),
+ Some(x) => x
+ };
+
+ let mut username_end = None;
+ while userinfo_char_count > 0 {
+ let (c, utf8_c) = input.next_utf8().unwrap();
+ userinfo_char_count -= 1;
+ if c == ':' && username_end.is_none() {
+ // Start parsing password
+ username_end = Some(try!(to_u32(self.serialization.len())));
+ self.serialization.push(':');
+ } else {
+ self.check_url_code_point(c, &input);
+ self.serialization.extend(utf8_percent_encode(utf8_c, USERINFO_ENCODE_SET));
+ }
+ }
+ let username_end = match username_end {
+ Some(i) => i,
+ None => try!(to_u32(self.serialization.len())),
+ };
+ self.serialization.push('@');
+ Ok((username_end, remaining))
+ }
+
+ fn parse_host_and_port<'i>(&mut self, input: Input<'i>,
+ scheme_end: u32, scheme_type: SchemeType)
+ -> ParseResult<(u32, HostInternal, Option<u16>, Input<'i>)> {
+ let (host, remaining) = try!(
+ Parser::parse_host(input, scheme_type));
+ write!(&mut self.serialization, "{}", host).unwrap();
+ let host_end = try!(to_u32(self.serialization.len()));
+ let (port, remaining) = if let Some(remaining) = remaining.split_prefix(':') {
+ let scheme = || default_port(&self.serialization[..scheme_end as usize]);
+ try!(Parser::parse_port(remaining, scheme, self.context))
+ } else {
+ (None, remaining)
+ };
+ if let Some(port) = port {
+ write!(&mut self.serialization, ":{}", port).unwrap()
+ }
+ Ok((host_end, host.into(), port, remaining))
+ }
+
+ pub fn parse_host<'i>(mut input: Input<'i>, scheme_type: SchemeType)
+ -> ParseResult<(Host<String>, Input<'i>)> {
+ // Undo the Input abstraction here to avoid allocating in the common case
+ // where the host part of the input does not contain any tab or newline
+ let input_str = input.chars.as_str();
+ let mut inside_square_brackets = false;
+ let mut has_ignored_chars = false;
+ let mut non_ignored_chars = 0;
+ let mut bytes = 0;
+ for c in input_str.chars() {
+ match c {
+ ':' if !inside_square_brackets => break,
+ '\\' if scheme_type.is_special() => break,
+ '/' | '?' | '#' => break,
+ '\t' | '\n' | '\r' => {
+ has_ignored_chars = true;
+ }
+ '[' => {
+ inside_square_brackets = true;
+ non_ignored_chars += 1
+ }
+ ']' => {
+ inside_square_brackets = false;
+ non_ignored_chars += 1
+ }
+ _ => non_ignored_chars += 1
+ }
+ bytes += c.len_utf8();
+ }
+ let replaced: String;
+ let host_str;
+ {
+ let host_input = input.by_ref().take(non_ignored_chars);
+ if has_ignored_chars {
+ replaced = host_input.collect();
+ host_str = &*replaced
+ } else {
+ for _ in host_input {}
+ host_str = &input_str[..bytes]
+ }
+ }
+ if scheme_type.is_special() && host_str.is_empty() {
+ return Err(ParseError::EmptyHost)
+ }
+ let host = try!(Host::parse(host_str));
+ Ok((host, input))
+ }
+
+ pub fn parse_file_host<'i>(&mut self, input: Input<'i>)
+ -> ParseResult<(bool, HostInternal, Input<'i>)> {
+ // Undo the Input abstraction here to avoid allocating in the common case
+ // where the host part of the input does not contain any tab or newline
+ let input_str = input.chars.as_str();
+ let mut has_ignored_chars = false;
+ let mut non_ignored_chars = 0;
+ let mut bytes = 0;
+ for c in input_str.chars() {
+ match c {
+ '/' | '\\' | '?' | '#' => break,
+ '\t' | '\n' | '\r' => has_ignored_chars = true,
+ _ => non_ignored_chars += 1,
+ }
+ bytes += c.len_utf8();
+ }
+ let replaced: String;
+ let host_str;
+ let mut remaining = input.clone();
+ {
+ let host_input = remaining.by_ref().take(non_ignored_chars);
+ if has_ignored_chars {
+ replaced = host_input.collect();
+ host_str = &*replaced
+ } else {
+ for _ in host_input {}
+ host_str = &input_str[..bytes]
+ }
+ }
+ if is_windows_drive_letter(host_str) {
+ return Ok((false, HostInternal::None, input))
+ }
+ let host = if host_str.is_empty() {
+ HostInternal::None
+ } else {
+ match try!(Host::parse(host_str)) {
+ Host::Domain(ref d) if d == "localhost" => HostInternal::None,
+ host => {
+ write!(&mut self.serialization, "{}", host).unwrap();
+ host.into()
+ }
+ }
+ };
+ Ok((true, host, remaining))
+ }
+
+ pub fn parse_port<'i, P>(mut input: Input<'i>, default_port: P,
+ context: Context)
+ -> ParseResult<(Option<u16>, Input<'i>)>
+ where P: Fn() -> Option<u16> {
+ let mut port: u32 = 0;
+ let mut has_any_digit = false;
+ while let (Some(c), remaining) = input.split_first() {
+ if let Some(digit) = c.to_digit(10) {
+ port = port * 10 + digit;
+ if port > ::std::u16::MAX as u32 {
+ return Err(ParseError::InvalidPort)
+ }
+ has_any_digit = true;
+ } else if context == Context::UrlParser && !matches!(c, '/' | '\\' | '?' | '#') {
+ return Err(ParseError::InvalidPort)
+ } else {
+ break
+ }
+ input = remaining;
+ }
+ let mut opt_port = Some(port as u16);
+ if !has_any_digit || opt_port == default_port() {
+ opt_port = None;
+ }
+ return Ok((opt_port, input))
+ }
+
+ pub fn parse_path_start<'i>(&mut self, scheme_type: SchemeType, has_host: &mut bool,
+ mut input: Input<'i>)
+ -> Input<'i> {
+ // Path start state
+ match input.split_first() {
+ (Some('/'), remaining) => input = remaining,
+ (Some('\\'), remaining) => if scheme_type.is_special() {
+ self.syntax_violation("backslash");
+ input = remaining
+ },
+ _ => {}
+ }
+ let path_start = self.serialization.len();
+ self.serialization.push('/');
+ self.parse_path(scheme_type, has_host, path_start, input)
+ }
+
+ pub fn parse_path<'i>(&mut self, scheme_type: SchemeType, has_host: &mut bool,
+ path_start: usize, mut input: Input<'i>)
+ -> Input<'i> {
+ // Relative path state
+ debug_assert!(self.serialization.ends_with("/"));
+ loop {
+ let segment_start = self.serialization.len();
+ let mut ends_with_slash = false;
+ loop {
+ let input_before_c = input.clone();
+ let (c, utf8_c) = if let Some(x) = input.next_utf8() { x } else { break };
+ match c {
+ '/' if self.context != Context::PathSegmentSetter => {
+ ends_with_slash = true;
+ break
+ },
+ '\\' if self.context != Context::PathSegmentSetter &&
+ scheme_type.is_special() => {
+ self.syntax_violation("backslash");
+ ends_with_slash = true;
+ break
+ },
+ '?' | '#' if self.context == Context::UrlParser => {
+ input = input_before_c;
+ break
+ },
+ _ => {
+ self.check_url_code_point(c, &input);
+ if c == '%' {
+ let after_percent_sign = input.clone();
+ if matches!(input.next(), Some('2')) &&
+ matches!(input.next(), Some('E') | Some('e')) {
+ self.serialization.push('.');
+ continue
+ }
+ input = after_percent_sign
+ }
+ if self.context == Context::PathSegmentSetter {
+ self.serialization.extend(utf8_percent_encode(
+ utf8_c, PATH_SEGMENT_ENCODE_SET));
+ } else {
+ self.serialization.extend(utf8_percent_encode(
+ utf8_c, DEFAULT_ENCODE_SET));
+ }
+ }
+ }
+ }
+ match &self.serialization[segment_start..] {
+ ".." => {
+ debug_assert!(self.serialization.as_bytes()[segment_start - 1] == b'/');
+ self.serialization.truncate(segment_start - 1); // Truncate "/.."
+ self.pop_path(scheme_type, path_start);
+ if !self.serialization[path_start..].ends_with("/") {
+ self.serialization.push('/')
+ }
+ },
+ "." => {
+ self.serialization.truncate(segment_start);
+ },
+ _ => {
+ if scheme_type.is_file() && is_windows_drive_letter(
+ &self.serialization[path_start + 1..]
+ ) {
+ if self.serialization.ends_with('|') {
+ self.serialization.pop();
+ self.serialization.push(':');
+ }
+ if *has_host {
+ self.syntax_violation("file: with host and Windows drive letter");
+ *has_host = false; // FIXME account for this in callers
+ }
+ }
+ if ends_with_slash {
+ self.serialization.push('/')
+ }
+ }
+ }
+ if !ends_with_slash {
+ break
+ }
+ }
+ input
+ }
+
+ /// https://url.spec.whatwg.org/#pop-a-urls-path
+ fn pop_path(&mut self, scheme_type: SchemeType, path_start: usize) {
+ if self.serialization.len() > path_start {
+ let slash_position = self.serialization[path_start..].rfind('/').unwrap();
+ // + 1 since rfind returns the position before the slash.
+ let segment_start = path_start + slash_position + 1;
+ // Don’t pop a Windows drive letter
+ // FIXME: *normalized* Windows drive letter
+ if !(
+ scheme_type.is_file() &&
+ is_windows_drive_letter(&self.serialization[segment_start..])
+ ) {
+ self.serialization.truncate(segment_start);
+ }
+ }
+
+ }
+
+ pub fn parse_cannot_be_a_base_path<'i>(&mut self, mut input: Input<'i>) -> Input<'i> {
+ loop {
+ let input_before_c = input.clone();
+ match input.next_utf8() {
+ Some(('?', _)) | Some(('#', _)) if self.context == Context::UrlParser => {
+ return input_before_c
+ }
+ Some((c, utf8_c)) => {
+ self.check_url_code_point(c, &input);
+ self.serialization.extend(utf8_percent_encode(
+ utf8_c, SIMPLE_ENCODE_SET));
+ }
+ None => return input
+ }
+ }
+ }
+
+ fn with_query_and_fragment(mut self, scheme_end: u32, username_end: u32,
+ host_start: u32, host_end: u32, host: HostInternal,
+ port: Option<u16>, path_start: u32, remaining: Input)
+ -> ParseResult<Url> {
+ let (query_start, fragment_start) =
+ try!(self.parse_query_and_fragment(scheme_end, remaining));
+ Ok(Url {
+ serialization: self.serialization,
+ scheme_end: scheme_end,
+ username_end: username_end,
+ host_start: host_start,
+ host_end: host_end,
+ host: host,
+ port: port,
+ path_start: path_start,
+ query_start: query_start,
+ fragment_start: fragment_start
+ })
+ }
+
+ /// Return (query_start, fragment_start)
+ fn parse_query_and_fragment(&mut self, scheme_end: u32, mut input: Input)
+ -> ParseResult<(Option<u32>, Option<u32>)> {
+ let mut query_start = None;
+ match input.next() {
+ Some('#') => {}
+ Some('?') => {
+ query_start = Some(try!(to_u32(self.serialization.len())));
+ self.serialization.push('?');
+ let remaining = self.parse_query(scheme_end, input);
+ if let Some(remaining) = remaining {
+ input = remaining
+ } else {
+ return Ok((query_start, None))
+ }
+ }
+ None => return Ok((None, None)),
+ _ => panic!("Programming error. parse_query_and_fragment() called without ? or # {:?}")
+ }
+
+ let fragment_start = try!(to_u32(self.serialization.len()));
+ self.serialization.push('#');
+ self.parse_fragment(input);
+ Ok((query_start, Some(fragment_start)))
+ }
+
+ pub fn parse_query<'i>(&mut self, scheme_end: u32, mut input: Input<'i>)
+ -> Option<Input<'i>> {
+ let mut query = String::new(); // FIXME: use a streaming decoder instead
+ let mut remaining = None;
+ while let Some(c) = input.next() {
+ if c == '#' && self.context == Context::UrlParser {
+ remaining = Some(input);
+ break
+ } else {
+ self.check_url_code_point(c, &input);
+ query.push(c);
+ }
+ }
+
+ let encoding = match &self.serialization[..scheme_end as usize] {
+ "http" | "https" | "file" | "ftp" | "gopher" => self.query_encoding_override,
+ _ => EncodingOverride::utf8(),
+ };
+ let query_bytes = encoding.encode(query.into());
+ self.serialization.extend(percent_encode(&query_bytes, QUERY_ENCODE_SET));
+ remaining
+ }
+
+ fn fragment_only(mut self, base_url: &Url, mut input: Input) -> ParseResult<Url> {
+ let before_fragment = match base_url.fragment_start {
+ Some(i) => base_url.slice(..i),
+ None => &*base_url.serialization,
+ };
+ debug_assert!(self.serialization.is_empty());
+ self.serialization.reserve(before_fragment.len() + input.chars.as_str().len());
+ self.serialization.push_str(before_fragment);
+ self.serialization.push('#');
+ let next = input.next();
+ debug_assert!(next == Some('#'));
+ self.parse_fragment(input);
+ Ok(Url {
+ serialization: self.serialization,
+ fragment_start: Some(try!(to_u32(before_fragment.len()))),
+ ..*base_url
+ })
+ }
+
+ pub fn parse_fragment(&mut self, mut input: Input) {
+ while let Some(c) = input.next() {
+ if c == '\0' {
+ self.syntax_violation("NULL characters are ignored in URL fragment identifiers")
+ } else {
+ self.check_url_code_point(c, &input);
+ self.serialization.push(c); // No percent-encoding here.
+ }
+ }
+ }
+
+ fn check_url_code_point(&self, c: char, input: &Input) {
+ if let Some(log) = self.log_syntax_violation {
+ if c == '%' {
+ let mut input = input.clone();
+ if !matches!((input.next(), input.next()), (Some(a), Some(b))
+ if is_ascii_hex_digit(a) && is_ascii_hex_digit(b)) {
+ log("expected 2 hex digits after %")
+ }
+ } else if !is_url_code_point(c) {
+ log("non-URL code point")
+ }
+ }
+ }
+}
+
+#[inline]
+fn is_ascii_hex_digit(c: char) -> bool {
+ matches!(c, 'a'...'f' | 'A'...'F' | '0'...'9')
+}
+
+// Non URL code points:
+// U+0000 to U+0020 (space)
+// " # % < > [ \ ] ^ ` { | }
+// U+007F to U+009F
+// surrogates
+// U+FDD0 to U+FDEF
+// Last two of each plane: U+__FFFE to U+__FFFF for __ in 00 to 10 hex
+#[inline]
+fn is_url_code_point(c: char) -> bool {
+ matches!(c,
+ 'a'...'z' |
+ 'A'...'Z' |
+ '0'...'9' |
+ '!' | '$' | '&' | '\'' | '(' | ')' | '*' | '+' | ',' | '-' |
+ '.' | '/' | ':' | ';' | '=' | '?' | '@' | '_' | '~' |
+ '\u{A0}'...'\u{D7FF}' | '\u{E000}'...'\u{FDCF}' | '\u{FDF0}'...'\u{FFFD}' |
+ '\u{10000}'...'\u{1FFFD}' | '\u{20000}'...'\u{2FFFD}' |
+ '\u{30000}'...'\u{3FFFD}' | '\u{40000}'...'\u{4FFFD}' |
+ '\u{50000}'...'\u{5FFFD}' | '\u{60000}'...'\u{6FFFD}' |
+ '\u{70000}'...'\u{7FFFD}' | '\u{80000}'...'\u{8FFFD}' |
+ '\u{90000}'...'\u{9FFFD}' | '\u{A0000}'...'\u{AFFFD}' |
+ '\u{B0000}'...'\u{BFFFD}' | '\u{C0000}'...'\u{CFFFD}' |
+ '\u{D0000}'...'\u{DFFFD}' | '\u{E1000}'...'\u{EFFFD}' |
+ '\u{F0000}'...'\u{FFFFD}' | '\u{100000}'...'\u{10FFFD}')
+}
+
+/// https://url.spec.whatwg.org/#c0-controls-and-space
+#[inline]
+fn c0_control_or_space(ch: char) -> bool {
+ ch <= ' ' // U+0000 to U+0020
+}
+
+/// https://url.spec.whatwg.org/#ascii-alpha
+#[inline]
+pub fn ascii_alpha(ch: char) -> bool {
+ matches!(ch, 'a'...'z' | 'A'...'Z')
+}
+
+#[inline]
+pub fn to_u32(i: usize) -> ParseResult<u32> {
+ if i <= ::std::u32::MAX as usize {
+ Ok(i as u32)
+ } else {
+ Err(ParseError::Overflow)
+ }
+}
+
+/// Wether the scheme is file:, the path has a single segment, and that segment
+/// is a Windows drive letter
+fn is_windows_drive_letter(segment: &str) -> bool {
+ segment.len() == 2
+ && starts_with_windows_drive_letter(segment)
+}
+
+fn starts_with_windows_drive_letter(s: &str) -> bool {
+ ascii_alpha(s.as_bytes()[0] as char)
+ && matches!(s.as_bytes()[1], b':' | b'|')
+}
+
+fn starts_with_windows_drive_letter_segment(input: &Input) -> bool {
+ let mut input = input.clone();
+ matches!((input.next(), input.next(), input.next()), (Some(a), Some(b), Some(c))
+ if ascii_alpha(a) && matches!(b, ':' | '|') && matches!(c, '/' | '\\' | '?' | '#'))
+}
diff --git a/third_party/rust/url/src/path_segments.rs b/third_party/rust/url/src/path_segments.rs
new file mode 100644
index 000000000..437a84ee7
--- /dev/null
+++ b/third_party/rust/url/src/path_segments.rs
@@ -0,0 +1,187 @@
+// Copyright 2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+use parser::{self, SchemeType, to_u32};
+use std::str;
+use Url;
+
+/// Exposes methods to manipulate the path of an URL that is not cannot-be-base.
+///
+/// The path always starts with a `/` slash, and is made of slash-separated segments.
+/// There is always at least one segment (which may be the empty string).
+///
+/// Examples:
+///
+/// ```rust
+/// # use url::Url;
+/// let mut url = Url::parse("mailto:me@example.com").unwrap();
+/// assert!(url.path_segments_mut().is_err());
+///
+/// let mut url = Url::parse("http://example.net/foo/index.html").unwrap();
+/// url.path_segments_mut().unwrap().pop().push("img").push("2/100%.png");
+/// assert_eq!(url.as_str(), "http://example.net/foo/img/2%2F100%25.png");
+/// ```
+pub struct PathSegmentsMut<'a> {
+ url: &'a mut Url,
+ after_first_slash: usize,
+ after_path: String,
+ old_after_path_position: u32,
+}
+
+// Not re-exported outside the crate
+pub fn new(url: &mut Url) -> PathSegmentsMut {
+ let after_path = url.take_after_path();
+ let old_after_path_position = to_u32(url.serialization.len()).unwrap();
+ debug_assert!(url.byte_at(url.path_start) == b'/');
+ PathSegmentsMut {
+ after_first_slash: url.path_start as usize + "/".len(),
+ url: url,
+ old_after_path_position: old_after_path_position,
+ after_path: after_path,
+ }
+}
+
+impl<'a> Drop for PathSegmentsMut<'a> {
+ fn drop(&mut self) {
+ self.url.restore_after_path(self.old_after_path_position, &self.after_path)
+ }
+}
+
+impl<'a> PathSegmentsMut<'a> {
+ /// Remove all segments in the path, leaving the minimal `url.path() == "/"`.
+ ///
+ /// Returns `&mut Self` so that method calls can be chained.
+ ///
+ /// Example:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap();
+ /// url.path_segments_mut().unwrap().clear().push("logout");
+ /// assert_eq!(url.as_str(), "https://github.com/logout");
+ /// ```
+ pub fn clear(&mut self) -> &mut Self {
+ self.url.serialization.truncate(self.after_first_slash);
+ self
+ }
+
+ /// Remove the last segment of this URL’s path if it is empty,
+ /// except if these was only one segment to begin with.
+ ///
+ /// In other words, remove one path trailing slash, if any,
+ /// unless it is also the initial slash (so this does nothing if `url.path() == "/")`.
+ ///
+ /// Returns `&mut Self` so that method calls can be chained.
+ ///
+ /// Example:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap();
+ /// url.path_segments_mut().unwrap().push("pulls");
+ /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url//pulls");
+ ///
+ /// let mut url = Url::parse("https://github.com/servo/rust-url/").unwrap();
+ /// url.path_segments_mut().unwrap().pop_if_empty().push("pulls");
+ /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/pulls");
+ /// ```
+ pub fn pop_if_empty(&mut self) -> &mut Self {
+ if self.url.serialization[self.after_first_slash..].ends_with('/') {
+ self.url.serialization.pop();
+ }
+ self
+ }
+
+ /// Remove the last segment of this URL’s path.
+ ///
+ /// If the path only has one segment, make it empty such that `url.path() == "/"`.
+ ///
+ /// Returns `&mut Self` so that method calls can be chained.
+ pub fn pop(&mut self) -> &mut Self {
+ let last_slash = self.url.serialization[self.after_first_slash..].rfind('/').unwrap_or(0);
+ self.url.serialization.truncate(self.after_first_slash + last_slash);
+ self
+ }
+
+ /// Append the given segment at the end of this URL’s path.
+ ///
+ /// See the documentation for `.extend()`.
+ ///
+ /// Returns `&mut Self` so that method calls can be chained.
+ pub fn push(&mut self, segment: &str) -> &mut Self {
+ self.extend(Some(segment))
+ }
+
+ /// Append each segment from the given iterator at the end of this URL’s path.
+ ///
+ /// Each segment is percent-encoded like in `Url::parse` or `Url::join`,
+ /// except that `%` and `/` characters are also encoded (to `%25` and `%2F`).
+ /// This is unlike `Url::parse` where `%` is left as-is in case some of the input
+ /// is already percent-encoded, and `/` denotes a path segment separator.)
+ ///
+ /// Note that, in addition to slashes between new segments,
+ /// this always adds a slash between the existing path and the new segments
+ /// *except* if the existing path is `"/"`.
+ /// If the previous last segment was empty (if the path had a trailing slash)
+ /// the path after `.extend()` will contain two consecutive slashes.
+ /// If that is undesired, call `.pop_if_empty()` first.
+ ///
+ /// To obtain a behavior similar to `Url::join`, call `.pop()` unconditionally first.
+ ///
+ /// Returns `&mut Self` so that method calls can be chained.
+ ///
+ /// Example:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// let mut url = Url::parse("https://github.com/").unwrap();
+ /// let org = "servo";
+ /// let repo = "rust-url";
+ /// let issue_number = "188";
+ /// url.path_segments_mut().unwrap().extend(&[org, repo, "issues", issue_number]);
+ /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/issues/188");
+ /// ```
+ ///
+ /// In order to make sure that parsing the serialization of an URL gives the same URL,
+ /// a segment is ignored if it is `"."` or `".."`:
+ ///
+ /// ```rust
+ /// # use url::Url;
+ /// let mut url = Url::parse("https://github.com/servo").unwrap();
+ /// url.path_segments_mut().unwrap().extend(&["..", "rust-url", ".", "pulls"]);
+ /// assert_eq!(url.as_str(), "https://github.com/servo/rust-url/pulls");
+ /// ```
+ pub fn extend<I>(&mut self, segments: I) -> &mut Self
+ where I: IntoIterator, I::Item: AsRef<str> {
+ let scheme_type = SchemeType::from(self.url.scheme());
+ let path_start = self.url.path_start as usize;
+ self.url.mutate(|parser| {
+ parser.context = parser::Context::PathSegmentSetter;
+ for segment in segments {
+ let segment = segment.as_ref();
+ if matches!(segment, "." | "..") {
+ continue
+ }
+ if parser.serialization.len() > path_start + 1 {
+ parser.serialization.push('/');
+ }
+ let mut has_host = true; // FIXME account for this?
+ parser.parse_path(scheme_type, &mut has_host, path_start,
+ parser::Input::new(segment));
+ }
+ });
+ self
+ }
+
+ /// For internal testing, not part of the public API.
+ #[doc(hidden)]
+ pub fn assert_url_invariants(&mut self) -> &mut Self {
+ self.url.assert_invariants();
+ self
+ }
+}
diff --git a/third_party/rust/url/src/percent_encoding.rs b/third_party/rust/url/src/percent_encoding.rs
new file mode 100644
index 000000000..a4fb6177a
--- /dev/null
+++ b/third_party/rust/url/src/percent_encoding.rs
@@ -0,0 +1,344 @@
+// Copyright 2013-2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+use encoding;
+use std::ascii::AsciiExt;
+use std::borrow::Cow;
+use std::fmt;
+use std::slice;
+use std::str;
+
+/// Represents a set of characters / bytes that should be percent-encoded.
+///
+/// See [encode sets specification](http://url.spec.whatwg.org/#simple-encode-set).
+///
+/// Different characters need to be encoded in different parts of an URL.
+/// For example, a literal `?` question mark in an URL’s path would indicate
+/// the start of the query string.
+/// A question mark meant to be part of the path therefore needs to be percent-encoded.
+/// In the query string however, a question mark does not have any special meaning
+/// and does not need to be percent-encoded.
+///
+/// A few sets are defined in this module.
+/// Use the [`define_encode_set!`](../macro.define_encode_set!.html) macro to define different ones.
+pub trait EncodeSet: Clone {
+ /// Called with UTF-8 bytes rather than code points.
+ /// Should return true for all non-ASCII bytes.
+ fn contains(&self, byte: u8) -> bool;
+}
+
+/// Define a new struct
+/// that implements the [`EncodeSet`](percent_encoding/trait.EncodeSet.html) trait,
+/// for use in [`percent_decode()`](percent_encoding/fn.percent_encode.html)
+/// and related functions.
+///
+/// Parameters are characters to include in the set in addition to those of the base set.
+/// See [encode sets specification](http://url.spec.whatwg.org/#simple-encode-set).
+///
+/// Example
+/// =======
+///
+/// ```rust
+/// #[macro_use] extern crate url;
+/// use url::percent_encoding::{utf8_percent_encode, SIMPLE_ENCODE_SET};
+/// define_encode_set! {
+/// /// This encode set is used in the URL parser for query strings.
+/// pub QUERY_ENCODE_SET = [SIMPLE_ENCODE_SET] | {' ', '"', '#', '<', '>'}
+/// }
+/// # fn main() {
+/// assert_eq!(utf8_percent_encode("foo bar", QUERY_ENCODE_SET).collect::<String>(), "foo%20bar");
+/// # }
+/// ```
+#[macro_export]
+macro_rules! define_encode_set {
+ ($(#[$attr: meta])* pub $name: ident = [$base_set: expr] | {$($ch: pat),*}) => {
+ $(#[$attr])*
+ #[derive(Copy, Clone)]
+ #[allow(non_camel_case_types)]
+ pub struct $name;
+
+ impl $crate::percent_encoding::EncodeSet for $name {
+ #[inline]
+ fn contains(&self, byte: u8) -> bool {
+ match byte as char {
+ $(
+ $ch => true,
+ )*
+ _ => $base_set.contains(byte)
+ }
+ }
+ }
+ }
+}
+
+/// This encode set is used for the path of cannot-be-a-base URLs.
+#[derive(Copy, Clone)]
+#[allow(non_camel_case_types)]
+pub struct SIMPLE_ENCODE_SET;
+
+impl EncodeSet for SIMPLE_ENCODE_SET {
+ #[inline]
+ fn contains(&self, byte: u8) -> bool {
+ byte < 0x20 || byte > 0x7E
+ }
+}
+
+define_encode_set! {
+ /// This encode set is used in the URL parser for query strings.
+ pub QUERY_ENCODE_SET = [SIMPLE_ENCODE_SET] | {' ', '"', '#', '<', '>'}
+}
+
+define_encode_set! {
+ /// This encode set is used for path components.
+ pub DEFAULT_ENCODE_SET = [QUERY_ENCODE_SET] | {'`', '?', '{', '}'}
+}
+
+define_encode_set! {
+ /// This encode set is used for on '/'-separated path segment
+ pub PATH_SEGMENT_ENCODE_SET = [DEFAULT_ENCODE_SET] | {'%', '/'}
+}
+
+define_encode_set! {
+ /// This encode set is used for username and password.
+ pub USERINFO_ENCODE_SET = [DEFAULT_ENCODE_SET] | {
+ '/', ':', ';', '=', '@', '[', '\\', ']', '^', '|'
+ }
+}
+
+/// Return the percent-encoding of the given bytes.
+///
+/// This is unconditional, unlike `percent_encode()` which uses an encode set.
+pub fn percent_encode_byte(byte: u8) -> &'static str {
+ let index = usize::from(byte) * 3;
+ &"\
+ %00%01%02%03%04%05%06%07%08%09%0A%0B%0C%0D%0E%0F\
+ %10%11%12%13%14%15%16%17%18%19%1A%1B%1C%1D%1E%1F\
+ %20%21%22%23%24%25%26%27%28%29%2A%2B%2C%2D%2E%2F\
+ %30%31%32%33%34%35%36%37%38%39%3A%3B%3C%3D%3E%3F\
+ %40%41%42%43%44%45%46%47%48%49%4A%4B%4C%4D%4E%4F\
+ %50%51%52%53%54%55%56%57%58%59%5A%5B%5C%5D%5E%5F\
+ %60%61%62%63%64%65%66%67%68%69%6A%6B%6C%6D%6E%6F\
+ %70%71%72%73%74%75%76%77%78%79%7A%7B%7C%7D%7E%7F\
+ %80%81%82%83%84%85%86%87%88%89%8A%8B%8C%8D%8E%8F\
+ %90%91%92%93%94%95%96%97%98%99%9A%9B%9C%9D%9E%9F\
+ %A0%A1%A2%A3%A4%A5%A6%A7%A8%A9%AA%AB%AC%AD%AE%AF\
+ %B0%B1%B2%B3%B4%B5%B6%B7%B8%B9%BA%BB%BC%BD%BE%BF\
+ %C0%C1%C2%C3%C4%C5%C6%C7%C8%C9%CA%CB%CC%CD%CE%CF\
+ %D0%D1%D2%D3%D4%D5%D6%D7%D8%D9%DA%DB%DC%DD%DE%DF\
+ %E0%E1%E2%E3%E4%E5%E6%E7%E8%E9%EA%EB%EC%ED%EE%EF\
+ %F0%F1%F2%F3%F4%F5%F6%F7%F8%F9%FA%FB%FC%FD%FE%FF\
+ "[index..index + 3]
+}
+
+/// Percent-encode the given bytes with the given encode set.
+///
+/// The encode set define which bytes (in addition to non-ASCII and controls)
+/// need to be percent-encoded.
+/// The choice of this set depends on context.
+/// For example, `?` needs to be encoded in an URL path but not in a query string.
+///
+/// The return value is an iterator of `&str` slices (so it has a `.collect::<String>()` method)
+/// that also implements `Display` and `Into<Cow<str>>`.
+/// The latter returns `Cow::Borrowed` when none of the bytes in `input`
+/// are in the given encode set.
+#[inline]
+pub fn percent_encode<E: EncodeSet>(input: &[u8], encode_set: E) -> PercentEncode<E> {
+ PercentEncode {
+ bytes: input,
+ encode_set: encode_set,
+ }
+}
+
+/// Percent-encode the UTF-8 encoding of the given string.
+///
+/// See `percent_encode()` for how to use the return value.
+#[inline]
+pub fn utf8_percent_encode<E: EncodeSet>(input: &str, encode_set: E) -> PercentEncode<E> {
+ percent_encode(input.as_bytes(), encode_set)
+}
+
+/// The return type of `percent_encode()` and `utf8_percent_encode()`.
+#[derive(Clone)]
+pub struct PercentEncode<'a, E: EncodeSet> {
+ bytes: &'a [u8],
+ encode_set: E,
+}
+
+impl<'a, E: EncodeSet> Iterator for PercentEncode<'a, E> {
+ type Item = &'a str;
+
+ fn next(&mut self) -> Option<&'a str> {
+ if let Some((&first_byte, remaining)) = self.bytes.split_first() {
+ if self.encode_set.contains(first_byte) {
+ self.bytes = remaining;
+ Some(percent_encode_byte(first_byte))
+ } else {
+ assert!(first_byte.is_ascii());
+ for (i, &byte) in remaining.iter().enumerate() {
+ if self.encode_set.contains(byte) {
+ // 1 for first_byte + i for previous iterations of this loop
+ let (unchanged_slice, remaining) = self.bytes.split_at(1 + i);
+ self.bytes = remaining;
+ return Some(unsafe { str::from_utf8_unchecked(unchanged_slice) })
+ } else {
+ assert!(byte.is_ascii());
+ }
+ }
+ let unchanged_slice = self.bytes;
+ self.bytes = &[][..];
+ Some(unsafe { str::from_utf8_unchecked(unchanged_slice) })
+ }
+ } else {
+ None
+ }
+ }
+
+ fn size_hint(&self) -> (usize, Option<usize>) {
+ if self.bytes.is_empty() {
+ (0, Some(0))
+ } else {
+ (1, Some(self.bytes.len()))
+ }
+ }
+}
+
+impl<'a, E: EncodeSet> fmt::Display for PercentEncode<'a, E> {
+ fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
+ for c in (*self).clone() {
+ try!(formatter.write_str(c))
+ }
+ Ok(())
+ }
+}
+
+impl<'a, E: EncodeSet> From<PercentEncode<'a, E>> for Cow<'a, str> {
+ fn from(mut iter: PercentEncode<'a, E>) -> Self {
+ match iter.next() {
+ None => "".into(),
+ Some(first) => {
+ match iter.next() {
+ None => first.into(),
+ Some(second) => {
+ let mut string = first.to_owned();
+ string.push_str(second);
+ string.extend(iter);
+ string.into()
+ }
+ }
+ }
+ }
+ }
+}
+
+/// Percent-decode the given bytes.
+///
+/// The return value is an iterator of decoded `u8` bytes
+/// that also implements `Into<Cow<u8>>`
+/// (which returns `Cow::Borrowed` when `input` contains no percent-encoded sequence)
+/// and has `decode_utf8()` and `decode_utf8_lossy()` methods.
+#[inline]
+pub fn percent_decode<'a>(input: &'a [u8]) -> PercentDecode<'a> {
+ PercentDecode {
+ bytes: input.iter()
+ }
+}
+
+/// The return type of `percent_decode()`.
+#[derive(Clone)]
+pub struct PercentDecode<'a> {
+ bytes: slice::Iter<'a, u8>,
+}
+
+fn after_percent_sign(iter: &mut slice::Iter<u8>) -> Option<u8> {
+ let initial_iter = iter.clone();
+ let h = iter.next().and_then(|&b| (b as char).to_digit(16));
+ let l = iter.next().and_then(|&b| (b as char).to_digit(16));
+ if let (Some(h), Some(l)) = (h, l) {
+ Some(h as u8 * 0x10 + l as u8)
+ } else {
+ *iter = initial_iter;
+ None
+ }
+}
+
+impl<'a> Iterator for PercentDecode<'a> {
+ type Item = u8;
+
+ fn next(&mut self) -> Option<u8> {
+ self.bytes.next().map(|&byte| {
+ if byte == b'%' {
+ after_percent_sign(&mut self.bytes).unwrap_or(byte)
+ } else {
+ byte
+ }
+ })
+ }
+
+ fn size_hint(&self) -> (usize, Option<usize>) {
+ let bytes = self.bytes.len();
+ (bytes / 3, Some(bytes))
+ }
+}
+
+impl<'a> From<PercentDecode<'a>> for Cow<'a, [u8]> {
+ fn from(iter: PercentDecode<'a>) -> Self {
+ match iter.if_any() {
+ Some(vec) => Cow::Owned(vec),
+ None => Cow::Borrowed(iter.bytes.as_slice()),
+ }
+ }
+}
+
+impl<'a> PercentDecode<'a> {
+ /// If the percent-decoding is different from the input, return it as a new bytes vector.
+ pub fn if_any(&self) -> Option<Vec<u8>> {
+ let mut bytes_iter = self.bytes.clone();
+ while bytes_iter.find(|&&b| b == b'%').is_some() {
+ if let Some(decoded_byte) = after_percent_sign(&mut bytes_iter) {
+ let initial_bytes = self.bytes.as_slice();
+ let unchanged_bytes_len = initial_bytes.len() - bytes_iter.len() - 3;
+ let mut decoded = initial_bytes[..unchanged_bytes_len].to_owned();
+ decoded.push(decoded_byte);
+ decoded.extend(PercentDecode {
+ bytes: bytes_iter
+ });
+ return Some(decoded)
+ }
+ }
+ // Nothing to decode
+ None
+ }
+
+ /// Decode the result of percent-decoding as UTF-8.
+ ///
+ /// This is return `Err` when the percent-decoded bytes are not well-formed in UTF-8.
+ pub fn decode_utf8(self) -> Result<Cow<'a, str>, str::Utf8Error> {
+ match self.clone().into() {
+ Cow::Borrowed(bytes) => {
+ match str::from_utf8(bytes) {
+ Ok(s) => Ok(s.into()),
+ Err(e) => Err(e),
+ }
+ }
+ Cow::Owned(bytes) => {
+ match String::from_utf8(bytes) {
+ Ok(s) => Ok(s.into()),
+ Err(e) => Err(e.utf8_error()),
+ }
+ }
+ }
+ }
+
+ /// Decode the result of percent-decoding as UTF-8, lossily.
+ ///
+ /// Invalid UTF-8 percent-encoded byte sequences will be replaced � U+FFFD,
+ /// the replacement character.
+ pub fn decode_utf8_lossy(self) -> Cow<'a, str> {
+ encoding::decode_utf8_lossy(self.clone().into())
+ }
+}
diff --git a/third_party/rust/url/src/quirks.rs b/third_party/rust/url/src/quirks.rs
new file mode 100644
index 000000000..9a7537f47
--- /dev/null
+++ b/third_party/rust/url/src/quirks.rs
@@ -0,0 +1,217 @@
+// Copyright 2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+//! Getters and setters for URL components implemented per https://url.spec.whatwg.org/#api
+//!
+//! Unless you need to be interoperable with web browsers,
+//! you probably want to use `Url` method instead.
+
+use {Url, Position, Host, ParseError, idna};
+use parser::{Parser, SchemeType, default_port, Context, Input};
+
+/// https://url.spec.whatwg.org/#dom-url-domaintoascii
+pub fn domain_to_ascii(domain: &str) -> String {
+ match Host::parse(domain) {
+ Ok(Host::Domain(domain)) => domain,
+ _ => String::new(),
+ }
+}
+
+/// https://url.spec.whatwg.org/#dom-url-domaintounicode
+pub fn domain_to_unicode(domain: &str) -> String {
+ match Host::parse(domain) {
+ Ok(Host::Domain(ref domain)) => {
+ let (unicode, _errors) = idna::domain_to_unicode(domain);
+ unicode
+ }
+ _ => String::new(),
+ }
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-href
+pub fn href(url: &Url) -> &str {
+ url.as_str()
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-href
+pub fn set_href(url: &mut Url, value: &str) -> Result<(), ParseError> {
+ *url = try!(Url::parse(value));
+ Ok(())
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-origin
+pub fn origin(url: &Url) -> String {
+ url.origin().unicode_serialization()
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-protocol
+#[inline]
+pub fn protocol(url: &Url) -> &str {
+ &url.as_str()[..url.scheme().len() + ":".len()]
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-protocol
+pub fn set_protocol(url: &mut Url, mut new_protocol: &str) -> Result<(), ()> {
+ // The scheme state in the spec ignores everything after the first `:`,
+ // but `set_scheme` errors if there is more.
+ if let Some(position) = new_protocol.find(':') {
+ new_protocol = &new_protocol[..position];
+ }
+ url.set_scheme(new_protocol)
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-username
+#[inline]
+pub fn username(url: &Url) -> &str {
+ url.username()
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-username
+pub fn set_username(url: &mut Url, new_username: &str) -> Result<(), ()> {
+ url.set_username(new_username)
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-password
+#[inline]
+pub fn password(url: &Url) -> &str {
+ url.password().unwrap_or("")
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-password
+pub fn set_password(url: &mut Url, new_password: &str) -> Result<(), ()> {
+ url.set_password(if new_password.is_empty() { None } else { Some(new_password) })
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-host
+#[inline]
+pub fn host(url: &Url) -> &str {
+ &url[Position::BeforeHost..Position::AfterPort]
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-host
+pub fn set_host(url: &mut Url, new_host: &str) -> Result<(), ()> {
+ if url.cannot_be_a_base() {
+ return Err(())
+ }
+ let host;
+ let opt_port;
+ {
+ let scheme = url.scheme();
+ let result = Parser::parse_host(Input::new(new_host), SchemeType::from(scheme));
+ match result {
+ Ok((h, remaining)) => {
+ host = h;
+ opt_port = if let Some(remaining) = remaining.split_prefix(':') {
+ Parser::parse_port(remaining, || default_port(scheme), Context::Setter)
+ .ok().map(|(port, _remaining)| port)
+ } else {
+ None
+ };
+ }
+ Err(_) => return Err(())
+ }
+ }
+ url.set_host_internal(host, opt_port);
+ Ok(())
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-hostname
+#[inline]
+pub fn hostname(url: &Url) -> &str {
+ url.host_str().unwrap_or("")
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-hostname
+pub fn set_hostname(url: &mut Url, new_hostname: &str) -> Result<(), ()> {
+ if url.cannot_be_a_base() {
+ return Err(())
+ }
+ let result = Parser::parse_host(Input::new(new_hostname), SchemeType::from(url.scheme()));
+ if let Ok((host, _remaining)) = result {
+ url.set_host_internal(host, None);
+ Ok(())
+ } else {
+ Err(())
+ }
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-port
+#[inline]
+pub fn port(url: &Url) -> &str {
+ &url[Position::BeforePort..Position::AfterPort]
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-port
+pub fn set_port(url: &mut Url, new_port: &str) -> Result<(), ()> {
+ let result;
+ {
+ // has_host implies !cannot_be_a_base
+ let scheme = url.scheme();
+ if !url.has_host() || scheme == "file" {
+ return Err(())
+ }
+ result = Parser::parse_port(Input::new(new_port), || default_port(scheme), Context::Setter)
+ }
+ if let Ok((new_port, _remaining)) = result {
+ url.set_port_internal(new_port);
+ Ok(())
+ } else {
+ Err(())
+ }
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-pathname
+#[inline]
+pub fn pathname(url: &Url) -> &str {
+ url.path()
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-pathname
+pub fn set_pathname(url: &mut Url, new_pathname: &str) {
+ if !url.cannot_be_a_base() {
+ url.set_path(new_pathname)
+ }
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-search
+pub fn search(url: &Url) -> &str {
+ trim(&url[Position::AfterPath..Position::AfterQuery])
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-search
+pub fn set_search(url: &mut Url, new_search: &str) {
+ url.set_query(match new_search {
+ "" => None,
+ _ if new_search.starts_with('?') => Some(&new_search[1..]),
+ _ => Some(new_search),
+ })
+}
+
+/// Getter for https://url.spec.whatwg.org/#dom-url-hash
+pub fn hash(url: &Url) -> &str {
+ trim(&url[Position::AfterQuery..])
+}
+
+/// Setter for https://url.spec.whatwg.org/#dom-url-hash
+pub fn set_hash(url: &mut Url, new_hash: &str) {
+ if url.scheme() != "javascript" {
+ url.set_fragment(match new_hash {
+ "" => None,
+ _ if new_hash.starts_with('#') => Some(&new_hash[1..]),
+ _ => Some(new_hash),
+ })
+ }
+}
+
+fn trim(s: &str) -> &str {
+ if s.len() == 1 {
+ ""
+ } else {
+ s
+ }
+}
diff --git a/third_party/rust/url/src/slicing.rs b/third_party/rust/url/src/slicing.rs
new file mode 100644
index 000000000..926f3c796
--- /dev/null
+++ b/third_party/rust/url/src/slicing.rs
@@ -0,0 +1,182 @@
+// Copyright 2016 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+use std::ops::{Range, RangeFrom, RangeTo, RangeFull, Index};
+use Url;
+
+impl Index<RangeFull> for Url {
+ type Output = str;
+ fn index(&self, _: RangeFull) -> &str {
+ &self.serialization
+ }
+}
+
+impl Index<RangeFrom<Position>> for Url {
+ type Output = str;
+ fn index(&self, range: RangeFrom<Position>) -> &str {
+ &self.serialization[self.index(range.start)..]
+ }
+}
+
+impl Index<RangeTo<Position>> for Url {
+ type Output = str;
+ fn index(&self, range: RangeTo<Position>) -> &str {
+ &self.serialization[..self.index(range.end)]
+ }
+}
+
+impl Index<Range<Position>> for Url {
+ type Output = str;
+ fn index(&self, range: Range<Position>) -> &str {
+ &self.serialization[self.index(range.start)..self.index(range.end)]
+ }
+}
+
+/// Indicates a position within a URL based on its components.
+///
+/// A range of positions can be used for slicing `Url`:
+///
+/// ```rust
+/// # use url::{Url, Position};
+/// # fn something(some_url: Url) {
+/// let serialization: &str = &some_url[..];
+/// let serialization_without_fragment: &str = &some_url[..Position::AfterQuery];
+/// let authority: &str = &some_url[Position::BeforeUsername..Position::AfterPort];
+/// let data_url_payload: &str = &some_url[Position::BeforePath..Position::AfterQuery];
+/// let scheme_relative: &str = &some_url[Position::BeforeUsername..];
+/// # }
+/// ```
+///
+/// In a pseudo-grammar (where `[`…`]?` makes a sub-sequence optional),
+/// URL components and delimiters that separate them are:
+///
+/// ```notrust
+/// url =
+/// scheme ":"
+/// [ "//" [ username [ ":" password ]? "@" ]? host [ ":" port ]? ]?
+/// path [ "?" query ]? [ "#" fragment ]?
+/// ```
+///
+/// When a given component is not present,
+/// its "before" and "after" position are the same
+/// (so that `&some_url[BeforeFoo..AfterFoo]` is the empty string)
+/// and component ordering is preserved
+/// (so that a missing query "is between" a path and a fragment).
+///
+/// The end of a component and the start of the next are either the same or separate
+/// by a delimiter.
+/// (Not that the initial `/` of a path is considered part of the path here, not a delimiter.)
+/// For example, `&url[..BeforeFragment]` would include a `#` delimiter (if present in `url`),
+/// so `&url[..AfterQuery]` might be desired instead.
+///
+/// `BeforeScheme` and `AfterFragment` are always the start and end of the entire URL,
+/// so `&url[BeforeScheme..X]` is the same as `&url[..X]`
+/// and `&url[X..AfterFragment]` is the same as `&url[X..]`.
+#[derive(Copy, Clone, Debug)]
+pub enum Position {
+ BeforeScheme,
+ AfterScheme,
+ BeforeUsername,
+ AfterUsername,
+ BeforePassword,
+ AfterPassword,
+ BeforeHost,
+ AfterHost,
+ BeforePort,
+ AfterPort,
+ BeforePath,
+ AfterPath,
+ BeforeQuery,
+ AfterQuery,
+ BeforeFragment,
+ AfterFragment
+}
+
+impl Url {
+ #[inline]
+ fn index(&self, position: Position) -> usize {
+ match position {
+ Position::BeforeScheme => 0,
+
+ Position::AfterScheme => self.scheme_end as usize,
+
+ Position::BeforeUsername => if self.has_authority() {
+ self.scheme_end as usize + "://".len()
+ } else {
+ debug_assert!(self.byte_at(self.scheme_end) == b':');
+ debug_assert!(self.scheme_end + ":".len() as u32 == self.username_end);
+ self.scheme_end as usize + ":".len()
+ },
+
+ Position::AfterUsername => self.username_end as usize,
+
+ Position::BeforePassword => if self.has_authority() &&
+ self.byte_at(self.username_end) == b':' {
+ self.username_end as usize + ":".len()
+ } else {
+ debug_assert!(self.username_end == self.host_start);
+ self.username_end as usize
+ },
+
+ Position::AfterPassword => if self.has_authority() &&
+ self.byte_at(self.username_end) == b':' {
+ debug_assert!(self.byte_at(self.host_start - "@".len() as u32) == b'@');
+ self.host_start as usize - "@".len()
+ } else {
+ debug_assert!(self.username_end == self.host_start);
+ self.host_start as usize
+ },
+
+ Position::BeforeHost => self.host_start as usize,
+
+ Position::AfterHost => self.host_end as usize,
+
+ Position::BeforePort => if self.port.is_some() {
+ debug_assert!(self.byte_at(self.host_end) == b':');
+ self.host_end as usize + ":".len()
+ } else {
+ self.host_end as usize
+ },
+
+ Position::AfterPort => self.path_start as usize,
+
+ Position::BeforePath => self.path_start as usize,
+
+ Position::AfterPath => match (self.query_start, self.fragment_start) {
+ (Some(q), _) => q as usize,
+ (None, Some(f)) => f as usize,
+ (None, None) => self.serialization.len(),
+ },
+
+ Position::BeforeQuery => match (self.query_start, self.fragment_start) {
+ (Some(q), _) => {
+ debug_assert!(self.byte_at(q) == b'?');
+ q as usize + "?".len()
+ }
+ (None, Some(f)) => f as usize,
+ (None, None) => self.serialization.len(),
+ },
+
+ Position::AfterQuery => match self.fragment_start {
+ None => self.serialization.len(),
+ Some(f) => f as usize,
+ },
+
+ Position::BeforeFragment => match self.fragment_start {
+ Some(f) => {
+ debug_assert!(self.byte_at(f) == b'#');
+ f as usize + "#".len()
+ }
+ None => self.serialization.len(),
+ },
+
+ Position::AfterFragment => self.serialization.len(),
+ }
+ }
+}
+
diff --git a/third_party/rust/url/tests/data.rs b/third_party/rust/url/tests/data.rs
new file mode 100644
index 000000000..b8945aa48
--- /dev/null
+++ b/third_party/rust/url/tests/data.rs
@@ -0,0 +1,193 @@
+// Copyright 2013-2014 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+//! Data-driven tests
+
+extern crate rustc_serialize;
+extern crate test;
+extern crate url;
+
+use rustc_serialize::json::{self, Json};
+use url::{Url, quirks};
+
+
+fn run_parsing(input: String, base: String, expected: Result<ExpectedAttributes, ()>) {
+ let base = match Url::parse(&base) {
+ Ok(base) => base,
+ Err(message) => panic!("Error parsing base {:?}: {}", base, message)
+ };
+ let (url, expected) = match (base.join(&input), expected) {
+ (Ok(url), Ok(expected)) => (url, expected),
+ (Err(_), Err(())) => return,
+ (Err(message), Ok(_)) => panic!("Error parsing URL {:?}: {}", input, message),
+ (Ok(_), Err(())) => panic!("Expected a parse error for URL {:?}", input),
+ };
+
+ url.assert_invariants();
+
+ macro_rules! assert_eq {
+ ($expected: expr, $got: expr) => {
+ {
+ let expected = $expected;
+ let got = $got;
+ assert!(expected == got, "{:?} != {} {:?} for URL {:?}",
+ got, stringify!($expected), expected, url);
+ }
+ }
+ }
+
+ macro_rules! assert_attributes {
+ ($($attr: ident)+) => {
+ {
+ $(
+ assert_eq!(expected.$attr, quirks::$attr(&url));
+ )+;
+ }
+ }
+ }
+
+ assert_attributes!(href protocol username password host hostname port pathname search hash);
+
+ if let Some(expected_origin) = expected.origin {
+ assert_eq!(expected_origin, quirks::origin(&url));
+ }
+}
+
+struct ExpectedAttributes {
+ href: String,
+ origin: Option<String>,
+ protocol: String,
+ username: String,
+ password: String,
+ host: String,
+ hostname: String,
+ port: String,
+ pathname: String,
+ search: String,
+ hash: String,
+}
+
+trait JsonExt {
+ fn take(&mut self, key: &str) -> Option<Json>;
+ fn object(self) -> json::Object;
+ fn string(self) -> String;
+ fn take_string(&mut self, key: &str) -> String;
+}
+
+impl JsonExt for Json {
+ fn take(&mut self, key: &str) -> Option<Json> {
+ self.as_object_mut().unwrap().remove(key)
+ }
+
+ fn object(self) -> json::Object {
+ if let Json::Object(o) = self { o } else { panic!("Not a Json::Object") }
+ }
+
+ fn string(self) -> String {
+ if let Json::String(s) = self { s } else { panic!("Not a Json::String") }
+ }
+
+ fn take_string(&mut self, key: &str) -> String {
+ self.take(key).unwrap().string()
+ }
+}
+
+fn collect_parsing<F: FnMut(String, test::TestFn)>(add_test: &mut F) {
+ // Copied form https://github.com/w3c/web-platform-tests/blob/master/url/
+ let mut json = Json::from_str(include_str!("urltestdata.json"))
+ .expect("JSON parse error in urltestdata.json");
+ for entry in json.as_array_mut().unwrap() {
+ if entry.is_string() {
+ continue // ignore comments
+ }
+ let base = entry.take_string("base");
+ let input = entry.take_string("input");
+ let expected = if entry.find("failure").is_some() {
+ Err(())
+ } else {
+ Ok(ExpectedAttributes {
+ href: entry.take_string("href"),
+ origin: entry.take("origin").map(Json::string),
+ protocol: entry.take_string("protocol"),
+ username: entry.take_string("username"),
+ password: entry.take_string("password"),
+ host: entry.take_string("host"),
+ hostname: entry.take_string("hostname"),
+ port: entry.take_string("port"),
+ pathname: entry.take_string("pathname"),
+ search: entry.take_string("search"),
+ hash: entry.take_string("hash"),
+ })
+ };
+ add_test(format!("{:?} @ base {:?}", input, base),
+ test::TestFn::dyn_test_fn(move || run_parsing(input, base, expected)));
+ }
+}
+
+fn collect_setters<F>(add_test: &mut F) where F: FnMut(String, test::TestFn) {
+ let mut json = Json::from_str(include_str!("setters_tests.json"))
+ .expect("JSON parse error in setters_tests.json");
+
+ macro_rules! setter {
+ ($attr: expr, $setter: ident) => {{
+ let mut tests = json.take($attr).unwrap();
+ for mut test in tests.as_array_mut().unwrap().drain(..) {
+ let comment = test.take("comment").map(Json::string).unwrap_or(String::new());
+ let href = test.take_string("href");
+ let new_value = test.take_string("new_value");
+ let name = format!("{:?}.{} = {:?} {}", href, $attr, new_value, comment);
+ let mut expected = test.take("expected").unwrap();
+ add_test(name, test::TestFn::dyn_test_fn(move || {
+ let mut url = Url::parse(&href).unwrap();
+ url.assert_invariants();
+ let _ = quirks::$setter(&mut url, &new_value);
+ assert_attributes!(url, expected,
+ href protocol username password host hostname port pathname search hash);
+ url.assert_invariants();
+ }))
+ }
+ }}
+ }
+ macro_rules! assert_attributes {
+ ($url: expr, $expected: expr, $($attr: ident)+) => {
+ $(
+ if let Some(value) = $expected.take(stringify!($attr)) {
+ assert_eq!(quirks::$attr(&$url), value.string())
+ }
+ )+
+ }
+ }
+ setter!("protocol", set_protocol);
+ setter!("username", set_username);
+ setter!("password", set_password);
+ setter!("hostname", set_hostname);
+ setter!("host", set_host);
+ setter!("port", set_port);
+ setter!("pathname", set_pathname);
+ setter!("search", set_search);
+ setter!("hash", set_hash);
+}
+
+fn main() {
+ let mut tests = Vec::new();
+ {
+ let mut add_one = |name: String, run: test::TestFn| {
+ tests.push(test::TestDescAndFn {
+ desc: test::TestDesc {
+ name: test::DynTestName(name),
+ ignore: false,
+ should_panic: test::ShouldPanic::No,
+ },
+ testfn: run,
+ })
+ };
+ collect_parsing(&mut add_one);
+ collect_setters(&mut add_one);
+ }
+ test::test_main(&std::env::args().collect::<Vec<_>>(), tests)
+}
diff --git a/third_party/rust/url/tests/setters_tests.json b/third_party/rust/url/tests/setters_tests.json
new file mode 100644
index 000000000..669cc084a
--- /dev/null
+++ b/third_party/rust/url/tests/setters_tests.json
@@ -0,0 +1,1148 @@
+{
+ "comment": [
+ "## Tests for setters of https://url.spec.whatwg.org/#urlutils-members",
+ "",
+ "This file contains a JSON object.",
+ "Other than 'comment', each key is an attribute of the `URL` interface",
+ "defined in WHATWG’s URL Standard.",
+ "The values are arrays of test case objects for that attribute.",
+ "",
+ "To run a test case for the attribute `attr`:",
+ "",
+ "* Create a new `URL` object with the value for the 'href' key",
+ " the constructor single parameter. (Without a base URL.)",
+ " This must not throw.",
+ "* Set the attribute `attr` to (invoke its setter with)",
+ " with the value of for 'new_value' key.",
+ "* The value for the 'expected' key is another object.",
+ " For each `key` / `value` pair of that object,",
+ " get the attribute `key` (invoke its getter).",
+ " The returned string must be equal to `value`.",
+ "",
+ "Note: the 'href' setter is already covered by urltestdata.json."
+ ],
+ "protocol": [
+ {
+ "comment": "The empty string is not a valid scheme. Setter leaves the URL unchanged.",
+ "href": "a://example.net",
+ "new_value": "",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "href": "a://example.net",
+ "new_value": "b",
+ "expected": {
+ "href": "b://example.net/",
+ "protocol": "b:"
+ }
+ },
+ {
+ "comment": "Upper-case ASCII is lower-cased",
+ "href": "a://example.net",
+ "new_value": "B",
+ "expected": {
+ "href": "b://example.net/",
+ "protocol": "b:"
+ }
+ },
+ {
+ "comment": "Non-ASCII is rejected",
+ "href": "a://example.net",
+ "new_value": "é",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "comment": "No leading digit",
+ "href": "a://example.net",
+ "new_value": "0b",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "comment": "No leading punctuation",
+ "href": "a://example.net",
+ "new_value": "+b",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "href": "a://example.net",
+ "new_value": "bC0+-.",
+ "expected": {
+ "href": "bc0+-.://example.net/",
+ "protocol": "bc0+-.:"
+ }
+ },
+ {
+ "comment": "Only some punctuation is acceptable",
+ "href": "a://example.net",
+ "new_value": "b,c",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "comment": "Non-ASCII is rejected",
+ "href": "a://example.net",
+ "new_value": "bé",
+ "expected": {
+ "href": "a://example.net/",
+ "protocol": "a:"
+ }
+ },
+ {
+ "comment": "Spec deviation: from special scheme to not is not problematic. https://github.com/whatwg/url/issues/104",
+ "href": "http://example.net",
+ "new_value": "b",
+ "expected": {
+ "href": "b://example.net/",
+ "protocol": "b:"
+ }
+ },
+ {
+ "comment": "Cannot-be-a-base URL doesn’t have a host, but URL in a special scheme must.",
+ "href": "mailto:me@example.net",
+ "new_value": "http",
+ "expected": {
+ "href": "mailto:me@example.net",
+ "protocol": "mailto:"
+ }
+ },
+ {
+ "comment": "Spec deviation: from non-special scheme with a host to special is not problematic. https://github.com/whatwg/url/issues/104",
+ "href": "ssh://me@example.net",
+ "new_value": "http",
+ "expected": {
+ "href": "http://me@example.net/",
+ "protocol": "http:"
+ }
+ },
+ {
+ "comment": "Stuff after the first ':' is ignored",
+ "href": "http://example.net",
+ "new_value": "https:foo : bar",
+ "expected": {
+ "href": "https://example.net/",
+ "protocol": "https:"
+ }
+ },
+ {
+ "comment": "Stuff after the first ':' is ignored",
+ "href": "data:text/html,<p>Test",
+ "new_value": "view-source+data:foo : bar",
+ "expected": {
+ "href": "view-source+data:text/html,<p>Test",
+ "protocol": "view-source+data:"
+ }
+ }
+ ],
+ "username": [
+ {
+ "comment": "No host means no username",
+ "href": "file:///home/you/index.html",
+ "new_value": "me",
+ "expected": {
+ "href": "file:///home/you/index.html",
+ "username": ""
+ }
+ },
+ {
+ "comment": "No host means no username",
+ "href": "unix:/run/foo.socket",
+ "new_value": "me",
+ "expected": {
+ "href": "unix:/run/foo.socket",
+ "username": ""
+ }
+ },
+ {
+ "comment": "Cannot-be-a-base means no username",
+ "href": "mailto:you@example.net",
+ "new_value": "me",
+ "expected": {
+ "href": "mailto:you@example.net",
+ "username": ""
+ }
+ },
+ {
+ "href": "http://example.net",
+ "new_value": "me",
+ "expected": {
+ "href": "http://me@example.net/",
+ "username": "me"
+ }
+ },
+ {
+ "href": "http://:secret@example.net",
+ "new_value": "me",
+ "expected": {
+ "href": "http://me:secret@example.net/",
+ "username": "me"
+ }
+ },
+ {
+ "href": "http://me@example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://example.net/",
+ "username": ""
+ }
+ },
+ {
+ "href": "http://me:secret@example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://:secret@example.net/",
+ "username": ""
+ }
+ },
+ {
+ "comment": "UTF-8 percent encoding with the userinfo encode set.",
+ "href": "http://example.net",
+ "new_value": "\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "expected": {
+ "href": "http://%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9@example.net/",
+ "username": "%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9"
+ }
+ },
+ {
+ "comment": "Bytes already percent-encoded are left as-is.",
+ "href": "http://example.net",
+ "new_value": "%c3%89té",
+ "expected": {
+ "href": "http://%c3%89t%C3%A9@example.net/",
+ "username": "%c3%89t%C3%A9"
+ }
+ }
+ ],
+ "password": [
+ {
+ "comment": "No host means no password",
+ "href": "file:///home/me/index.html",
+ "new_value": "secret",
+ "expected": {
+ "href": "file:///home/me/index.html",
+ "password": ""
+ }
+ },
+ {
+ "comment": "No host means no password",
+ "href": "unix:/run/foo.socket",
+ "new_value": "secret",
+ "expected": {
+ "href": "unix:/run/foo.socket",
+ "password": ""
+ }
+ },
+ {
+ "comment": "Cannot-be-a-base means no password",
+ "href": "mailto:me@example.net",
+ "new_value": "secret",
+ "expected": {
+ "href": "mailto:me@example.net",
+ "password": ""
+ }
+ },
+ {
+ "href": "http://example.net",
+ "new_value": "secret",
+ "expected": {
+ "href": "http://:secret@example.net/",
+ "password": "secret"
+ }
+ },
+ {
+ "href": "http://me@example.net",
+ "new_value": "secret",
+ "expected": {
+ "href": "http://me:secret@example.net/",
+ "password": "secret"
+ }
+ },
+ {
+ "href": "http://:secret@example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://example.net/",
+ "password": ""
+ }
+ },
+ {
+ "href": "http://me:secret@example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://me@example.net/",
+ "password": ""
+ }
+ },
+ {
+ "comment": "UTF-8 percent encoding with the userinfo encode set.",
+ "href": "http://example.net",
+ "new_value": "\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "expected": {
+ "href": "http://:%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9@example.net/",
+ "password": "%00%01%09%0A%0D%1F%20!%22%23$%&'()*+,-.%2F09%3A%3B%3C%3D%3E%3F%40AZ%5B%5C%5D%5E_%60az%7B%7C%7D~%7F%C2%80%C2%81%C3%89%C3%A9"
+ }
+ },
+ {
+ "comment": "Bytes already percent-encoded are left as-is.",
+ "href": "http://example.net",
+ "new_value": "%c3%89té",
+ "expected": {
+ "href": "http://:%c3%89t%C3%A9@example.net/",
+ "password": "%c3%89t%C3%A9"
+ }
+ }
+ ],
+ "host": [
+ {
+ "comment": "Cannot-be-a-base means no host",
+ "href": "mailto:me@example.net",
+ "new_value": "example.com",
+ "expected": {
+ "href": "mailto:me@example.net",
+ "host": ""
+ }
+ },
+ {
+ "comment": "Cannot-be-a-base means no password",
+ "href": "data:text/plain,Stuff",
+ "new_value": "example.net",
+ "expected": {
+ "href": "data:text/plain,Stuff",
+ "host": ""
+ }
+ },
+ {
+ "href": "http://example.net",
+ "new_value": "example.com:8080",
+ "expected": {
+ "href": "http://example.com:8080/",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Port number is unchanged if not specified in the new value",
+ "href": "http://example.net:8080",
+ "new_value": "example.com",
+ "expected": {
+ "href": "http://example.com:8080/",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Port number is removed if empty in the new value: https://github.com/whatwg/url/pull/113",
+ "href": "http://example.net:8080",
+ "new_value": "example.com:",
+ "expected": {
+ "href": "http://example.com/",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "The empty host is not valid for special schemes",
+ "href": "http://example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://example.net/",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "The empty host is OK for non-special schemes",
+ "href": "view-source+http://example.net/foo",
+ "new_value": "",
+ "expected": {
+ "href": "view-source+http:///foo",
+ "host": ""
+ }
+ },
+ {
+ "comment": "Path-only URLs can gain a host",
+ "href": "a:/foo",
+ "new_value": "example.net",
+ "expected": {
+ "href": "a://example.net/foo",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "Path-only URLs can gain a host",
+ "href": "a:/foo",
+ "new_value": "example.net",
+ "expected": {
+ "href": "a://example.net/foo",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "IPv4 address syntax is normalized",
+ "href": "http://example.net",
+ "new_value": "0x7F000001:8080",
+ "expected": {
+ "href": "http://127.0.0.1:8080/",
+ "host": "127.0.0.1:8080",
+ "hostname": "127.0.0.1",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "IPv6 address syntax is normalized",
+ "href": "http://example.net",
+ "new_value": "[::0:01]:2",
+ "expected": {
+ "href": "http://[::1]:2/",
+ "host": "[::1]:2",
+ "hostname": "[::1]",
+ "port": "2"
+ }
+ },
+ {
+ "comment": "Default port number is removed",
+ "href": "http://example.net",
+ "new_value": "example.com:80",
+ "expected": {
+ "href": "http://example.com/",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Default port number is removed",
+ "href": "https://example.net",
+ "new_value": "example.com:443",
+ "expected": {
+ "href": "https://example.com/",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Default port number is only removed for the relevant scheme",
+ "href": "https://example.net",
+ "new_value": "example.com:80",
+ "expected": {
+ "href": "https://example.com:80/",
+ "host": "example.com:80",
+ "hostname": "example.com",
+ "port": "80"
+ }
+ },
+ {
+ "comment": "Stuff after a / delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com/stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a / delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080/stuff",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a ? delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com?stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a ? delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080?stuff",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a # delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com#stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a # delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080#stuff",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a \\ delimiter is ignored for special schemes",
+ "href": "http://example.net/path",
+ "new_value": "example.com\\stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a \\ delimiter is ignored for special schemes",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080\\stuff",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "\\ is not a delimiter for non-special schemes, and it’s invalid in a domain",
+ "href": "view-source+http://example.net/path",
+ "new_value": "example.com\\stuff",
+ "expected": {
+ "href": "view-source+http://example.net/path",
+ "host": "example.net",
+ "hostname": "example.net",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "view-source+http://example.net/path",
+ "new_value": "example.com:8080stuff2",
+ "expected": {
+ "href": "view-source+http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080stuff2",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080+2",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Port numbers are 16 bit integers",
+ "href": "http://example.net/path",
+ "new_value": "example.com:65535",
+ "expected": {
+ "href": "http://example.com:65535/path",
+ "host": "example.com:65535",
+ "hostname": "example.com",
+ "port": "65535"
+ }
+ },
+ {
+ "comment": "Port numbers are 16 bit integers, overflowing is an error. Hostname is still set, though.",
+ "href": "http://example.net/path",
+ "new_value": "example.com:65536",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ }
+ ],
+ "hostname": [
+ {
+ "comment": "Cannot-be-a-base means no host",
+ "href": "mailto:me@example.net",
+ "new_value": "example.com",
+ "expected": {
+ "href": "mailto:me@example.net",
+ "host": ""
+ }
+ },
+ {
+ "comment": "Cannot-be-a-base means no password",
+ "href": "data:text/plain,Stuff",
+ "new_value": "example.net",
+ "expected": {
+ "href": "data:text/plain,Stuff",
+ "host": ""
+ }
+ },
+ {
+ "href": "http://example.net:8080",
+ "new_value": "example.com",
+ "expected": {
+ "href": "http://example.com:8080/",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "The empty host is not valid for special schemes",
+ "href": "http://example.net",
+ "new_value": "",
+ "expected": {
+ "href": "http://example.net/",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "The empty host is OK for non-special schemes",
+ "href": "view-source+http://example.net/foo",
+ "new_value": "",
+ "expected": {
+ "href": "view-source+http:///foo",
+ "host": ""
+ }
+ },
+ {
+ "comment": "Path-only URLs can gain a host",
+ "href": "a:/foo",
+ "new_value": "example.net",
+ "expected": {
+ "href": "a://example.net/foo",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "Path-only URLs can gain a host",
+ "href": "a:/foo",
+ "new_value": "example.net",
+ "expected": {
+ "href": "a://example.net/foo",
+ "host": "example.net"
+ }
+ },
+ {
+ "comment": "IPv4 address syntax is normalized",
+ "href": "http://example.net:8080",
+ "new_value": "0x7F000001",
+ "expected": {
+ "href": "http://127.0.0.1:8080/",
+ "host": "127.0.0.1:8080",
+ "hostname": "127.0.0.1",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "IPv6 address syntax is normalized",
+ "href": "http://example.net",
+ "new_value": "[::0:01]",
+ "expected": {
+ "href": "http://[::1]/",
+ "host": "[::1]",
+ "hostname": "[::1]",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a : delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com:8080",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a : delimiter is ignored",
+ "href": "http://example.net:8080/path",
+ "new_value": "example.com:",
+ "expected": {
+ "href": "http://example.com:8080/path",
+ "host": "example.com:8080",
+ "hostname": "example.com",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a / delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com/stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a ? delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com?stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a # delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "example.com#stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Stuff after a \\ delimiter is ignored for special schemes",
+ "href": "http://example.net/path",
+ "new_value": "example.com\\stuff",
+ "expected": {
+ "href": "http://example.com/path",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": ""
+ }
+ },
+ {
+ "comment": "\\ is not a delimiter for non-special schemes, and it’s invalid in a domain",
+ "href": "view-source+http://example.net/path",
+ "new_value": "example.com\\stuff",
+ "expected": {
+ "href": "view-source+http://example.net/path",
+ "host": "example.net",
+ "hostname": "example.net",
+ "port": ""
+ }
+ }
+ ],
+ "port": [
+ {
+ "href": "http://example.net",
+ "new_value": "8080",
+ "expected": {
+ "href": "http://example.net:8080/",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Port number is removed if empty in the new value: https://github.com/whatwg/url/pull/113",
+ "href": "http://example.net:8080",
+ "new_value": "",
+ "expected": {
+ "href": "http://example.net/",
+ "host": "example.net",
+ "hostname": "example.net",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Default port number is removed",
+ "href": "http://example.net:8080",
+ "new_value": "80",
+ "expected": {
+ "href": "http://example.net/",
+ "host": "example.net",
+ "hostname": "example.net",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Default port number is removed",
+ "href": "https://example.net:4433",
+ "new_value": "443",
+ "expected": {
+ "href": "https://example.net/",
+ "host": "example.net",
+ "hostname": "example.net",
+ "port": ""
+ }
+ },
+ {
+ "comment": "Default port number is only removed for the relevant scheme",
+ "href": "https://example.net",
+ "new_value": "80",
+ "expected": {
+ "href": "https://example.net:80/",
+ "host": "example.net:80",
+ "hostname": "example.net",
+ "port": "80"
+ }
+ },
+ {
+ "comment": "Stuff after a / delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "8080/stuff",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a ? delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "8080?stuff",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a # delimiter is ignored",
+ "href": "http://example.net/path",
+ "new_value": "8080#stuff",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Stuff after a \\ delimiter is ignored for special schemes",
+ "href": "http://example.net/path",
+ "new_value": "8080\\stuff",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "view-source+http://example.net/path",
+ "new_value": "8080stuff2",
+ "expected": {
+ "href": "view-source+http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "http://example.net/path",
+ "new_value": "8080stuff2",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Anything other than ASCII digit stops the port parser in a setter but is not an error",
+ "href": "http://example.net/path",
+ "new_value": "8080+2",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ },
+ {
+ "comment": "Port numbers are 16 bit integers",
+ "href": "http://example.net/path",
+ "new_value": "65535",
+ "expected": {
+ "href": "http://example.net:65535/path",
+ "host": "example.net:65535",
+ "hostname": "example.net",
+ "port": "65535"
+ }
+ },
+ {
+ "comment": "Port numbers are 16 bit integers, overflowing is an error",
+ "href": "http://example.net:8080/path",
+ "new_value": "65536",
+ "expected": {
+ "href": "http://example.net:8080/path",
+ "host": "example.net:8080",
+ "hostname": "example.net",
+ "port": "8080"
+ }
+ }
+ ],
+ "pathname": [
+ {
+ "comment": "Cannot-be-a-base don’t have a path",
+ "href": "mailto:me@example.net",
+ "new_value": "/foo",
+ "expected": {
+ "href": "mailto:me@example.net",
+ "pathname": "me@example.net"
+ }
+ },
+ {
+ "href": "unix:/run/foo.socket?timeout=10",
+ "new_value": "/var/log/../run/bar.socket",
+ "expected": {
+ "href": "unix:/var/run/bar.socket?timeout=10",
+ "pathname": "/var/run/bar.socket"
+ }
+ },
+ {
+ "href": "https://example.net#nav",
+ "new_value": "home",
+ "expected": {
+ "href": "https://example.net/home#nav",
+ "pathname": "/home"
+ }
+ },
+ {
+ "href": "https://example.net#nav",
+ "new_value": "../home",
+ "expected": {
+ "href": "https://example.net/home#nav",
+ "pathname": "/home"
+ }
+ },
+ {
+ "comment": "\\ is a segment delimiter for 'special' URLs",
+ "href": "http://example.net/home?lang=fr#nav",
+ "new_value": "\\a\\%2E\\b\\%2e.\\c",
+ "expected": {
+ "href": "http://example.net/a/c?lang=fr#nav",
+ "pathname": "/a/c"
+ }
+ },
+ {
+ "comment": "\\ is *not* a segment delimiter for non-'special' URLs",
+ "href": "view-source+http://example.net/home?lang=fr#nav",
+ "new_value": "\\a\\%2E\\b\\%2e.\\c",
+ "expected": {
+ "href": "view-source+http://example.net/\\a\\.\\b\\..\\c?lang=fr#nav",
+ "pathname": "/\\a\\.\\b\\..\\c"
+ }
+ },
+ {
+ "comment": "UTF-8 percent encoding with the default encode set. Tabs and newlines are removed. Leading or training C0 controls and space are removed.",
+ "href": "a:/",
+ "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "expected": {
+ "href": "a:/!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E%3F@AZ[\\]^_%60az%7B|%7D~%7F%C2%80%C2%81%C3%89%C3%A9",
+ "pathname": "/!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E%3F@AZ[\\]^_%60az%7B|%7D~%7F%C2%80%C2%81%C3%89%C3%A9"
+ }
+ },
+ {
+ "comment": "Bytes already percent-encoded are left as-is, except %2E.",
+ "href": "http://example.net",
+ "new_value": "%2e%2E%c3%89té",
+ "expected": {
+ "href": "http://example.net/..%c3%89t%C3%A9",
+ "pathname": "/..%c3%89t%C3%A9"
+ }
+ }
+ ],
+ "search": [
+ {
+ "href": "https://example.net#nav",
+ "new_value": "lang=fr",
+ "expected": {
+ "href": "https://example.net/?lang=fr#nav",
+ "search": "?lang=fr"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "lang=fr",
+ "expected": {
+ "href": "https://example.net/?lang=fr#nav",
+ "search": "?lang=fr"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "?lang=fr",
+ "expected": {
+ "href": "https://example.net/?lang=fr#nav",
+ "search": "?lang=fr"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "??lang=fr",
+ "expected": {
+ "href": "https://example.net/??lang=fr#nav",
+ "search": "??lang=fr"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "?",
+ "expected": {
+ "href": "https://example.net/?#nav",
+ "search": ""
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "",
+ "expected": {
+ "href": "https://example.net/#nav",
+ "search": ""
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US",
+ "new_value": "",
+ "expected": {
+ "href": "https://example.net/",
+ "search": ""
+ }
+ },
+ {
+ "href": "https://example.net",
+ "new_value": "",
+ "expected": {
+ "href": "https://example.net/",
+ "search": ""
+ }
+ },
+ {
+ "comment": "UTF-8 percent encoding with the query encode set. Tabs and newlines are removed. Leading or training C0 controls and space are removed.",
+ "href": "a:/",
+ "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "expected": {
+ "href": "a:/?!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E?@AZ[\\]^_`az{|}~%7F%C2%80%C2%81%C3%89%C3%A9",
+ "search": "?!%00%01%1F%20!%22%23$%&'()*+,-./09:;%3C=%3E?@AZ[\\]^_`az{|}~%7F%C2%80%C2%81%C3%89%C3%A9"
+ }
+ },
+ {
+ "comment": "Bytes already percent-encoded are left as-is",
+ "href": "http://example.net",
+ "new_value": "%c3%89té",
+ "expected": {
+ "href": "http://example.net/?%c3%89t%C3%A9",
+ "search": "?%c3%89t%C3%A9"
+ }
+ }
+ ],
+ "hash": [
+ {
+ "href": "https://example.net",
+ "new_value": "main",
+ "expected": {
+ "href": "https://example.net/#main",
+ "hash": "#main"
+ }
+ },
+ {
+ "href": "https://example.net#nav",
+ "new_value": "main",
+ "expected": {
+ "href": "https://example.net/#main",
+ "hash": "#main"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US",
+ "new_value": "##nav",
+ "expected": {
+ "href": "https://example.net/?lang=en-US##nav",
+ "hash": "##nav"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "#main",
+ "expected": {
+ "href": "https://example.net/?lang=en-US#main",
+ "hash": "#main"
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "#",
+ "expected": {
+ "href": "https://example.net/?lang=en-US#",
+ "hash": ""
+ }
+ },
+ {
+ "href": "https://example.net?lang=en-US#nav",
+ "new_value": "",
+ "expected": {
+ "href": "https://example.net/?lang=en-US",
+ "hash": ""
+ }
+ },
+ {
+ "comment": "No percent-encoding at all (!); nuls, tabs, and newlines are removed. Leading or training C0 controls and space are removed.",
+ "href": "a:/",
+ "new_value": "\u0000\u0001\t\n\r\u001f !\u0000\u0001\t\n\r\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "expected": {
+ "href": "a:/#!\u0001\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé",
+ "hash": "#!\u0001\u001f !\"#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~\u007f\u0080\u0081Éé"
+ }
+ },
+ {
+ "comment": "Bytes already percent-encoded are left as-is",
+ "href": "http://example.net",
+ "new_value": "%c3%89té",
+ "expected": {
+ "href": "http://example.net/#%c3%89té",
+ "hash": "#%c3%89té"
+ }
+ }
+ ]
+}
diff --git a/third_party/rust/url/tests/unit.rs b/third_party/rust/url/tests/unit.rs
new file mode 100644
index 000000000..7cea1000c
--- /dev/null
+++ b/third_party/rust/url/tests/unit.rs
@@ -0,0 +1,303 @@
+// Copyright 2013-2014 The rust-url developers.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+//! Unit tests
+
+extern crate url;
+
+use std::borrow::Cow;
+use std::net::{Ipv4Addr, Ipv6Addr};
+use std::path::{Path, PathBuf};
+use url::{Host, Url, form_urlencoded};
+
+macro_rules! assert_from_file_path {
+ ($path: expr) => { assert_from_file_path!($path, $path) };
+ ($path: expr, $url_path: expr) => {{
+ let url = Url::from_file_path(Path::new($path)).unwrap();
+ assert_eq!(url.host(), None);
+ assert_eq!(url.path(), $url_path);
+ assert_eq!(url.to_file_path(), Ok(PathBuf::from($path)));
+ }};
+}
+
+
+
+#[test]
+fn new_file_paths() {
+ if cfg!(unix) {
+ assert_eq!(Url::from_file_path(Path::new("relative")), Err(()));
+ assert_eq!(Url::from_file_path(Path::new("../relative")), Err(()));
+ }
+ if cfg!(windows) {
+ assert_eq!(Url::from_file_path(Path::new("relative")), Err(()));
+ assert_eq!(Url::from_file_path(Path::new(r"..\relative")), Err(()));
+ assert_eq!(Url::from_file_path(Path::new(r"\drive-relative")), Err(()));
+ assert_eq!(Url::from_file_path(Path::new(r"\\ucn\")), Err(()));
+ }
+
+ if cfg!(unix) {
+ assert_from_file_path!("/foo/bar");
+ assert_from_file_path!("/foo/ba\0r", "/foo/ba%00r");
+ assert_from_file_path!("/foo/ba%00r", "/foo/ba%2500r");
+ }
+}
+
+#[test]
+#[cfg(unix)]
+fn new_path_bad_utf8() {
+ use std::ffi::OsStr;
+ use std::os::unix::prelude::*;
+
+ let url = Url::from_file_path(Path::new(OsStr::from_bytes(b"/foo/ba\x80r"))).unwrap();
+ let os_str = OsStr::from_bytes(b"/foo/ba\x80r");
+ assert_eq!(url.to_file_path(), Ok(PathBuf::from(os_str)));
+}
+
+#[test]
+fn new_path_windows_fun() {
+ if cfg!(windows) {
+ assert_from_file_path!(r"C:\foo\bar", "/C:/foo/bar");
+ assert_from_file_path!("C:\\foo\\ba\0r", "/C:/foo/ba%00r");
+
+ // Invalid UTF-8
+ assert!(Url::parse("file:///C:/foo/ba%80r").unwrap().to_file_path().is_err());
+
+ // test windows canonicalized path
+ let path = PathBuf::from(r"\\?\C:\foo\bar");
+ assert!(Url::from_file_path(path).is_ok());
+ }
+}
+
+
+#[test]
+fn new_directory_paths() {
+ if cfg!(unix) {
+ assert_eq!(Url::from_directory_path(Path::new("relative")), Err(()));
+ assert_eq!(Url::from_directory_path(Path::new("../relative")), Err(()));
+
+ let url = Url::from_directory_path(Path::new("/foo/bar")).unwrap();
+ assert_eq!(url.host(), None);
+ assert_eq!(url.path(), "/foo/bar/");
+ }
+ if cfg!(windows) {
+ assert_eq!(Url::from_directory_path(Path::new("relative")), Err(()));
+ assert_eq!(Url::from_directory_path(Path::new(r"..\relative")), Err(()));
+ assert_eq!(Url::from_directory_path(Path::new(r"\drive-relative")), Err(()));
+ assert_eq!(Url::from_directory_path(Path::new(r"\\ucn\")), Err(()));
+
+ let url = Url::from_directory_path(Path::new(r"C:\foo\bar")).unwrap();
+ assert_eq!(url.host(), None);
+ assert_eq!(url.path(), "/C:/foo/bar/");
+ }
+}
+
+#[test]
+fn from_str() {
+ assert!("http://testing.com/this".parse::<Url>().is_ok());
+}
+
+#[test]
+fn issue_124() {
+ let url: Url = "file:a".parse().unwrap();
+ assert_eq!(url.path(), "/a");
+ let url: Url = "file:...".parse().unwrap();
+ assert_eq!(url.path(), "/...");
+ let url: Url = "file:..".parse().unwrap();
+ assert_eq!(url.path(), "/");
+}
+
+#[test]
+fn test_equality() {
+ use std::hash::{Hash, Hasher, SipHasher};
+
+ fn check_eq(a: &Url, b: &Url) {
+ assert_eq!(a, b);
+
+ let mut h1 = SipHasher::new();
+ a.hash(&mut h1);
+ let mut h2 = SipHasher::new();
+ b.hash(&mut h2);
+ assert_eq!(h1.finish(), h2.finish());
+ }
+
+ fn url(s: &str) -> Url {
+ let rv = s.parse().unwrap();
+ check_eq(&rv, &rv);
+ rv
+ }
+
+ // Doesn't care if default port is given.
+ let a: Url = url("https://example.com/");
+ let b: Url = url("https://example.com:443/");
+ check_eq(&a, &b);
+
+ // Different ports
+ let a: Url = url("http://example.com/");
+ let b: Url = url("http://example.com:8080/");
+ assert!(a != b, "{:?} != {:?}", a, b);
+
+ // Different scheme
+ let a: Url = url("http://example.com/");
+ let b: Url = url("https://example.com/");
+ assert!(a != b);
+
+ // Different host
+ let a: Url = url("http://foo.com/");
+ let b: Url = url("http://bar.com/");
+ assert!(a != b);
+
+ // Missing path, automatically substituted. Semantically the same.
+ let a: Url = url("http://foo.com");
+ let b: Url = url("http://foo.com/");
+ check_eq(&a, &b);
+}
+
+#[test]
+fn host() {
+ fn assert_host(input: &str, host: Host<&str>) {
+ assert_eq!(Url::parse(input).unwrap().host(), Some(host));
+ }
+ assert_host("http://www.mozilla.org", Host::Domain("www.mozilla.org"));
+ assert_host("http://1.35.33.49", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49)));
+ assert_host("http://[2001:0db8:85a3:08d3:1319:8a2e:0370:7344]", Host::Ipv6(Ipv6Addr::new(
+ 0x2001, 0x0db8, 0x85a3, 0x08d3, 0x1319, 0x8a2e, 0x0370, 0x7344)));
+ assert_host("http://1.35.+33.49", Host::Domain("1.35.+33.49"));
+ assert_host("http://[::]", Host::Ipv6(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 0)));
+ assert_host("http://[::1]", Host::Ipv6(Ipv6Addr::new(0, 0, 0, 0, 0, 0, 0, 1)));
+ assert_host("http://0x1.0X23.0x21.061", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49)));
+ assert_host("http://0x1232131", Host::Ipv4(Ipv4Addr::new(1, 35, 33, 49)));
+ assert_host("http://111", Host::Ipv4(Ipv4Addr::new(0, 0, 0, 111)));
+ assert_host("http://2..2.3", Host::Domain("2..2.3"));
+ assert!(Url::parse("http://42.0x1232131").is_err());
+ assert!(Url::parse("http://192.168.0.257").is_err());
+}
+
+#[test]
+fn host_serialization() {
+ // libstd’s `Display for Ipv6Addr` serializes 0:0:0:0:0:0:_:_ and 0:0:0:0:0:ffff:_:_
+ // using IPv4-like syntax, as suggested in https://tools.ietf.org/html/rfc5952#section-4
+ // but https://url.spec.whatwg.org/#concept-ipv6-serializer specifies not to.
+
+ // Not [::0.0.0.2] / [::ffff:0.0.0.2]
+ assert_eq!(Url::parse("http://[0::2]").unwrap().host_str(), Some("[::2]"));
+ assert_eq!(Url::parse("http://[0::ffff:0:2]").unwrap().host_str(), Some("[::ffff:0:2]"));
+}
+
+#[test]
+fn test_idna() {
+ assert!("http://goșu.ro".parse::<Url>().is_ok());
+ assert_eq!(Url::parse("http://☃.net/").unwrap().host(), Some(Host::Domain("xn--n3h.net")));
+}
+
+#[test]
+fn test_serialization() {
+ let data = [
+ ("http://example.com/", "http://example.com/"),
+ ("http://addslash.com", "http://addslash.com/"),
+ ("http://@emptyuser.com/", "http://emptyuser.com/"),
+ ("http://:@emptypass.com/", "http://:@emptypass.com/"),
+ ("http://user@user.com/", "http://user@user.com/"),
+ ("http://user:pass@userpass.com/", "http://user:pass@userpass.com/"),
+ ("http://slashquery.com/path/?q=something", "http://slashquery.com/path/?q=something"),
+ ("http://noslashquery.com/path?q=something", "http://noslashquery.com/path?q=something")
+ ];
+ for &(input, result) in &data {
+ let url = Url::parse(input).unwrap();
+ assert_eq!(url.as_str(), result);
+ }
+}
+
+#[test]
+fn test_form_urlencoded() {
+ let pairs: &[(Cow<str>, Cow<str>)] = &[
+ ("foo".into(), "é&".into()),
+ ("bar".into(), "".into()),
+ ("foo".into(), "#".into())
+ ];
+ let encoded = form_urlencoded::Serializer::new(String::new()).extend_pairs(pairs).finish();
+ assert_eq!(encoded, "foo=%C3%A9%26&bar=&foo=%23");
+ assert_eq!(form_urlencoded::parse(encoded.as_bytes()).collect::<Vec<_>>(), pairs.to_vec());
+}
+
+#[test]
+fn test_form_serialize() {
+ let encoded = form_urlencoded::Serializer::new(String::new())
+ .append_pair("foo", "é&")
+ .append_pair("bar", "")
+ .append_pair("foo", "#")
+ .finish();
+ assert_eq!(encoded, "foo=%C3%A9%26&bar=&foo=%23");
+}
+
+#[test]
+/// https://github.com/servo/rust-url/issues/25
+fn issue_25() {
+ let filename = if cfg!(windows) { r"C:\run\pg.sock" } else { "/run/pg.sock" };
+ let mut url = Url::from_file_path(filename).unwrap();
+ url.assert_invariants();
+ url.set_scheme("postgres").unwrap();
+ url.assert_invariants();
+ url.set_host(Some("")).unwrap();
+ url.assert_invariants();
+ url.set_username("me").unwrap();
+ url.assert_invariants();
+ let expected = format!("postgres://me@/{}run/pg.sock", if cfg!(windows) { "C:/" } else { "" });
+ assert_eq!(url.as_str(), expected);
+}
+
+#[test]
+/// https://github.com/servo/rust-url/issues/61
+fn issue_61() {
+ let mut url = Url::parse("http://mozilla.org").unwrap();
+ url.set_scheme("https").unwrap();
+ assert_eq!(url.port(), None);
+ assert_eq!(url.port_or_known_default(), Some(443));
+ url.assert_invariants();
+}
+
+#[test]
+#[cfg(not(windows))]
+/// https://github.com/servo/rust-url/issues/197
+fn issue_197() {
+ let mut url = Url::from_file_path("/").expect("Failed to parse path");
+ url.assert_invariants();
+ assert_eq!(url, Url::parse("file:///").expect("Failed to parse path + protocol"));
+ url.path_segments_mut().expect("path_segments_mut").pop_if_empty();
+}
+
+#[test]
+/// https://github.com/servo/rust-url/issues/222
+fn append_trailing_slash() {
+ let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap();
+ url.assert_invariants();
+ url.path_segments_mut().unwrap().push("");
+ url.assert_invariants();
+ assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/?a=b");
+}
+
+#[test]
+/// https://github.com/servo/rust-url/issues/227
+fn extend_query_pairs_then_mutate() {
+ let mut url: Url = "http://localhost:6767/foo/bar".parse().unwrap();
+ url.query_pairs_mut().extend_pairs(vec![ ("auth", "my-token") ].into_iter());
+ url.assert_invariants();
+ assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?auth=my-token");
+ url.path_segments_mut().unwrap().push("some_other_path");
+ url.assert_invariants();
+ assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/some_other_path?auth=my-token");
+}
+
+#[test]
+/// https://github.com/servo/rust-url/issues/222
+fn append_empty_segment_then_mutate() {
+ let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap();
+ url.assert_invariants();
+ url.path_segments_mut().unwrap().push("").pop();
+ url.assert_invariants();
+ assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?a=b");
+}
diff --git a/third_party/rust/url/tests/urltestdata.json b/third_party/rust/url/tests/urltestdata.json
new file mode 100644
index 000000000..ee5416ecf
--- /dev/null
+++ b/third_party/rust/url/tests/urltestdata.json
@@ -0,0 +1,4277 @@
+[
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/segments.js",
+ {
+ "input": "http://example\t.\norg",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://user:pass@foo:21/bar;par?b#c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://user:pass@foo:21/bar;par?b#c",
+ "origin": "http://foo:21",
+ "protocol": "http:",
+ "username": "user",
+ "password": "pass",
+ "host": "foo:21",
+ "hostname": "foo",
+ "port": "21",
+ "pathname": "/bar;par",
+ "search": "?b",
+ "hash": "#c"
+ },
+ {
+ "input": "http:foo.com",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/foo.com",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/foo.com",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "\t :foo.com \n",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:foo.com",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:foo.com",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": " foo.com ",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/foo.com",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/foo.com",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "a:\t foo.com",
+ "base": "http://example.org/foo/bar",
+ "href": "a: foo.com",
+ "origin": "null",
+ "protocol": "a:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": " foo.com",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:21/ b ? d # e ",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f:21/%20b%20?%20d%20# e",
+ "origin": "http://f:21",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f:21",
+ "hostname": "f",
+ "port": "21",
+ "pathname": "/%20b%20",
+ "search": "?%20d%20",
+ "hash": "# e"
+ },
+ {
+ "input": "http://f:/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f/c",
+ "origin": "http://f",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f",
+ "hostname": "f",
+ "port": "",
+ "pathname": "/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:0/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f:0/c",
+ "origin": "http://f:0",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f:0",
+ "hostname": "f",
+ "port": "0",
+ "pathname": "/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:00000000000000/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f:0/c",
+ "origin": "http://f:0",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f:0",
+ "hostname": "f",
+ "port": "0",
+ "pathname": "/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:00000000000000000000080/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f/c",
+ "origin": "http://f",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f",
+ "hostname": "f",
+ "port": "",
+ "pathname": "/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:b/c",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://f: /c",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://f:\n/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://f/c",
+ "origin": "http://f",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "f",
+ "hostname": "f",
+ "port": "",
+ "pathname": "/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://f:fifty-two/c",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://f:999999/c",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://f: 21 / b ? d # e ",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": " \t",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":foo.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:foo.com/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:foo.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":foo.com\\",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:foo.com/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:foo.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":a",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:a",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:a",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":\\",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":#",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:#",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "#",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar#",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "#/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar#/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": "#/"
+ },
+ {
+ "input": "#\\",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar#\\",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": "#\\"
+ },
+ {
+ "input": "#;?",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar#;?",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": "#;?"
+ },
+ {
+ "input": "?",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar?",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ":23",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:23",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:23",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/:23",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/:23",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/:23",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "::",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/::",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/::",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "::23",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/::23",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/::23",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo://",
+ "base": "http://example.org/foo/bar",
+ "href": "foo:///",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://a:b@c:29/d",
+ "base": "http://example.org/foo/bar",
+ "href": "http://a:b@c:29/d",
+ "origin": "http://c:29",
+ "protocol": "http:",
+ "username": "a",
+ "password": "b",
+ "host": "c:29",
+ "hostname": "c",
+ "port": "29",
+ "pathname": "/d",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http::@c:29",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/:@c:29",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/:@c:29",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://&a:foo(b]c@d:2/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://&a:foo(b%5Dc@d:2/",
+ "origin": "http://d:2",
+ "protocol": "http:",
+ "username": "&a",
+ "password": "foo(b%5Dc",
+ "host": "d:2",
+ "hostname": "d",
+ "port": "2",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://::@c@d:2",
+ "base": "http://example.org/foo/bar",
+ "href": "http://:%3A%40c@d:2/",
+ "origin": "http://d:2",
+ "protocol": "http:",
+ "username": "",
+ "password": "%3A%40c",
+ "host": "d:2",
+ "hostname": "d",
+ "port": "2",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo.com:b@d/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo.com:b@d/",
+ "origin": "http://d",
+ "protocol": "http:",
+ "username": "foo.com",
+ "password": "b",
+ "host": "d",
+ "hostname": "d",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo.com/\\@",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo.com//@",
+ "origin": "http://foo.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo.com",
+ "hostname": "foo.com",
+ "port": "",
+ "pathname": "//@",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:\\\\foo.com\\",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo.com/",
+ "origin": "http://foo.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo.com",
+ "hostname": "foo.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:\\\\a\\b:c\\d@foo.com\\",
+ "base": "http://example.org/foo/bar",
+ "href": "http://a/b:c/d@foo.com/",
+ "origin": "http://a",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "a",
+ "hostname": "a",
+ "port": "",
+ "pathname": "/b:c/d@foo.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo:/",
+ "base": "http://example.org/foo/bar",
+ "href": "foo:/",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo:/bar.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "foo:/bar.com/",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/bar.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo://///////",
+ "base": "http://example.org/foo/bar",
+ "href": "foo://///////",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "///////",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo://///////bar.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "foo://///////bar.com/",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "///////bar.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "foo:////://///",
+ "base": "http://example.org/foo/bar",
+ "href": "foo:////://///",
+ "origin": "null",
+ "protocol": "foo:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "//://///",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "c:/foo",
+ "base": "http://example.org/foo/bar",
+ "href": "c:/foo",
+ "origin": "null",
+ "protocol": "c:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "//foo/bar",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo/bar",
+ "origin": "http://foo",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo/path;a??e#f#g",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo/path;a??e#f#g",
+ "origin": "http://foo",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/path;a",
+ "search": "??e",
+ "hash": "#f#g"
+ },
+ {
+ "input": "http://foo/abcd?efgh?ijkl",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo/abcd?efgh?ijkl",
+ "origin": "http://foo",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/abcd",
+ "search": "?efgh?ijkl",
+ "hash": ""
+ },
+ {
+ "input": "http://foo/abcd#foo?bar",
+ "base": "http://example.org/foo/bar",
+ "href": "http://foo/abcd#foo?bar",
+ "origin": "http://foo",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/abcd",
+ "search": "",
+ "hash": "#foo?bar"
+ },
+ {
+ "input": "[61:24:74]:98",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/[61:24:74]:98",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/[61:24:74]:98",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:[61:27]/:foo",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/[61:27]/:foo",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/[61:27]/:foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://[1::2]:3:4",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://2001::1",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://2001::1]",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://2001::1]:80",
+ "base": "http://example.org/foo/bar",
+ "failure": true
+ },
+ {
+ "input": "http://[2001::1]",
+ "base": "http://example.org/foo/bar",
+ "href": "http://[2001::1]/",
+ "origin": "http://[2001::1]",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "[2001::1]",
+ "hostname": "[2001::1]",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://[2001::1]:80",
+ "base": "http://example.org/foo/bar",
+ "href": "http://[2001::1]/",
+ "origin": "http://[2001::1]",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "[2001::1]",
+ "hostname": "[2001::1]",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/example.com/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ftp://example.com/",
+ "origin": "ftp://example.com",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "https://example.com/",
+ "origin": "https://example.com",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "madeupscheme:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "madeupscheme:/example.com/",
+ "origin": "null",
+ "protocol": "madeupscheme:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "file:///example.com/",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftps:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ftps:/example.com/",
+ "origin": "null",
+ "protocol": "ftps:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "gopher://example.com/",
+ "origin": "gopher://example.com",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ws://example.com/",
+ "origin": "ws://example.com",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "wss://example.com/",
+ "origin": "wss://example.com",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "data:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "data:/example.com/",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "javascript:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "javascript:/example.com/",
+ "origin": "null",
+ "protocol": "javascript:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "mailto:/example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "mailto:/example.com/",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/example.com/",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ftp://example.com/",
+ "origin": "ftp://example.com",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "https://example.com/",
+ "origin": "https://example.com",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "madeupscheme:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "madeupscheme:example.com/",
+ "origin": "null",
+ "protocol": "madeupscheme:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftps:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ftps:example.com/",
+ "origin": "null",
+ "protocol": "ftps:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "gopher://example.com/",
+ "origin": "gopher://example.com",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "ws://example.com/",
+ "origin": "ws://example.com",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "wss://example.com/",
+ "origin": "wss://example.com",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "data:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "data:example.com/",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "javascript:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "javascript:example.com/",
+ "origin": "null",
+ "protocol": "javascript:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "mailto:example.com/",
+ "base": "http://example.org/foo/bar",
+ "href": "mailto:example.com/",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/a/b/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/a/b/c",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/a/b/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/a/ /c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/a/%20/c",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/a/%20/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/a%2fc",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/a%2fc",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/a%2fc",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/a/%2f/c",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/a/%2f/c",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/a/%2f/c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "#β",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar#β",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "",
+ "hash": "#β"
+ },
+ {
+ "input": "data:text/html,test#test",
+ "base": "http://example.org/foo/bar",
+ "href": "data:text/html,test#test",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "text/html,test",
+ "search": "",
+ "hash": "#test"
+ },
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/file.html",
+ {
+ "input": "file:c:\\foo\\bar.html",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///c:/foo/bar.html",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/c:/foo/bar.html",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": " File:c|////foo\\bar.html",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///c:////foo/bar.html",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/c:////foo/bar.html",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "C|/foo/bar",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///C:/foo/bar",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/C:/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/C|\\foo\\bar",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///C:/foo/bar",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/C:/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "//C|/foo/bar",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///C:/foo/bar",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/C:/foo/bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "//server/file",
+ "base": "file:///tmp/mock/path",
+ "href": "file://server/file",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "server",
+ "hostname": "server",
+ "port": "",
+ "pathname": "/file",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "\\\\server\\file",
+ "base": "file:///tmp/mock/path",
+ "href": "file://server/file",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "server",
+ "hostname": "server",
+ "port": "",
+ "pathname": "/file",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/\\server/file",
+ "base": "file:///tmp/mock/path",
+ "href": "file://server/file",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "server",
+ "hostname": "server",
+ "port": "",
+ "pathname": "/file",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:///foo/bar.txt",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///foo/bar.txt",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/foo/bar.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:///home/me",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///home/me",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/home/me",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "//",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "///",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "///test",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///test",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/test",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file://test",
+ "base": "file:///tmp/mock/path",
+ "href": "file://test/",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "test",
+ "hostname": "test",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file://localhost",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file://localhost/",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file://localhost/test",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///test",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/test",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "test",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///tmp/mock/test",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/tmp/mock/test",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:test",
+ "base": "file:///tmp/mock/path",
+ "href": "file:///tmp/mock/test",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/tmp/mock/test",
+ "search": "",
+ "hash": ""
+ },
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/path.js",
+ {
+ "input": "http://example.com/././foo",
+ "base": "about:blank",
+ "href": "http://example.com/foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/./.foo",
+ "base": "about:blank",
+ "href": "http://example.com/.foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/.foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/.",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/./",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar/..",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar/../",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/..bar",
+ "base": "about:blank",
+ "href": "http://example.com/foo/..bar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/..bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar/../ton",
+ "base": "about:blank",
+ "href": "http://example.com/foo/ton",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/ton",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar/../ton/../../a",
+ "base": "about:blank",
+ "href": "http://example.com/a",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/a",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/../../..",
+ "base": "about:blank",
+ "href": "http://example.com/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/../../../ton",
+ "base": "about:blank",
+ "href": "http://example.com/ton",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/ton",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/%2e",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/%2e%2",
+ "base": "about:blank",
+ "href": "http://example.com/foo/.%2",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/.%2",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/%2e./%2e%2e/.%2e/%2e.bar",
+ "base": "about:blank",
+ "href": "http://example.com/..bar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/..bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com////../..",
+ "base": "about:blank",
+ "href": "http://example.com//",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "//",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar//../..",
+ "base": "about:blank",
+ "href": "http://example.com/foo/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo/bar//..",
+ "base": "about:blank",
+ "href": "http://example.com/foo/bar/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo/bar/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo",
+ "base": "about:blank",
+ "href": "http://example.com/foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/%20foo",
+ "base": "about:blank",
+ "href": "http://example.com/%20foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%20foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%",
+ "base": "about:blank",
+ "href": "http://example.com/foo%",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%2",
+ "base": "about:blank",
+ "href": "http://example.com/foo%2",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%2",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%2zbar",
+ "base": "about:blank",
+ "href": "http://example.com/foo%2zbar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%2zbar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%2©zbar",
+ "base": "about:blank",
+ "href": "http://example.com/foo%2%C3%82%C2%A9zbar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%2%C3%82%C2%A9zbar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%41%7a",
+ "base": "about:blank",
+ "href": "http://example.com/foo%41%7a",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%41%7a",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo\t\u0091%91",
+ "base": "about:blank",
+ "href": "http://example.com/foo%C2%91%91",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%C2%91%91",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo%00%51",
+ "base": "about:blank",
+ "href": "http://example.com/foo%00%51",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foo%00%51",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/(%28:%3A%29)",
+ "base": "about:blank",
+ "href": "http://example.com/(%28:%3A%29)",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/(%28:%3A%29)",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/%3A%3a%3C%3c",
+ "base": "about:blank",
+ "href": "http://example.com/%3A%3a%3C%3c",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%3A%3a%3C%3c",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/foo\tbar",
+ "base": "about:blank",
+ "href": "http://example.com/foobar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/foobar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com\\\\foo\\\\bar",
+ "base": "about:blank",
+ "href": "http://example.com//foo//bar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "//foo//bar",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/%7Ffp3%3Eju%3Dduvgw%3Dd",
+ "base": "about:blank",
+ "href": "http://example.com/%7Ffp3%3Eju%3Dduvgw%3Dd",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%7Ffp3%3Eju%3Dduvgw%3Dd",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/@asdf%40",
+ "base": "about:blank",
+ "href": "http://example.com/@asdf%40",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/@asdf%40",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/你好你好",
+ "base": "about:blank",
+ "href": "http://example.com/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/‥/foo",
+ "base": "about:blank",
+ "href": "http://example.com/%E2%80%A5/foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%E2%80%A5/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com//foo",
+ "base": "about:blank",
+ "href": "http://example.com/%EF%BB%BF/foo",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%EF%BB%BF/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example.com/‮/foo/‭/bar",
+ "base": "about:blank",
+ "href": "http://example.com/%E2%80%AE/foo/%E2%80%AD/bar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/%E2%80%AE/foo/%E2%80%AD/bar",
+ "search": "",
+ "hash": ""
+ },
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/script-tests/relative.js",
+ {
+ "input": "http://www.google.com/foo?bar=baz#",
+ "base": "about:blank",
+ "href": "http://www.google.com/foo?bar=baz#",
+ "origin": "http://www.google.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.google.com",
+ "hostname": "www.google.com",
+ "port": "",
+ "pathname": "/foo",
+ "search": "?bar=baz",
+ "hash": ""
+ },
+ {
+ "input": "http://www.google.com/foo?bar=baz# »",
+ "base": "about:blank",
+ "href": "http://www.google.com/foo?bar=baz# »",
+ "origin": "http://www.google.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.google.com",
+ "hostname": "www.google.com",
+ "port": "",
+ "pathname": "/foo",
+ "search": "?bar=baz",
+ "hash": "# »"
+ },
+ {
+ "input": "data:test# »",
+ "base": "about:blank",
+ "href": "data:test# »",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "test",
+ "search": "",
+ "hash": "# »"
+ },
+ {
+ "input": "http://[www.google.com]/",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://www.google.com",
+ "base": "about:blank",
+ "href": "http://www.google.com/",
+ "origin": "http://www.google.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.google.com",
+ "hostname": "www.google.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://192.0x00A80001",
+ "base": "about:blank",
+ "href": "http://192.168.0.1/",
+ "origin": "http://192.168.0.1",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "192.168.0.1",
+ "hostname": "192.168.0.1",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://www/foo%2Ehtml",
+ "base": "about:blank",
+ "href": "http://www/foo.html",
+ "origin": "http://www",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www",
+ "hostname": "www",
+ "port": "",
+ "pathname": "/foo.html",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://www/foo/%2E/html",
+ "base": "about:blank",
+ "href": "http://www/foo/html",
+ "origin": "http://www",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www",
+ "hostname": "www",
+ "port": "",
+ "pathname": "/foo/html",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://user:pass@/",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://%25DOMAIN:foobar@foodomain.com/",
+ "base": "about:blank",
+ "href": "http://%25DOMAIN:foobar@foodomain.com/",
+ "origin": "http://foodomain.com",
+ "protocol": "http:",
+ "username": "%25DOMAIN",
+ "password": "foobar",
+ "host": "foodomain.com",
+ "hostname": "foodomain.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:\\\\www.google.com\\foo",
+ "base": "about:blank",
+ "href": "http://www.google.com/foo",
+ "origin": "http://www.google.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.google.com",
+ "hostname": "www.google.com",
+ "port": "",
+ "pathname": "/foo",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo:80/",
+ "base": "about:blank",
+ "href": "http://foo/",
+ "origin": "http://foo",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo:81/",
+ "base": "about:blank",
+ "href": "http://foo:81/",
+ "origin": "http://foo:81",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "foo:81",
+ "hostname": "foo",
+ "port": "81",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "httpa://foo:80/",
+ "base": "about:blank",
+ "href": "httpa://foo:80/",
+ "origin": "null",
+ "protocol": "httpa:",
+ "username": "",
+ "password": "",
+ "host": "foo:80",
+ "hostname": "foo",
+ "port": "80",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://foo:-80/",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "https://foo:443/",
+ "base": "about:blank",
+ "href": "https://foo/",
+ "origin": "https://foo",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https://foo:80/",
+ "base": "about:blank",
+ "href": "https://foo:80/",
+ "origin": "https://foo:80",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "foo:80",
+ "hostname": "foo",
+ "port": "80",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp://foo:21/",
+ "base": "about:blank",
+ "href": "ftp://foo/",
+ "origin": "ftp://foo",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp://foo:80/",
+ "base": "about:blank",
+ "href": "ftp://foo:80/",
+ "origin": "ftp://foo:80",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "foo:80",
+ "hostname": "foo",
+ "port": "80",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher://foo:70/",
+ "base": "about:blank",
+ "href": "gopher://foo/",
+ "origin": "gopher://foo",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher://foo:443/",
+ "base": "about:blank",
+ "href": "gopher://foo:443/",
+ "origin": "gopher://foo:443",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "foo:443",
+ "hostname": "foo",
+ "port": "443",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws://foo:80/",
+ "base": "about:blank",
+ "href": "ws://foo/",
+ "origin": "ws://foo",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws://foo:81/",
+ "base": "about:blank",
+ "href": "ws://foo:81/",
+ "origin": "ws://foo:81",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "foo:81",
+ "hostname": "foo",
+ "port": "81",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws://foo:443/",
+ "base": "about:blank",
+ "href": "ws://foo:443/",
+ "origin": "ws://foo:443",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "foo:443",
+ "hostname": "foo",
+ "port": "443",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws://foo:815/",
+ "base": "about:blank",
+ "href": "ws://foo:815/",
+ "origin": "ws://foo:815",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "foo:815",
+ "hostname": "foo",
+ "port": "815",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss://foo:80/",
+ "base": "about:blank",
+ "href": "wss://foo:80/",
+ "origin": "wss://foo:80",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "foo:80",
+ "hostname": "foo",
+ "port": "80",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss://foo:81/",
+ "base": "about:blank",
+ "href": "wss://foo:81/",
+ "origin": "wss://foo:81",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "foo:81",
+ "hostname": "foo",
+ "port": "81",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss://foo:443/",
+ "base": "about:blank",
+ "href": "wss://foo/",
+ "origin": "wss://foo",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "foo",
+ "hostname": "foo",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss://foo:815/",
+ "base": "about:blank",
+ "href": "wss://foo:815/",
+ "origin": "wss://foo:815",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "foo:815",
+ "hostname": "foo",
+ "port": "815",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/example.com/",
+ "base": "about:blank",
+ "href": "http://example.com/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp:/example.com/",
+ "base": "about:blank",
+ "href": "ftp://example.com/",
+ "origin": "ftp://example.com",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https:/example.com/",
+ "base": "about:blank",
+ "href": "https://example.com/",
+ "origin": "https://example.com",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "madeupscheme:/example.com/",
+ "base": "about:blank",
+ "href": "madeupscheme:/example.com/",
+ "origin": "null",
+ "protocol": "madeupscheme:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:/example.com/",
+ "base": "about:blank",
+ "href": "file:///example.com/",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftps:/example.com/",
+ "base": "about:blank",
+ "href": "ftps:/example.com/",
+ "origin": "null",
+ "protocol": "ftps:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher:/example.com/",
+ "base": "about:blank",
+ "href": "gopher://example.com/",
+ "origin": "gopher://example.com",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws:/example.com/",
+ "base": "about:blank",
+ "href": "ws://example.com/",
+ "origin": "ws://example.com",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss:/example.com/",
+ "base": "about:blank",
+ "href": "wss://example.com/",
+ "origin": "wss://example.com",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "data:/example.com/",
+ "base": "about:blank",
+ "href": "data:/example.com/",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "javascript:/example.com/",
+ "base": "about:blank",
+ "href": "javascript:/example.com/",
+ "origin": "null",
+ "protocol": "javascript:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "mailto:/example.com/",
+ "base": "about:blank",
+ "href": "mailto:/example.com/",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:example.com/",
+ "base": "about:blank",
+ "href": "http://example.com/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftp:example.com/",
+ "base": "about:blank",
+ "href": "ftp://example.com/",
+ "origin": "ftp://example.com",
+ "protocol": "ftp:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https:example.com/",
+ "base": "about:blank",
+ "href": "https://example.com/",
+ "origin": "https://example.com",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "madeupscheme:example.com/",
+ "base": "about:blank",
+ "href": "madeupscheme:example.com/",
+ "origin": "null",
+ "protocol": "madeupscheme:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ftps:example.com/",
+ "base": "about:blank",
+ "href": "ftps:example.com/",
+ "origin": "null",
+ "protocol": "ftps:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "gopher:example.com/",
+ "base": "about:blank",
+ "href": "gopher://example.com/",
+ "origin": "gopher://example.com",
+ "protocol": "gopher:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "ws:example.com/",
+ "base": "about:blank",
+ "href": "ws://example.com/",
+ "origin": "ws://example.com",
+ "protocol": "ws:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "wss:example.com/",
+ "base": "about:blank",
+ "href": "wss://example.com/",
+ "origin": "wss://example.com",
+ "protocol": "wss:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "data:example.com/",
+ "base": "about:blank",
+ "href": "data:example.com/",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "javascript:example.com/",
+ "base": "about:blank",
+ "href": "javascript:example.com/",
+ "origin": "null",
+ "protocol": "javascript:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "mailto:example.com/",
+ "base": "about:blank",
+ "href": "mailto:example.com/",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "example.com/",
+ "search": "",
+ "hash": ""
+ },
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/segments-userinfo-vs-host.html",
+ {
+ "input": "http:@www.example.com",
+ "base": "about:blank",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/@www.example.com",
+ "base": "about:blank",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://@www.example.com",
+ "base": "about:blank",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:a:b@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/a:b@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://a:b@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://@pple.com",
+ "base": "about:blank",
+ "href": "http://pple.com/",
+ "origin": "http://pple.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "pple.com",
+ "hostname": "pple.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http::b@www.example.com",
+ "base": "about:blank",
+ "href": "http://:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/:b@www.example.com",
+ "base": "about:blank",
+ "href": "http://:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://:b@www.example.com",
+ "base": "about:blank",
+ "href": "http://:b@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "b",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/:@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://user@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:/@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "https:@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:a:b@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:/a:b@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://a:b@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http::@/www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:a:@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:/a:@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://a:@www.example.com",
+ "base": "about:blank",
+ "href": "http://a:@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "a",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://www.@pple.com",
+ "base": "about:blank",
+ "href": "http://www.@pple.com/",
+ "origin": "http://pple.com",
+ "protocol": "http:",
+ "username": "www.",
+ "password": "",
+ "host": "pple.com",
+ "hostname": "pple.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http:@:www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http:/@:www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://@:www.example.com",
+ "base": "about:blank",
+ "failure": true
+ },
+ {
+ "input": "http://:@www.example.com",
+ "base": "about:blank",
+ "href": "http://:@www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "# Others",
+ {
+ "input": "/",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": ".",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "..",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "./test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../aaa/test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/aaa/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/aaa/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../../test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "中/test.txt",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example.com/%E4%B8%AD/test.txt",
+ "origin": "http://www.example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example.com",
+ "hostname": "www.example.com",
+ "port": "",
+ "pathname": "/%E4%B8%AD/test.txt",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://www.example2.com",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example2.com/",
+ "origin": "http://www.example2.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example2.com",
+ "hostname": "www.example2.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "//www.example2.com",
+ "base": "http://www.example.com/test",
+ "href": "http://www.example2.com/",
+ "origin": "http://www.example2.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.example2.com",
+ "hostname": "www.example2.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:...",
+ "base": "http://www.example.com/test",
+ "href": "file:///...",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/...",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:..",
+ "base": "http://www.example.com/test",
+ "href": "file:///",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "file:a",
+ "base": "http://www.example.com/test",
+ "href": "file:///a",
+ "protocol": "file:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/a",
+ "search": "",
+ "hash": ""
+ },
+ "# Based on http://trac.webkit.org/browser/trunk/LayoutTests/fast/url/host.html",
+ "Basic canonicalization, uppercase should be converted to lowercase",
+ {
+ "input": "http://ExAmPlE.CoM",
+ "base": "http://other.com/",
+ "href": "http://example.com/",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://example example.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://Goo%20 goo%7C|.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://[]",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://[:]",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "U+3000 is mapped to U+0020 (space) which is disallowed",
+ {
+ "input": "http://GOO\u00a0\u3000goo.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Other types of space (no-break, zero-width, zero-width-no-break) are name-prepped away to nothing. U+200B, U+2060, and U+FEFF, are ignored",
+ {
+ "input": "http://GOO\u200b\u2060\ufeffgoo.com",
+ "base": "http://other.com/",
+ "href": "http://googoo.com/",
+ "origin": "http://googoo.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "googoo.com",
+ "hostname": "googoo.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "Ideographic full stop (full-width period for Chinese, etc.) should be treated as a dot. U+3002 is mapped to U+002E (dot)",
+ {
+ "input": "http://www.foo。bar.com",
+ "base": "http://other.com/",
+ "href": "http://www.foo.bar.com/",
+ "origin": "http://www.foo.bar.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "www.foo.bar.com",
+ "hostname": "www.foo.bar.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "Invalid unicode characters should fail... U+FDD0 is disallowed; %ef%b7%90 is U+FDD0",
+ {
+ "input": "http://\ufdd0zyx.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "This is the same as previous but escaped",
+ {
+ "input": "http://%ef%b7%90zyx.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Test name prepping, fullwidth input should be converted to ASCII and NOT IDN-ized. This is 'Go' in fullwidth UTF-8/UTF-16.",
+ {
+ "input": "http://Go.com",
+ "base": "http://other.com/",
+ "href": "http://go.com/",
+ "origin": "http://go.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "go.com",
+ "hostname": "go.com",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "URL spec forbids the following. https://www.w3.org/Bugs/Public/show_bug.cgi?id=24257",
+ {
+ "input": "http://%41.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://%ef%bc%85%ef%bc%94%ef%bc%91.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "...%00 in fullwidth should fail (also as escaped UTF-8 input)",
+ {
+ "input": "http://%00.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://%ef%bc%85%ef%bc%90%ef%bc%90.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Basic IDN support, UTF-8 and UTF-16 input should be converted to IDN",
+ {
+ "input": "http://你好你好",
+ "base": "http://other.com/",
+ "href": "http://xn--6qqa088eba/",
+ "origin": "http://你好你好",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "xn--6qqa088eba",
+ "hostname": "xn--6qqa088eba",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "Invalid escaped characters should fail and the percents should be escaped. https://www.w3.org/Bugs/Public/show_bug.cgi?id=24191",
+ {
+ "input": "http://%zz%66%a.com",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "If we get an invalid character that has been escaped.",
+ {
+ "input": "http://%25",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ {
+ "input": "http://hello%00",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Escaped numbers should be treated like IP addresses if they are.",
+ {
+ "input": "http://%30%78%63%30%2e%30%32%35%30.01",
+ "base": "http://other.com/",
+ "href": "http://192.168.0.1/",
+ "origin": "http://192.168.0.1",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "192.168.0.1",
+ "hostname": "192.168.0.1",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://%30%78%63%30%2e%30%32%35%30.01%2e",
+ "base": "http://other.com/",
+ "href": "http://192.168.0.1/",
+ "origin": "http://192.168.0.1",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "192.168.0.1",
+ "hostname": "192.168.0.1",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://192.168.0.257",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Invalid escaping should trigger the regular host error handling",
+ {
+ "input": "http://%3g%78%63%30%2e%30%32%35%30%2E.01",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Something that isn't exactly an IP should get treated as a host and spaces escaped",
+ {
+ "input": "http://192.168.0.1 hello",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Fullwidth and escaped UTF-8 fullwidth should still be treated as IP",
+ {
+ "input": "http://0Xc0.0250.01",
+ "base": "http://other.com/",
+ "href": "http://192.168.0.1/",
+ "origin": "http://192.168.0.1",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "192.168.0.1",
+ "hostname": "192.168.0.1",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "Broken IPv6",
+ {
+ "input": "http://[google.com]",
+ "base": "http://other.com/",
+ "failure": true
+ },
+ "Misc Unicode",
+ {
+ "input": "http://foo:💩@example.com/bar",
+ "base": "http://other.com/",
+ "href": "http://foo:%F0%9F%92%A9@example.com/bar",
+ "origin": "http://example.com",
+ "protocol": "http:",
+ "username": "foo",
+ "password": "%F0%9F%92%A9",
+ "host": "example.com",
+ "hostname": "example.com",
+ "port": "",
+ "pathname": "/bar",
+ "search": "",
+ "hash": ""
+ },
+ "# resolving a fragment against any scheme succeeds",
+ {
+ "input": "#",
+ "base": "test:test",
+ "href": "test:test#",
+ "origin": "null",
+ "protocol": "test:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "test",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "#x",
+ "base": "mailto:x@x.com",
+ "href": "mailto:x@x.com#x",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "x@x.com",
+ "search": "",
+ "hash": "#x"
+ },
+ {
+ "input": "#x",
+ "base": "data:,",
+ "href": "data:,#x",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": ",",
+ "search": "",
+ "hash": "#x"
+ },
+ {
+ "input": "#x",
+ "base": "about:blank",
+ "href": "about:blank#x",
+ "origin": "null",
+ "protocol": "about:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "blank",
+ "search": "",
+ "hash": "#x"
+ },
+ {
+ "input": "#",
+ "base": "test:test?test",
+ "href": "test:test?test#",
+ "origin": "null",
+ "protocol": "test:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "test",
+ "search": "?test",
+ "hash": ""
+ },
+ "# multiple @ in authority state",
+ {
+ "input": "https://@test@test@example:800/",
+ "base": "http://doesnotmatter/",
+ "href": "https://%40test%40test@example:800/",
+ "origin": "https://example:800",
+ "protocol": "https:",
+ "username": "%40test%40test",
+ "password": "",
+ "host": "example:800",
+ "hostname": "example",
+ "port": "800",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "https://@@@example",
+ "base": "http://doesnotmatter/",
+ "href": "https://%40%40@example/",
+ "origin": "https://example",
+ "protocol": "https:",
+ "username": "%40%40",
+ "password": "",
+ "host": "example",
+ "hostname": "example",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "non-az-09 characters",
+ {
+ "input": "http://`{}:`{}@h/`{}?`{}",
+ "base": "http://doesnotmatter/",
+ "href": "http://%60%7B%7D:%60%7B%7D@h/%60%7B%7D?`{}",
+ "origin": "http://h",
+ "protocol": "http:",
+ "username": "%60%7B%7D",
+ "password": "%60%7B%7D",
+ "host": "h",
+ "hostname": "h",
+ "port": "",
+ "pathname": "/%60%7B%7D",
+ "search": "?`{}",
+ "hash": ""
+ },
+ "# Credentials in base",
+ {
+ "input": "/some/path",
+ "base": "http://user@example.org/smth",
+ "href": "http://user@example.org/some/path",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "user",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/some/path",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "",
+ "base": "http://user:pass@example.org:21/smth",
+ "href": "http://user:pass@example.org:21/smth",
+ "origin": "http://example.org:21",
+ "protocol": "http:",
+ "username": "user",
+ "password": "pass",
+ "host": "example.org:21",
+ "hostname": "example.org",
+ "port": "21",
+ "pathname": "/smth",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/some/path",
+ "base": "http://user:pass@example.org:21/smth",
+ "href": "http://user:pass@example.org:21/some/path",
+ "origin": "http://example.org:21",
+ "protocol": "http:",
+ "username": "user",
+ "password": "pass",
+ "host": "example.org:21",
+ "hostname": "example.org",
+ "port": "21",
+ "pathname": "/some/path",
+ "search": "",
+ "hash": ""
+ },
+ "# a set of tests designed by zcorpan for relative URLs with unknown schemes",
+ {
+ "input": "i",
+ "base": "sc:sd",
+ "failure": true
+ },
+ {
+ "input": "i",
+ "base": "sc:sd/sd",
+ "failure": true
+ },
+ {
+ "input": "i",
+ "base": "sc:/pa/pa",
+ "href": "sc:/pa/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "i",
+ "base": "sc://ho/pa",
+ "href": "sc://ho/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "ho",
+ "hostname": "ho",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "i",
+ "base": "sc:///pa/pa",
+ "href": "sc:///pa/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../i",
+ "base": "sc:sd",
+ "failure": true
+ },
+ {
+ "input": "../i",
+ "base": "sc:sd/sd",
+ "failure": true
+ },
+ {
+ "input": "../i",
+ "base": "sc:/pa/pa",
+ "href": "sc:/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../i",
+ "base": "sc://ho/pa",
+ "href": "sc://ho/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "ho",
+ "hostname": "ho",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "../i",
+ "base": "sc:///pa/pa",
+ "href": "sc:///i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/i",
+ "base": "sc:sd",
+ "failure": true
+ },
+ {
+ "input": "/i",
+ "base": "sc:sd/sd",
+ "failure": true
+ },
+ {
+ "input": "/i",
+ "base": "sc:/pa/pa",
+ "href": "sc:/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/i",
+ "base": "sc://ho/pa",
+ "href": "sc://ho/i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "ho",
+ "hostname": "ho",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "/i",
+ "base": "sc:///pa/pa",
+ "href": "sc:///i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/i",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "?i",
+ "base": "sc:sd",
+ "failure": true
+ },
+ {
+ "input": "?i",
+ "base": "sc:sd/sd",
+ "failure": true
+ },
+ {
+ "input": "?i",
+ "base": "sc:/pa/pa",
+ "href": "sc:/pa/pa?i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/pa",
+ "search": "?i",
+ "hash": ""
+ },
+ {
+ "input": "?i",
+ "base": "sc://ho/pa",
+ "href": "sc://ho/pa?i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "ho",
+ "hostname": "ho",
+ "port": "",
+ "pathname": "/pa",
+ "search": "?i",
+ "hash": ""
+ },
+ {
+ "input": "?i",
+ "base": "sc:///pa/pa",
+ "href": "sc:///pa/pa?i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/pa",
+ "search": "?i",
+ "hash": ""
+ },
+ {
+ "input": "#i",
+ "base": "sc:sd",
+ "href": "sc:sd#i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "sd",
+ "search": "",
+ "hash": "#i"
+ },
+ {
+ "input": "#i",
+ "base": "sc:sd/sd",
+ "href": "sc:sd/sd#i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "sd/sd",
+ "search": "",
+ "hash": "#i"
+ },
+ {
+ "input": "#i",
+ "base": "sc:/pa/pa",
+ "href": "sc:/pa/pa#i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/pa",
+ "search": "",
+ "hash": "#i"
+ },
+ {
+ "input": "#i",
+ "base": "sc://ho/pa",
+ "href": "sc://ho/pa#i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "ho",
+ "hostname": "ho",
+ "port": "",
+ "pathname": "/pa",
+ "search": "",
+ "hash": "#i"
+ },
+ {
+ "input": "#i",
+ "base": "sc:///pa/pa",
+ "href": "sc:///pa/pa#i",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/pa/pa",
+ "search": "",
+ "hash": "#i"
+ },
+ "# make sure that relative URL logic works on known typically non-relative schemes too",
+ {
+ "input": "about:/../",
+ "base": "about:blank",
+ "href": "about:/",
+ "origin": "null",
+ "protocol": "about:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "data:/../",
+ "base": "about:blank",
+ "href": "data:/",
+ "origin": "null",
+ "protocol": "data:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "javascript:/../",
+ "base": "about:blank",
+ "href": "javascript:/",
+ "origin": "null",
+ "protocol": "javascript:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "mailto:/../",
+ "base": "about:blank",
+ "href": "mailto:/",
+ "origin": "null",
+ "protocol": "mailto:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "# unknown schemes and non-ASCII domains",
+ {
+ "input": "sc://ñ.test/",
+ "base": "about:blank",
+ "href": "sc://xn--ida.test/",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "xn--ida.test",
+ "hostname": "xn--ida.test",
+ "port": "",
+ "pathname": "/",
+ "search": "",
+ "hash": ""
+ },
+ "# unknown schemes and backslashes",
+ {
+ "input": "sc:\\../",
+ "base": "about:blank",
+ "href": "sc:\\../",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": "\\../",
+ "search": "",
+ "hash": ""
+ },
+ "# unknown scheme with path looking like a password",
+ {
+ "input": "sc::a@example.net",
+ "base": "about:blank",
+ "href": "sc::a@example.net",
+ "origin": "null",
+ "protocol": "sc:",
+ "username": "",
+ "password": "",
+ "host": "",
+ "hostname": "",
+ "port": "",
+ "pathname": ":a@example.net",
+ "search": "",
+ "hash": ""
+ },
+ "# tests from jsdom/whatwg-url designed for code coverage",
+ {
+ "input": "http://127.0.0.1:10100/relative_import.html",
+ "base": "about:blank",
+ "href": "http://127.0.0.1:10100/relative_import.html",
+ "origin": "http://127.0.0.1:10100",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "127.0.0.1:10100",
+ "hostname": "127.0.0.1",
+ "port": "10100",
+ "pathname": "/relative_import.html",
+ "search": "",
+ "hash": ""
+ },
+ {
+ "input": "http://facebook.com/?foo=%7B%22abc%22",
+ "base": "about:blank",
+ "href": "http://facebook.com/?foo=%7B%22abc%22",
+ "origin": "http://facebook.com",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "facebook.com",
+ "hostname": "facebook.com",
+ "port": "",
+ "pathname": "/",
+ "search": "?foo=%7B%22abc%22",
+ "hash": ""
+ },
+ {
+ "input": "https://localhost:3000/jqueryui@1.2.3",
+ "base": "about:blank",
+ "href": "https://localhost:3000/jqueryui@1.2.3",
+ "origin": "https://localhost:3000",
+ "protocol": "https:",
+ "username": "",
+ "password": "",
+ "host": "localhost:3000",
+ "hostname": "localhost",
+ "port": "3000",
+ "pathname": "/jqueryui@1.2.3",
+ "search": "",
+ "hash": ""
+ },
+ "# tab/LF/CR",
+ {
+ "input": "h\tt\nt\rp://h\to\ns\rt:9\t0\n0\r0/p\ta\nt\rh?q\tu\ne\rry#f\tr\na\rg",
+ "base": "about:blank",
+ "href": "http://host:9000/path?query#frag",
+ "origin": "http://host:9000",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "host:9000",
+ "hostname": "host",
+ "port": "9000",
+ "pathname": "/path",
+ "search": "?query",
+ "hash": "#frag"
+ },
+ "# Stringification of URL.searchParams",
+ {
+ "input": "?a=b&c=d",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar?a=b&c=d",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "?a=b&c=d",
+ "searchParams": "a=b&c=d",
+ "hash": ""
+ },
+ {
+ "input": "??a=b&c=d",
+ "base": "http://example.org/foo/bar",
+ "href": "http://example.org/foo/bar??a=b&c=d",
+ "origin": "http://example.org",
+ "protocol": "http:",
+ "username": "",
+ "password": "",
+ "host": "example.org",
+ "hostname": "example.org",
+ "port": "",
+ "pathname": "/foo/bar",
+ "search": "??a=b&c=d",
+ "searchParams": "%3Fa=b&c=d",
+ "hash": ""
+ }
+]