Skip to content

Commit

Permalink
Add (de)serialization of internal representation, to avoid re-parsing.
Browse files Browse the repository at this point in the history
Fixes #252, closes #254.
  • Loading branch information
Manishearth authored and SimonSapin committed Dec 19, 2016
1 parent cf8ca41 commit 78ccfaf
Show file tree
Hide file tree
Showing 7 changed files with 122 additions and 23 deletions.
3 changes: 2 additions & 1 deletion Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,7 @@ test = false
[dev-dependencies]
rustc-test = "0.1"
rustc-serialize = "0.3"
bincode = {version = "0.6.0", features = ["serde"]}

[features]
query_encoding = ["encoding"]
Expand All @@ -38,4 +39,4 @@ heapsize = {version = ">=0.1.1, <0.4", optional = true}
idna = { version = "0.1.0", path = "./idna" }
matches = "0.1"
rustc-serialize = {version = "0.3", optional = true}
serde = {version = ">=0.6.1, <0.9", optional = true}
serde = {version = "0.8.20", optional = true}
3 changes: 1 addition & 2 deletions Makefile
Original file line number Diff line number Diff line change
@@ -1,6 +1,5 @@
test:
cargo test --features "query_encoding serde rustc-serialize"
[ x$$TRAVIS_RUST_VERSION != xnightly ] || cargo test --features heapsize
cargo test --features "query_encoding serde rustc-serialize heapsize"
(cd idna && cargo test)

.PHONY: test
32 changes: 32 additions & 0 deletions src/host.rs
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,38 @@ pub enum HostInternal {
#[cfg(feature = "heapsize")]
known_heap_size!(0, HostInternal);

#[cfg(feature="serde")]
impl ::serde::Serialize for HostInternal {
fn serialize<S>(&self, serializer: &mut S) -> Result<(), S::Error> where S: ::serde::Serializer {
// This doesn’t use `derive` because that involves
// large dependencies (that take a long time to build), and
// either Macros 1.1 which are not stable yet or a cumbersome build script.
//
// Implementing `Serializer` correctly for an enum is tricky,
// so let’s use existing enums that already do.
use std::net::IpAddr;
match *self {
HostInternal::None => None,
HostInternal::Domain => Some(None),
HostInternal::Ipv4(addr) => Some(Some(IpAddr::V4(addr))),
HostInternal::Ipv6(addr) => Some(Some(IpAddr::V6(addr))),
}.serialize(serializer)
}
}

#[cfg(feature="serde")]
impl ::serde::Deserialize for HostInternal {
fn deserialize<D>(deserializer: &mut D) -> Result<Self, D::Error> where D: ::serde::Deserializer {
use std::net::IpAddr;
Ok(match try!(::serde::Deserialize::deserialize(deserializer)) {
None => HostInternal::None,
Some(None) => HostInternal::Domain,
Some(Some(IpAddr::V4(addr))) => HostInternal::Ipv4(addr),
Some(Some(IpAddr::V6(addr))) => HostInternal::Ipv6(addr),
})
}
}

impl<S> From<Host<S>> for HostInternal {
fn from(host: Host<S>) -> HostInternal {
match host {
Expand Down
65 changes: 61 additions & 4 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -318,11 +318,12 @@ impl Url {
/// This checks each of these invariants and panic if one is not met.
/// This is for testing rust-url itself.
#[doc(hidden)]
pub fn assert_invariants(&self) {
pub fn check_invariants(&self) -> Result<(), String> {
macro_rules! assert {
($x: expr) => {
if !$x {
panic!("!( {} ) for URL {:?}", stringify!($x), self.serialization)
return Err(format!("!( {} ) for URL {:?}",
stringify!($x), self.serialization))
}
}
}
Expand All @@ -333,8 +334,9 @@ impl Url {
let a = $a;
let b = $b;
if a != b {
panic!("{:?} != {:?} ({} != {}) for URL {:?}",
a, b, stringify!($a), stringify!($b), self.serialization)
return Err(format!("{:?} != {:?} ({} != {}) for URL {:?}",
a, b, stringify!($a), stringify!($b),
self.serialization))
}
}
}
Expand Down Expand Up @@ -415,6 +417,7 @@ impl Url {
assert_eq!(self.path_start, other.path_start);
assert_eq!(self.query_start, other.query_start);
assert_eq!(self.fragment_start, other.fragment_start);
Ok(())
}

/// Return the origin of this URL (https://url.spec.whatwg.org/#origin)
Expand Down Expand Up @@ -1341,6 +1344,60 @@ impl Url {
Ok(url)
}

/// Serialize with Serde using the internal representation of the `Url` struct.
///
/// The corresponding `deserialize_internal` method sacrifices some invariant-checking
/// for speed, compared to the `Deserialize` trait impl.
///
/// This method is only available if the `serde` Cargo feature is enabled.
#[cfg(feature = "serde")]
#[deny(unused)]
pub fn serialize_internal<S>(&self, serializer: &mut S) -> Result<(), S::Error> where S: serde::Serializer {
use serde::Serialize;
// Destructuring first lets us ensure that adding or removing fields forces this method
// to be updated
let Url { ref serialization, ref scheme_end,
ref username_end, ref host_start,
ref host_end, ref host, ref port,
ref path_start, ref query_start,
ref fragment_start} = *self;
(serialization, scheme_end, username_end,
host_start, host_end, host, port, path_start,
query_start, fragment_start).serialize(serializer)
}

/// Serialize with Serde using the internal representation of the `Url` struct.
///
/// The corresponding `deserialize_internal` method sacrifices some invariant-checking
/// for speed, compared to the `Deserialize` trait impl.
///
/// This method is only available if the `serde` Cargo feature is enabled.
#[cfg(feature = "serde")]
#[deny(unused)]
pub fn deserialize_internal<D>(deserializer: &mut D) -> Result<Self, D::Error> where D: serde::Deserializer {
use serde::{Deserialize, Error};
let (serialization, scheme_end, username_end,
host_start, host_end, host, port, path_start,
query_start, fragment_start) = try!(Deserialize::deserialize(deserializer));
let url = Url {
serialization: serialization,
scheme_end: scheme_end,
username_end: username_end,
host_start: host_start,
host_end: host_end,
host: host,
port: port,
path_start: path_start,
query_start: query_start,
fragment_start: fragment_start
};
if cfg!(debug_assertions) {
try!(url.check_invariants().map_err(|ref reason| Error::invalid_value(&reason)))
}
Ok(url)
}


/// Assuming the URL is in the `file` scheme or similar,
/// convert its path to an absolute `std::path::Path`.
///
Expand Down
2 changes: 1 addition & 1 deletion src/path_segments.rs
Original file line number Diff line number Diff line change
Expand Up @@ -181,7 +181,7 @@ impl<'a> PathSegmentsMut<'a> {
/// For internal testing, not part of the public API.
#[doc(hidden)]
pub fn assert_url_invariants(&mut self) -> &mut Self {
self.url.assert_invariants();
self.url.check_invariants();
self
}
}
16 changes: 13 additions & 3 deletions tests/data.rs
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,16 @@ extern crate url;
use rustc_serialize::json::{self, Json};
use url::{Url, quirks};

fn check_invariants(url: &Url) {
url.check_invariants().unwrap();
#[cfg(feature="serde")] {
extern crate bincode;
let bytes = bincode::serde::serialize(url, bincode::SizeLimit::Infinite).unwrap();
let new_url: Url = bincode::serde::deserialize(&bytes).unwrap();
assert_eq!(url, &new_url);
}
}


fn run_parsing(input: String, base: String, expected: Result<ExpectedAttributes, ()>) {
let base = match Url::parse(&base) {
Expand All @@ -28,7 +38,7 @@ fn run_parsing(input: String, base: String, expected: Result<ExpectedAttributes,
(Ok(_), Err(())) => panic!("Expected a parse error for URL {:?}", input),
};

url.assert_invariants();
check_invariants(&url);

macro_rules! assert_eq {
($expected: expr, $got: expr) => {
Expand Down Expand Up @@ -144,11 +154,11 @@ fn collect_setters<F>(add_test: &mut F) where F: FnMut(String, test::TestFn) {
let mut expected = test.take("expected").unwrap();
add_test(name, test::TestFn::dyn_test_fn(move || {
let mut url = Url::parse(&href).unwrap();
url.assert_invariants();
check_invariants(&url);
let _ = quirks::$setter(&mut url, &new_value);
assert_attributes!(url, expected,
href protocol username password host hostname port pathname search hash);
url.assert_invariants();
check_invariants(&url);
}))
}
}}
Expand Down
24 changes: 12 additions & 12 deletions tests/unit.rs
Original file line number Diff line number Diff line change
Expand Up @@ -250,13 +250,13 @@ fn test_form_serialize() {
fn issue_25() {
let filename = if cfg!(windows) { r"C:\run\pg.sock" } else { "/run/pg.sock" };
let mut url = Url::from_file_path(filename).unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
url.set_scheme("postgres").unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
url.set_host(Some("")).unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
url.set_username("me").unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
let expected = format!("postgres://me@/{}run/pg.sock", if cfg!(windows) { "C:/" } else { "" });
assert_eq!(url.as_str(), expected);
}
Expand All @@ -268,15 +268,15 @@ fn issue_61() {
url.set_scheme("https").unwrap();
assert_eq!(url.port(), None);
assert_eq!(url.port_or_known_default(), Some(443));
url.assert_invariants();
url.check_invariants().unwrap();
}

#[test]
#[cfg(not(windows))]
/// https://github.com/servo/rust-url/issues/197
fn issue_197() {
let mut url = Url::from_file_path("/").expect("Failed to parse path");
url.assert_invariants();
url.check_invariants().unwrap();
assert_eq!(url, Url::parse("file:///").expect("Failed to parse path + protocol"));
url.path_segments_mut().expect("path_segments_mut").pop_if_empty();
}
Expand All @@ -290,9 +290,9 @@ fn issue_241() {
/// https://github.com/servo/rust-url/issues/222
fn append_trailing_slash() {
let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
url.path_segments_mut().unwrap().push("");
url.assert_invariants();
url.check_invariants().unwrap();
assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/?a=b");
}

Expand All @@ -301,20 +301,20 @@ fn append_trailing_slash() {
fn extend_query_pairs_then_mutate() {
let mut url: Url = "http://localhost:6767/foo/bar".parse().unwrap();
url.query_pairs_mut().extend_pairs(vec![ ("auth", "my-token") ].into_iter());
url.assert_invariants();
url.check_invariants().unwrap();
assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?auth=my-token");
url.path_segments_mut().unwrap().push("some_other_path");
url.assert_invariants();
url.check_invariants().unwrap();
assert_eq!(url.to_string(), "http://localhost:6767/foo/bar/some_other_path?auth=my-token");
}

#[test]
/// https://github.com/servo/rust-url/issues/222
fn append_empty_segment_then_mutate() {
let mut url: Url = "http://localhost:6767/foo/bar?a=b".parse().unwrap();
url.assert_invariants();
url.check_invariants().unwrap();
url.path_segments_mut().unwrap().push("").pop();
url.assert_invariants();
url.check_invariants().unwrap();
assert_eq!(url.to_string(), "http://localhost:6767/foo/bar?a=b");
}

Expand Down

0 comments on commit 78ccfaf

Please sign in to comment.