Skip to content

Commit a9d108a

Browse files
committed
Speed up noop registry updates with GitHub
This commit adds supports to registry index updates to use GitHub's HTTP API [1] which is purportedly [2] much faster than doing a git clone, and emprically that appears to be the case. This logic kicks in by looking at the URL of a registry's index, and if it looks exactly like `github.com/$user/$repo` then we'll attempt to use GitHub's API, otherwise we always fall back to a git update. This behavior may *slow down* registry updates which actually need to download information as an extra HTTP request is performed to figure out that we need to perform a git fetch, but hopefully that won't actually be the case much of the time! [1]: https://developer.github.com/v3/repos/commits/#get-the-sha-1-of-a-commit-reference [2]: https://developer.github.com/changes/2016-02-24-commit-reference-sha-api/
1 parent c917e94 commit a9d108a

File tree

1 file changed

+69
-2
lines changed

1 file changed

+69
-2
lines changed

src/cargo/sources/registry/remote.rs

+69-2
Original file line numberDiff line numberDiff line change
@@ -2,10 +2,11 @@ use std::io::SeekFrom;
22
use std::io::prelude::*;
33
use std::path::Path;
44

5-
use curl::easy::Easy;
5+
use curl::easy::{Easy, List};
66
use git2;
7-
use rustc_serialize::json;
87
use rustc_serialize::hex::ToHex;
8+
use rustc_serialize::json;
9+
use url::Url;
910

1011
use core::{PackageId, SourceId};
1112
use ops;
@@ -70,11 +71,30 @@ impl<'cfg> RegistryData for RemoteRegistry<'cfg> {
7071

7172
try!(self.config.shell().status("Updating",
7273
format!("registry `{}`", self.source_id.url())));
74+
7375
let repo = try!(git2::Repository::open(path).or_else(|_| {
7476
let _ = lock.remove_siblings();
7577
git2::Repository::init(path)
7678
}));
7779

80+
if self.source_id.url().host_str() == Some("github.com") {
81+
if let Ok(oid) = repo.refname_to_id("refs/heads/master") {
82+
let handle = match self.handle {
83+
Some(ref mut handle) => handle,
84+
None => {
85+
self.handle = Some(try!(ops::http_handle(self.config)));
86+
self.handle.as_mut().unwrap()
87+
}
88+
};
89+
debug!("attempting github fast path for {}",
90+
self.source_id.url());
91+
if github_up_to_date(handle, &self.source_id.url(), &oid) {
92+
return Ok(())
93+
}
94+
debug!("fast path failed, falling back to a git fetch");
95+
}
96+
}
97+
7898
// git fetch origin
7999
let url = self.source_id.url().to_string();
80100
let refspec = "refs/heads/*:refs/remotes/origin/*";
@@ -151,3 +171,50 @@ impl<'cfg> RegistryData for RemoteRegistry<'cfg> {
151171
Ok(dst)
152172
}
153173
}
174+
175+
/// Updating the index is done pretty regularly so we want it to be as fast as
176+
/// possible. For registries hosted on github (like the crates.io index) there's
177+
/// a fast path available to use [1] to tell us that there's no updates to be
178+
/// made.
179+
///
180+
/// This function will attempt to hit that fast path and verify that the `oid`
181+
/// is actually the current `master` branch of the repository. If `true` is
182+
/// returned then no update needs to be performed, but if `false` is returned
183+
/// then the standard update logic still needs to happen.
184+
///
185+
/// [1]: https://developer.github.com/v3/repos/commits/#get-the-sha-1-of-a-commit-reference
186+
///
187+
/// Note that this function should never cause an actual failure because it's
188+
/// just a fast path. As a result all errors are ignored in this function and we
189+
/// just return a `bool`. Any real errors will be reported through the normal
190+
/// update path above.
191+
fn github_up_to_date(handle: &mut Easy, url: &Url, oid: &git2::Oid) -> bool {
192+
macro_rules! try {
193+
($e:expr) => (match $e {
194+
Some(e) => e,
195+
None => return false,
196+
})
197+
}
198+
199+
// This expects github urls in the form `github.com/user/repo` and nothing
200+
// else
201+
let mut pieces = try!(url.path_segments());
202+
let username = try!(pieces.next());
203+
let repo = try!(pieces.next());
204+
if pieces.next().is_some() {
205+
return false
206+
}
207+
208+
let url = format!("https://api.github.com/repos/{}/{}/commits/master",
209+
username, repo);
210+
try!(handle.get(true).ok());
211+
try!(handle.url(&url).ok());
212+
try!(handle.useragent("cargo").ok());
213+
let mut headers = List::new();
214+
try!(headers.append("Accept: application/vnd.github.3.sha").ok());
215+
try!(headers.append(&format!("If-None-Match: \"{}\"", oid)).ok());
216+
try!(handle.http_headers(headers).ok());
217+
try!(handle.perform().ok());
218+
219+
try!(handle.response_code().ok()) == 304
220+
}

0 commit comments

Comments
 (0)