Skip to content

Commit 36053de

Browse files
committed
SHA-256 support
1 parent 4231106 commit 36053de

File tree

1 file changed

+96
-26
lines changed

1 file changed

+96
-26
lines changed

src/cargo/sources/git/utils.rs

+96-26
Original file line numberDiff line numberDiff line change
@@ -7,14 +7,15 @@ use crate::util::{network, Config, IntoUrl, MetricsCounter, Progress};
77
use anyhow::{anyhow, Context as _};
88
use cargo_util::{paths, ProcessBuilder};
99
use curl::easy::List;
10-
use git2::{self, ErrorClass, ObjectType};
10+
use git2::{self, ErrorClass, ObjectType, Oid};
1111
use log::{debug, info};
1212
use serde::ser;
1313
use serde::Serialize;
1414
use std::env;
1515
use std::fmt;
1616
use std::path::{Path, PathBuf};
1717
use std::process::Command;
18+
use std::str;
1819
use std::time::{Duration, Instant};
1920
use url::Url;
2021

@@ -781,11 +782,15 @@ pub fn fetch(
781782

782783
// If we're fetching from GitHub, attempt GitHub's special fast path for
783784
// testing if we've already got an up-to-date copy of the repository
784-
match github_up_to_date(repo, url, reference, config) {
785-
Ok(true) => return Ok(()),
786-
Ok(false) => {}
787-
Err(e) => debug!("failed to check github {:?}", e),
788-
}
785+
let oid_to_fetch = match github_fast_path(repo, url, reference, config) {
786+
Ok(FastPathRev::UpToDate) => return Ok(()),
787+
Ok(FastPathRev::NeedsFetch(rev)) => Some(rev),
788+
Ok(FastPathRev::Indeterminate) => None,
789+
Err(e) => {
790+
debug!("failed to check github {:?}", e);
791+
None
792+
}
793+
};
789794

790795
// We reuse repositories quite a lot, so before we go through and update the
791796
// repo check to see if it's a little too old and could benefit from a gc.
@@ -815,11 +820,10 @@ pub fn fetch(
815820
}
816821

817822
GitReference::Rev(rev) => {
818-
let is_github = || Url::parse(url).map_or(false, |url| is_github(&url));
819823
if rev.starts_with("refs/") {
820824
refspecs.push(format!("+{0}:{0}", rev));
821-
} else if is_github() && is_long_hash(rev) {
822-
refspecs.push(format!("+{0}:refs/commit/{0}", rev));
825+
} else if let Some(oid_to_fetch) = oid_to_fetch {
826+
refspecs.push(format!("+{0}:refs/commit/{0}", oid_to_fetch));
823827
} else {
824828
// We don't know what the rev will point to. To handle this
825829
// situation we fetch all branches and tags, and then we pray
@@ -1016,45 +1020,79 @@ fn init(path: &Path, bare: bool) -> CargoResult<git2::Repository> {
10161020
Ok(git2::Repository::init_opts(&path, &opts)?)
10171021
}
10181022

1023+
enum FastPathRev {
1024+
/// The local rev (determined by `reference.resolve(repo)`) is already up to
1025+
/// date with what this rev resolves to on GitHub's server.
1026+
UpToDate,
1027+
/// The following SHA must be fetched in order for the local rev to become
1028+
/// up to date.
1029+
NeedsFetch(Oid),
1030+
/// Don't know whether local rev is up to date. We'll fetch _all_ branches
1031+
/// and tags from the server and see what happens.
1032+
Indeterminate,
1033+
}
1034+
10191035
/// Updating the index is done pretty regularly so we want it to be as fast as
10201036
/// possible. For registries hosted on GitHub (like the crates.io index) there's
10211037
/// a fast path available to use [1] to tell us that there's no updates to be
10221038
/// made.
10231039
///
10241040
/// This function will attempt to hit that fast path and verify that the `oid`
1025-
/// is actually the current branch of the repository. If `true` is returned then
1026-
/// no update needs to be performed, but if `false` is returned then the
1027-
/// standard update logic still needs to happen.
1041+
/// is actually the current branch of the repository.
10281042
///
10291043
/// [1]: https://developer.github.com/v3/repos/commits/#get-the-sha-1-of-a-commit-reference
10301044
///
10311045
/// Note that this function should never cause an actual failure because it's
10321046
/// just a fast path. As a result all errors are ignored in this function and we
10331047
/// just return a `bool`. Any real errors will be reported through the normal
10341048
/// update path above.
1035-
fn github_up_to_date(
1049+
fn github_fast_path(
10361050
repo: &mut git2::Repository,
10371051
url: &str,
10381052
reference: &GitReference,
10391053
config: &Config,
1040-
) -> CargoResult<bool> {
1054+
) -> CargoResult<FastPathRev> {
10411055
let url = Url::parse(url)?;
10421056
if !is_github(&url) {
1043-
return Ok(false);
1057+
return Ok(FastPathRev::Indeterminate);
10441058
}
10451059

1060+
let local_object = reference.resolve(repo).ok();
1061+
10461062
let github_branch_name = match reference {
10471063
GitReference::Branch(branch) => branch,
10481064
GitReference::Tag(tag) => tag,
10491065
GitReference::DefaultBranch => "HEAD",
10501066
GitReference::Rev(rev) => {
10511067
if rev.starts_with("refs/") {
10521068
rev
1053-
} else if is_long_hash(rev) {
1054-
return Ok(reference.resolve(repo).is_ok());
1069+
} else if looks_like_commit_hash(rev) {
1070+
// `revparse_single` (used by `resolve`) is the only way to turn
1071+
// short hash -> long hash, but it also parses other things,
1072+
// like branch and tag names, which might coincidentally be
1073+
// valid hex.
1074+
//
1075+
// We only return early if `rev` is a prefix of the object found
1076+
// by `revparse_single`. Don't bother talking to GitHub in that
1077+
// case, since commit hashes are permanent. If a commit with the
1078+
// requested hash is already present in the local clone, its
1079+
// contents must be the same as what is on the server for that
1080+
// hash.
1081+
//
1082+
// If `rev` is not found locally by `revparse_single`, we'll
1083+
// need GitHub to resolve it and get a hash. If `rev` is found
1084+
// but is not a short hash of the found object, it's probably a
1085+
// branch and we also need to get a hash from GitHub, in case
1086+
// the branch has moved.
1087+
if let Some(local_object) = local_object {
1088+
if is_short_hash_of(rev, local_object) {
1089+
return Ok(FastPathRev::UpToDate);
1090+
}
1091+
}
1092+
rev
10551093
} else {
10561094
debug!("can't use github fast path with `rev = \"{}\"`", rev);
1057-
return Ok(false);
1095+
return Ok(FastPathRev::Indeterminate);
10581096
}
10591097
}
10601098
};
@@ -1087,18 +1125,50 @@ fn github_up_to_date(
10871125
handle.get(true)?;
10881126
handle.url(&url)?;
10891127
handle.useragent("cargo")?;
1090-
let mut headers = List::new();
1091-
headers.append("Accept: application/vnd.github.3.sha")?;
1092-
headers.append(&format!("If-None-Match: \"{}\"", reference.resolve(repo)?))?;
1093-
handle.http_headers(headers)?;
1094-
handle.perform()?;
1095-
Ok(handle.response_code()? == 304)
1128+
handle.http_headers({
1129+
let mut headers = List::new();
1130+
headers.append("Accept: application/vnd.github.3.sha")?;
1131+
if let Some(local_object) = local_object {
1132+
headers.append(&format!("If-None-Match: \"{}\"", local_object))?;
1133+
}
1134+
headers
1135+
})?;
1136+
1137+
let mut response_body = Vec::new();
1138+
let mut transfer = handle.transfer();
1139+
transfer.write_function(|data| {
1140+
response_body.extend_from_slice(data);
1141+
Ok(data.len())
1142+
})?;
1143+
transfer.perform()?;
1144+
drop(transfer); // end borrow of handle so that response_code can be called
1145+
1146+
let response_code = handle.response_code()?;
1147+
if response_code == 304 {
1148+
Ok(FastPathRev::UpToDate)
1149+
} else if response_code == 200 {
1150+
let oid_to_fetch = str::from_utf8(&response_body)?.parse::<Oid>()?;
1151+
Ok(FastPathRev::NeedsFetch(oid_to_fetch))
1152+
} else {
1153+
// Usually response_code == 404 if the repository does not exist, and
1154+
// response_code == 422 if exists but GitHub is unable to resolve the
1155+
// requested rev.
1156+
Ok(FastPathRev::Indeterminate)
1157+
}
10961158
}
10971159

10981160
fn is_github(url: &Url) -> bool {
10991161
url.host_str() == Some("github.com")
11001162
}
11011163

1102-
fn is_long_hash(rev: &str) -> bool {
1103-
rev.len() == 40 && rev.chars().all(|ch| ch.is_ascii_hexdigit())
1164+
fn looks_like_commit_hash(rev: &str) -> bool {
1165+
rev.len() >= 7 && rev.chars().all(|ch| ch.is_ascii_hexdigit())
1166+
}
1167+
1168+
fn is_short_hash_of(rev: &str, oid: Oid) -> bool {
1169+
let long_hash = oid.to_string();
1170+
match long_hash.get(..rev.len()) {
1171+
Some(truncated_long_hash) => truncated_long_hash.eq_ignore_ascii_case(rev),
1172+
None => false,
1173+
}
11041174
}

0 commit comments

Comments
 (0)