@@ -7,14 +7,15 @@ use crate::util::{network, Config, IntoUrl, MetricsCounter, Progress};
7
7
use anyhow:: { anyhow, Context as _} ;
8
8
use cargo_util:: { paths, ProcessBuilder } ;
9
9
use curl:: easy:: List ;
10
- use git2:: { self , ErrorClass , ObjectType } ;
10
+ use git2:: { self , ErrorClass , ObjectType , Oid } ;
11
11
use log:: { debug, info} ;
12
12
use serde:: ser;
13
13
use serde:: Serialize ;
14
14
use std:: env;
15
15
use std:: fmt;
16
16
use std:: path:: { Path , PathBuf } ;
17
17
use std:: process:: Command ;
18
+ use std:: str;
18
19
use std:: time:: { Duration , Instant } ;
19
20
use url:: Url ;
20
21
@@ -781,11 +782,15 @@ pub fn fetch(
781
782
782
783
// If we're fetching from GitHub, attempt GitHub's special fast path for
783
784
// testing if we've already got an up-to-date copy of the repository
784
- match github_up_to_date ( repo, url, reference, config) {
785
- Ok ( true ) => return Ok ( ( ) ) ,
786
- Ok ( false ) => { }
787
- Err ( e) => debug ! ( "failed to check github {:?}" , e) ,
788
- }
785
+ let oid_to_fetch = match github_fast_path ( repo, url, reference, config) {
786
+ Ok ( FastPathRev :: UpToDate ) => return Ok ( ( ) ) ,
787
+ Ok ( FastPathRev :: NeedsFetch ( rev) ) => Some ( rev) ,
788
+ Ok ( FastPathRev :: Indeterminate ) => None ,
789
+ Err ( e) => {
790
+ debug ! ( "failed to check github {:?}" , e) ;
791
+ None
792
+ }
793
+ } ;
789
794
790
795
// We reuse repositories quite a lot, so before we go through and update the
791
796
// repo check to see if it's a little too old and could benefit from a gc.
@@ -815,11 +820,10 @@ pub fn fetch(
815
820
}
816
821
817
822
GitReference :: Rev ( rev) => {
818
- let is_github = || Url :: parse ( url) . map_or ( false , |url| is_github ( & url) ) ;
819
823
if rev. starts_with ( "refs/" ) {
820
824
refspecs. push ( format ! ( "+{0}:{0}" , rev) ) ;
821
- } else if is_github ( ) && is_long_hash ( rev ) {
822
- refspecs. push ( format ! ( "+{0}:refs/commit/{0}" , rev ) ) ;
825
+ } else if let Some ( oid_to_fetch ) = oid_to_fetch {
826
+ refspecs. push ( format ! ( "+{0}:refs/commit/{0}" , oid_to_fetch ) ) ;
823
827
} else {
824
828
// We don't know what the rev will point to. To handle this
825
829
// situation we fetch all branches and tags, and then we pray
@@ -1016,45 +1020,79 @@ fn init(path: &Path, bare: bool) -> CargoResult<git2::Repository> {
1016
1020
Ok ( git2:: Repository :: init_opts ( & path, & opts) ?)
1017
1021
}
1018
1022
1023
+ enum FastPathRev {
1024
+ /// The local rev (determined by `reference.resolve(repo)`) is already up to
1025
+ /// date with what this rev resolves to on GitHub's server.
1026
+ UpToDate ,
1027
+ /// The following SHA must be fetched in order for the local rev to become
1028
+ /// up to date.
1029
+ NeedsFetch ( Oid ) ,
1030
+ /// Don't know whether local rev is up to date. We'll fetch _all_ branches
1031
+ /// and tags from the server and see what happens.
1032
+ Indeterminate ,
1033
+ }
1034
+
1019
1035
/// Updating the index is done pretty regularly so we want it to be as fast as
1020
1036
/// possible. For registries hosted on GitHub (like the crates.io index) there's
1021
1037
/// a fast path available to use [1] to tell us that there's no updates to be
1022
1038
/// made.
1023
1039
///
1024
1040
/// This function will attempt to hit that fast path and verify that the `oid`
1025
- /// is actually the current branch of the repository. If `true` is returned then
1026
- /// no update needs to be performed, but if `false` is returned then the
1027
- /// standard update logic still needs to happen.
1041
+ /// is actually the current branch of the repository.
1028
1042
///
1029
1043
/// [1]: https://developer.github.com/v3/repos/commits/#get-the-sha-1-of-a-commit-reference
1030
1044
///
1031
1045
/// Note that this function should never cause an actual failure because it's
1032
1046
/// just a fast path. As a result all errors are ignored in this function and we
1033
1047
/// just return a `bool`. Any real errors will be reported through the normal
1034
1048
/// update path above.
1035
- fn github_up_to_date (
1049
+ fn github_fast_path (
1036
1050
repo : & mut git2:: Repository ,
1037
1051
url : & str ,
1038
1052
reference : & GitReference ,
1039
1053
config : & Config ,
1040
- ) -> CargoResult < bool > {
1054
+ ) -> CargoResult < FastPathRev > {
1041
1055
let url = Url :: parse ( url) ?;
1042
1056
if !is_github ( & url) {
1043
- return Ok ( false ) ;
1057
+ return Ok ( FastPathRev :: Indeterminate ) ;
1044
1058
}
1045
1059
1060
+ let local_object = reference. resolve ( repo) . ok ( ) ;
1061
+
1046
1062
let github_branch_name = match reference {
1047
1063
GitReference :: Branch ( branch) => branch,
1048
1064
GitReference :: Tag ( tag) => tag,
1049
1065
GitReference :: DefaultBranch => "HEAD" ,
1050
1066
GitReference :: Rev ( rev) => {
1051
1067
if rev. starts_with ( "refs/" ) {
1052
1068
rev
1053
- } else if is_long_hash ( rev) {
1054
- return Ok ( reference. resolve ( repo) . is_ok ( ) ) ;
1069
+ } else if looks_like_commit_hash ( rev) {
1070
+ // `revparse_single` (used by `resolve`) is the only way to turn
1071
+ // short hash -> long hash, but it also parses other things,
1072
+ // like branch and tag names, which might coincidentally be
1073
+ // valid hex.
1074
+ //
1075
+ // We only return early if `rev` is a prefix of the object found
1076
+ // by `revparse_single`. Don't bother talking to GitHub in that
1077
+ // case, since commit hashes are permanent. If a commit with the
1078
+ // requested hash is already present in the local clone, its
1079
+ // contents must be the same as what is on the server for that
1080
+ // hash.
1081
+ //
1082
+ // If `rev` is not found locally by `revparse_single`, we'll
1083
+ // need GitHub to resolve it and get a hash. If `rev` is found
1084
+ // but is not a short hash of the found object, it's probably a
1085
+ // branch and we also need to get a hash from GitHub, in case
1086
+ // the branch has moved.
1087
+ if let Some ( local_object) = local_object {
1088
+ if is_short_hash_of ( rev, local_object) {
1089
+ return Ok ( FastPathRev :: UpToDate ) ;
1090
+ }
1091
+ }
1092
+ rev
1055
1093
} else {
1056
1094
debug ! ( "can't use github fast path with `rev = \" {}\" `" , rev) ;
1057
- return Ok ( false ) ;
1095
+ return Ok ( FastPathRev :: Indeterminate ) ;
1058
1096
}
1059
1097
}
1060
1098
} ;
@@ -1087,18 +1125,50 @@ fn github_up_to_date(
1087
1125
handle. get ( true ) ?;
1088
1126
handle. url ( & url) ?;
1089
1127
handle. useragent ( "cargo" ) ?;
1090
- let mut headers = List :: new ( ) ;
1091
- headers. append ( "Accept: application/vnd.github.3.sha" ) ?;
1092
- headers. append ( & format ! ( "If-None-Match: \" {}\" " , reference. resolve( repo) ?) ) ?;
1093
- handle. http_headers ( headers) ?;
1094
- handle. perform ( ) ?;
1095
- Ok ( handle. response_code ( ) ? == 304 )
1128
+ handle. http_headers ( {
1129
+ let mut headers = List :: new ( ) ;
1130
+ headers. append ( "Accept: application/vnd.github.3.sha" ) ?;
1131
+ if let Some ( local_object) = local_object {
1132
+ headers. append ( & format ! ( "If-None-Match: \" {}\" " , local_object) ) ?;
1133
+ }
1134
+ headers
1135
+ } ) ?;
1136
+
1137
+ let mut response_body = Vec :: new ( ) ;
1138
+ let mut transfer = handle. transfer ( ) ;
1139
+ transfer. write_function ( |data| {
1140
+ response_body. extend_from_slice ( data) ;
1141
+ Ok ( data. len ( ) )
1142
+ } ) ?;
1143
+ transfer. perform ( ) ?;
1144
+ drop ( transfer) ; // end borrow of handle so that response_code can be called
1145
+
1146
+ let response_code = handle. response_code ( ) ?;
1147
+ if response_code == 304 {
1148
+ Ok ( FastPathRev :: UpToDate )
1149
+ } else if response_code == 200 {
1150
+ let oid_to_fetch = str:: from_utf8 ( & response_body) ?. parse :: < Oid > ( ) ?;
1151
+ Ok ( FastPathRev :: NeedsFetch ( oid_to_fetch) )
1152
+ } else {
1153
+ // Usually response_code == 404 if the repository does not exist, and
1154
+ // response_code == 422 if exists but GitHub is unable to resolve the
1155
+ // requested rev.
1156
+ Ok ( FastPathRev :: Indeterminate )
1157
+ }
1096
1158
}
1097
1159
1098
1160
fn is_github ( url : & Url ) -> bool {
1099
1161
url. host_str ( ) == Some ( "github.com" )
1100
1162
}
1101
1163
1102
- fn is_long_hash ( rev : & str ) -> bool {
1103
- rev. len ( ) == 40 && rev. chars ( ) . all ( |ch| ch. is_ascii_hexdigit ( ) )
1164
+ fn looks_like_commit_hash ( rev : & str ) -> bool {
1165
+ rev. len ( ) >= 7 && rev. chars ( ) . all ( |ch| ch. is_ascii_hexdigit ( ) )
1166
+ }
1167
+
1168
+ fn is_short_hash_of ( rev : & str , oid : Oid ) -> bool {
1169
+ let long_hash = oid. to_string ( ) ;
1170
+ match long_hash. get ( ..rev. len ( ) ) {
1171
+ Some ( truncated_long_hash) => truncated_long_hash. eq_ignore_ascii_case ( rev) ,
1172
+ None => false ,
1173
+ }
1104
1174
}
0 commit comments