Skip to content

Commit 7dc5506

Browse files
committed
Stabilize sparse-registry
1 parent 247b22f commit 7dc5506

File tree

10 files changed

+347
-344
lines changed

10 files changed

+347
-344
lines changed

src/cargo/core/features.rs

+12-2
Original file line numberDiff line numberDiff line change
@@ -681,7 +681,7 @@ unstable_cli_options!(
681681
no_index_update: bool = ("Do not update the registry index even if the cache is outdated"),
682682
panic_abort_tests: bool = ("Enable support to run tests with -Cpanic=abort"),
683683
host_config: bool = ("Enable the [host] section in the .cargo/config.toml file"),
684-
sparse_registry: bool = ("Support plain-HTTP-based crate registries"),
684+
sparse_registry: bool = ("Use the sparse protocol when accessing crates.io"),
685685
registry_auth: bool = ("Authentication for alternative registries, and generate registry authentication tokens using asymmetric cryptography"),
686686
target_applies_to_host: bool = ("Enable the `target-applies-to-host` key in the .cargo/config.toml file"),
687687
rustdoc_map: bool = ("Allow passing external documentation mappings to rustdoc"),
@@ -751,6 +751,11 @@ const STABILISED_MULTITARGET: &str = "Multiple `--target` options are now always
751751
const STABILIZED_TERMINAL_WIDTH: &str =
752752
"The -Zterminal-width option is now always enabled for terminal output.";
753753

754+
const STABILISED_SPARSE_REGISTRY: &str = "This flag currently still sets the default protocol\
755+
to `sparse` when accessing crates.io. However, this will be removed in the future. \n\
756+
The stable equivalent is to set the config value `registries.crates-io.protocol = 'sparse'`\n\
757+
or environment variable `CARGO_REGISTRIES_CRATES_IO_PROTOCOL=sparse`";
758+
754759
fn deserialize_build_std<'de, D>(deserializer: D) -> Result<Option<Vec<String>>, D::Error>
755760
where
756761
D: serde::Deserializer<'de>,
@@ -948,7 +953,12 @@ impl CliUnstable {
948953
"multitarget" => stabilized_warn(k, "1.64", STABILISED_MULTITARGET),
949954
"rustdoc-map" => self.rustdoc_map = parse_empty(k, v)?,
950955
"terminal-width" => stabilized_warn(k, "1.68", STABILIZED_TERMINAL_WIDTH),
951-
"sparse-registry" => self.sparse_registry = parse_empty(k, v)?,
956+
"sparse-registry" => {
957+
// Once sparse-registry becomes the default for crates.io, `sparse_registry` should
958+
// be removed entirely from `CliUnstable`.
959+
stabilized_warn(k, "1.68", STABILISED_SPARSE_REGISTRY);
960+
self.sparse_registry = parse_empty(k, v)?;
961+
}
952962
"registry-auth" => self.registry_auth = parse_empty(k, v)?,
953963
"namespaced-features" => stabilized_warn(k, "1.60", STABILISED_NAMESPACED_FEATURES),
954964
"weak-dep-features" => stabilized_warn(k, "1.60", STABILIZED_WEAK_DEP_FEATURES),

src/cargo/sources/registry/http_remote.rs

-3
Original file line numberDiff line numberDiff line change
@@ -157,9 +157,6 @@ impl<'cfg> HttpRegistry<'cfg> {
157157
config: &'cfg Config,
158158
name: &str,
159159
) -> CargoResult<HttpRegistry<'cfg>> {
160-
if !config.cli_unstable().sparse_registry {
161-
anyhow::bail!("usage of sparse registries requires `-Z sparse-registry`");
162-
}
163160
let url = source_id.url().as_str();
164161
// Ensure the url ends with a slash so we can concatenate paths.
165162
if !url.ends_with('/') {

src/doc/src/reference/config.md

+14
Original file line numberDiff line numberDiff line change
@@ -892,6 +892,20 @@ commands like [`cargo publish`] that require authentication.
892892

893893
Can be overridden with the `--token` command-line option.
894894

895+
##### `registries.crates-io.protocol`
896+
* Type: string
897+
* Default: `git`
898+
* Environment: `CARGO_REGISTRIES_CRATES_IO_PROTOCOL`
899+
900+
Specifies the protocol used to access crates.io. Allowed values are `git` or `sparse`.
901+
902+
`git` causes Cargo to clone the entire index of all packages ever published to [crates.io] from <https://github.com/rust-lang/crates.io-index/>.
903+
This can have performance implications due to the size of the index.
904+
`sparse` is a newer protocol which uses HTTPS to download only what is necessary from <https://index.crates.io/>.
905+
This can result in a significant performance improvement for resolving new dependencies in most situations.
906+
907+
More information about registry protocols may be found in the [Registries chapter](registries.md).
908+
895909
#### `[registry]`
896910

897911
The `[registry]` table controls the default registry used when one is not

src/doc/src/reference/registries.md

+20-1
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,9 @@ table has a key for each registry, for example:
2222
my-registry = { index = "https://my-intranet:8080/git/index" }
2323
```
2424

25-
The `index` key should be a URL to a git repository with the registry's index.
25+
The `index` key should be a URL to a git repository with the registry's index or a
26+
Cargo sparse registry URL with the `sparse+` prefix.
27+
2628
A crate can then depend on a crate from another registry by specifying the
2729
`registry` key and a value of the registry's name in that dependency's entry
2830
in `Cargo.toml`:
@@ -98,13 +100,30 @@ has a separate table for each registry, for example:
98100
token = "854DvwSlUwEHtIo3kWy6x7UCPKHfzCmy"
99101
```
100102

103+
### Registry Protocols
104+
Cargo supports two remote registry protocols: `git` and `sparse`. If the registry
105+
index URL starts with `sparse+`, Cargo uses the sparse protocol. Otherwise
106+
Cargo uses the `git` protocol.
107+
108+
The `git` protocol stores index metadata in a git repository and requires Cargo to clone
109+
the entire repo.
110+
111+
The `sparse` protocol fetches individual metadata files using plain HTTP requests.
112+
Since Cargo only downloads the metadata for relevant crates, the `sparse` protocol can
113+
save significant time and bandwidth.
114+
115+
The [crates.io] registry supports both protocols. The protocol for crates.io is
116+
controlled via the [`registries.crates-io.protocol`] config key.
117+
101118
[Source Replacement]: source-replacement.md
102119
[Running a Registry]: running-a-registry.md
103120
[`cargo publish`]: ../commands/cargo-publish.md
104121
[`cargo package`]: ../commands/cargo-package.md
105122
[`cargo login`]: ../commands/cargo-login.md
106123
[config]: config.md
107124
[crates.io]: https://crates.io/
125+
[`registries.crates-io.protocol`]: config.md#registriescrates-ioprotocol
126+
108127

109128
<script>
110129
(function() {

src/doc/src/reference/registry-index.md

+57-5
Original file line numberDiff line numberDiff line change
@@ -6,11 +6,10 @@ introduced them. Older versions of Cargo may not be able to use packages that
66
make use of new features. However, the format for older packages should not
77
change, so older versions of Cargo should be able to use them.
88

9-
The index is stored in a git repository so that Cargo can efficiently fetch
10-
incremental updates to the index. In the root of the repository is a file
11-
named `config.json` which contains JSON information used by Cargo for
12-
accessing the registry. This is an example of what the [crates.io] config file
13-
looks like:
9+
### Index Configuration
10+
The root of the index contains a file named `config.json` which contains JSON
11+
information used by Cargo for accessing the registry. This is an example of
12+
what the [crates.io] config file looks like:
1413

1514
```javascript
1615
{
@@ -37,11 +36,15 @@ The keys are:
3736
is not specified, commands such as [`cargo publish`] will not work. The web
3837
API is described below.
3938

39+
40+
### Download Endpoint
4041
The download endpoint should send the `.crate` file for the requested package.
4142
Cargo supports https, http, and file URLs, HTTP redirects, HTTP1 and HTTP2.
4243
The exact specifics of TLS support depend on the platform that Cargo is
4344
running on, the version of Cargo, and how it was compiled.
4445

46+
47+
### Index files
4548
The rest of the index repository contains one file for each package, where the
4649
filename is the name of the package in lowercase. Each version of the package
4750
has a separate line in the file. The files are organized in a tier of
@@ -202,6 +205,55 @@ explaining the format of the entry.
202205
The JSON objects should not be modified after they are added except for the
203206
`yanked` field whose value may change at any time.
204207

208+
### Index Protocols
209+
Cargo supports two remote registry protocols: `git` and `sparse`. The `git` protocol
210+
stores index files in a git repository and the `sparse` protocol fetches individual
211+
files over HTTP.
212+
213+
#### Git Protocol
214+
The git protocol has no protocol prefix in the index url. For example the git index URL
215+
for [crates.io] is `https://github.com/rust-lang/crates.io-index`.
216+
217+
Cargo caches the git repository on disk so that it can efficiently incrementally fetch
218+
updates.
219+
220+
#### Sparse Protocol
221+
The sparse protocol uses the `sparse+` protocol prefix in the registry URL. For example,
222+
the sparse index URL for [crates.io] is `sparse+https://index.crates.io/`.
223+
224+
The sparse protocol downloads each index file using an individual HTTP request. Since
225+
this results in a large number of small HTTP requests, performance is signficiantly
226+
improved with a server that supports pipelining and HTTP/2.
227+
228+
##### Caching
229+
Cargo caches the crate metadata files, and captures the `ETag` or `Last-Modified`
230+
HTTP header from the server for each entry. When refreshing crate metadata, Cargo
231+
sends the `If-None-Match` or `If-Modified-Since` header to allow the server to respond
232+
with HTTP 304 "Not Modified" if the local cache is valid, saving time and bandwidth.
233+
If both `ETag` and `Last-Modified` headers are present, Cargo uses the `ETag` only.
234+
235+
##### Cache Invalidation
236+
If a registry is using some kind of CDN or proxy which caches access to the index files,
237+
then it is recommended that registries implement some form of cache invalidation when
238+
the files are updated. If these caches are not updated, then users may not be able to
239+
access new crates until the cache is cleared.
240+
241+
##### Nonexistent Crates
242+
For crates that do not exist, the registry should respond with a 404 "Not Found", 410 "Gone"
243+
or 451 "Unavailable For Legal Reasons" code.
244+
245+
##### Sparse Limitations
246+
Since the URL of the registry is stored in the lockfile, it's not recommended to offer
247+
a registry with both protocols. Discussion about a transition plan is ongoing in issue
248+
[#10964]. The [crates.io] registry is an exception, since Cargo internally substitues
249+
the equivalent git URL when the sparse protocol is used.
250+
251+
If a registry does offer both protocols, it's currently recommended to choose one protocol
252+
as the canonical protocol and use [source replacement] for the other protocol.
253+
254+
205255
[`cargo publish`]: ../commands/cargo-publish.md
206256
[alphanumeric]: ../../std/primitive.char.html#method.is_alphanumeric
207257
[crates.io]: https://crates.io/
258+
[source replacement]: ../reference/source-replacement.md
259+
[#10964]: https://github.com/rust-lang/cargo/issues/10964

src/doc/src/reference/unstable.md

+5-27
Original file line numberDiff line numberDiff line change
@@ -97,7 +97,6 @@ Each new feature described below should explain how to use it.
9797
* Registries
9898
* [credential-process](#credential-process) — Adds support for fetching registry tokens from an external authentication program.
9999
* [`cargo logout`](#cargo-logout) — Adds the `logout` command to remove the currently saved registry token.
100-
* [sparse-registry](#sparse-registry) — Adds support for fetching from static-file HTTP registries (`sparse+`)
101100
* [publish-timeout](#publish-timeout) — Controls the timeout between uploading the crate and being available in the index
102101
* [registry-auth](#registry-auth) — Adds support for authenticated registries, and generate registry authentication tokens using asymmetric cryptography.
103102

@@ -792,32 +791,6 @@ fn main() {
792791
}
793792
```
794793

795-
### sparse-registry
796-
* Tracking Issue: [9069](https://github.com/rust-lang/cargo/issues/9069)
797-
* RFC: [#2789](https://github.com/rust-lang/rfcs/pull/2789)
798-
799-
The `sparse-registry` feature allows cargo to interact with remote registries served
800-
over plain HTTP rather than git. These registries can be identified by urls starting with
801-
`sparse+http://` or `sparse+https://`.
802-
803-
When fetching index metadata over HTTP, Cargo only downloads the metadata for relevant
804-
crates, which can save significant time and bandwidth.
805-
806-
The format of the sparse index is identical to a checkout of a git-based index.
807-
808-
The `registries.crates-io.protocol` config option can be used to set the default protocol
809-
for crates.io. This option requires `-Z sparse-registry` to be enabled.
810-
811-
* `sparse` — Use sparse index.
812-
* `git` — Use git index.
813-
* If the option is unset, it will be sparse index if `-Z sparse-registry` is enabled,
814-
otherwise it will be git index.
815-
816-
Cargo locally caches the crate metadata files, and captures an `ETag` or `Last-Modified`
817-
HTTP header from the server for each entry. When refreshing crate metadata, Cargo will
818-
send the `If-None-Match` or `If-Modified-Since` header to allow the server to respond
819-
with HTTP 304 if the local cache is valid, saving time and bandwidth.
820-
821794
### publish-timeout
822795
* Tracking Issue: [11222](https://github.com/rust-lang/cargo/issues/11222)
823796

@@ -1456,3 +1429,8 @@ for more information.
14561429
The `-Z terminal-width` option has been stabilized in the 1.68 release.
14571430
The terminal width is always passed to the compiler when running from a
14581431
terminal where Cargo can automatically detect the width.
1432+
1433+
### sparse-registry
1434+
1435+
Sparse registry support has been stabilized in the 1.68 release.
1436+
See [Registry Protocols](registries.md#registry-protocols) for more information.

tests/testsuite/alt_registry.rs

+3-9
Original file line numberDiff line numberDiff line change
@@ -1335,9 +1335,7 @@ fn sparse_lockfile() {
13351335
.file("src/lib.rs", "")
13361336
.build();
13371337

1338-
p.cargo("-Zsparse-registry generate-lockfile")
1339-
.masquerade_as_nightly_cargo(&["sparse-registry"])
1340-
.run();
1338+
p.cargo("generate-lockfile").run();
13411339
assert_match_exact(
13421340
&p.read_lockfile(),
13431341
r#"# This file is automatically @generated by Cargo.
@@ -1383,9 +1381,7 @@ fn publish_with_transitive_dep() {
13831381
)
13841382
.file("src/lib.rs", "")
13851383
.build();
1386-
p1.cargo("publish -Zsparse-registry --registry Alt-1")
1387-
.masquerade_as_nightly_cargo(&["sparse-registry"])
1388-
.run();
1384+
p1.cargo("publish --registry Alt-1").run();
13891385

13901386
let p2 = project()
13911387
.file(
@@ -1402,7 +1398,5 @@ fn publish_with_transitive_dep() {
14021398
)
14031399
.file("src/lib.rs", "")
14041400
.build();
1405-
p2.cargo("publish -Zsparse-registry")
1406-
.masquerade_as_nightly_cargo(&["sparse-registry"])
1407-
.run();
1401+
p2.cargo("publish").run();
14081402
}

tests/testsuite/publish.rs

+8-20
Original file line numberDiff line numberDiff line change
@@ -195,8 +195,8 @@ fn simple_publish_with_asymmetric() {
195195
.file("src/main.rs", "fn main() {}")
196196
.build();
197197

198-
p.cargo("publish --no-verify -Zregistry-auth -Zsparse-registry --registry dummy-registry")
199-
.masquerade_as_nightly_cargo(&["registry-auth", "sparse-registry"])
198+
p.cargo("publish --no-verify -Zregistry-auth --registry dummy-registry")
199+
.masquerade_as_nightly_cargo(&["registry-auth"])
200200
.with_stderr(
201201
"\
202202
[UPDATING] `dummy-registry` index
@@ -2518,8 +2518,7 @@ fn wait_for_first_publish() {
25182518
.file("src/lib.rs", "")
25192519
.build();
25202520

2521-
p.cargo("publish --no-verify -Z sparse-registry")
2522-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2521+
p.cargo("publish --no-verify")
25232522
.replace_crates_io(registry.index_url())
25242523
.with_status(0)
25252524
.with_stderr(
@@ -2556,10 +2555,7 @@ See [..]
25562555
.file("src/main.rs", "fn main() {}")
25572556
.build();
25582557

2559-
p.cargo("build -Z sparse-registry")
2560-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2561-
.with_status(0)
2562-
.run();
2558+
p.cargo("build").with_status(0).run();
25632559
}
25642560

25652561
/// A separate test is needed for package names with - or _ as they hit
@@ -2602,8 +2598,7 @@ fn wait_for_first_publish_underscore() {
26022598
.file("src/lib.rs", "")
26032599
.build();
26042600

2605-
p.cargo("publish --no-verify -Z sparse-registry")
2606-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2601+
p.cargo("publish --no-verify")
26072602
.replace_crates_io(registry.index_url())
26082603
.with_status(0)
26092604
.with_stderr(
@@ -2640,10 +2635,7 @@ See [..]
26402635
.file("src/main.rs", "fn main() {}")
26412636
.build();
26422637

2643-
p.cargo("build -Z sparse-registry")
2644-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2645-
.with_status(0)
2646-
.run();
2638+
p.cargo("build").with_status(0).run();
26472639
}
26482640

26492641
#[cargo_test]
@@ -2696,8 +2688,7 @@ fn wait_for_subsequent_publish() {
26962688
.file("src/lib.rs", "")
26972689
.build();
26982690

2699-
p.cargo("publish --no-verify -Z sparse-registry")
2700-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2691+
p.cargo("publish --no-verify")
27012692
.replace_crates_io(registry.index_url())
27022693
.with_status(0)
27032694
.with_stderr(
@@ -2734,10 +2725,7 @@ See [..]
27342725
.file("src/main.rs", "fn main() {}")
27352726
.build();
27362727

2737-
p.cargo("build -Z sparse-registry")
2738-
.masquerade_as_nightly_cargo(&["sparse-registry"])
2739-
.with_status(0)
2740-
.run();
2728+
p.cargo("build").with_status(0).run();
27412729
}
27422730

27432731
#[cargo_test]

0 commit comments

Comments
 (0)