Skip to content

Commit 8d8f06b

Browse files
committed
avoid excessive initialization when copying to a Vec
It now keeps track of initialized bytes to avoid reinitialization. It also keeps track of read sizes to avoid initializing more bytes than the reader needs. This is important when passing a huge vector to a Read that only has a few bytes to offer and doesn't implement read_buf().
1 parent 9c20ddd commit 8d8f06b

File tree

1 file changed

+47
-17
lines changed

1 file changed

+47
-17
lines changed

library/std/src/io/copy.rs

+47-17
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
use super::{BorrowedBuf, BufReader, BufWriter, Read, Result, Write, DEFAULT_BUF_SIZE};
22
use crate::alloc::Allocator;
33
use crate::cmp;
4+
use crate::cmp::min;
45
use crate::collections::VecDeque;
56
use crate::io::IoSlice;
67
use crate::mem::MaybeUninit;
@@ -271,28 +272,57 @@ impl<A: Allocator> BufferedWriterSpec for Vec<u8, A> {
271272
}
272273
}
273274

275+
// don't immediately offer the vec's whole spare capacity, otherwise
276+
// we might have to fully initialize it if the reader doesn't have a custom read_buf() impl
277+
let mut max_read_size = DEFAULT_BUF_SIZE;
278+
274279
loop {
275280
self.reserve(DEFAULT_BUF_SIZE);
276-
let mut buf: BorrowedBuf<'_> = self.spare_capacity_mut().into();
277-
match reader.read_buf(buf.unfilled()) {
278-
Ok(()) => {}
279-
Err(e) if e.is_interrupted() => continue,
280-
Err(e) => return Err(e),
281-
};
281+
let mut initialized_spare_capacity = 0;
282282

283-
let read = buf.filled().len();
284-
if read == 0 {
285-
break;
286-
}
283+
loop {
284+
let buf = self.spare_capacity_mut();
285+
let read_size = min(max_read_size, buf.len());
286+
let mut buf = BorrowedBuf::from(&mut buf[..read_size]);
287+
// SAFETY: init is either 0 or the init_len from the previous iteration.
288+
unsafe {
289+
buf.set_init(initialized_spare_capacity);
290+
}
291+
match reader.read_buf(buf.unfilled()) {
292+
Ok(()) => {
293+
let bytes_read = buf.len();
287294

288-
// SAFETY: BorrowedBuf guarantees all of its filled bytes are init
289-
// and the number of read bytes can't exceed the spare capacity since
290-
// that's what the buffer is borrowing from.
291-
unsafe { self.set_len(self.len() + read) };
292-
bytes += read as u64;
293-
}
295+
// EOF
296+
if bytes_read == 0 {
297+
return Ok(bytes);
298+
}
294299

295-
Ok(bytes)
300+
// the reader is returning short reads but it doesn't call ensure_init()
301+
if buf.init_len() < buf.capacity() {
302+
max_read_size = usize::MAX;
303+
}
304+
// the reader hasn't returned short reads so far
305+
if bytes_read == buf.capacity() {
306+
max_read_size *= 2;
307+
}
308+
309+
initialized_spare_capacity = buf.init_len() - bytes_read;
310+
bytes += bytes_read as u64;
311+
// SAFETY: BorrowedBuf guarantees all of its filled bytes are init
312+
// and the number of read bytes can't exceed the spare capacity since
313+
// that's what the buffer is borrowing from.
314+
unsafe { self.set_len(self.len() + bytes_read) };
315+
316+
// spare capacity full, reserve more
317+
if self.len() == self.capacity() {
318+
break;
319+
}
320+
}
321+
Err(e) if e.is_interrupted() => continue,
322+
Err(e) => return Err(e),
323+
}
324+
}
325+
}
296326
}
297327
}
298328

0 commit comments

Comments
 (0)