Skip to content

Commit e092502

Browse files
committed
Auto merge of #116785 - nnethercote:spec-Bytes-read, r=the8472
Specialize `Bytes<R>::next` when `R` is a `BufReader`. This reduces the runtime for a simple program using `Bytes::next` to iterate through a file from 220ms to 70ms on my Linux box. r? `@the8472`
2 parents 4578435 + 181ce63 commit e092502

File tree

2 files changed

+60
-15
lines changed

2 files changed

+60
-15
lines changed

library/std/src/io/buffered/bufreader.rs

+20-5
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,8 @@ mod buffer;
22

33
use crate::fmt;
44
use crate::io::{
5-
self, BorrowedCursor, BufRead, IoSliceMut, Read, Seek, SeekFrom, SizeHint, DEFAULT_BUF_SIZE,
5+
self, uninlined_slow_read_byte, BorrowedCursor, BufRead, IoSliceMut, Read, Seek, SeekFrom,
6+
SizeHint, SpecReadByte, DEFAULT_BUF_SIZE,
67
};
78
use buffer::Buffer;
89

@@ -259,6 +260,22 @@ impl<R: ?Sized + Seek> BufReader<R> {
259260
}
260261
}
261262

263+
impl<R> SpecReadByte for BufReader<R>
264+
where
265+
Self: Read,
266+
{
267+
#[inline]
268+
fn spec_read_byte(&mut self) -> Option<io::Result<u8>> {
269+
let mut byte = 0;
270+
if self.buf.consume_with(1, |claimed| byte = claimed[0]) {
271+
return Some(Ok(byte));
272+
}
273+
274+
// Fallback case, only reached once per buffer refill.
275+
uninlined_slow_read_byte(self)
276+
}
277+
}
278+
262279
#[stable(feature = "rust1", since = "1.0.0")]
263280
impl<R: ?Sized + Read> Read for BufReader<R> {
264281
fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
@@ -269,10 +286,8 @@ impl<R: ?Sized + Read> Read for BufReader<R> {
269286
self.discard_buffer();
270287
return self.inner.read(buf);
271288
}
272-
let nread = {
273-
let mut rem = self.fill_buf()?;
274-
rem.read(buf)?
275-
};
289+
let mut rem = self.fill_buf()?;
290+
let nread = rem.read(buf)?;
276291
self.consume(nread);
277292
Ok(nread)
278293
}

library/std/src/io/mod.rs

+40-10
Original file line numberDiff line numberDiff line change
@@ -2777,17 +2777,10 @@ pub struct Bytes<R> {
27772777
impl<R: Read> Iterator for Bytes<R> {
27782778
type Item = Result<u8>;
27792779

2780-
#[inline]
2780+
// Not `#[inline]`. This function gets inlined even without it, but having
2781+
// the inline annotation can result in worse code generation. See #116785.
27812782
fn next(&mut self) -> Option<Result<u8>> {
2782-
let mut byte = 0;
2783-
loop {
2784-
return match self.inner.read(slice::from_mut(&mut byte)) {
2785-
Ok(0) => None,
2786-
Ok(..) => Some(Ok(byte)),
2787-
Err(ref e) if e.is_interrupted() => continue,
2788-
Err(e) => Some(Err(e)),
2789-
};
2790-
}
2783+
SpecReadByte::spec_read_byte(&mut self.inner)
27912784
}
27922785

27932786
#[inline]
@@ -2796,6 +2789,43 @@ impl<R: Read> Iterator for Bytes<R> {
27962789
}
27972790
}
27982791

2792+
/// For the specialization of `Bytes::next`.
2793+
trait SpecReadByte {
2794+
fn spec_read_byte(&mut self) -> Option<Result<u8>>;
2795+
}
2796+
2797+
impl<R> SpecReadByte for R
2798+
where
2799+
Self: Read,
2800+
{
2801+
#[inline]
2802+
default fn spec_read_byte(&mut self) -> Option<Result<u8>> {
2803+
inlined_slow_read_byte(self)
2804+
}
2805+
}
2806+
2807+
/// Read a single byte in a slow, generic way. This is used by the default
2808+
/// `spec_read_byte`.
2809+
#[inline]
2810+
fn inlined_slow_read_byte<R: Read>(reader: &mut R) -> Option<Result<u8>> {
2811+
let mut byte = 0;
2812+
loop {
2813+
return match reader.read(slice::from_mut(&mut byte)) {
2814+
Ok(0) => None,
2815+
Ok(..) => Some(Ok(byte)),
2816+
Err(ref e) if e.is_interrupted() => continue,
2817+
Err(e) => Some(Err(e)),
2818+
};
2819+
}
2820+
}
2821+
2822+
// Used by `BufReader::spec_read_byte`, for which the `inline(ever)` is
2823+
// important.
2824+
#[inline(never)]
2825+
fn uninlined_slow_read_byte<R: Read>(reader: &mut R) -> Option<Result<u8>> {
2826+
inlined_slow_read_byte(reader)
2827+
}
2828+
27992829
trait SizeHint {
28002830
fn lower_bound(&self) -> usize;
28012831

0 commit comments

Comments
 (0)