Skip to content

Commit

Permalink
Specialize Bytes<R>::next when R is a BufReader.
Browse files Browse the repository at this point in the history
This reduces the runtime for a simple program using `Bytes::next` to
iterate through a file from 220ms to 70ms on my Linux box.
  • Loading branch information
nnethercote committed Oct 19, 2023
1 parent cc705b8 commit 42f7720
Show file tree
Hide file tree
Showing 2 changed files with 53 additions and 12 deletions.
24 changes: 19 additions & 5 deletions library/std/src/io/buffered/bufreader.rs
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,8 @@ mod buffer;

use crate::fmt;
use crate::io::{
self, BorrowedCursor, BufRead, IoSliceMut, Read, Seek, SeekFrom, SizeHint, DEFAULT_BUF_SIZE,
self, BorrowedCursor, BufRead, IoSliceMut, Read, Seek, SeekFrom, SizeHint, SpecReadByte,
DEFAULT_BUF_SIZE,
};
use buffer::Buffer;

Expand Down Expand Up @@ -259,6 +260,21 @@ impl<R: ?Sized + Seek> BufReader<R> {
}
}

impl<R> SpecReadByte for BufReader<R>
where
Self: Read,
{
#[inline]
fn spec_read_byte(&mut self) -> Option<io::Result<u8>> {
let mut byte = 0;
if self.buf.consume_with(1, |claimed| byte = claimed[0]) {
return Some(Ok(byte));
}

self.slow_read_byte()
}
}

#[stable(feature = "rust1", since = "1.0.0")]
impl<R: ?Sized + Read> Read for BufReader<R> {
fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
Expand All @@ -269,10 +285,8 @@ impl<R: ?Sized + Read> Read for BufReader<R> {
self.discard_buffer();
return self.inner.read(buf);
}
let nread = {
let mut rem = self.fill_buf()?;
rem.read(buf)?
};
let mut rem = self.fill_buf()?;
let nread = rem.read(buf)?;
self.consume(nread);
Ok(nread)
}
Expand Down
41 changes: 34 additions & 7 deletions library/std/src/io/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -2777,23 +2777,50 @@ pub struct Bytes<R> {
impl<R: Read> Iterator for Bytes<R> {
type Item = Result<u8>;

#[inline]
// Not `#[inline]`. This function gets inlined even without it, but having
// the inline annotation can result in worse code generation. See #116785.
fn next(&mut self) -> Option<Result<u8>> {
SpecReadByte::spec_read_byte(&mut self.inner)
}

#[inline]
fn size_hint(&self) -> (usize, Option<usize>) {
SizeHint::size_hint(&self.inner)
}
}

// Trait for specialization of `Bytes::next`.
trait SpecReadByte {
// Specializable method for reading a single byte.
fn spec_read_byte(&mut self) -> Option<Result<u8>>;

// Non-specializable method for reading a single byte. This is used by the
// default `spec_read_byte` and can also be called on a slow path of a
// specialized `spec_read_byte` method.
fn slow_read_byte(&mut self) -> Option<Result<u8>>;
}

impl<R> SpecReadByte for R
where
Self: Read,
{
#[inline]
default fn spec_read_byte(&mut self) -> Option<Result<u8>> {
self.slow_read_byte()
}

#[inline(never)]
fn slow_read_byte(&mut self) -> Option<Result<u8>> {
let mut byte = 0;
loop {
return match self.inner.read(slice::from_mut(&mut byte)) {
return match self.read(slice::from_mut(&mut byte)) {
Ok(0) => None,
Ok(..) => Some(Ok(byte)),
Err(ref e) if e.is_interrupted() => continue,
Err(e) => Some(Err(e)),
};
}
}

#[inline]
fn size_hint(&self) -> (usize, Option<usize>) {
SizeHint::size_hint(&self.inner)
}
}

trait SizeHint {
Expand Down

0 comments on commit 42f7720

Please sign in to comment.