itoa/src/lib.rs

318 lines
12 KiB
Rust
Raw Normal View History

2020-06-14 01:36:24 -04:00
//! [![github]](https://github.com/dtolnay/itoa) [![crates-io]](https://crates.io/crates/itoa) [![docs-rs]](https://docs.rs/itoa)
//!
//! [github]: https://img.shields.io/badge/github-8da0cb?style=for-the-badge&labelColor=555555&logo=github
//! [crates-io]: https://img.shields.io/badge/crates.io-fc8d62?style=for-the-badge&labelColor=555555&logo=rust
//! [docs-rs]: https://img.shields.io/badge/docs.rs-66c2a5?style=for-the-badge&labelColor=555555&logoColor=white&logo=
//!
//! <br>
//!
2019-05-01 21:26:44 -04:00
//! This crate provides fast functions for printing integer primitives to an
//! [`io::Write`] or a [`fmt::Write`]. The implementation comes straight from
//! [libcore] but avoids the performance penalty of going through
//! [`fmt::Formatter`].
//!
//! See also [`dtoa`] for printing floating point primitives.
//!
//! [`io::Write`]: https://doc.rust-lang.org/std/io/trait.Write.html
//! [`fmt::Write`]: https://doc.rust-lang.org/core/fmt/trait.Write.html
//! [libcore]: https://github.com/rust-lang/rust/blob/b8214dc6c6fc20d0a660fb5700dca9ebf51ebe89/src/libcore/fmt/num.rs#L201-L254
//! [`fmt::Formatter`]: https://doc.rust-lang.org/std/fmt/struct.Formatter.html
//! [`dtoa`]: https://github.com/dtolnay/dtoa
//!
//! <br>
//!
//! # Performance (lower is better)
//!
//! ![performance](https://raw.githubusercontent.com/dtolnay/itoa/master/performance.png)
//!
//! <br>
//!
//! # Example
2019-05-01 21:26:44 -04:00
//!
//! ```
//! fn main() {
//! let mut buffer = itoa::Buffer::new();
//! let printed = buffer.format(128u64);
//! assert_eq!(printed, "128");
2019-05-01 21:26:44 -04:00
//! }
//! ```
2021-08-22 01:22:57 -04:00
#![doc(html_root_url = "https://docs.rs/itoa/0.4.8")]
2018-03-16 21:14:54 -04:00
#![cfg_attr(not(feature = "std"), no_std)]
#![allow(
clippy::cast_lossless,
clippy::cast_possible_truncation,
clippy::expl_impl_clone_on_copy,
clippy::missing_errors_doc,
clippy::must_use_candidate,
clippy::semicolon_if_nothing_returned, // https://github.com/rust-lang/rust-clippy/issues/7768
clippy::transmute_ptr_to_ptr,
clippy::unreadable_literal
2020-12-29 20:10:05 -05:00
)]
2017-09-16 17:22:05 -04:00
mod udiv128;
2018-03-16 21:14:54 -04:00
#[cfg(feature = "std")]
2021-12-12 00:07:41 -05:00
use std::{mem, ptr, slice, str};
2016-06-25 17:32:23 -04:00
2018-03-16 21:14:54 -04:00
#[cfg(not(feature = "std"))]
2021-12-12 00:07:14 -05:00
use core::{mem, ptr, slice, str};
2018-03-16 21:14:54 -04:00
use self::mem::MaybeUninit;
/// A safe API for formatting integers to text.
2018-09-08 15:05:53 -04:00
///
/// # Example
///
2019-04-30 04:20:42 -04:00
/// ```
2018-09-08 15:05:53 -04:00
/// let mut buffer = itoa::Buffer::new();
/// let printed = buffer.format(1234);
/// assert_eq!(printed, "1234");
/// ```
#[derive(Copy)]
pub struct Buffer {
bytes: [MaybeUninit<u8>; I128_MAX_LEN],
}
impl Default for Buffer {
#[inline]
fn default() -> Buffer {
Buffer::new()
}
}
impl Clone for Buffer {
#[inline]
fn clone(&self) -> Self {
Buffer::new()
}
}
impl Buffer {
/// This is a cheap operation; you don't need to worry about reusing buffers
/// for efficiency.
#[inline]
pub fn new() -> Buffer {
let bytes = [MaybeUninit::<u8>::uninit(); I128_MAX_LEN];
Buffer { bytes }
}
/// Print an integer into this buffer and return a reference to its string representation
2018-09-08 15:05:53 -04:00
/// within the buffer.
pub fn format<I: Integer>(&mut self, i: I) -> &str {
i.write(self)
}
}
// Seal to prevent downstream implementations of the Integer trait.
mod private {
pub trait Sealed {}
}
/// An integer that can be written into an [`itoa::Buffer`][Buffer].
2018-03-18 03:22:56 -04:00
///
/// This trait is sealed and cannot be implemented for types outside of itoa.
pub trait Integer: private::Sealed {
2018-03-18 03:20:35 -04:00
// Not public API.
#[doc(hidden)]
2019-05-01 22:10:39 -04:00
fn write(self, buf: &mut Buffer) -> &str;
2016-06-25 17:32:23 -04:00
}
trait IntegerPrivate<B> {
fn write_to(self, buf: &mut B) -> &[u8];
}
const DEC_DIGITS_LUT: &[u8] = b"\
2018-09-08 15:11:06 -04:00
0001020304050607080910111213141516171819\
2016-06-25 17:32:23 -04:00
2021222324252627282930313233343536373839\
4041424344454647484950515253545556575859\
6061626364656667686970717273747576777879\
8081828384858687888990919293949596979899";
// Adaptation of the original implementation at
// https://github.com/rust-lang/rust/blob/b8214dc6c6fc20d0a660fb5700dca9ebf51ebe89/src/libcore/fmt/num.rs#L188-L266
macro_rules! impl_IntegerCommon {
($max_len:expr, $t:ident) => {
2017-09-16 17:12:12 -04:00
impl Integer for $t {
2018-03-20 22:48:34 -04:00
#[inline]
2019-05-01 22:10:39 -04:00
fn write(self, buf: &mut Buffer) -> &str {
unsafe {
debug_assert!($max_len <= I128_MAX_LEN);
let buf = mem::transmute::<
&mut [MaybeUninit<u8>; I128_MAX_LEN],
&mut [MaybeUninit<u8>; $max_len],
>(&mut buf.bytes);
let bytes = self.write_to(buf);
str::from_utf8_unchecked(bytes)
}
}
}
impl private::Sealed for $t {}
};
}
macro_rules! impl_Integer {
2018-03-22 04:38:52 -04:00
($($max_len:expr => $t:ident),* as $conv_fn:ident) => {$(
impl_IntegerCommon!($max_len, $t);
2017-09-16 17:12:12 -04:00
impl IntegerPrivate<[MaybeUninit<u8>; $max_len]> for $t {
2017-09-16 17:12:12 -04:00
#[allow(unused_comparisons)]
2018-03-20 22:48:34 -04:00
#[inline]
fn write_to(self, buf: &mut [MaybeUninit<u8>; $max_len]) -> &[u8] {
2017-09-16 17:12:12 -04:00
let is_nonnegative = self >= 0;
let mut n = if is_nonnegative {
self as $conv_fn
} else {
// convert the negative num to positive by summing 1 to it's 2 complement
(!(self as $conv_fn)).wrapping_add(1)
};
let mut curr = buf.len() as isize;
let buf_ptr = buf.as_mut_ptr() as *mut u8;
2017-09-16 17:12:12 -04:00
let lut_ptr = DEC_DIGITS_LUT.as_ptr();
unsafe {
// need at least 16 bits for the 4-characters-at-a-time to work.
if mem::size_of::<$t>() >= 2 {
// eagerly decode 4 characters at a time
2017-09-16 17:12:12 -04:00
while n >= 10000 {
let rem = (n % 10000) as isize;
n /= 10000;
let d1 = (rem / 100) << 1;
let d2 = (rem % 100) << 1;
curr -= 4;
ptr::copy_nonoverlapping(lut_ptr.offset(d1), buf_ptr.offset(curr), 2);
ptr::copy_nonoverlapping(lut_ptr.offset(d2), buf_ptr.offset(curr + 2), 2);
}
2016-06-25 17:32:23 -04:00
}
2017-09-16 17:12:12 -04:00
// if we reach here numbers are <= 9999, so at most 4 chars long
let mut n = n as isize; // possibly reduce 64bit math
2016-06-25 17:32:23 -04:00
2017-09-16 17:12:12 -04:00
// decode 2 more chars, if > 2 chars
if n >= 100 {
let d1 = (n % 100) << 1;
n /= 100;
curr -= 2;
ptr::copy_nonoverlapping(lut_ptr.offset(d1), buf_ptr.offset(curr), 2);
}
2016-06-25 17:32:23 -04:00
2017-09-16 17:12:12 -04:00
// decode last 1 or 2 chars
if n < 10 {
curr -= 1;
*buf_ptr.offset(curr) = (n as u8) + b'0';
} else {
let d1 = n << 1;
curr -= 2;
ptr::copy_nonoverlapping(lut_ptr.offset(d1), buf_ptr.offset(curr), 2);
}
2017-09-16 17:12:12 -04:00
if !is_nonnegative {
curr -= 1;
*buf_ptr.offset(curr) = b'-';
}
}
2016-06-25 17:32:23 -04:00
2017-09-16 17:12:12 -04:00
let len = buf.len() - curr as usize;
unsafe { slice::from_raw_parts(buf_ptr.offset(curr), len) }
}
2016-06-25 17:32:23 -04:00
}
2017-09-16 17:12:12 -04:00
)*};
2016-06-25 17:32:23 -04:00
}
const I8_MAX_LEN: usize = 4;
const U8_MAX_LEN: usize = 3;
const I16_MAX_LEN: usize = 6;
const U16_MAX_LEN: usize = 5;
const I32_MAX_LEN: usize = 11;
const U32_MAX_LEN: usize = 10;
const I64_MAX_LEN: usize = 20;
const U64_MAX_LEN: usize = 20;
impl_Integer!(
I8_MAX_LEN => i8,
U8_MAX_LEN => u8,
I16_MAX_LEN => i16,
U16_MAX_LEN => u16,
I32_MAX_LEN => i32,
2018-09-08 15:11:06 -04:00
U32_MAX_LEN => u32
as u32);
impl_Integer!(I64_MAX_LEN => i64, U64_MAX_LEN => u64 as u64);
2016-06-25 17:32:23 -04:00
#[cfg(target_pointer_width = "16")]
impl_Integer!(I16_MAX_LEN => isize, U16_MAX_LEN => usize as u16);
2016-06-25 17:32:23 -04:00
#[cfg(target_pointer_width = "32")]
2018-03-22 04:18:40 -04:00
impl_Integer!(I32_MAX_LEN => isize, U32_MAX_LEN => usize as u32);
2016-06-25 17:32:23 -04:00
#[cfg(target_pointer_width = "64")]
impl_Integer!(I64_MAX_LEN => isize, U64_MAX_LEN => usize as u64);
2017-09-16 16:18:37 -04:00
macro_rules! impl_Integer128 {
($($max_len:expr => $t:ident),*) => {$(
impl_IntegerCommon!($max_len, $t);
2017-09-16 16:18:37 -04:00
impl IntegerPrivate<[MaybeUninit<u8>; $max_len]> for $t {
2017-09-16 16:18:37 -04:00
#[allow(unused_comparisons)]
2018-03-20 22:48:34 -04:00
#[inline]
fn write_to(self, buf: &mut [MaybeUninit<u8>; $max_len]) -> &[u8] {
2017-09-16 16:18:37 -04:00
let is_nonnegative = self >= 0;
let n = if is_nonnegative {
self as u128
} else {
// convert the negative num to positive by summing 1 to it's 2 complement
(!(self as u128)).wrapping_add(1)
};
let mut curr = buf.len() as isize;
let buf_ptr = buf.as_mut_ptr() as *mut u8;
2017-09-16 16:18:37 -04:00
unsafe {
// Divide by 10^19 which is the highest power less than 2^64.
let (n, rem) = udiv128::udivmod_1e19(n);
let buf1 = buf_ptr.offset(curr - U64_MAX_LEN as isize) as *mut [MaybeUninit<u8>; U64_MAX_LEN];
2018-03-22 04:38:52 -04:00
curr -= rem.write_to(&mut *buf1).len() as isize;
2017-09-16 16:18:37 -04:00
if n != 0 {
// Memset the base10 leading zeros of rem.
let target = buf.len() as isize - 19;
ptr::write_bytes(buf_ptr.offset(target), b'0', (curr - target) as usize);
curr = target;
// Divide by 10^19 again.
let (n, rem) = udiv128::udivmod_1e19(n);
let buf2 = buf_ptr.offset(curr - U64_MAX_LEN as isize) as *mut [MaybeUninit<u8>; U64_MAX_LEN];
2017-09-16 16:18:37 -04:00
curr -= rem.write_to(&mut *buf2).len() as isize;
if n != 0 {
// Memset the leading zeros.
let target = buf.len() as isize - 38;
ptr::write_bytes(buf_ptr.offset(target), b'0', (curr - target) as usize);
curr = target;
// There is at most one digit left
// because u128::max / 10^19 / 10^19 is 3.
curr -= 1;
*buf_ptr.offset(curr) = (n as u8) + b'0';
}
}
if !is_nonnegative {
curr -= 1;
*buf_ptr.offset(curr) = b'-';
}
let len = buf.len() - curr as usize;
slice::from_raw_parts(buf_ptr.offset(curr), len)
}
}
}
)*};
}
const U128_MAX_LEN: usize = 39;
const I128_MAX_LEN: usize = 40;
impl_Integer128!(I128_MAX_LEN => i128, U128_MAX_LEN => u128);