vendor/base64-0.21.2/src/chunked_encoder.rs - toolchain/rustc - Git at Google

 #[cfg(any(feature = "alloc", feature = "std", test))]
 use alloc::string::String;
 use core::cmp;
 #[cfg(any(feature = "alloc", feature = "std", test))]
 use core::str;

 use crate::encode::add_padding;
 use crate::engine::{Config, Engine};

 /// The output mechanism for ChunkedEncoder's encoded bytes.
 pub trait Sink {
     type Error;

     /// Handle a chunk of encoded base64 data (as UTF-8 bytes)
     fn write_encoded_bytes(&mut self, encoded: &[u8]) -> Result<(), Self::Error>;
 }

 const BUF_SIZE: usize = 1024;

 /// A base64 encoder that emits encoded bytes in chunks without heap allocation.
 pub struct ChunkedEncoder<'e, E: Engine + ?Sized> {
     engine: &'e E,
     max_input_chunk_len: usize,
 }

 impl<'e, E: Engine + ?Sized> ChunkedEncoder<'e, E> {
     pub fn new(engine: &'e E) -> ChunkedEncoder<'e, E> {
         ChunkedEncoder {
             engine,
             max_input_chunk_len: max_input_length(BUF_SIZE, engine.config().encode_padding()),
         }
     }

     pub fn encode<S: Sink>(&self, bytes: &[u8], sink: &mut S) -> Result<(), S::Error> {
         let mut encode_buf: [u8; BUF_SIZE] = [0; BUF_SIZE];
         let mut input_index = 0;

         while input_index < bytes.len() {
             // either the full input chunk size, or it's the last iteration
             let input_chunk_len = cmp::min(self.max_input_chunk_len, bytes.len() - input_index);

             let chunk = &bytes[input_index..(input_index + input_chunk_len)];

             let mut b64_bytes_written = self.engine.internal_encode(chunk, &mut encode_buf);

             input_index += input_chunk_len;
             let more_input_left = input_index < bytes.len();

             if self.engine.config().encode_padding() && !more_input_left {
                 // no more input, add padding if needed. Buffer will have room because
                 // max_input_length leaves room for it.
                 b64_bytes_written +=
                     add_padding(b64_bytes_written, &mut encode_buf[b64_bytes_written..]);
             }

             sink.write_encoded_bytes(&encode_buf[0..b64_bytes_written])?;
         }

         Ok(())
     }
 }

 /// Calculate the longest input that can be encoded for the given output buffer size.
 ///
 /// If the config requires padding, two bytes of buffer space will be set aside so that the last
 /// chunk of input can be encoded safely.
 ///
 /// The input length will always be a multiple of 3 so that no encoding state has to be carried over
 /// between chunks.
 fn max_input_length(encoded_buf_len: usize, padded: bool) -> usize {
     let effective_buf_len = if padded {
         // make room for padding
         encoded_buf_len
             .checked_sub(2)
             .expect("Don't use a tiny buffer")
     } else {
         encoded_buf_len
     };

     // No padding, so just normal base64 expansion.
     (effective_buf_len / 4) * 3
 }

 // A really simple sink that just appends to a string
 #[cfg(any(feature = "alloc", feature = "std", test))]
 pub(crate) struct StringSink<'a> {
     string: &'a mut String,
 }

 #[cfg(any(feature = "alloc", feature = "std", test))]
 impl<'a> StringSink<'a> {
     pub(crate) fn new(s: &mut String) -> StringSink {
         StringSink { string: s }
     }
 }

 #[cfg(any(feature = "alloc", feature = "std", test))]
 impl<'a> Sink for StringSink<'a> {
     type Error = ();

     fn write_encoded_bytes(&mut self, s: &[u8]) -> Result<(), Self::Error> {
         self.string.push_str(str::from_utf8(s).unwrap());

         Ok(())
     }
 }

 #[cfg(test)]
 pub mod tests {
     use rand::{
         distributions::{Distribution, Uniform},
         Rng, SeedableRng,
     };

     use crate::{
         alphabet::STANDARD,
         engine::general_purpose::{GeneralPurpose, GeneralPurposeConfig, PAD},
         tests::random_engine,
     };

     use super::*;

     #[test]
     fn chunked_encode_empty() {
         assert_eq!("", chunked_encode_str(&[], PAD));
     }

     #[test]
     fn chunked_encode_intermediate_fast_loop() {
         // > 8 bytes input, will enter the pretty fast loop
         assert_eq!("Zm9vYmFyYmF6cXV4", chunked_encode_str(b"foobarbazqux", PAD));
     }

     #[test]
     fn chunked_encode_fast_loop() {
         // > 32 bytes input, will enter the uber fast loop
         assert_eq!(
             "Zm9vYmFyYmF6cXV4cXV1eGNvcmdlZ3JhdWx0Z2FycGx5eg==",
             chunked_encode_str(b"foobarbazquxquuxcorgegraultgarplyz", PAD)
         );
     }

     #[test]
     fn chunked_encode_slow_loop_only() {
         // < 8 bytes input, slow loop only
         assert_eq!("Zm9vYmFy", chunked_encode_str(b"foobar", PAD));
     }

     #[test]
     fn chunked_encode_matches_normal_encode_random_string_sink() {
         let helper = StringSinkTestHelper;
         chunked_encode_matches_normal_encode_random(&helper);
     }

     #[test]
     fn max_input_length_no_pad() {
         assert_eq!(768, max_input_length(1024, false));
     }

     #[test]
     fn max_input_length_with_pad_decrements_one_triple() {
         assert_eq!(765, max_input_length(1024, true));
     }

     #[test]
     fn max_input_length_with_pad_one_byte_short() {
         assert_eq!(765, max_input_length(1025, true));
     }

     #[test]
     fn max_input_length_with_pad_fits_exactly() {
         assert_eq!(768, max_input_length(1026, true));
     }

     #[test]
     fn max_input_length_cant_use_extra_single_encoded_byte() {
         assert_eq!(300, max_input_length(401, false));
     }

     pub fn chunked_encode_matches_normal_encode_random<S: SinkTestHelper>(sink_test_helper: &S) {
         let mut input_buf: Vec<u8> = Vec::new();
         let mut output_buf = String::new();
         let mut rng = rand::rngs::SmallRng::from_entropy();
         let input_len_range = Uniform::new(1, 10_000);

         for _ in 0..5_000 {
             input_buf.clear();
             output_buf.clear();

             let buf_len = input_len_range.sample(&mut rng);
             for _ in 0..buf_len {
                 input_buf.push(rng.gen());
             }

             let engine = random_engine(&mut rng);

             let chunk_encoded_string = sink_test_helper.encode_to_string(&engine, &input_buf);
             engine.encode_string(&input_buf, &mut output_buf);

             assert_eq!(output_buf, chunk_encoded_string, "input len={}", buf_len);
         }
     }

     fn chunked_encode_str(bytes: &[u8], config: GeneralPurposeConfig) -> String {
         let mut s = String::new();

         let mut sink = StringSink::new(&mut s);
         let engine = GeneralPurpose::new(&STANDARD, config);
         let encoder = ChunkedEncoder::new(&engine);
         encoder.encode(bytes, &mut sink).unwrap();

         s
     }

     // An abstraction around sinks so that we can have tests that easily to any sink implementation
     pub trait SinkTestHelper {
         fn encode_to_string<E: Engine>(&self, engine: &E, bytes: &[u8]) -> String;
     }

     struct StringSinkTestHelper;

     impl SinkTestHelper for StringSinkTestHelper {
         fn encode_to_string<E: Engine>(&self, engine: &E, bytes: &[u8]) -> String {
             let encoder = ChunkedEncoder::new(engine);
             let mut s = String::new();
             let mut sink = StringSink::new(&mut s);
             encoder.encode(bytes, &mut sink).unwrap();

             s
         }
     }
 }
	#[cfg(any(feature = "alloc", feature = "std", test))]
	use alloc::string::String;
	use core::cmp;
	#[cfg(any(feature = "alloc", feature = "std", test))]
	use core::str;

	use crate::encode::add_padding;
	use crate::engine::{Config, Engine};

	/// The output mechanism for ChunkedEncoder's encoded bytes.
	pub trait Sink {
	type Error;

	/// Handle a chunk of encoded base64 data (as UTF-8 bytes)
	fn write_encoded_bytes(&mut self, encoded: &[u8]) -> Result<(), Self::Error>;
	}

	const BUF_SIZE: usize = 1024;

	/// A base64 encoder that emits encoded bytes in chunks without heap allocation.
	pub struct ChunkedEncoder<'e, E: Engine + ?Sized> {
	engine: &'e E,
	max_input_chunk_len: usize,
	}

	impl<'e, E: Engine + ?Sized> ChunkedEncoder<'e, E> {
	pub fn new(engine: &'e E) -> ChunkedEncoder<'e, E> {
	ChunkedEncoder {
	engine,
	max_input_chunk_len: max_input_length(BUF_SIZE, engine.config().encode_padding()),
	}
	}

	pub fn encode<S: Sink>(&self, bytes: &[u8], sink: &mut S) -> Result<(), S::Error> {
	let mut encode_buf: [u8; BUF_SIZE] = [0; BUF_SIZE];
	let mut input_index = 0;

	while input_index < bytes.len() {
	// either the full input chunk size, or it's the last iteration
	let input_chunk_len = cmp::min(self.max_input_chunk_len, bytes.len() - input_index);

	let chunk = &bytes[input_index..(input_index + input_chunk_len)];

	let mut b64_bytes_written = self.engine.internal_encode(chunk, &mut encode_buf);

	input_index += input_chunk_len;
	let more_input_left = input_index < bytes.len();

	if self.engine.config().encode_padding() && !more_input_left {
	// no more input, add padding if needed. Buffer will have room because
	// max_input_length leaves room for it.
	b64_bytes_written +=
	add_padding(b64_bytes_written, &mut encode_buf[b64_bytes_written..]);
	}

	sink.write_encoded_bytes(&encode_buf[0..b64_bytes_written])?;
	}

	Ok(())
	}
	}

	/// Calculate the longest input that can be encoded for the given output buffer size.
	///
	/// If the config requires padding, two bytes of buffer space will be set aside so that the last
	/// chunk of input can be encoded safely.
	///
	/// The input length will always be a multiple of 3 so that no encoding state has to be carried over
	/// between chunks.
	fn max_input_length(encoded_buf_len: usize, padded: bool) -> usize {
	let effective_buf_len = if padded {
	// make room for padding
	encoded_buf_len
	.checked_sub(2)
	.expect("Don't use a tiny buffer")
	} else {
	encoded_buf_len
	};

	// No padding, so just normal base64 expansion.
	(effective_buf_len / 4) * 3
	}

	// A really simple sink that just appends to a string
	#[cfg(any(feature = "alloc", feature = "std", test))]
	pub(crate) struct StringSink<'a> {
	string: &'a mut String,
	}

	#[cfg(any(feature = "alloc", feature = "std", test))]
	impl<'a> StringSink<'a> {
	pub(crate) fn new(s: &mut String) -> StringSink {
	StringSink { string: s }
	}
	}

	#[cfg(any(feature = "alloc", feature = "std", test))]
	impl<'a> Sink for StringSink<'a> {
	type Error = ();

	fn write_encoded_bytes(&mut self, s: &[u8]) -> Result<(), Self::Error> {
	self.string.push_str(str::from_utf8(s).unwrap());

	Ok(())
	}
	}

	#[cfg(test)]
	pub mod tests {
	use rand::{
	distributions::{Distribution, Uniform},
	Rng, SeedableRng,
	};

	use crate::{
	alphabet::STANDARD,
	engine::general_purpose::{GeneralPurpose, GeneralPurposeConfig, PAD},
	tests::random_engine,
	};

	use super::*;

	#[test]
	fn chunked_encode_empty() {
	assert_eq!("", chunked_encode_str(&[], PAD));
	}

	#[test]
	fn chunked_encode_intermediate_fast_loop() {
	// > 8 bytes input, will enter the pretty fast loop
	assert_eq!("Zm9vYmFyYmF6cXV4", chunked_encode_str(b"foobarbazqux", PAD));
	}

	#[test]
	fn chunked_encode_fast_loop() {
	// > 32 bytes input, will enter the uber fast loop
	assert_eq!(
	"Zm9vYmFyYmF6cXV4cXV1eGNvcmdlZ3JhdWx0Z2FycGx5eg==",
	chunked_encode_str(b"foobarbazquxquuxcorgegraultgarplyz", PAD)
	);
	}

	#[test]
	fn chunked_encode_slow_loop_only() {
	// < 8 bytes input, slow loop only
	assert_eq!("Zm9vYmFy", chunked_encode_str(b"foobar", PAD));
	}

	#[test]
	fn chunked_encode_matches_normal_encode_random_string_sink() {
	let helper = StringSinkTestHelper;
	chunked_encode_matches_normal_encode_random(&helper);
	}

	#[test]
	fn max_input_length_no_pad() {
	assert_eq!(768, max_input_length(1024, false));
	}

	#[test]
	fn max_input_length_with_pad_decrements_one_triple() {
	assert_eq!(765, max_input_length(1024, true));
	}

	#[test]
	fn max_input_length_with_pad_one_byte_short() {
	assert_eq!(765, max_input_length(1025, true));
	}

	#[test]
	fn max_input_length_with_pad_fits_exactly() {
	assert_eq!(768, max_input_length(1026, true));
	}

	#[test]
	fn max_input_length_cant_use_extra_single_encoded_byte() {
	assert_eq!(300, max_input_length(401, false));
	}

	pub fn chunked_encode_matches_normal_encode_random<S: SinkTestHelper>(sink_test_helper: &S) {
	let mut input_buf: Vec<u8> = Vec::new();
	let mut output_buf = String::new();
	let mut rng = rand::rngs::SmallRng::from_entropy();
	let input_len_range = Uniform::new(1, 10_000);

	for _ in 0..5_000 {
	input_buf.clear();
	output_buf.clear();

	let buf_len = input_len_range.sample(&mut rng);
	for _ in 0..buf_len {
	input_buf.push(rng.gen());
	}

	let engine = random_engine(&mut rng);

	let chunk_encoded_string = sink_test_helper.encode_to_string(&engine, &input_buf);
	engine.encode_string(&input_buf, &mut output_buf);

	assert_eq!(output_buf, chunk_encoded_string, "input len={}", buf_len);
	}
	}

	fn chunked_encode_str(bytes: &[u8], config: GeneralPurposeConfig) -> String {
	let mut s = String::new();

	let mut sink = StringSink::new(&mut s);
	let engine = GeneralPurpose::new(&STANDARD, config);
	let encoder = ChunkedEncoder::new(&engine);
	encoder.encode(bytes, &mut sink).unwrap();

	s
	}

	// An abstraction around sinks so that we can have tests that easily to any sink implementation
	pub trait SinkTestHelper {
	fn encode_to_string<E: Engine>(&self, engine: &E, bytes: &[u8]) -> String;
	}

	struct StringSinkTestHelper;

	impl SinkTestHelper for StringSinkTestHelper {
	fn encode_to_string<E: Engine>(&self, engine: &E, bytes: &[u8]) -> String {
	let encoder = ChunkedEncoder::new(engine);
	let mut s = String::new();
	let mut sink = StringSink::new(&mut s);
	encoder.encode(bytes, &mut sink).unwrap();

	s
	}
	}
	}