From 0b9607324e6c3415617e30da2c2617d85fe66422 Mon Sep 17 00:00:00 2001
From: zleyyij <75810274+zleyyij@users.noreply.github.com>
Date: Tue, 21 May 2024 01:27:43 -0600
Subject: [PATCH] Add documentation throughout the codebase. (#61)

* doc: added documentation throughout the codebase

authored-by: zleyyij <zleyyij@noreply.users.github.com>
---
 src/blocks/block.rs                      | 17 +++++
 src/blocks/literals_section.rs           | 90 ++++++++++++++++--------
 src/blocks/mod.rs                        |  7 ++
 src/blocks/sequence_section.rs           | 37 +++++++++-
 src/decoding/bit_reader.rs               |  1 +
 src/decoding/bit_reader_reverse.rs       | 12 +++-
 src/decoding/block_decoder.rs            |  5 +-
 src/decoding/decodebuffer.rs             | 42 +++++------
 src/decoding/dictionary.rs               | 28 +++++++-
 src/decoding/literals_section_decoder.rs |  8 +++
 src/decoding/mod.rs                      |  3 +
 src/decoding/ringbuffer.rs               | 26 ++++++-
 src/decoding/scratch.rs                  | 12 +++-
 src/decoding/sequence_execution.rs       | 12 ++--
 src/decoding/sequence_section_decoder.rs | 28 ++++++++
 src/frame.rs                             | 76 +++++++++++++++++++-
 src/frame_decoder.rs                     |  6 +-
 src/fse/fse_decoder.rs                   | 58 +++++++++++++--
 src/fse/mod.rs                           | 14 ++++
 src/huff0/huff0_decoder.rs               | 68 +++++++++++++++++-
 src/huff0/mod.rs                         |  4 ++
 src/io.rs                                |  1 +
 src/io_nostd.rs                          |  2 +
 src/streaming_decoder.rs                 | 35 +++++++--
 24 files changed, 509 insertions(+), 83 deletions(-)

diff --git a/src/blocks/block.rs b/src/blocks/block.rs
index 078eb44e..c8e63b74 100644
--- a/src/blocks/block.rs
+++ b/src/blocks/block.rs
@@ -1,8 +1,16 @@
+//! Block header definitions.
+
+/// There are 4 different kinds of blocks, and the type of block influences the meaning of `Block_Size`.
 #[derive(Debug, Clone, Copy, PartialEq, Eq)]
 pub enum BlockType {
+    /// An uncompressed block.
     Raw,
+    /// A single byte, repeated `Block_Size` times (Run Length Encoding).
     RLE,
+    /// A Zstandard compressed block. `Block_Size` is the length of the compressed data.
     Compressed,
+    /// This is not a valid block, and this value should not be used.
+    /// If this value is present, it should be considered corrupted data.
     Reserved,
 }
 
@@ -17,9 +25,18 @@ impl core::fmt::Display for BlockType {
     }
 }
 
+/// A representation of a single block header. As well as containing a frame header,
+/// each Zstandard frame contains one or more blocks.
 pub struct BlockHeader {
+    /// Whether this block is the last block in the frame.
+    /// It may be followed by an optional `Content_Checksum` if it is.
     pub last_block: bool,
     pub block_type: BlockType,
+    /// The size of the decompressed data. If the block type
+    /// is [BlockType::Reserved] or [BlockType::Compressed],
+    /// this value is set to zero and should not be referenced.
     pub decompressed_size: u32,
+    /// The size of the block. If the block is [BlockType::RLE],
+    /// this value will be 1.
     pub content_size: u32,
 }
diff --git a/src/blocks/literals_section.rs b/src/blocks/literals_section.rs
index 7e7d4909..10501ecf 100644
--- a/src/blocks/literals_section.rs
+++ b/src/blocks/literals_section.rs
@@ -1,16 +1,44 @@
+//! Utilities and representations for the first half of a block, the literals section.
+//! It contains data that is then copied from by the sequences section.
 use super::super::decoding::bit_reader::{BitReader, GetBitsError};
 
+/// A compressed block consists of two sections, a literals section, and a sequences section.
+/// This is the first of those two sections. A literal is just any arbitrary data, and it is copied by the sequences section
 pub struct LiteralsSection {
+    /// - If this block is of type [LiteralsSectionType::Raw], then the data is `regenerated_bytes`
+    /// bytes long, and it contains the raw literals data to be used during the second section,
+    /// the sequences section.
+    /// - If this block is of type [LiteralsSectionType::RLE],
+    /// then the literal consists of a single byte repeated `regenerated_size` times.
+    /// - For types [LiteralsSectionType::Compressed] or [LiteralsSectionType::Treeless],
+    /// then this is the size of the decompressed data.
     pub regenerated_size: u32,
+    /// - For types [LiteralsSectionType::Raw] and [LiteralsSectionType::RLE], this value is not present.
+    /// - For types [LiteralsSectionType::Compressed] and [LiteralsSectionType::Treeless], this value will
+    /// be set to the size of the compressed data.
     pub compressed_size: Option<u32>,
+    /// This value will be either 1 stream or 4 streams if the literal is of type
+    /// [LiteralsSectionType::Compressed] or [LiteralsSectionType::Treeless], and it
+    /// is not used for RLE or uncompressed literals.
     pub num_streams: Option<u8>,
+    /// The type of the literal section.
     pub ls_type: LiteralsSectionType,
 }
 
+/// The way which a literal section is encoded.
 pub enum LiteralsSectionType {
+    /// Literals are stored uncompressed.
     Raw,
+    /// Literals consist of a single byte value repeated [LiteralsSection::regenerated_size] times.
     RLE,
+    /// This is a standard Huffman-compressed block, starting with a Huffman tree description.
+    /// In this mode, there are at least *2* different literals represented in the Huffman tree
+    /// description.
     Compressed,
+    /// This is a Huffman-compressed block,
+    /// using the Huffman tree from the previous [LiteralsSectionType::Compressed] block
+    /// in the sequence. If this mode is triggered without any previous Huffman-tables in the
+    /// frame (or dictionary), it should be treated as data corruption.
     Treeless,
 }
 
@@ -77,6 +105,7 @@ impl Default for LiteralsSection {
 }
 
 impl LiteralsSection {
+    /// Create a new [LiteralsSection].
     pub fn new() -> LiteralsSection {
         LiteralsSection {
             regenerated_size: 0,
@@ -86,25 +115,26 @@ impl LiteralsSection {
         }
     }
 
+    /// Given the first byte of a header, determine the size of the whole header, from 1 to 5 bytes.
     pub fn header_bytes_needed(&self, first_byte: u8) -> Result<u8, LiteralsSectionParseError> {
-        let ls_type = Self::section_type(first_byte)?;
+        let ls_type: LiteralsSectionType = Self::section_type(first_byte)?;
         let size_format = (first_byte >> 2) & 0x3;
         match ls_type {
             LiteralsSectionType::RLE | LiteralsSectionType::Raw => {
                 match size_format {
                     0 | 2 => {
-                        //size_format actually only uses one bit
-                        //regenerated_size uses 5 bits
+                        // size_format actually only uses one bit
+                        // regenerated_size uses 5 bits
                         Ok(1)
                     }
                     1 => {
-                        //size_format uses 2 bit
-                        //regenerated_size uses 12 bits
+                        // size_format uses 2 bit
+                        // regenerated_size uses 12 bits
                         Ok(2)
                     }
                     3 => {
-                        //size_format uses 2 bit
-                        //regenerated_size uses 20 bits
+                        // size_format uses 2 bit
+                        // regenerated_size uses 20 bits
                         Ok(3)
                     }
                     _ => panic!(
@@ -115,16 +145,16 @@ impl LiteralsSection {
             LiteralsSectionType::Compressed | LiteralsSectionType::Treeless => {
                 match size_format {
                     0 | 1 => {
-                        //Only differ in num_streams
-                        //both regenerated and compressed sizes use 10 bit
+                        // Only differ in num_streams
+                        // both regenerated and compressed sizes use 10 bit
                         Ok(3)
                     }
                     2 => {
-                        //both regenerated and compressed sizes use 14 bit
+                        // both regenerated and compressed sizes use 14 bit
                         Ok(4)
                     }
                     3 => {
-                        //both regenerated and compressed sizes use 18 bit
+                        // both regenerated and compressed sizes use 18 bit
                         Ok(5)
                     }
 
@@ -136,10 +166,11 @@ impl LiteralsSection {
         }
     }
 
+    /// Parse the header into `self`, and returns the number of bytes read.
     pub fn parse_from_header(&mut self, raw: &[u8]) -> Result<u8, LiteralsSectionParseError> {
-        let mut br = BitReader::new(raw);
-        let t = br.get_bits(2)? as u8;
-        self.ls_type = Self::section_type(t)?;
+        let mut br: BitReader<'_> = BitReader::new(raw);
+        let block_type = br.get_bits(2)? as u8;
+        self.ls_type = Self::section_type(block_type)?;
         let size_format = br.get_bits(2)? as u8;
 
         let byte_needed = self.header_bytes_needed(raw[0])?;
@@ -155,20 +186,20 @@ impl LiteralsSection {
                 self.compressed_size = None;
                 match size_format {
                     0 | 2 => {
-                        //size_format actually only uses one bit
-                        //regenerated_size uses 5 bits
+                        // size_format actually only uses one bit
+                        // regenerated_size uses 5 bits
                         self.regenerated_size = u32::from(raw[0]) >> 3;
                         Ok(1)
                     }
                     1 => {
-                        //size_format uses 2 bit
-                        //regenerated_size uses 12 bits
+                        // size_format uses 2 bit
+                        // regenerated_size uses 12 bits
                         self.regenerated_size = (u32::from(raw[0]) >> 4) + (u32::from(raw[1]) << 4);
                         Ok(2)
                     }
                     3 => {
-                        //size_format uses 2 bit
-                        //regenerated_size uses 20 bits
+                        // size_format uses 2 bit
+                        // regenerated_size uses 20 bits
                         self.regenerated_size = (u32::from(raw[0]) >> 4)
                             + (u32::from(raw[1]) << 4)
                             + (u32::from(raw[2]) << 12);
@@ -194,10 +225,10 @@ impl LiteralsSection {
 
                 match size_format {
                     0 | 1 => {
-                        //Differ in num_streams see above
-                        //both regenerated and compressed sizes use 10 bit
+                        // Differ in num_streams see above
+                        // both regenerated and compressed sizes use 10 bit
 
-                        //4 from the first, six from the second byte
+                        // 4 from the first, six from the second byte
                         self.regenerated_size =
                             (u32::from(raw[0]) >> 4) + ((u32::from(raw[1]) & 0x3f) << 4);
 
@@ -207,27 +238,27 @@ impl LiteralsSection {
                         Ok(3)
                     }
                     2 => {
-                        //both regenerated and compressed sizes use 14 bit
+                        // both regenerated and compressed sizes use 14 bit
 
-                        //4 from first, full second, 2 from the third byte
+                        // 4 from first, full second, 2 from the third byte
                         self.regenerated_size = (u32::from(raw[0]) >> 4)
                             + (u32::from(raw[1]) << 4)
                             + ((u32::from(raw[2]) & 0x3) << 12);
 
-                        //6 from the third, full last byte
+                        // 6 from the third, full last byte
                         self.compressed_size =
                             Some((u32::from(raw[2]) >> 2) + (u32::from(raw[3]) << 6));
                         Ok(4)
                     }
                     3 => {
-                        //both regenerated and compressed sizes use 18 bit
+                        // both regenerated and compressed sizes use 18 bit
 
-                        //4 from first, full second, six from third byte
+                        // 4 from first, full second, six from third byte
                         self.regenerated_size = (u32::from(raw[0]) >> 4)
                             + (u32::from(raw[1]) << 4)
                             + ((u32::from(raw[2]) & 0x3F) << 12);
 
-                        //2 from third, full fourth, full fifth byte
+                        // 2 from third, full fourth, full fifth byte
                         self.compressed_size = Some(
                             (u32::from(raw[2]) >> 6)
                                 + (u32::from(raw[3]) << 2)
@@ -244,6 +275,7 @@ impl LiteralsSection {
         }
     }
 
+    /// Given the first two bits of a header, determine the type of a header.
     fn section_type(raw: u8) -> Result<LiteralsSectionType, LiteralsSectionParseError> {
         let t = raw & 0x3;
         match t {
diff --git a/src/blocks/mod.rs b/src/blocks/mod.rs
index d12a1866..c4787b87 100644
--- a/src/blocks/mod.rs
+++ b/src/blocks/mod.rs
@@ -1,3 +1,10 @@
+//! In a Zstandard frame, there's a frame header, followed by one or more *blocks*.
+//!
+//! A block contains data, and a header describing how that data is encoded, as well
+//! as other misc metadata.
+//!
+//! <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#blocks>
+
 pub mod block;
 pub mod literals_section;
 pub mod sequence_section;
diff --git a/src/blocks/sequence_section.rs b/src/blocks/sequence_section.rs
index bc28425e..653ecf7c 100644
--- a/src/blocks/sequence_section.rs
+++ b/src/blocks/sequence_section.rs
@@ -1,12 +1,32 @@
+//! Utilities and representations for the second half of a block, the sequence section.
+//! This section copies literals from the literals section into the decompressed output.
+
 pub struct SequencesHeader {
     pub num_sequences: u32,
     pub modes: Option<CompressionModes>,
 }
 
+/// A sequence represents potentially redundant data, and it can be broken up into 2 steps:
+/// - A copy step, where data is copied from the literals section to the decompressed output
+/// - A *match* copy step that copies data from within the previously decompressed output.
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#sequence-execution>
 #[derive(Clone, Copy)]
 pub struct Sequence {
+    /// Literal length, or the number of bytes to be copied from the literals section
+    /// in the copy step.
     pub ll: u32,
+    /// The length of the match to make during the match copy step.
     pub ml: u32,
+    /// How far back to go in the decompressed data to read from the match copy step.
+    /// If this value is greater than 3, then the offset is `of -3`. If `of` is from 1-3,
+    /// then it has special handling:
+    ///
+    /// The first 3 values define 3 different repeated offsets, with 1 referring to the most
+    /// recent, 2 the second recent, and so on. When the current sequence has a literal length of 0,
+    /// then the repeated offsets are shifted by 1. So an offset value of 1 refers to 2, 2 refers to 3,
+    /// and 3 refers to the most recent offset minus one. If that value is equal to zero, the data
+    /// is considered corrupted.
     pub of: u32,
 }
 
@@ -16,16 +36,27 @@ impl core::fmt::Display for Sequence {
     }
 }
 
+/// This byte defines the compression mode of each symbol type
 #[derive(Copy, Clone)]
 pub struct CompressionModes(u8);
+/// The compression mode used for symbol compression
 pub enum ModeType {
+    /// A predefined FSE distribution table is used, and no distribution table
+    /// will be present.
     Predefined,
+    /// The table consists of a single byte, which contains the symbol's value.
     RLE,
+    /// Standard FSE compression, a distribution table will be present. This
+    /// mode should not be used when only one symbol is present.
     FSECompressed,
+    /// The table used in the previous compressed block with at least one sequence
+    /// will be used again. If this is the first block, the table in the dictionary will
+    /// be used.
     Repeat,
 }
 
 impl CompressionModes {
+    /// Deserialize a two bit mode value into a [ModeType]
     pub fn decode_mode(m: u8) -> ModeType {
         match m {
             0 => ModeType::Predefined,
@@ -35,15 +66,17 @@ impl CompressionModes {
             _ => panic!("This can never happen"),
         }
     }
-
+    /// Read the compression mode of the literal lengths field.
     pub fn ll_mode(self) -> ModeType {
         Self::decode_mode(self.0 >> 6)
     }
 
+    /// Read the compression mode of the offset value field.
     pub fn of_mode(self) -> ModeType {
         Self::decode_mode((self.0 >> 4) & 0x3)
     }
 
+    /// Read the compression mode of the match lengths field.
     pub fn ml_mode(self) -> ModeType {
         Self::decode_mode((self.0 >> 2) & 0x3)
     }
@@ -79,6 +112,7 @@ impl core::fmt::Display for SequencesHeaderParseError {
 }
 
 impl SequencesHeader {
+    /// Create a new [SequencesHeader].
     pub fn new() -> SequencesHeader {
         SequencesHeader {
             num_sequences: 0,
@@ -86,6 +120,7 @@ impl SequencesHeader {
         }
     }
 
+    /// Attempt to deserialize the provided buffer into `self`, returning the number of bytes read.
     pub fn parse_from_header(&mut self, source: &[u8]) -> Result<u8, SequencesHeaderParseError> {
         let mut bytes_read = 0;
         if source.is_empty() {
diff --git a/src/decoding/bit_reader.rs b/src/decoding/bit_reader.rs
index 26228aa6..85058211 100644
--- a/src/decoding/bit_reader.rs
+++ b/src/decoding/bit_reader.rs
@@ -1,3 +1,4 @@
+/// Interact with a provided source at a bit level.
 pub struct BitReader<'s> {
     idx: usize, //index counts bits already read
     source: &'s [u8],
diff --git a/src/decoding/bit_reader_reverse.rs b/src/decoding/bit_reader_reverse.rs
index 5bc5a2a7..cc0e0915 100644
--- a/src/decoding/bit_reader_reverse.rs
+++ b/src/decoding/bit_reader_reverse.rs
@@ -2,15 +2,21 @@ pub use super::bit_reader::GetBitsError;
 use byteorder::ByteOrder;
 use byteorder::LittleEndian;
 
+/// Zstandard encodes some types of data in a way that the data must be read
+/// back to front to decode it properly. `BitReaderReversed` provides a
+/// convenient interface to do that.
 pub struct BitReaderReversed<'s> {
     idx: isize, //index counts bits already read
     source: &'s [u8],
-
+    /// The reader doesn't read directly from the source,
+    /// it reads bits from here, and the container is
+    /// "refilled" as it's emptied.
     bit_container: u64,
     bits_in_container: u8,
 }
 
 impl<'s> BitReaderReversed<'s> {
+    /// How many bits are left to read by the reader.
     pub fn bits_remaining(&self) -> isize {
         self.idx + self.bits_in_container as isize
     }
@@ -102,6 +108,8 @@ impl<'s> BitReaderReversed<'s> {
         (self.idx - 1) / 8
     }
 
+    /// Read `n` number of bits from the source. Returns an error if the reader
+    /// requests more bits than remain for reading.
     #[inline(always)]
     pub fn get_bits(&mut self, n: u8) -> Result<u64, GetBitsError> {
         if n == 0 {
@@ -162,7 +170,7 @@ impl<'s> BitReaderReversed<'s> {
             return Ok((0, 0, 0));
         }
         if sum > 56 {
-            // try and get the values separatly
+            // try and get the values separately
             return Ok((self.get_bits(n1)?, self.get_bits(n2)?, self.get_bits(n3)?));
         }
         let sum = sum as u8;
diff --git a/src/decoding/block_decoder.rs b/src/decoding/block_decoder.rs
index 9d48b21e..2d421fda 100644
--- a/src/decoding/block_decoder.rs
+++ b/src/decoding/block_decoder.rs
@@ -264,6 +264,7 @@ impl From<DecompressBlockError> for DecodeBlockContentError {
     }
 }
 
+/// Create a new [BlockDecoder].
 pub fn new() -> BlockDecoder {
     BlockDecoder {
         internal_state: DecoderState::ReadyToDecodeNextHeader,
@@ -474,14 +475,14 @@ impl BlockDecoder {
         let decompressed_size = match btype {
             BlockType::Raw => block_size,
             BlockType::RLE => block_size,
-            BlockType::Reserved => 0, //should be catched above, this is an error state
+            BlockType::Reserved => 0, //should be caught above, this is an error state
             BlockType::Compressed => 0, //unknown but will be smaller than 128kb (or window_size if that is smaller than 128kb)
         };
         let content_size = match btype {
             BlockType::Raw => block_size,
             BlockType::Compressed => block_size,
             BlockType::RLE => 1,
-            BlockType::Reserved => 0, //should be catched above, this is an error state
+            BlockType::Reserved => 0, //should be caught above, this is an error state
         };
 
         let last_block = self.is_last();
diff --git a/src/decoding/decodebuffer.rs b/src/decoding/decodebuffer.rs
index 6e98d150..04a43e8b 100644
--- a/src/decoding/decodebuffer.rs
+++ b/src/decoding/decodebuffer.rs
@@ -5,7 +5,7 @@ use core::hash::Hasher;
 
 use super::ringbuffer::RingBuffer;
 
-pub struct Decodebuffer {
+pub struct DecodeBuffer {
     buffer: RingBuffer,
     pub dict_content: Vec<u8>,
 
@@ -17,32 +17,32 @@ pub struct Decodebuffer {
 
 #[derive(Debug)]
 #[non_exhaustive]
-pub enum DecodebufferError {
+pub enum DecodeBufferError {
     NotEnoughBytesInDictionary { got: usize, need: usize },
     OffsetTooBig { offset: usize, buf_len: usize },
 }
 
 #[cfg(feature = "std")]
-impl std::error::Error for DecodebufferError {}
+impl std::error::Error for DecodeBufferError {}
 
-impl core::fmt::Display for DecodebufferError {
+impl core::fmt::Display for DecodeBufferError {
     fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
         match self {
-            DecodebufferError::NotEnoughBytesInDictionary { got, need } => {
+            DecodeBufferError::NotEnoughBytesInDictionary { got, need } => {
                 write!(
                     f,
                     "Need {} bytes from the dictionary but it is only {} bytes long",
                     need, got,
                 )
             }
-            DecodebufferError::OffsetTooBig { offset, buf_len } => {
+            DecodeBufferError::OffsetTooBig { offset, buf_len } => {
                 write!(f, "offset: {} bigger than buffer: {}", offset, buf_len,)
             }
         }
     }
 }
 
-impl Read for Decodebuffer {
+impl Read for DecodeBuffer {
     fn read(&mut self, target: &mut [u8]) -> Result<usize, Error> {
         let max_amount = self.can_drain_to_window_size().unwrap_or(0);
         let amount = max_amount.min(target.len());
@@ -57,9 +57,9 @@ impl Read for Decodebuffer {
     }
 }
 
-impl Decodebuffer {
-    pub fn new(window_size: usize) -> Decodebuffer {
-        Decodebuffer {
+impl DecodeBuffer {
+    pub fn new(window_size: usize) -> DecodeBuffer {
+        DecodeBuffer {
             buffer: RingBuffer::new(),
             dict_content: Vec::new(),
             window_size,
@@ -94,7 +94,7 @@ impl Decodebuffer {
         self.total_output_counter += data.len() as u64;
     }
 
-    pub fn repeat(&mut self, offset: usize, match_length: usize) -> Result<(), DecodebufferError> {
+    pub fn repeat(&mut self, offset: usize, match_length: usize) -> Result<(), DecodeBufferError> {
         if offset > self.buffer.len() {
             self.repeat_from_dict(offset, match_length)
         } else {
@@ -163,13 +163,13 @@ impl Decodebuffer {
         &mut self,
         offset: usize,
         match_length: usize,
-    ) -> Result<(), DecodebufferError> {
+    ) -> Result<(), DecodeBufferError> {
         if self.total_output_counter <= self.window_size as u64 {
             // at least part of that repeat is from the dictionary content
             let bytes_from_dict = offset - self.buffer.len();
 
             if bytes_from_dict > self.dict_content.len() {
-                return Err(DecodebufferError::NotEnoughBytesInDictionary {
+                return Err(DecodeBufferError::NotEnoughBytesInDictionary {
                     got: self.dict_content.len(),
                     need: bytes_from_dict,
                 });
@@ -189,14 +189,14 @@ impl Decodebuffer {
             }
             Ok(())
         } else {
-            Err(DecodebufferError::OffsetTooBig {
+            Err(DecodeBufferError::OffsetTooBig {
                 offset,
                 buf_len: self.buffer.len(),
             })
         }
     }
 
-    // Check if and how many bytes can currently be drawn from the buffer
+    /// Check if and how many bytes can currently be drawn from the buffer
     pub fn can_drain_to_window_size(&self) -> Option<usize> {
         if self.buffer.len() > self.window_size {
             Some(self.buffer.len() - self.window_size)
@@ -210,8 +210,8 @@ impl Decodebuffer {
         self.buffer.len()
     }
 
-    //drain as much as possible while retaining enough so that decoding si still possible with the required window_size
-    //At best call only if can_drain_to_window_size reports a 'high' number of bytes to reduce allocations
+    /// Drain as much as possible while retaining enough so that decoding si still possible with the required window_size
+    /// At best call only if can_drain_to_window_size reports a 'high' number of bytes to reduce allocations
     pub fn drain_to_window_size(&mut self) -> Option<Vec<u8>> {
         //TODO investigate if it is possible to return the std::vec::Drain iterator directly without collecting here
         match self.can_drain_to_window_size() {
@@ -238,7 +238,7 @@ impl Decodebuffer {
         }
     }
 
-    //drain the buffer completely
+    /// drain the buffer completely
     pub fn drain(&mut self) -> Vec<u8> {
         let (slice1, slice2) = self.buffer.as_slices();
         #[cfg(feature = "hash")]
@@ -350,7 +350,7 @@ fn write_all_bytes(mut sink: impl Write, buf: &[u8]) -> (usize, Result<(), Error
 
 #[cfg(test)]
 mod tests {
-    use super::Decodebuffer;
+    use super::DecodeBuffer;
     use crate::io::{Error, ErrorKind, Write};
 
     extern crate std;
@@ -385,7 +385,7 @@ mod tests {
             write_len: 10,
         };
 
-        let mut decode_buf = Decodebuffer::new(100);
+        let mut decode_buf = DecodeBuffer::new(100);
         decode_buf.push(b"0123456789");
         decode_buf.repeat(10, 90).unwrap();
         let repeats = 1000;
@@ -435,7 +435,7 @@ mod tests {
             block_every: 5,
         };
 
-        let mut decode_buf = Decodebuffer::new(100);
+        let mut decode_buf = DecodeBuffer::new(100);
         decode_buf.push(b"0123456789");
         decode_buf.repeat(10, 90).unwrap();
         let repeats = 1000;
diff --git a/src/decoding/dictionary.rs b/src/decoding/dictionary.rs
index 35c05ffc..2d930c61 100644
--- a/src/decoding/dictionary.rs
+++ b/src/decoding/dictionary.rs
@@ -6,11 +6,34 @@ use crate::decoding::scratch::HuffmanScratch;
 use crate::fse::FSETableError;
 use crate::huff0::HuffmanTableError;
 
+/// Zstandard includes support for "raw content" dictionaries, that store bytes optionally used
+/// during sequence execution.
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#dictionary-format>
 pub struct Dictionary {
+    /// A 4 byte value used by decoders to check if they can use
+    /// the correct dictionary. This value must not be zero.
     pub id: u32,
+    /// A dictionary can contain an entropy table, either FSE or
+    /// Huffman.
     pub fse: FSEScratch,
+    /// A dictionary can contain an entropy table, either FSE or
+    /// Huffman.
     pub huf: HuffmanScratch,
+    /// The content of a dictionary acts as a "past" in front of data
+    /// to compress or decompress,
+    /// so it can be referenced in sequence commands.
+    /// As long as the amount of data decoded from this frame is less than or
+    /// equal to Window_Size, sequence commands may specify offsets longer than
+    /// the total length of decoded output so far to reference back to the
+    /// dictionary, even parts of the dictionary with offsets larger than Window_Size.
+    /// After the total output has surpassed Window_Size however,
+    /// this is no longer allowed and the dictionary is no longer accessible
     pub dict_content: Vec<u8>,
+    /// The 3 most recent offsets are stored so that they can be used
+    /// during sequence execution, see
+    /// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#repeat-offsets>
+    /// for more.
     pub offset_hist: [u32; 3],
 }
 
@@ -61,11 +84,12 @@ impl From<HuffmanTableError> for DictionaryDecodeError {
     }
 }
 
+/// This 4 byte (little endian) magic number refers to the start of a dictionary
 pub const MAGIC_NUM: [u8; 4] = [0x37, 0xA4, 0x30, 0xEC];
 
 impl Dictionary {
-    /// parses the dictionary and set the tables
-    /// it returns the dict_id for checking with the frame's dict_id
+    /// Parses the dictionary from `raw` and set the tables
+    /// it returns the dict_id for checking with the frame's `dict_id``
     pub fn decode_dict(raw: &[u8]) -> Result<Dictionary, DictionaryDecodeError> {
         let mut new_dict = Dictionary {
             id: 0,
diff --git a/src/decoding/literals_section_decoder.rs b/src/decoding/literals_section_decoder.rs
index dbb81ae3..6948b6a7 100644
--- a/src/decoding/literals_section_decoder.rs
+++ b/src/decoding/literals_section_decoder.rs
@@ -1,3 +1,6 @@
+//! This module contains the [decompress_literals] function, used to take a
+//! parsed literals header and a source and decompress it.
+
 use super::super::blocks::literals_section::{LiteralsSection, LiteralsSectionType};
 use super::bit_reader_reverse::{BitReaderReversed, GetBitsError};
 use super::scratch::HuffmanScratch;
@@ -105,6 +108,7 @@ impl From<HuffmanTableError> for DecompressLiteralsError {
     }
 }
 
+/// Decode and decompress the provided literals section into `target`, returning the number of bytes read.
 pub fn decode_literals(
     section: &LiteralsSection,
     scratch: &mut HuffmanScratch,
@@ -129,6 +133,10 @@ pub fn decode_literals(
     }
 }
 
+/// Decompress the provided literals section and source into the provided `target`.
+/// This function is used when the literals section is `Compressed` or `Treeless`
+///
+/// Returns the number of bytes read.
 fn decompress_literals(
     section: &LiteralsSection,
     scratch: &mut HuffmanScratch,
diff --git a/src/decoding/mod.rs b/src/decoding/mod.rs
index b89df351..a9f9b7ae 100644
--- a/src/decoding/mod.rs
+++ b/src/decoding/mod.rs
@@ -1,3 +1,6 @@
+//! Structures and utilities used for reading from data, decoding that data
+//! and storing the output.
+
 pub mod bit_reader;
 pub mod bit_reader_reverse;
 pub mod block_decoder;
diff --git a/src/decoding/ringbuffer.rs b/src/decoding/ringbuffer.rs
index 8303edf5..e364d902 100644
--- a/src/decoding/ringbuffer.rs
+++ b/src/decoding/ringbuffer.rs
@@ -37,16 +37,19 @@ impl RingBuffer {
         }
     }
 
+    /// Return the number of bytes in the buffer.
     pub fn len(&self) -> usize {
         let (x, y) = self.data_slice_lengths();
         x + y
     }
 
+    /// Return the amount of available space (in bytes) of the buffer.
     pub fn free(&self) -> usize {
         let (x, y) = self.free_slice_lengths();
         (x + y).saturating_sub(1)
     }
 
+    /// Empty the buffer and reset the head and tail.
     pub fn clear(&mut self) {
         // SAFETY: Upholds invariant 2, trivially
         // SAFETY: Upholds invariant 3; 0 is always valid
@@ -54,10 +57,12 @@ impl RingBuffer {
         self.tail = 0;
     }
 
+    /// Whether the buffer is empty
     pub fn is_empty(&self) -> bool {
         self.head == self.tail
     }
 
+    /// Ensure that there's space for `amount` elements in the buffer.
     pub fn reserve(&mut self, amount: usize) {
         let free = self.free();
         if free >= amount {
@@ -131,6 +136,8 @@ impl RingBuffer {
         self.tail = (self.tail + 1) % self.cap;
     }
 
+    /// Fetch the byte stored at the selected index from the buffer, returning it, or
+    /// `None` if the index is out of bounds.
     #[allow(dead_code)]
     pub fn get(&self, idx: usize) -> Option<u8> {
         if idx < self.len() {
@@ -142,7 +149,7 @@ impl RingBuffer {
             None
         }
     }
-
+    /// Append the provided data to the end of `self`.
     pub fn extend(&mut self, data: &[u8]) {
         let len = data.len();
         let ptr = data.as_ptr();
@@ -178,6 +185,8 @@ impl RingBuffer {
         self.tail = (self.tail + len) % self.cap;
     }
 
+    /// Advance head past `amount` elements, effectively removing
+    /// them from the buffer.
     pub fn drop_first_n(&mut self, amount: usize) {
         debug_assert!(amount <= self.len());
         let amount = usize::min(amount, self.len());
@@ -186,6 +195,8 @@ impl RingBuffer {
         self.head = (self.head + amount) % self.cap;
     }
 
+    /// Return the size of the two contiguous occupied sections of memory used
+    /// by the buffer.
     // SAFETY: other code relies on this pointing to initialized halves of the buffer only
     fn data_slice_lengths(&self) -> (usize, usize) {
         let len_after_head;
@@ -203,6 +214,7 @@ impl RingBuffer {
     }
 
     // SAFETY: other code relies on this pointing to initialized halves of the buffer only
+    /// Return pointers to the head and tail, and the length of each section.
     fn data_slice_parts(&self) -> ((*const u8, usize), (*const u8, usize)) {
         let (len_after_head, len_to_tail) = self.data_slice_lengths();
 
@@ -211,6 +223,8 @@ impl RingBuffer {
             (self.buf.as_ptr(), len_to_tail),
         )
     }
+
+    /// Return references to each part of the ring buffer.
     pub fn as_slices(&self) -> (&[u8], &[u8]) {
         let (s1, s2) = self.data_slice_parts();
         unsafe {
@@ -223,6 +237,7 @@ impl RingBuffer {
 
     // SAFETY: other code relies on this producing the lengths of free zones
     // at the beginning/end of the buffer. Everything else must be initialized
+    /// Returns the size of the two unoccupied sections of memory used by the buffer.
     fn free_slice_lengths(&self) -> (usize, usize) {
         let len_to_head;
         let len_after_tail;
@@ -238,6 +253,8 @@ impl RingBuffer {
         (len_to_head, len_after_tail)
     }
 
+    /// Returns mutable references to the available space and the size of that available space,
+    /// for the two sections in the buffer.
     // SAFETY: Other code relies on this pointing to the free zones, data after the first and before the second must
     // be valid
     fn free_slice_parts(&self) -> ((*mut u8, usize), (*mut u8, usize)) {
@@ -249,6 +266,7 @@ impl RingBuffer {
         )
     }
 
+    /// Copies elements from the provided range to the end of the buffer.
     #[allow(dead_code)]
     pub fn extend_from_within(&mut self, start: usize, len: usize) {
         if start + len > self.len() {
@@ -268,6 +286,9 @@ impl RingBuffer {
         unsafe { self.extend_from_within_unchecked(start, len) }
     }
 
+    /// Copies data from the provided range to the end of the buffer, without
+    /// first verifying that the unoccupied capacity is available.
+    ///
     /// SAFETY:
     /// For this to be safe two requirements need to hold:
     /// 1. start + len <= self.len() so we do not copy uninitialised memory
@@ -326,6 +347,9 @@ impl RingBuffer {
     }
 
     #[allow(dead_code)]
+    /// This function is functionally the same as [RingBuffer::extend_from_within_unchecked],
+    /// but it does not contain any branching operations.
+    ///
     /// SAFETY:
     /// Needs start + len <= self.len()
     /// And more then len reserved space
diff --git a/src/decoding/scratch.rs b/src/decoding/scratch.rs
index 35d5c61e..37a27a36 100644
--- a/src/decoding/scratch.rs
+++ b/src/decoding/scratch.rs
@@ -1,14 +1,20 @@
+//! Structures that wrap around various decoders to make decoding easier.
+
 use super::super::blocks::sequence_section::Sequence;
-use super::decodebuffer::Decodebuffer;
+use super::decodebuffer::DecodeBuffer;
 use crate::decoding::dictionary::Dictionary;
 use crate::fse::FSETable;
 use crate::huff0::HuffmanTable;
 use alloc::vec::Vec;
 
+/// A block level decoding buffer.
 pub struct DecoderScratch {
+    /// The decoder used for Huffman blocks.
     pub huf: HuffmanScratch,
+    /// The decoder used for FSE blocks.
     pub fse: FSEScratch,
-    pub buffer: Decodebuffer,
+
+    pub buffer: DecodeBuffer,
     pub offset_hist: [u32; 3],
 
     pub literals_buffer: Vec<u8>,
@@ -30,7 +36,7 @@ impl DecoderScratch {
                 match_lengths: FSETable::new(),
                 ml_rle: None,
             },
-            buffer: Decodebuffer::new(window_size),
+            buffer: DecodeBuffer::new(window_size),
             offset_hist: [1, 4, 8],
 
             block_content_buffer: Vec::new(),
diff --git a/src/decoding/sequence_execution.rs b/src/decoding/sequence_execution.rs
index 2e731216..1a212284 100644
--- a/src/decoding/sequence_execution.rs
+++ b/src/decoding/sequence_execution.rs
@@ -1,9 +1,9 @@
-use super::{decodebuffer::DecodebufferError, scratch::DecoderScratch};
+use super::{decodebuffer::DecodeBufferError, scratch::DecoderScratch};
 
 #[derive(Debug)]
 #[non_exhaustive]
 pub enum ExecuteSequencesError {
-    DecodebufferError(DecodebufferError),
+    DecodebufferError(DecodeBufferError),
     NotEnoughBytesForSequence { wanted: usize, have: usize },
     ZeroOffset,
 }
@@ -38,12 +38,13 @@ impl std::error::Error for ExecuteSequencesError {
     }
 }
 
-impl From<DecodebufferError> for ExecuteSequencesError {
-    fn from(val: DecodebufferError) -> Self {
+impl From<DecodeBufferError> for ExecuteSequencesError {
+    fn from(val: DecodeBufferError) -> Self {
         Self::DecodebufferError(val)
     }
 }
 
+/// Take the provided decoder and execute the sequences stored within
 pub fn execute_sequences(scratch: &mut DecoderScratch) -> Result<(), ExecuteSequencesError> {
     let mut literals_copy_counter = 0;
     let old_buffer_size = scratch.buffer.len();
@@ -95,6 +96,9 @@ pub fn execute_sequences(scratch: &mut DecoderScratch) -> Result<(), ExecuteSequ
     Ok(())
 }
 
+/// Update the most recently used offsets to reflect the provided offset value, and return the
+/// "actual" offset needed because offsets are not stored in a raw way, some transformations are needed
+/// before you get a functional number.
 fn do_offset_history(offset_value: u32, lit_len: u32, scratch: &mut [u32; 3]) -> u32 {
     let actual_offset = if lit_len > 0 {
         match offset_value {
diff --git a/src/decoding/sequence_section_decoder.rs b/src/decoding/sequence_section_decoder.rs
index e2b4fd39..08252c33 100644
--- a/src/decoding/sequence_section_decoder.rs
+++ b/src/decoding/sequence_section_decoder.rs
@@ -98,6 +98,7 @@ impl From<FSEDecoderError> for DecodeSequenceError {
     }
 }
 
+/// Decode the provided source as a series of sequences into the supplied `target`.
 pub fn decode_sequences(
     section: &SequencesHeader,
     source: &[u8],
@@ -307,6 +308,10 @@ fn decode_sequences_without_rle(
     }
 }
 
+/// Look up the provided state value from a literal length table predefined
+/// by the Zstandard reference document. Returns a tuple of (value, number of bits).
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#appendix-a---decoding-tables-for-predefined-codes>
 fn lookup_ll_code(code: u8) -> (u32, u8) {
     match code {
         0..=15 => (u32::from(code), 0),
@@ -334,6 +339,10 @@ fn lookup_ll_code(code: u8) -> (u32, u8) {
     }
 }
 
+/// Look up the provided state value from a match length table predefined
+/// by the Zstandard reference document. Returns a tuple of (value, number of bits).
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#appendix-a---decoding-tables-for-predefined-codes>
 fn lookup_ml_code(code: u8) -> (u32, u8) {
     match code {
         0..=31 => (u32::from(code) + 3, 0),
@@ -362,8 +371,12 @@ fn lookup_ml_code(code: u8) -> (u32, u8) {
     }
 }
 
+// This info is buried in the symbol compression mode table
+/// "The maximum allowed accuracy log for literals length and match length tables is 9"
 pub const LL_MAX_LOG: u8 = 9;
+/// "The maximum allowed accuracy log for literals length and match length tables is 9"
 pub const ML_MAX_LOG: u8 = 9;
+/// "The maximum accuracy log for the offset table is 8."
 pub const OF_MAX_LOG: u8 = 8;
 
 fn maybe_update_fse_tables(
@@ -475,19 +488,34 @@ fn maybe_update_fse_tables(
     Ok(bytes_read)
 }
 
+// The default Literal Length decoding table uses an accuracy logarithm of 6 bits.
 const LL_DEFAULT_ACC_LOG: u8 = 6;
+/// If [ModeType::Predefined] is selected for a symbol type, its FSE decoding
+/// table is generated using a predefined distribution table.
+///
+/// https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#literals-length
 const LITERALS_LENGTH_DEFAULT_DISTRIBUTION: [i32; 36] = [
     4, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 2, 1, 1, 1, 1, 1,
     -1, -1, -1, -1,
 ];
 
+// The default Match Length decoding table uses an accuracy logarithm of 6 bits.
 const ML_DEFAULT_ACC_LOG: u8 = 6;
+/// If [ModeType::Predefined] is selected for a symbol type, its FSE decoding
+/// table is generated using a predefined distribution table.
+///
+/// https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#match-length
 const MATCH_LENGTH_DEFAULT_DISTRIBUTION: [i32; 53] = [
     1, 4, 3, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
     1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, -1, -1, -1, -1, -1, -1, -1,
 ];
 
+// The default Match Length decoding table uses an accuracy logarithm of 5 bits.
 const OF_DEFAULT_ACC_LOG: u8 = 5;
+/// If [ModeType::Predefined] is selected for a symbol type, its FSE decoding
+/// table is generated using a predefined distribution table.
+///
+/// https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#match-length
 const OFFSET_DEFAULT_DISTRIBUTION: [i32; 29] = [
     1, 1, 1, 1, 1, 1, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, -1, -1, -1, -1, -1,
 ];
diff --git a/src/frame.rs b/src/frame.rs
index 5870e1bc..b7a23498 100644
--- a/src/frame.rs
+++ b/src/frame.rs
@@ -3,21 +3,54 @@ use core::fmt;
 #[cfg(feature = "std")]
 use std::error::Error as StdError;
 
+/// This magic number is included at the start of a single Zstandard frame
 pub const MAGIC_NUM: u32 = 0xFD2F_B528;
+/// The minimum window size is defined as 1 KB
 pub const MIN_WINDOW_SIZE: u64 = 1024;
+/// The maximum window size is 3.75TB
 pub const MAX_WINDOW_SIZE: u64 = (1 << 41) + 7 * (1 << 38);
 
+/// Zstandard compressed data is made of one or more [Frame]s. Each frame is independent and can be
+/// decompressed independently of other frames.
+///
+/// There are two frame formats defined by Zstandard: Zstandard frames and Skippable frames.
+/// Zstandard frames contain compressed data, while skippable frames contain custom user metadata.
+///
+/// This structure contains the header of the frame.
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#frames>
 pub struct Frame {
     pub header: FrameHeader,
 }
 
+/// A frame header has a variable size, with a minimum of 2 bytes, and a maximum of 14 bytes.
 pub struct FrameHeader {
     pub descriptor: FrameDescriptor,
+    /// The `Window_Descriptor` field contains the minimum size of a memory buffer needed to
+    /// decompress the entire frame.
+    ///
+    /// This byte is not included in the frame header when the `Single_Segment_flag` is set.
+    ///
+    /// Bits 7-3 refer to the `Exponent`, where bits 2-0 refer to the `Mantissa`.
+    ///
+    /// To determine the size of a window, the following formula can be used:
+    /// ```text
+    /// windowLog = 10 + Exponent;
+    /// windowBase = 1 << windowLog;
+    /// windowAdd = (windowBase / 8) * Mantissa;
+    /// Window_Size = windowBase + windowAdd;
+    /// ```
+    /// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#window_descriptor>
     window_descriptor: u8,
+    /// The `Dictionary_ID` field contains the ID of the dictionary to be used to decode the frame.
+    /// When this value is not present, it's up to the decoder to know which dictionary to use.
     dict_id: Option<u32>,
+    /// The size of the original/uncompressed content.
     frame_content_size: u64,
 }
 
+/// The first byte is called the `Frame Header Descriptor`, and it describes what other fields
+/// are present.
 pub struct FrameDescriptor(u8);
 
 #[derive(Debug)]
@@ -42,27 +75,61 @@ impl fmt::Display for FrameDescriptorError {
 impl StdError for FrameDescriptorError {}
 
 impl FrameDescriptor {
+    /// Read the `Frame_Content_Size_flag` from the frame header descriptor.
+    ///
+    /// This is a 2 bit flag, specifying if the `Frame_Content_Size` field is present
+    /// within the header. It notates the number of bytes used by `Frame_Content_size`
+    ///
+    /// When this value is is 0, `FCS_Field_Size` depends on Single_Segment_flag.
+    /// If the `Single_Segment_flag` field is set in the frame header descriptor,
+    /// the size of the `Frame_Content_Size` field of the header is 1 byte.
+    /// Otherwise, `FCS_Field_Size` is 0, and the `Frame_Content_Size` is not provided.
+    ///
+    /// | Flag Value (decimal) | Size of the `Frame_Content_Size` field in bytes |
+    /// | -- | -- |
+    /// | 0 | 0 or 1 (see above) |
+    /// | 1 | 2 |
+    /// | 2 | 4 |
+    /// | 3 | 8 |
     pub fn frame_content_size_flag(&self) -> u8 {
         self.0 >> 6
     }
 
+    /// This bit is reserved for some future feature, a compliant decoder **must ensure**
+    /// that this value is set to zero.
     pub fn reserved_flag(&self) -> bool {
         ((self.0 >> 3) & 0x1) == 1
     }
 
+    /// If this flag is set, data must be regenerated within a single continuous memory segment.
+    ///
+    /// In this case, the `Window_Descriptor` byte is skipped, but `Frame_Content_Size` is present.
+    /// The decoder must allocate a memory segment equal to or larger than `Frame_Content_Size`.
     pub fn single_segment_flag(&self) -> bool {
         ((self.0 >> 5) & 0x1) == 1
     }
 
+    /// If this flag is set, a 32 bit `Content_Checksum` will be present at the end of the frame.
     pub fn content_checksum_flag(&self) -> bool {
         ((self.0 >> 2) & 0x1) == 1
     }
 
+    /// This is a two bit flag telling if a dictionary ID is provided within the header. It also
+    /// specifies the size of this field
+    ///
+    /// | Value (Decimal) | `DID_Field_Size` (bytes) |
+    /// | -- | -- |
+    /// | 0 | 0 |
+    /// | 1 | 1 |
+    /// | 2 | 2 |
+    /// | 3 | 4 |
     pub fn dict_id_flag(&self) -> u8 {
         self.0 & 0x3
     }
 
-    // Deriving info from the flags
+    /// Read the size of the `Frame_Content_size` field from the frame header descriptor, returning
+    /// the size in bytes.
+    /// If this value is zero, then the `Frame_Content_Size` field is not present within the header.
     pub fn frame_content_size_bytes(&self) -> Result<u8, FrameDescriptorError> {
         match self.frame_content_size_flag() {
             0 => {
@@ -79,6 +146,9 @@ impl FrameDescriptor {
         }
     }
 
+    /// Read the size of the `Dictionary_ID` field from the frame header descriptor, returning the size in bytes.
+    /// If this value is zero, then the dictionary id is not present within the header,
+    /// and "It's up to the decoder to know which dictionary to use."
     pub fn dictionary_id_bytes(&self) -> Result<u8, FrameDescriptorError> {
         match self.dict_id_flag() {
             0 => Ok(0),
@@ -153,6 +223,7 @@ impl From<FrameDescriptorError> for FrameHeaderError {
 }
 
 impl FrameHeader {
+    /// Read the size of the window from the header, returning the size in bytes.
     pub fn window_size(&self) -> Result<u64, FrameHeaderError> {
         if self.descriptor.single_segment_flag() {
             Ok(self.frame_content_size())
@@ -178,10 +249,12 @@ impl FrameHeader {
         }
     }
 
+    /// The ID (if provided) of the dictionary required to decode this frame.
     pub fn dictionary_id(&self) -> Option<u32> {
         self.dict_id
     }
 
+    /// Obtain the uncompressed size (in bytes) of the frame contents.
     pub fn frame_content_size(&self) -> u64 {
         self.frame_content_size
     }
@@ -249,6 +322,7 @@ impl From<FrameDescriptorError> for ReadFrameHeaderError {
     }
 }
 
+/// Read a single serialized frame from the reader and return a tuple containing the parsed frame and the number of bytes read.
 pub fn read_frame_header(mut r: impl Read) -> Result<(Frame, u8), ReadFrameHeaderError> {
     use ReadFrameHeaderError as err;
     let mut buf = [0u8; 4];
diff --git a/src/frame_decoder.rs b/src/frame_decoder.rs
index a0be962e..610ced4e 100644
--- a/src/frame_decoder.rs
+++ b/src/frame_decoder.rs
@@ -1,3 +1,7 @@
+//! Zstandard compressed data is made of one or more [Frame]s. Each frame is independent and can be
+//! decompressed independently of other frames. This module contains structures
+//! and utilities that can be used to decode a frame.
+
 use super::frame;
 use crate::decoding::dictionary::Dictionary;
 use crate::decoding::scratch::DecoderScratch;
@@ -13,7 +17,7 @@ use std::error::Error as StdError;
 /// over how many bytes/blocks will be decoded at a time (so you don't have to decode a 10GB file into memory all at once).
 /// It reads bytes as needed from a provided source and can be read from to collect partial results.
 ///
-/// If you want to just read the whole frame with an io::Read without having to deal with manually calling decode_blocks
+/// If you want to just read the whole frame with an `io::Read` without having to deal with manually calling [FrameDecoder::decode_blocks]
 /// you can use the provided StreamingDecoder with wraps this FrameDecoder
 ///
 /// Workflow is as follows:
diff --git a/src/fse/fse_decoder.rs b/src/fse/fse_decoder.rs
index eb1de877..6b8aa5a8 100644
--- a/src/fse/fse_decoder.rs
+++ b/src/fse/fse_decoder.rs
@@ -2,11 +2,31 @@ use crate::decoding::bit_reader::BitReader;
 use crate::decoding::bit_reader_reverse::{BitReaderReversed, GetBitsError};
 use alloc::vec::Vec;
 
+/// FSE decoding involves a decoding table that describes the probabilities of
+/// all literals from 0 to the highest present one
+///
+/// <https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#fse-table-description>
 pub struct FSETable {
+    /// The actual table containing the decoded symbol and the compression data
+    /// connected to that symbol.
     pub decode: Vec<Entry>, //used to decode symbols, and calculate the next state
-
+    /// The size of the table is stored in logarithm base 2 format,
+    /// with the **size of the table** being equal to `(1 << accuracy_log)`.
+    /// This value is used so that the decoder knows how many bits to read from the bitstream.
     pub accuracy_log: u8,
+    /// In this context, probability refers to the likelihood that a symbol occurs in the given data.
+    /// Given this info, the encoder can assign shorter codes to symbols that appear more often,
+    /// and longer codes that appear less often, then the decoder can use the probability
+    /// to determine what code was assigned to what symbol.
+    ///
+    /// The probability of a single symbol is a value representing the proportion of times the symbol
+    /// would fall within the data.
+    ///
+    /// If a symbol probability is set to `-1`, it means that the probability of a symbol
+    /// occurring in the data is less than one.
     pub symbol_probabilities: Vec<i32>, //used while building the decode Vector
+    /// The number of times each symbol occurs (The first entry being 0x0, the second being 0x1) and so on
+    /// up until the highest possible symbol (255).
     symbol_counter: Vec<u32>,
 }
 
@@ -87,7 +107,9 @@ impl From<GetBitsError> for FSETableError {
 }
 
 pub struct FSEDecoder<'table> {
+    /// An FSE state value represents an index in the FSE table.
     pub state: Entry,
+    /// A reference to the table used for decoding.
     table: &'table FSETable,
 }
 
@@ -125,13 +147,20 @@ impl From<GetBitsError> for FSEDecoderError {
     }
 }
 
+/// A single entry in an FSE table.
 #[derive(Copy, Clone)]
 pub struct Entry {
+    /// This value is used as an offset value, and it is added
+    /// to a value read from the stream to determine the next state value.
     pub base_line: u32,
+    /// How many bits should be read from the stream when decoding this entry.
     pub num_bits: u8,
+    /// The byte that should be put in the decode output when encountering this state.
     pub symbol: u8,
 }
 
+/// This value is added to the first 4 bits of the stream to determine the
+/// `Accuracy_Log`
 const ACC_LOG_OFFSET: u8 = 5;
 
 fn highest_bit_set(x: u32) -> u32 {
@@ -140,6 +169,7 @@ fn highest_bit_set(x: u32) -> u32 {
 }
 
 impl<'t> FSEDecoder<'t> {
+    /// Initialize a new Finite State Entropy decoder.
     pub fn new(table: &'t FSETable) -> FSEDecoder<'_> {
         FSEDecoder {
             state: table.decode.first().copied().unwrap_or(Entry {
@@ -151,10 +181,13 @@ impl<'t> FSEDecoder<'t> {
         }
     }
 
+    /// Returns the byte associated with the symbol the internal cursor is pointing at.
     pub fn decode_symbol(&self) -> u8 {
         self.state.symbol
     }
 
+    /// Initialize internal state and prepare for decoding. After this, `decode_symbol` can be called
+    /// to read the first symbol and `update_state` can be called to prepare to read the next symbol.
     pub fn init_state(&mut self, bits: &mut BitReaderReversed<'_>) -> Result<(), FSEDecoderError> {
         if self.table.accuracy_log == 0 {
             return Err(FSEDecoderError::TableIsUninitialized);
@@ -164,6 +197,7 @@ impl<'t> FSEDecoder<'t> {
         Ok(())
     }
 
+    /// Advance the internal state to decode the next symbol in the bitstream.
     pub fn update_state(
         &mut self,
         bits: &mut BitReaderReversed<'_>,
@@ -180,6 +214,7 @@ impl<'t> FSEDecoder<'t> {
 }
 
 impl FSETable {
+    /// Initialize a new empty Finite State Entropy decoding table.
     pub fn new() -> FSETable {
         FSETable {
             symbol_probabilities: Vec::with_capacity(256), //will never be more than 256 symbols because u8
@@ -189,6 +224,7 @@ impl FSETable {
         }
     }
 
+    /// Reset `self` and update `self`'s state to mirror the provided table.
     pub fn reinit_from(&mut self, other: &Self) {
         self.reset();
         self.symbol_counter.extend_from_slice(&other.symbol_counter);
@@ -198,6 +234,7 @@ impl FSETable {
         self.accuracy_log = other.accuracy_log;
     }
 
+    /// Empty the table and clear all internal state.
     pub fn reset(&mut self) {
         self.symbol_counter.clear();
         self.symbol_probabilities.clear();
@@ -205,7 +242,7 @@ impl FSETable {
         self.accuracy_log = 0;
     }
 
-    //returns how many BYTEs (not bits) were read while building the decoder
+    /// returns how many BYTEs (not bits) were read while building the decoder
     pub fn build_decoder(&mut self, source: &[u8], max_log: u8) -> Result<usize, FSETableError> {
         self.accuracy_log = 0;
 
@@ -215,6 +252,7 @@ impl FSETable {
         Ok(bytes_read)
     }
 
+    /// Given the provided accuracy log, build a decoding table from that log.
     pub fn build_from_probabilities(
         &mut self,
         acc_log: u8,
@@ -229,6 +267,8 @@ impl FSETable {
         Ok(())
     }
 
+    /// Build the actual decoding table after probabilities have been read into the table.
+    /// After this function is called, the decoding process can begin.
     fn build_decoding_table(&mut self) {
         self.decode.clear();
 
@@ -303,6 +343,8 @@ impl FSETable {
         }
     }
 
+    /// Read the accuracy log and the probability table from the source and return the number of bytes
+    /// read. If the size of the table is larger than the provided `max_log`, return an error.
     fn read_probabilities(&mut self, source: &[u8], max_log: u8) -> Result<usize, FSETableError> {
         self.symbol_probabilities.clear(); //just clear, we will fill a probability for each entry anyways. No need to force new allocs here
 
@@ -318,11 +360,11 @@ impl FSETable {
             return Err(FSETableError::AccLogIsZero);
         }
 
-        let probablility_sum = 1 << self.accuracy_log;
+        let probability_sum = 1 << self.accuracy_log;
         let mut probability_counter = 0;
 
-        while probability_counter < probablility_sum {
-            let max_remaining_value = probablility_sum - probability_counter + 1;
+        while probability_counter < probability_sum {
+            let max_remaining_value = probability_sum - probability_counter + 1;
             let bits_to_read = highest_bit_set(max_remaining_value);
 
             let unchecked_value = br.get_bits(bits_to_read as usize)? as u32;
@@ -366,10 +408,10 @@ impl FSETable {
             }
         }
 
-        if probability_counter != probablility_sum {
+        if probability_counter != probability_sum {
             return Err(FSETableError::ProbabilityCounterMismatch {
                 got: probability_counter,
-                expected_sum: probablility_sum,
+                expected_sum: probability_sum,
                 symbol_probabilities: self.symbol_probabilities.clone(),
             });
         }
@@ -389,6 +431,8 @@ impl FSETable {
 }
 
 //utility functions for building the decoding table from probabilities
+/// Calculate the position of the next entry of the table given the current
+/// position and size of the table.
 fn next_position(mut p: usize, table_size: usize) -> usize {
     p += (table_size >> 1) + (table_size >> 3) + 3;
     p &= table_size - 1;
diff --git a/src/fse/mod.rs b/src/fse/mod.rs
index ba4beb51..e25489fa 100644
--- a/src/fse/mod.rs
+++ b/src/fse/mod.rs
@@ -1,2 +1,16 @@
+//! FSE, short for Finite State Entropy, is an encoding technique
+//! that assigns shorter codes to symbols that appear more frequently in data,
+//! and longer codes to less frequent symbols.
+//!
+//! FSE works by mutating a state and using that state to index into a table.
+//!
+//! Zstandard uses two different kinds of entropy encoding: FSE, and Huffman coding.
+//! Huffman is used to compress literals,
+//! while FSE is used for all other symbols (literal length code, match length code, offset code).
+//!
+//! https://github.com/facebook/zstd/blob/dev/doc/zstd_compression_format.md#fse
+//!
+//! <https://arxiv.org/pdf/1311.2540>
+
 mod fse_decoder;
 pub use fse_decoder::*;
diff --git a/src/huff0/huff0_decoder.rs b/src/huff0/huff0_decoder.rs
index 49f40622..40820d0a 100644
--- a/src/huff0/huff0_decoder.rs
+++ b/src/huff0/huff0_decoder.rs
@@ -1,3 +1,5 @@
+//! Utilities for decoding Huff0 encoded huffman data.
+
 use crate::decoding::bit_reader_reverse::{BitReaderReversed, GetBitsError};
 use crate::fse::{FSEDecoder, FSEDecoderError, FSETable, FSETableError};
 use alloc::vec::Vec;
@@ -6,13 +8,19 @@ use std::error::Error as StdError;
 
 pub struct HuffmanTable {
     decode: Vec<Entry>,
-
+    /// The weight of a symbol is the number of occurences in a table.
+    /// This value is used in constructing a binary tree referred to as
+    /// a huffman tree.
     weights: Vec<u8>,
+    /// The maximum size in bits a prefix code in the encoded data can be.
+    /// This value is used so that the decoder knows how many bits
+    /// to read from the bitstream before checking the table. This
+    /// value must be 11 or lower.
     pub max_num_bits: u8,
     bits: Vec<u8>,
     bit_ranks: Vec<u32>,
     rank_indexes: Vec<usize>,
-
+    /// In some cases, the list of weights is compressed using FSE compression.
     fse_table: FSETable,
 }
 
@@ -163,8 +171,10 @@ impl From<FSETableError> for HuffmanTableError {
     }
 }
 
+/// An interface around a huffman table used to decode data.
 pub struct HuffmanDecoder<'table> {
     table: &'table HuffmanTable,
+    /// State is used to index into the table.
     pub state: u64,
 }
 
@@ -197,24 +207,35 @@ impl From<GetBitsError> for HuffmanDecoderError {
     }
 }
 
+/// A single entry in the table contains the decoded symbol/literal and the
+/// size of the prefix code.
 #[derive(Copy, Clone)]
 pub struct Entry {
+    /// The byte that the prefix code replaces during encoding.
     symbol: u8,
+    /// The number of bits the prefix code occupies.
     num_bits: u8,
 }
 
+/// The Zstandard specification limits the maximum length of a code to 11 bits.
 const MAX_MAX_NUM_BITS: u8 = 11;
 
+/// Assert that the provided value is greater than zero, and returns the
+/// 32 - the number of leading zeros
 fn highest_bit_set(x: u32) -> u32 {
     assert!(x > 0);
     u32::BITS - x.leading_zeros()
 }
 
 impl<'t> HuffmanDecoder<'t> {
+    /// Create a new decoder with the provided table
     pub fn new(table: &'t HuffmanTable) -> HuffmanDecoder<'t> {
         HuffmanDecoder { table, state: 0 }
     }
 
+    /// Re-initialize the decoder, using the new table if one is provided.
+    /// This might used for treeless blocks, because they re-use the table from old
+    /// data.
     pub fn reset(mut self, new_table: Option<&'t HuffmanTable>) {
         self.state = 0;
         if let Some(next_table) = new_table {
@@ -222,10 +243,15 @@ impl<'t> HuffmanDecoder<'t> {
         }
     }
 
+    /// Decode the symbol the internal state (cursor) is pointed at and return the
+    /// decoded literal.
     pub fn decode_symbol(&mut self) -> u8 {
         self.table.decode[self.state as usize].symbol
     }
 
+    /// Initialize internal state and prepare to decode data. Then, `decode_symbol` can be called
+    /// to read the byte the internal cursor is pointing at, and `next_state` can be called to advance
+    /// the cursor until the max number of bits has been read.
     pub fn init_state(
         &mut self,
         br: &mut BitReaderReversed<'_>,
@@ -236,14 +262,21 @@ impl<'t> HuffmanDecoder<'t> {
         Ok(num_bits)
     }
 
+    /// Advance the internal cursor to the next symbol. After this, you can call `decode_symbol`
+    /// to read from the new position.
     pub fn next_state(
         &mut self,
         br: &mut BitReaderReversed<'_>,
     ) -> Result<u8, HuffmanDecoderError> {
+        // self.state stores a small section, or a window of the bit stream. The table can be indexed via this state,
+        // telling you how many bits identify the current symbol.
         let num_bits = self.table.decode[self.state as usize].num_bits;
+        // New bits are read from the stream
         let new_bits = br.get_bits(num_bits)?;
+        // Shift and mask out the bits that identify the current symbol
         self.state <<= num_bits;
         self.state &= self.table.decode.len() as u64 - 1;
+        // The new bits are appended at the end of the current state.
         self.state |= new_bits;
         Ok(num_bits)
     }
@@ -256,6 +289,7 @@ impl Default for HuffmanTable {
 }
 
 impl HuffmanTable {
+    /// Create a new, empty table.
     pub fn new() -> HuffmanTable {
         HuffmanTable {
             decode: Vec::new(),
@@ -269,6 +303,8 @@ impl HuffmanTable {
         }
     }
 
+    /// Completely empty the table then repopulate as a replica
+    /// of `other`.
     pub fn reinit_from(&mut self, other: &Self) {
         self.reset();
         self.decode.extend_from_slice(&other.decode);
@@ -279,6 +315,7 @@ impl HuffmanTable {
         self.fse_table.reinit_from(&other.fse_table);
     }
 
+    /// Completely empty the table of all data.
     pub fn reset(&mut self) {
         self.decode.clear();
         self.weights.clear();
@@ -289,6 +326,9 @@ impl HuffmanTable {
         self.fse_table.reset();
     }
 
+    /// Read from `source` and parse it into a huffman table.
+    ///
+    /// Returns the number of bytes read.
     pub fn build_decoder(&mut self, source: &[u8]) -> Result<u32, HuffmanTableError> {
         self.decode.clear();
 
@@ -297,6 +337,13 @@ impl HuffmanTable {
         Ok(bytes_used)
     }
 
+    /// Read weights from the provided source.
+    ///
+    /// The huffman table is represented in the encoded data as a list of weights
+    /// at the most basic level. After the header, weights are read, then the table
+    /// can be built using that list of weights.
+    ///
+    /// Returns the number of bytes read.
     fn read_weights(&mut self, source: &[u8]) -> Result<u32, HuffmanTableError> {
         use HuffmanTableError as err;
 
@@ -307,6 +354,9 @@ impl HuffmanTable {
         let mut bits_read = 8;
 
         match header {
+            // If the header byte is less than 128, the series of weights
+            // is compressed using two interleaved FSE streams that share
+            // a distribution table.
             0..=127 => {
                 let fse_stream = &source[1..];
                 if header as usize > fse_stream.len() {
@@ -331,6 +381,9 @@ impl HuffmanTable {
                     "Building fse table for huffman weights used: {}",
                     bytes_used_by_fse_header
                 );
+                // Huffman headers are compressed using two interleaved
+                // FSE bitstreams, where the first state (decoder) handles
+                // even symbols, and the second handles odd symbols.
                 let mut dec1 = FSEDecoder::new(&self.fse_table);
                 let mut dec2 = FSEDecoder::new(&self.fse_table);
 
@@ -368,6 +421,7 @@ impl HuffmanTable {
 
                 self.weights.clear();
 
+                // The two decoders take turns decoding a single symbol and updating their state.
                 loop {
                     let w = dec1.decode_symbol();
                     self.weights.push(w);
@@ -396,6 +450,12 @@ impl HuffmanTable {
                     }
                 }
             }
+            // If the header byte is greater than or equal to 128,
+            // weights are directly represented, where each weight is
+            // encoded directly as a 4 bit field. The weights will
+            // always be encoded with full bytes, meaning if there's
+            // an odd number of weights, the last weight will still
+            // occupy a full byte.
             _ => {
                 // weights are directly encoded
                 let weights_raw = &source[1..];
@@ -434,6 +494,10 @@ impl HuffmanTable {
         Ok(bytes_read as u32)
     }
 
+    /// Once the weights have been read from the data, you can decode the weights
+    /// into a table, and use that table to decode the actual compressed data.
+    ///
+    /// This function populates the rest of the table from the series of weights.
     fn build_table_from_weights(&mut self) -> Result<(), HuffmanTableError> {
         use HuffmanTableError as err;
 
diff --git a/src/huff0/mod.rs b/src/huff0/mod.rs
index 445c7fab..3d847d65 100644
--- a/src/huff0/mod.rs
+++ b/src/huff0/mod.rs
@@ -1,2 +1,6 @@
+/// Huffman coding is a method of encoding where symbols are assigned a code,
+/// and more commonly used symbols get shorter codes, and less commonly
+/// used symbols get longer codes. Codes are prefix free, meaning no two codes
+/// will start with the same sequence of bits.
 mod huff0_decoder;
 pub use huff0_decoder::*;
diff --git a/src/io.rs b/src/io.rs
index 6970cd13..7a90969a 100644
--- a/src/io.rs
+++ b/src/io.rs
@@ -1,2 +1,3 @@
+//! Re-exports of std values for when the std is available.
 #[cfg(feature = "std")]
 pub use std::io::{Error, ErrorKind, Read, Write};
diff --git a/src/io_nostd.rs b/src/io_nostd.rs
index 0fc76e90..880ff499 100644
--- a/src/io_nostd.rs
+++ b/src/io_nostd.rs
@@ -1,3 +1,5 @@
+//! Manual implementations of representations for `#![no_std]`
+
 use alloc::boxed::Box;
 
 #[non_exhaustive]
diff --git a/src/streaming_decoder.rs b/src/streaming_decoder.rs
index 3021e3f2..b2cca276 100644
--- a/src/streaming_decoder.rs
+++ b/src/streaming_decoder.rs
@@ -3,19 +3,40 @@ use core::borrow::BorrowMut;
 use crate::frame_decoder::{BlockDecodingStrategy, FrameDecoder, FrameDecoderError};
 use crate::io::{Error, ErrorKind, Read};
 
-/// High level decoder that implements a io::Read that can be used with
-/// io::Read::read_to_end / io::Read::read_exact or passing this to another library / module as a source for the decoded content
+/// High level Zstandard frame decoder that can be used to decompress a given Zstandard frame.
 ///
-/// The lower level FrameDecoder by comparison allows for finer grained control but need sto have it's decode_blocks method called continously
-/// to decode the zstd-frame.
+/// This decoder implements `io::Read`, so you can interact with it by calling
+/// `io::Read::read_to_end` / `io::Read::read_exact` or passing this to another library / module as a source for the decoded content
+///
+/// If you need more control over how decompression takes place, you can use
+/// the lower level [FrameDecoder], which allows for greater control over how
+/// decompression takes place but the implementor must call
+/// [FrameDecoder::decode_blocks] repeatedly to decode the entire frame.
 ///
 /// ## Caveat
-/// [StreamingDecoder] expects the underlying stream to only contain a single frame.
+/// [StreamingDecoder] expects the underlying stream to only contain a single frame,
+/// yet the specification states that a single archive may contain multiple frames.
+///
 /// To decode all the frames in a finite stream, the calling code needs to recreate
-/// the instance of the decoder
-/// and handle
+/// the instance of the decoder and handle
 /// [crate::frame::ReadFrameHeaderError::SkipFrame]
 /// errors by skipping forward the `length` amount of bytes, see <https://github.com/KillingSpark/zstd-rs/issues/57>
+///
+/// ```no_run
+/// // `read_to_end` is not implemented by the no_std implementation.
+/// #[cfg(feature = "std")]
+/// {
+///     use std::fs::File;
+///     use std::io::Read;
+///     use ruzstd::{StreamingDecoder};
+///
+///     // Read a Zstandard archive from the filesystem then decompress it into a vec.
+///     let mut f: File = todo!("Read a .zstd archive from somewhere");
+///     let mut decoder = StreamingDecoder::new(f).unwrap();
+///     let mut result = Vec::new();
+///     Read::read_to_end(&mut decoder, &mut result).unwrap();
+/// }
+/// ```
 pub struct StreamingDecoder<READ: Read, DEC: BorrowMut<FrameDecoder>> {
     pub decoder: DEC,
     source: READ,