diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index ab1c320..167cf2c 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -36,11 +36,16 @@ jobs:
         uses: actions/setup-dotnet@v5
         with:
           global-json-file: global.json
+          # The SDK comes from global.json; these runtime installs are required
+          # because projects target net8.0 and net9.0.
           dotnet-version: |
             8.0.x
             9.0.x
 
       - name: NuGet package cache
+        # actions/cache can fail on Windows before restore even runs; keep the
+        # optimization on Unix runners and let Windows restore normally.
+        if: runner.os != 'Windows'
         uses: actions/cache@v5
         with:
           path: ~/.nuget/packages
@@ -80,9 +85,23 @@ jobs:
       - uses: actions/setup-dotnet@v5
         with:
           global-json-file: global.json
+          # dotnet format loads all target frameworks, so install both runtimes
+          # even though global.json chooses the SDK.
+          dotnet-version: |
+            8.0.x
+            9.0.x
+
+      - name: Restore
+        run: dotnet restore IcebergSharp.slnx
+
+      - name: Verify whitespace formatting
+        run: dotnet format whitespace IcebergSharp.slnx --verify-no-changes --no-restore
+
+      - name: Verify code style
+        run: dotnet format style IcebergSharp.slnx --verify-no-changes --severity info --no-restore
 
-      - name: Verify formatting
-        run: dotnet format IcebergSharp.slnx --verify-no-changes --severity info
+      - name: Verify analyzer fixes
+        run: dotnet format analyzers IcebergSharp.slnx --verify-no-changes --severity info --no-restore
 
   pack:
     name: pack (dry run)
diff --git a/.gitignore b/.gitignore
index 455a0dd..3e522cf 100644
--- a/.gitignore
+++ b/.gitignore
@@ -8,6 +8,7 @@ publish/
 *.suo
 *.userosscache
 *.sln.docstates
+*.lscache
 
 # IDE
 .vs/
diff --git a/CHANGELOG.md b/CHANGELOG.md
index cda90bf..376f1fa 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,5 +14,17 @@ the 0.x line may include breaking changes; they will always be called out under
 - Phase 0 scaffolding: solution layout, CI, license, scope and roadmap.
 - Phase 1 core types and metadata: `Schema`, `IcebergType` hierarchy,
   `TableMetadata` JSON parser, and fixture-based round-trip tests.
+- Phase 2 Avro manifest reading: stream-based manifest-list and manifest readers,
+  Avro OCF `null` / `deflate` codecs, dynamic schema parsing, and Phase 2 smoke
+  coverage from metadata to manifests.
+
+### Changed
+- CI now enforces whitespace, style, and analyzer fixes explicitly with
+  `dotnet format --verify-no-changes`.
+
+### Fixed
+- Hardened Avro decoding and schema parsing against truncated schema JSON,
+  oversized encoded lengths, invalid block headers, and invalid logical-type
+  annotations.
 
 [Unreleased]: https://github.com/AndreaBozzo/IcebergSharp/commits/main
diff --git a/README.md b/README.md
index 3070eea..b78db55 100644
--- a/README.md
+++ b/README.md
@@ -31,8 +31,10 @@ doesn't expose Iceberg's metadata to them. There's no native client that gives a
 no embedded query engine — just metadata and Arrow batches you can hand to
 DuckDB.NET, ML.NET, or Power BI.
 
-> **Status:** Phase 0 — repository scaffolding only. No public API yet. See the
-> [roadmap](#roadmap) for what is coming and when.
+> **Status:** Phase 2 development. Core Iceberg metadata parsing and stream-based
+> Avro manifest / manifest-list readers are implemented and covered by unit
+> tests. Catalog, scan planning, file IO, and Parquet data reads are still on the
+> roadmap.
 
 ---
 
@@ -133,6 +135,13 @@ var lastWeek = table.NewScan()
 See [docs/compatibility-matrix.md](docs/compatibility-matrix.md) for the up-to-date
 matrix of supported catalogs, table-format versions, and storage backends.
 
+Current implemented surface:
+
+- `IcebergSharp.Core`: Iceberg v1/v2 table metadata, schemas, partition specs,
+  sort orders, snapshots, and manifest domain models.
+- `IcebergSharp.Avro`: stream-based Avro OCF readers for Iceberg manifest lists
+  and manifests, including `null` and `deflate` codecs.
+
 Target servers for v1:
 
 - Apache Polaris (reference implementation)
@@ -148,8 +157,8 @@ Target servers for v1:
 | Phase | Weeks | Deliverable |
 | --- | --- | --- |
 | 0. Scaffolding | done | Repo, CI, license, solution layout |
-| 1. Core types & metadata | 1-2 | `Schema`, `TableMetadata`, JSON parser |
-| 2. Avro manifest reader | 3-4 | Custom mini Avro OCF reader for manifests |
+| 1. Core types & metadata | done | `Schema`, `TableMetadata`, JSON parser |
+| 2. Avro manifest reader | in progress | Custom mini Avro OCF reader for manifests |
 | 3. REST catalog client | 5-6 | OAuth2 / Bearer / SigV4, dynamic discovery |
 | 4. Scan planning & pruning | 7-8 | Partition + stats pruning, residual filters |
 | 5. Parquet + schema evolution | 9-10 | Field-id resolution, add/drop/rename column |
@@ -180,9 +189,9 @@ column stats, and streams Parquet rows with field-id resolution.
 
 ## Contributing
 
-See [CONTRIBUTING.md](CONTRIBUTING.md). The project is in early development — the
-fastest way to help is to try the prerelease packages once Phase 1 ships and report
-incompatibilities against your specific catalog.
+See [CONTRIBUTING.md](CONTRIBUTING.md). The project is in early development; the
+fastest way to help right now is to try the metadata and manifest readers against
+real Iceberg tables and report incompatible schemas, codecs, or manifest shapes.
 
 ---
 
diff --git a/docs/compatibility-matrix.md b/docs/compatibility-matrix.md
index cf6a16d..e941ad0 100644
--- a/docs/compatibility-matrix.md
+++ b/docs/compatibility-matrix.md
@@ -1,6 +1,7 @@
 # Compatibility matrix
 
-> Last updated: Phase 0 — entries marked _planned_ are targets, not validated yet.
+> Last updated: Phase 2 development. Entries marked _planned_ are targets, not
+> validated yet.
 
 ## Catalogs
 
@@ -18,8 +19,8 @@
 
 | Spec version | Status |
 | --- | --- |
-| v1 | 🟡 planned for Phase 1 |
-| v2 | 🟡 planned for Phase 1 (primary target) |
+| v1 | ✅ metadata JSON + Avro manifests covered by unit fixtures |
+| v2 | ✅ metadata JSON + Avro manifests covered by unit fixtures |
 | v3 | 🟢 stretch goal — depends on spec stability |
 
 ## Storage backends
@@ -36,6 +37,7 @@
 
 | Format | Read | Write |
 | --- | --- | --- |
+| Iceberg manifest Avro OCF | ✅ `null` + `deflate` codecs | ⛔ out of scope for v1 |
 | Parquet | 🟡 planned for Phase 5 | ⛔ out of scope for v1 |
 | ORC | ⛔ out of scope for v1 | ⛔ out of scope for v1 |
 | Avro (data files, not manifests) | ⛔ out of scope for v1 | ⛔ out of scope for v1 |
@@ -44,6 +46,9 @@
 
 | Feature | Status |
 | --- | --- |
+| Table metadata JSON parsing | ✅ validated with v1/v2 fixtures |
+| Manifest-list reading | ✅ stream-based Avro OCF reader |
+| Manifest reading | ✅ stream-based Avro OCF reader |
 | Schema evolution (add / drop / rename / promote) | 🟡 planned for Phase 5 |
 | Partition spec evolution | 🟡 planned for Phase 4 |
 | Snapshot isolation / time travel | 🟡 planned for Phase 4 |
diff --git a/src/IcebergSharp.Avro/Internal/Codec/DeflateCodec.cs b/src/IcebergSharp.Avro/Internal/Codec/DeflateCodec.cs
new file mode 100644
index 0000000..b5917cb
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Codec/DeflateCodec.cs
@@ -0,0 +1,56 @@
+using System.Buffers;
+using System.IO.Compression;
+
+namespace IcebergSharp.Avro.Internal.Codec;
+
+/// <summary>
+/// Avro's <c>deflate</c> codec is raw DEFLATE (no zlib header). Wraps
+/// <see cref="DeflateStream"/> in decompress mode over the source bytes.
+/// </summary>
+internal sealed class DeflateCodec : IBlockCodec
+{
+    public static DeflateCodec Instance { get; } = new();
+    private DeflateCodec() { }
+
+    public string Name => "deflate";
+
+    public int Decode(ReadOnlySpan<byte> source, ref byte[] destination)
+    {
+        // System.IO.Compression doesn't accept ReadOnlySpan; copy the source
+        // into a rented buffer-backed MemoryStream. Renting is cheap relative
+        // to the decompression itself.
+        var sourceArr = ArrayPool<byte>.Shared.Rent(source.Length);
+        try
+        {
+            source.CopyTo(sourceArr);
+            using var src = new MemoryStream(sourceArr, 0, source.Length, writable: false);
+            using var deflate = new DeflateStream(src, CompressionMode.Decompress, leaveOpen: false);
+
+            var totalWritten = 0;
+            while (true)
+            {
+                if (totalWritten >= destination.Length)
+                {
+                    var grown = ArrayPool<byte>.Shared.Rent(destination.Length * 2);
+                    Buffer.BlockCopy(destination, 0, grown, 0, totalWritten);
+                    ArrayPool<byte>.Shared.Return(destination);
+                    destination = grown;
+                }
+
+                var n = deflate.Read(destination, totalWritten, destination.Length - totalWritten);
+                if (n == 0)
+                {
+                    break;
+                }
+
+                totalWritten += n;
+            }
+
+            return totalWritten;
+        }
+        finally
+        {
+            ArrayPool<byte>.Shared.Return(sourceArr);
+        }
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Codec/IBlockCodec.cs b/src/IcebergSharp.Avro/Internal/Codec/IBlockCodec.cs
new file mode 100644
index 0000000..66543f6
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Codec/IBlockCodec.cs
@@ -0,0 +1,14 @@
+namespace IcebergSharp.Avro.Internal.Codec;
+
+internal interface IBlockCodec
+{
+    /// <summary>Codec name as it appears in the OCF header (<c>null</c>, <c>deflate</c>).</summary>
+    string Name { get; }
+
+    /// <summary>
+    /// Decodes <paramref name="source"/> into <paramref name="destination"/>, resizing
+    /// <paramref name="destination"/> via the array pool if it isn't large enough.
+    /// Returns the number of valid bytes in <paramref name="destination"/>.
+    /// </summary>
+    int Decode(ReadOnlySpan<byte> source, ref byte[] destination);
+}
diff --git a/src/IcebergSharp.Avro/Internal/Codec/NullCodec.cs b/src/IcebergSharp.Avro/Internal/Codec/NullCodec.cs
new file mode 100644
index 0000000..4325f2d
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Codec/NullCodec.cs
@@ -0,0 +1,23 @@
+using System.Buffers;
+
+namespace IcebergSharp.Avro.Internal.Codec;
+
+internal sealed class NullCodec : IBlockCodec
+{
+    public static NullCodec Instance { get; } = new();
+    private NullCodec() { }
+
+    public string Name => "null";
+
+    public int Decode(ReadOnlySpan<byte> source, ref byte[] destination)
+    {
+        if (destination.Length < source.Length)
+        {
+            ArrayPool<byte>.Shared.Return(destination);
+            destination = ArrayPool<byte>.Shared.Rent(source.Length);
+        }
+
+        source.CopyTo(destination);
+        return source.Length;
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/AvroToIcebergType.cs b/src/IcebergSharp.Avro/Internal/Decode/AvroToIcebergType.cs
new file mode 100644
index 0000000..7206c4e
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/AvroToIcebergType.cs
@@ -0,0 +1,68 @@
+using IcebergSharp.Avro.Internal.Schema;
+using IcebergSharp.Types;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Maps an <see cref="AvroSchema"/> node back to the Iceberg type that produced
+/// it. Only used for partition columns — the manifest's partition record has a
+/// dynamic schema and Phase 4 wants <see cref="IcebergType"/>s on the boxed
+/// partition values.
+/// </summary>
+internal static class AvroToIcebergType
+{
+    public static IcebergType Resolve(AvroSchema schema)
+    {
+        // Peel off a nullable union to get to the carrier.
+        if (schema is AvroUnion u)
+        {
+            schema = u.NonNull;
+        }
+
+        return schema switch
+        {
+            AvroPrimitive p => ResolvePrimitive(p),
+            AvroFixed f => ResolveFixed(f),
+            _ => throw new NotSupportedException($"partition columns cannot have Avro schema kind {schema.GetType().Name}"),
+        };
+    }
+
+    private static IcebergType ResolvePrimitive(AvroPrimitive p)
+    {
+        return p.LogicalType switch
+        {
+            AvroLogicalType.Date => DateType.Instance,
+            AvroLogicalType.TimeMicros or AvroLogicalType.TimeMillis => TimeType.Instance,
+            AvroLogicalType.TimestampMicros => TimestampTzType.Instance,
+            AvroLogicalType.TimestampMillis => TimestampType.Instance,
+            AvroLogicalType.Uuid => UuidType.Instance,
+            AvroLogicalType.Decimal => new DecimalType(p.DecimalPrecision, p.DecimalScale),
+            _ => p.Kind switch
+            {
+                AvroPrimitiveKind.Boolean => BooleanType.Instance,
+                AvroPrimitiveKind.Int => IntType.Instance,
+                AvroPrimitiveKind.Long => LongType.Instance,
+                AvroPrimitiveKind.Float => FloatType.Instance,
+                AvroPrimitiveKind.Double => DoubleType.Instance,
+                AvroPrimitiveKind.Bytes => BinaryType.Instance,
+                AvroPrimitiveKind.String => StringType.Instance,
+                _ => throw new NotSupportedException($"unsupported Avro primitive {p.Kind} for partition column"),
+            },
+        };
+    }
+
+    private static IcebergType ResolveFixed(AvroFixed f)
+    {
+        if (f.LogicalType == AvroLogicalType.Decimal)
+        {
+            return new DecimalType(f.DecimalPrecision, f.DecimalScale);
+        }
+
+        if (f.LogicalType == AvroLogicalType.Uuid || f.Size == 16)
+        {
+            return UuidType.Instance;
+        }
+
+        return new FixedType(f.Size);
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/BinaryDecoder.cs b/src/IcebergSharp.Avro/Internal/Decode/BinaryDecoder.cs
new file mode 100644
index 0000000..66a3175
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/BinaryDecoder.cs
@@ -0,0 +1,185 @@
+using System.Buffers.Binary;
+using System.Text;
+using IcebergSharp.Avro.Internal.Errors;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Cursor over an in-memory Avro binary block. Read methods advance
+/// <see cref="Position"/>; all primitives are decoded directly out of the
+/// underlying span — no allocation per read except where the caller asks for a
+/// materialised string/byte[].
+/// </summary>
+internal ref struct BinaryDecoder
+{
+    private readonly ReadOnlySpan<byte> _buffer;
+    private int _position;
+
+    public BinaryDecoder(ReadOnlySpan<byte> buffer)
+    {
+        _buffer = buffer;
+        _position = 0;
+    }
+
+    public readonly int Position => _position;
+    public readonly int Length => _buffer.Length;
+    public readonly bool EndOfBuffer => _position >= _buffer.Length;
+
+    public bool ReadBoolean()
+    {
+        EnsureBytes(1);
+        var b = _buffer[_position++];
+        if (b > 1)
+        {
+            throw new AvroFormatException($"boolean must be 0 or 1, got 0x{b:X2}");
+        }
+
+        return b == 1;
+    }
+
+    public int ReadInt()
+    {
+        var value = ReadLong();
+        if (value is < int.MinValue or > int.MaxValue)
+        {
+            throw new AvroFormatException($"int value {value} is outside Int32 range");
+        }
+
+        return (int)value;
+    }
+
+    public long ReadLong()
+    {
+        // Zig-zag varint, little-endian, 7 bits per byte. At most 10 bytes for a long.
+        long value = 0;
+        var shift = 0;
+        while (true)
+        {
+            if (_position >= _buffer.Length)
+            {
+                throw new AvroFormatException("truncated varint");
+            }
+
+            var b = _buffer[_position++];
+            value |= (long)(b & 0x7F) << shift;
+            if ((b & 0x80) == 0)
+            {
+                break;
+            }
+
+            shift += 7;
+            if (shift > 63)
+            {
+                throw new AvroFormatException("varint too long for long");
+            }
+        }
+
+        // Zig-zag decode.
+        return (long)((ulong)value >> 1) ^ -(value & 1L);
+    }
+
+    public float ReadFloat()
+    {
+        EnsureBytes(4);
+        var v = BinaryPrimitives.ReadSingleLittleEndian(_buffer.Slice(_position, 4));
+        _position += 4;
+        return v;
+    }
+
+    public double ReadDouble()
+    {
+        EnsureBytes(8);
+        var v = BinaryPrimitives.ReadDoubleLittleEndian(_buffer.Slice(_position, 8));
+        _position += 8;
+        return v;
+    }
+
+    /// <summary>Reads the next length-prefixed byte sequence and returns a span into the underlying buffer (no copy).</summary>
+    public ReadOnlySpan<byte> ReadBytesSpan()
+    {
+        var len = ReadLong();
+        if (len < 0)
+        {
+            throw new AvroFormatException($"negative bytes length {len}");
+        }
+
+        if (len > int.MaxValue)
+        {
+            throw new AvroFormatException($"bytes length {len} exceeds supported maximum {int.MaxValue}");
+        }
+
+        if (len == 0)
+        {
+            return [];
+        }
+
+        EnsureBytes((int)len);
+        ReadOnlySpan<byte> span = _buffer.Slice(_position, (int)len);
+        _position += (int)len;
+        return span;
+    }
+
+    public string ReadString()
+    {
+        ReadOnlySpan<byte> bytes = ReadBytesSpan();
+        return bytes.IsEmpty ? string.Empty : Encoding.UTF8.GetString(bytes);
+    }
+
+    public ReadOnlySpan<byte> ReadFixed(int size)
+    {
+        if (size < 0)
+        {
+            throw new AvroFormatException($"fixed size must be non-negative, got {size}");
+        }
+
+        EnsureBytes(size);
+        ReadOnlySpan<byte> span = _buffer.Slice(_position, size);
+        _position += size;
+        return span;
+    }
+
+    /// <summary>
+    /// Reads the next block header of an array or map: returns the count of
+    /// items in this block (positive) and skips the byte-size header if the
+    /// block was prefixed with a negative count. A return of 0 terminates the
+    /// container.
+    /// </summary>
+    public long ReadBlockCount()
+    {
+        var count = ReadLong();
+        if (count < 0)
+        {
+            if (count == long.MinValue)
+            {
+                throw new AvroFormatException("array/map block count is too small to negate");
+            }
+
+            // Negative count means: -count items follow, prefixed with their byte size.
+            var byteSize = ReadLong(); // byte size, ignored — we read records by element count.
+            if (byteSize < 0)
+            {
+                throw new AvroFormatException($"negative array/map block byte size {byteSize}");
+            }
+
+            return -count;
+        }
+
+        return count;
+    }
+
+    /// <summary>Reads a union branch index (zigzag long).</summary>
+    public int ReadUnionBranch() => ReadInt();
+
+    private readonly void EnsureBytes(int count)
+    {
+        if (count < 0)
+        {
+            throw new AvroFormatException($"byte count must be non-negative, got {count}");
+        }
+
+        if (count > _buffer.Length - _position)
+        {
+            throw new AvroFormatException($"truncated buffer (need {count} bytes, have {_buffer.Length - _position})");
+        }
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/IcebergFieldIds.cs b/src/IcebergSharp.Avro/Internal/Decode/IcebergFieldIds.cs
new file mode 100644
index 0000000..23405c0
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/IcebergFieldIds.cs
@@ -0,0 +1,62 @@
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Iceberg spec field-ids for manifest-list and manifest schemas. Keeping them
+/// as named constants makes the sink code read close to the spec text.
+/// </summary>
+/// <remarks>
+/// Source: Apache Iceberg specification, sections "Manifest Lists" and
+/// "Manifests". Field-ids are stable across spec versions, even where v1 and
+/// v2 use different field names — the id is the contract.
+/// </remarks>
+internal static class IcebergFieldIds
+{
+    // manifest_file (manifest list record)
+    public const int ManifestPath = 500;
+    public const int ManifestLength = 501;
+    public const int PartitionSpecId = 502;
+    public const int AddedSnapshotId = 503;
+    public const int AddedFilesCount = 504; // v1 int; v2 calls this added_data_files_count
+    public const int ExistingFilesCount = 505;
+    public const int DeletedFilesCount = 506;
+    public const int Partitions = 507;
+    public const int AddedRowsCount = 512;
+    public const int ExistingRowsCount = 513;
+    public const int DeletedRowsCount = 514;
+    public const int SequenceNumber = 515;
+    public const int MinSequenceNumber = 516;
+    public const int Content = 517; // manifest_file content (v2)
+    public const int KeyMetadataManifest = 519;
+
+    // field_summary (member of manifest_file.partitions array)
+    public const int FsContainsNull = 509;
+    public const int FsContainsNaN = 518;
+    public const int FsLowerBound = 510;
+    public const int FsUpperBound = 511;
+
+    // manifest_entry
+    public const int Status = 0;
+    public const int EntrySnapshotId = 1;
+    public const int DataFile = 2;
+    public const int EntrySequenceNumber = 3; // v2
+    public const int EntryFileSequenceNumber = 4; // v2
+
+    // data_file (member of manifest_entry)
+    public const int DfContent = 134; // v2
+    public const int DfFilePath = 100;
+    public const int DfFileFormat = 101;
+    public const int DfPartition = 102;
+    public const int DfRecordCount = 103;
+    public const int DfFileSizeInBytes = 104;
+    public const int DfBlockSizeInBytes = 105; // v1 only
+    public const int DfColumnSizes = 108;
+    public const int DfValueCounts = 109;
+    public const int DfNullValueCounts = 110;
+    public const int DfNanValueCounts = 137;
+    public const int DfLowerBounds = 125;
+    public const int DfUpperBounds = 128;
+    public const int DfKeyMetadata = 131;
+    public const int DfSplitOffsets = 132;
+    public const int DfEqualityIds = 135;
+    public const int DfSortOrderId = 140;
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/ManifestEntrySink.cs b/src/IcebergSharp.Avro/Internal/Decode/ManifestEntrySink.cs
new file mode 100644
index 0000000..6110752
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/ManifestEntrySink.cs
@@ -0,0 +1,419 @@
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Schema;
+using IcebergSharp.Types;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Decodes one <c>manifest_entry</c> Avro record into a <see cref="ManifestEntry"/>.
+/// Reuses a pre-resolved partition-record schema across rows so we don't walk
+/// the Avro tree per data file.
+/// </summary>
+internal sealed class ManifestEntrySink
+{
+    private readonly AvroRecord _entryRecord;
+    private readonly AvroRecord _dataFileRecord;
+    private readonly AvroRecord? _partitionRecord;
+    private readonly string[] _partitionNames;
+    private readonly IcebergType[] _partitionTypes;
+
+    public ManifestEntrySink(AvroRecord entryRecord)
+    {
+        _entryRecord = entryRecord;
+        _dataFileRecord = ResolveDataFileRecord(entryRecord);
+        _partitionRecord = ResolvePartitionRecord(_dataFileRecord);
+        if (_partitionRecord is not null)
+        {
+            (_partitionNames, _partitionTypes) = PartitionRecordSink.ResolveSchema(_partitionRecord);
+        }
+        else
+        {
+            _partitionNames = [];
+            _partitionTypes = [];
+        }
+    }
+
+    public ManifestEntry Decode(ref BinaryDecoder decoder)
+    {
+        ManifestEntryStatus status = ManifestEntryStatus.Existing;
+        long? snapshotId = null;
+        long? sequenceNumber = null;
+        long? fileSequenceNumber = null;
+        DataFile? dataFile = null;
+
+        foreach (AvroRecordField field in _entryRecord.Fields)
+        {
+            switch (field.FieldId)
+            {
+                case IcebergFieldIds.Status:
+                    status = (ManifestEntryStatus)NullableReader.ReadIntRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.EntrySnapshotId:
+                    snapshotId = NullableReader.ReadLongOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.EntrySequenceNumber:
+                    sequenceNumber = NullableReader.ReadLongOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.EntryFileSequenceNumber:
+                    fileSequenceNumber = NullableReader.ReadLongOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DataFile:
+                    dataFile = DecodeDataFile(ref decoder, field.Schema);
+                    break;
+                default:
+                    ShapeDecoder.SkipValue(ref decoder, field.Schema);
+                    break;
+            }
+        }
+
+        if (dataFile is null)
+        {
+            throw new AvroFormatException("manifest_entry is missing data_file (field-id 2)");
+        }
+
+        return new ManifestEntry(status, snapshotId, sequenceNumber, fileSequenceNumber, dataFile);
+    }
+
+    private DataFile DecodeDataFile(ref BinaryDecoder decoder, AvroSchema dfSchema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref dfSchema))
+        {
+            throw new AvroFormatException("data_file is null");
+        }
+
+        if (dfSchema is not AvroRecord rec)
+        {
+            throw new AvroFormatException("data_file must be a record");
+        }
+
+        DataFileContent content = DataFileContent.Data;
+        string? filePath = null;
+        string? fileFormat = null;
+        PartitionValues partition = PartitionValues.Empty;
+        long recordCount = 0;
+        long fileSize = 0;
+        Dictionary<int, long>? columnSizes = null;
+        Dictionary<int, long>? valueCounts = null;
+        Dictionary<int, long>? nullValueCounts = null;
+        Dictionary<int, long>? nanValueCounts = null;
+        Dictionary<int, ReadOnlyMemory<byte>>? lowerBounds = null;
+        Dictionary<int, ReadOnlyMemory<byte>>? upperBounds = null;
+        byte[]? keyMetadata = null;
+        List<long>? splitOffsets = null;
+        List<int>? equalityIds = null;
+        int? sortOrderId = null;
+
+        foreach (AvroRecordField field in rec.Fields)
+        {
+            switch (field.FieldId)
+            {
+                case IcebergFieldIds.DfContent:
+                    content = (DataFileContent)NullableReader.ReadIntRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfFilePath:
+                    filePath = NullableReader.ReadStringRequired(ref decoder, field.Schema, "file_path");
+                    break;
+                case IcebergFieldIds.DfFileFormat:
+                    fileFormat = NullableReader.ReadStringRequired(ref decoder, field.Schema, "file_format");
+                    break;
+                case IcebergFieldIds.DfPartition:
+                    partition = DecodePartition(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfRecordCount:
+                    recordCount = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfFileSizeInBytes:
+                    fileSize = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfBlockSizeInBytes:
+                    // v1 only; not surfaced in the domain model.
+                    _ = NullableReader.ReadLongOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfColumnSizes:
+                    columnSizes = DecodeIntLongMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfValueCounts:
+                    valueCounts = DecodeIntLongMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfNullValueCounts:
+                    nullValueCounts = DecodeIntLongMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfNanValueCounts:
+                    nanValueCounts = DecodeIntLongMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfLowerBounds:
+                    lowerBounds = DecodeIntBytesMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfUpperBounds:
+                    upperBounds = DecodeIntBytesMap(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfKeyMetadata:
+                    keyMetadata = NullableReader.ReadBytesOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfSplitOffsets:
+                    splitOffsets = DecodeLongArray(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfEqualityIds:
+                    equalityIds = DecodeIntArray(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DfSortOrderId:
+                    sortOrderId = NullableReader.ReadIntOrNull(ref decoder, field.Schema);
+                    break;
+                default:
+                    ShapeDecoder.SkipValue(ref decoder, field.Schema);
+                    break;
+            }
+        }
+
+        if (filePath is null || fileFormat is null)
+        {
+            throw new AvroFormatException("data_file record is missing file_path or file_format");
+        }
+
+        return new DataFile(
+            content,
+            filePath,
+            fileFormat,
+            partition,
+            recordCount,
+            fileSize,
+            columnSizes,
+            valueCounts,
+            nullValueCounts,
+            nanValueCounts,
+            lowerBounds,
+            upperBounds,
+            keyMetadata ?? [],
+            splitOffsets,
+            equalityIds,
+            sortOrderId);
+    }
+
+    private PartitionValues DecodePartition(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return PartitionValues.Empty;
+        }
+
+        if (schema is not AvroRecord rec)
+        {
+            throw new AvroFormatException($"partition field must be a record, got {schema.GetType().Name}");
+        }
+
+        if (_partitionRecord is null)
+        {
+            // Should not happen — we resolved it in the constructor — but recover defensively.
+            ShapeDecoder.SkipValue(ref decoder, schema);
+            return PartitionValues.Empty;
+        }
+
+        return PartitionRecordSink.Decode(ref decoder, rec, _partitionNames, _partitionTypes);
+    }
+
+    private static Dictionary<int, long>? DecodeIntLongMap(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        // Iceberg encodes int-keyed maps as an Avro array of {key: int, value: T} records,
+        // because Avro's native map only supports string keys.
+        if (schema is not AvroArray arr || arr.Items is not AvroRecord entry)
+        {
+            throw new AvroFormatException($"expected int->long map (array<kv-record>), got {schema.GetType().Name}");
+        }
+
+        var result = new Dictionary<int, long>();
+        while (true)
+        {
+            var count = decoder.ReadBlockCount();
+            if (count == 0)
+            {
+                return result;
+            }
+
+            for (long i = 0; i < count; i++)
+            {
+                int? key = null;
+                long? value = null;
+                foreach (AvroRecordField f in entry.Fields)
+                {
+                    if (f.Name == "key")
+                    {
+                        key = NullableReader.ReadIntRequiredOrZero(ref decoder, f.Schema);
+                    }
+                    else if (f.Name == "value")
+                    {
+                        value = NullableReader.ReadLongRequiredOrZero(ref decoder, f.Schema);
+                    }
+                    else
+                    {
+                        ShapeDecoder.SkipValue(ref decoder, f.Schema);
+                    }
+                }
+
+                if (key is null || value is null)
+                {
+                    throw new AvroFormatException("kv-record missing key or value");
+                }
+
+                result[key.Value] = value.Value;
+            }
+        }
+    }
+
+    private static Dictionary<int, ReadOnlyMemory<byte>>? DecodeIntBytesMap(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        if (schema is not AvroArray arr || arr.Items is not AvroRecord entry)
+        {
+            throw new AvroFormatException($"expected int->bytes map (array<kv-record>), got {schema.GetType().Name}");
+        }
+
+        var result = new Dictionary<int, ReadOnlyMemory<byte>>();
+        while (true)
+        {
+            var count = decoder.ReadBlockCount();
+            if (count == 0)
+            {
+                return result;
+            }
+
+            for (long i = 0; i < count; i++)
+            {
+                int? key = null;
+                byte[]? value = null;
+                foreach (AvroRecordField f in entry.Fields)
+                {
+                    if (f.Name == "key")
+                    {
+                        key = NullableReader.ReadIntRequiredOrZero(ref decoder, f.Schema);
+                    }
+                    else if (f.Name == "value")
+                    {
+                        value = NullableReader.ReadBytesOrNull(ref decoder, f.Schema);
+                    }
+                    else
+                    {
+                        ShapeDecoder.SkipValue(ref decoder, f.Schema);
+                    }
+                }
+
+                if (key is null)
+                {
+                    throw new AvroFormatException("kv-record missing key");
+                }
+
+                result[key.Value] = value is null ? ReadOnlyMemory<byte>.Empty : value;
+            }
+        }
+    }
+
+    private static List<long>? DecodeLongArray(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        if (schema is not AvroArray arr)
+        {
+            throw new AvroFormatException($"expected array<long>, got {schema.GetType().Name}");
+        }
+
+        var result = new List<long>();
+        while (true)
+        {
+            var count = decoder.ReadBlockCount();
+            if (count == 0)
+            {
+                return result;
+            }
+
+            for (long i = 0; i < count; i++)
+            {
+                AvroSchema itemSchema = arr.Items;
+                result.Add(NullableReader.ReadLongRequiredOrZero(ref decoder, itemSchema));
+            }
+        }
+    }
+
+    private static List<int>? DecodeIntArray(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        if (schema is not AvroArray arr)
+        {
+            throw new AvroFormatException($"expected array<int>, got {schema.GetType().Name}");
+        }
+
+        var result = new List<int>();
+        while (true)
+        {
+            var count = decoder.ReadBlockCount();
+            if (count == 0)
+            {
+                return result;
+            }
+
+            for (long i = 0; i < count; i++)
+            {
+                AvroSchema itemSchema = arr.Items;
+                result.Add(NullableReader.ReadIntRequiredOrZero(ref decoder, itemSchema));
+            }
+        }
+    }
+
+    private static AvroRecord ResolveDataFileRecord(AvroRecord entryRecord)
+    {
+        foreach (AvroRecordField f in entryRecord.Fields)
+        {
+            if (f.FieldId == IcebergFieldIds.DataFile)
+            {
+                AvroSchema s = f.Schema;
+                if (s is AvroUnion u)
+                {
+                    s = u.NonNull;
+                }
+
+                if (s is AvroRecord r)
+                {
+                    return r;
+                }
+            }
+        }
+
+        throw new AvroFormatException("manifest_entry has no data_file record (field-id 2)");
+    }
+
+    private static AvroRecord? ResolvePartitionRecord(AvroRecord dataFileRecord)
+    {
+        foreach (AvroRecordField f in dataFileRecord.Fields)
+        {
+            if (f.FieldId == IcebergFieldIds.DfPartition)
+            {
+                AvroSchema s = f.Schema;
+                if (s is AvroUnion u)
+                {
+                    s = u.NonNull;
+                }
+
+                if (s is AvroRecord r)
+                {
+                    return r;
+                }
+            }
+        }
+
+        return null;
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/ManifestFileSink.cs b/src/IcebergSharp.Avro/Internal/Decode/ManifestFileSink.cs
new file mode 100644
index 0000000..efc3429
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/ManifestFileSink.cs
@@ -0,0 +1,189 @@
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Schema;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Decodes one <c>manifest_file</c> Avro record into a <see cref="ManifestFile"/>.
+/// Field dispatch is by Iceberg <c>field-id</c> so the same code handles v1
+/// (where rows-count fields are absent) and v2 (where they are required).
+/// </summary>
+internal static class ManifestFileSink
+{
+    public static ManifestFile Decode(ref BinaryDecoder decoder, AvroRecord record, int formatVersion)
+    {
+        string? manifestPath = null;
+        long manifestLength = 0;
+        var partitionSpecId = 0;
+        ManifestContent content = ManifestContent.Data;
+        long sequenceNumber = 0;
+        long minSequenceNumber = 0;
+        long addedSnapshotId = 0;
+        var addedFilesCount = 0;
+        var existingFilesCount = 0;
+        var deletedFilesCount = 0;
+        long addedRowsCount = 0;
+        long existingRowsCount = 0;
+        long deletedRowsCount = 0;
+        List<FieldSummary>? partitions = null;
+        byte[]? keyMetadata = null;
+
+        foreach (AvroRecordField field in record.Fields)
+        {
+            switch (field.FieldId)
+            {
+                case IcebergFieldIds.ManifestPath:
+                    manifestPath = NullableReader.ReadStringRequired(ref decoder, field.Schema, "manifest_path");
+                    break;
+                case IcebergFieldIds.ManifestLength:
+                    manifestLength = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.PartitionSpecId:
+                    partitionSpecId = NullableReader.ReadIntRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.Content:
+                    content = (ManifestContent)NullableReader.ReadIntRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.SequenceNumber:
+                    sequenceNumber = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.MinSequenceNumber:
+                    minSequenceNumber = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.AddedSnapshotId:
+                    addedSnapshotId = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.AddedFilesCount:
+                    addedFilesCount = ReadIntCount(ref decoder, field.Schema, "added_data_files_count");
+                    break;
+                case IcebergFieldIds.ExistingFilesCount:
+                    existingFilesCount = ReadIntCount(ref decoder, field.Schema, "existing_data_files_count");
+                    break;
+                case IcebergFieldIds.DeletedFilesCount:
+                    deletedFilesCount = ReadIntCount(ref decoder, field.Schema, "deleted_data_files_count");
+                    break;
+                case IcebergFieldIds.AddedRowsCount:
+                    addedRowsCount = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.ExistingRowsCount:
+                    existingRowsCount = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.DeletedRowsCount:
+                    deletedRowsCount = NullableReader.ReadLongRequiredOrZero(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.Partitions:
+                    partitions = DecodePartitions(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.KeyMetadataManifest:
+                    keyMetadata = NullableReader.ReadBytesOrNull(ref decoder, field.Schema);
+                    break;
+                default:
+                    ShapeDecoder.SkipValue(ref decoder, field.Schema);
+                    break;
+            }
+        }
+
+        if (manifestPath is null)
+        {
+            throw new AvroFormatException("manifest_file record is missing manifest_path (field-id 500)");
+        }
+
+        return new ManifestFile(
+            manifestPath,
+            manifestLength,
+            partitionSpecId,
+            content,
+            sequenceNumber,
+            minSequenceNumber,
+            addedSnapshotId,
+            addedFilesCount,
+            existingFilesCount,
+            deletedFilesCount,
+            addedRowsCount,
+            existingRowsCount,
+            deletedRowsCount,
+            partitions,
+            keyMetadata ?? [],
+            formatVersion);
+    }
+
+    private static List<FieldSummary> DecodePartitions(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (NullableReader.PeelNullable(ref decoder, ref schema))
+        {
+            return [];
+        }
+
+        if (schema is not AvroArray arr)
+        {
+            throw new AvroFormatException("partitions field must be array<field_summary>");
+        }
+
+        // Some writers wrap the field_summary record in [null, record] inside the array's items.
+        _ = arr.Items switch
+        {
+            AvroRecord => true,
+            AvroUnion { NonNull: AvroRecord } => true,
+            _ => throw new AvroFormatException("partitions array element must be a field_summary record"),
+        };
+
+        var result = new List<FieldSummary>();
+        while (true)
+        {
+            var count = decoder.ReadBlockCount();
+            if (count == 0)
+            {
+                return result;
+            }
+
+            for (long i = 0; i < count; i++)
+            {
+                AvroSchema itemSchema = arr.Items;
+                if (NullableReader.PeelNullable(ref decoder, ref itemSchema))
+                {
+                    throw new AvroFormatException("null field_summary in partitions array");
+                }
+
+                result.Add(DecodeFieldSummary(ref decoder, (AvroRecord)itemSchema));
+            }
+        }
+    }
+
+    private static int ReadIntCount(ref BinaryDecoder decoder, AvroSchema schema, string fieldName)
+    {
+        var value = NullableReader.ReadLongRequiredOrZero(ref decoder, schema);
+        return NullableReader.ToInt32(value, fieldName);
+    }
+
+    private static FieldSummary DecodeFieldSummary(ref BinaryDecoder decoder, AvroRecord rec)
+    {
+        var containsNull = false;
+        bool? containsNaN = null;
+        byte[] lower = [];
+        byte[] upper = [];
+
+        foreach (AvroRecordField field in rec.Fields)
+        {
+            switch (field.FieldId)
+            {
+                case IcebergFieldIds.FsContainsNull:
+                    containsNull = NullableReader.ReadBoolOrNull(ref decoder, field.Schema) ?? false;
+                    break;
+                case IcebergFieldIds.FsContainsNaN:
+                    containsNaN = NullableReader.ReadBoolOrNull(ref decoder, field.Schema);
+                    break;
+                case IcebergFieldIds.FsLowerBound:
+                    lower = NullableReader.ReadBytesOrNull(ref decoder, field.Schema) ?? [];
+                    break;
+                case IcebergFieldIds.FsUpperBound:
+                    upper = NullableReader.ReadBytesOrNull(ref decoder, field.Schema) ?? [];
+                    break;
+                default:
+                    ShapeDecoder.SkipValue(ref decoder, field.Schema);
+                    break;
+            }
+        }
+
+        return new FieldSummary(containsNull, containsNaN, lower, upper);
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/NullableReader.cs b/src/IcebergSharp.Avro/Internal/Decode/NullableReader.cs
new file mode 100644
index 0000000..4ace650
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/NullableReader.cs
@@ -0,0 +1,130 @@
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Schema;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Helpers for reading possibly-nullable Avro values. Each method peels off a
+/// <c>[null, T]</c> union and dispatches on the carried type. When the encoded
+/// branch is null the helper returns a sentinel (<c>null</c>, <c>0</c>,
+/// <c>false</c>, or an empty array) so callers don't carry per-field null flags.
+/// </summary>
+internal static class NullableReader
+{
+    public static bool PeelNullable(ref BinaryDecoder decoder, ref AvroSchema schema)
+    {
+        if (schema is not AvroUnion u)
+        {
+            return false;
+        }
+
+        var branch = decoder.ReadUnionBranch();
+        if (branch == u.NullBranchIndex)
+        {
+            return true;
+        }
+
+        if (branch != u.NonNullBranchIndex)
+        {
+            throw new AvroFormatException($"unexpected union branch {branch}");
+        }
+
+        schema = u.NonNull;
+        return false;
+    }
+
+    public static string? ReadStringOrNull(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        if (schema is AvroPrimitive { Kind: AvroPrimitiveKind.String })
+        {
+            return decoder.ReadString();
+        }
+
+        throw new AvroFormatException($"expected string schema, got {schema.GetType().Name}");
+    }
+
+    public static string ReadStringRequired(ref BinaryDecoder decoder, AvroSchema schema, string fieldName)
+        => ReadStringOrNull(ref decoder, schema)
+        ?? throw new AvroFormatException($"required string field '{fieldName}' is null");
+
+    public static long? ReadLongOrNull(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        return schema switch
+        {
+            AvroPrimitive { Kind: AvroPrimitiveKind.Long } => decoder.ReadLong(),
+            AvroPrimitive { Kind: AvroPrimitiveKind.Int } => decoder.ReadInt(),
+            _ => throw new AvroFormatException($"expected long/int schema, got {schema.GetType().Name}"),
+        };
+    }
+
+    public static long ReadLongRequiredOrZero(ref BinaryDecoder decoder, AvroSchema schema)
+        => ReadLongOrNull(ref decoder, schema) ?? 0L;
+
+    public static int? ReadIntOrNull(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        return schema switch
+        {
+            AvroPrimitive { Kind: AvroPrimitiveKind.Int } => decoder.ReadInt(),
+            AvroPrimitive { Kind: AvroPrimitiveKind.Long } => ToInt32(decoder.ReadLong(), "int-compatible long"),
+            _ => throw new AvroFormatException($"expected int schema, got {schema.GetType().Name}"),
+        };
+    }
+
+    public static int ReadIntRequiredOrZero(ref BinaryDecoder decoder, AvroSchema schema)
+        => ReadIntOrNull(ref decoder, schema) ?? 0;
+
+    public static int ToInt32(long value, string fieldName)
+    {
+        if (value is < int.MinValue or > int.MaxValue)
+        {
+            throw new AvroFormatException($"{fieldName} value {value} is outside Int32 range");
+        }
+
+        return (int)value;
+    }
+
+    public static bool? ReadBoolOrNull(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        if (schema is AvroPrimitive { Kind: AvroPrimitiveKind.Boolean })
+        {
+            return decoder.ReadBoolean();
+        }
+
+        throw new AvroFormatException($"expected boolean schema, got {schema.GetType().Name}");
+    }
+
+    public static byte[]? ReadBytesOrNull(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (PeelNullable(ref decoder, ref schema))
+        {
+            return null;
+        }
+
+        return schema switch
+        {
+            AvroPrimitive { Kind: AvroPrimitiveKind.Bytes } => decoder.ReadBytesSpan().ToArray(),
+            AvroFixed f => decoder.ReadFixed(f.Size).ToArray(),
+            _ => throw new AvroFormatException($"expected bytes/fixed schema, got {schema.GetType().Name}"),
+        };
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/PartitionRecordSink.cs b/src/IcebergSharp.Avro/Internal/Decode/PartitionRecordSink.cs
new file mode 100644
index 0000000..5dc1269
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/PartitionRecordSink.cs
@@ -0,0 +1,39 @@
+using IcebergSharp.Avro.Internal.Schema;
+using IcebergSharp.Types;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Decodes a manifest's <c>data_file.partition</c> record into a
+/// <see cref="PartitionValues"/> tuple, using the Avro record's own schema
+/// (which the writer stamps with field-ids that match the
+/// <c>partition-spec</c> metadata key).
+/// </summary>
+internal static class PartitionRecordSink
+{
+    /// <summary>Resolves the <see cref="PartitionValues"/> "template" — names and types — from the partition-record schema.</summary>
+    public static (string[] Names, IcebergType[] Types) ResolveSchema(AvroRecord partitionRecord)
+    {
+        var names = new string[partitionRecord.Fields.Count];
+        var types = new IcebergType[partitionRecord.Fields.Count];
+        for (var i = 0; i < partitionRecord.Fields.Count; i++)
+        {
+            AvroRecordField f = partitionRecord.Fields[i];
+            names[i] = f.Name;
+            types[i] = AvroToIcebergType.Resolve(f.Schema);
+        }
+
+        return (names, types);
+    }
+
+    public static PartitionValues Decode(ref BinaryDecoder decoder, AvroRecord partitionRecord, string[] names, IcebergType[] types)
+    {
+        var values = new object?[partitionRecord.Fields.Count];
+        for (var i = 0; i < partitionRecord.Fields.Count; i++)
+        {
+            values[i] = ShapeDecoder.DecodeValue(ref decoder, partitionRecord.Fields[i].Schema);
+        }
+
+        return new PartitionValues(names, types, values);
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Decode/ShapeDecoder.cs b/src/IcebergSharp.Avro/Internal/Decode/ShapeDecoder.cs
new file mode 100644
index 0000000..c80e2a9
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Decode/ShapeDecoder.cs
@@ -0,0 +1,272 @@
+using System.Globalization;
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Schema;
+
+namespace IcebergSharp.Avro.Internal.Decode;
+
+/// <summary>
+/// Schema-aware traversal helpers over a <see cref="BinaryDecoder"/>. The
+/// manifest/manifest-list record decoders use these to skip values they do not
+/// care about and to materialise typed values for the partition record (whose
+/// shape is dynamic).
+/// </summary>
+internal static class ShapeDecoder
+{
+    /// <summary>
+    /// Consumes the next value of the given schema from the decoder, discarding
+    /// it. Used when a record field's field-id is not one the caller wires up.
+    /// </summary>
+    public static void SkipValue(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        switch (schema)
+        {
+            case AvroPrimitive p:
+                SkipPrimitive(ref decoder, p);
+                break;
+
+            case AvroFixed f:
+                _ = decoder.ReadFixed(f.Size);
+                break;
+
+            case AvroEnum:
+                _ = decoder.ReadInt();
+                break;
+
+            case AvroUnion u:
+                {
+                    var branch = decoder.ReadUnionBranch();
+                    if (branch == u.NullBranchIndex)
+                    {
+                        return;
+                    }
+
+                    if (branch != u.NonNullBranchIndex)
+                    {
+                        throw new AvroFormatException($"unexpected union branch {branch}");
+                    }
+
+                    SkipValue(ref decoder, u.NonNull);
+                    break;
+                }
+
+            case AvroArray a:
+                {
+                    while (true)
+                    {
+                        var count = decoder.ReadBlockCount();
+                        if (count == 0)
+                        {
+                            break;
+                        }
+
+                        for (long i = 0; i < count; i++)
+                        {
+                            SkipValue(ref decoder, a.Items);
+                        }
+                    }
+
+                    break;
+                }
+
+            case AvroMap m:
+                {
+                    while (true)
+                    {
+                        var count = decoder.ReadBlockCount();
+                        if (count == 0)
+                        {
+                            break;
+                        }
+
+                        for (long i = 0; i < count; i++)
+                        {
+                            _ = decoder.ReadString();
+                            SkipValue(ref decoder, m.Values);
+                        }
+                    }
+
+                    break;
+                }
+
+            case AvroRecord r:
+                {
+                    foreach (AvroRecordField f in r.Fields)
+                    {
+                        SkipValue(ref decoder, f.Schema);
+                    }
+
+                    break;
+                }
+
+            default:
+                throw new AvroFormatException($"cannot skip unsupported schema kind {schema.GetType().Name}");
+        }
+    }
+
+    private static void SkipPrimitive(ref BinaryDecoder decoder, AvroPrimitive p)
+    {
+        switch (p.Kind)
+        {
+            case AvroPrimitiveKind.Null: break;
+            case AvroPrimitiveKind.Boolean: _ = decoder.ReadBoolean(); break;
+            case AvroPrimitiveKind.Int: _ = decoder.ReadInt(); break;
+            case AvroPrimitiveKind.Long: _ = decoder.ReadLong(); break;
+            case AvroPrimitiveKind.Float: _ = decoder.ReadFloat(); break;
+            case AvroPrimitiveKind.Double: _ = decoder.ReadDouble(); break;
+            case AvroPrimitiveKind.Bytes: _ = decoder.ReadBytesSpan(); break;
+            case AvroPrimitiveKind.String: _ = decoder.ReadBytesSpan(); break;
+            default: throw new AvroFormatException($"cannot skip primitive {p.Kind}");
+        }
+    }
+
+    /// <summary>
+    /// Decodes a single value of the given schema as a CLR <see cref="object"/>.
+    /// Used for partition column values; honours the logical type to produce
+    /// <see cref="DateOnly"/>, <see cref="DateTime"/>, <see cref="Guid"/>, and
+    /// <see cref="decimal"/> where appropriate.
+    /// </summary>
+    public static object? DecodeValue(ref BinaryDecoder decoder, AvroSchema schema)
+    {
+        if (schema is AvroUnion u)
+        {
+            var branch = decoder.ReadUnionBranch();
+            if (branch == u.NullBranchIndex)
+            {
+                return null;
+            }
+
+            if (branch != u.NonNullBranchIndex)
+            {
+                throw new AvroFormatException($"unexpected union branch {branch}");
+            }
+
+            schema = u.NonNull;
+        }
+
+        return schema switch
+        {
+            AvroPrimitive p => DecodePrimitive(ref decoder, p),
+            AvroFixed f => DecodeFixed(ref decoder, f),
+            _ => throw new NotSupportedException($"unexpected partition-value schema kind {schema.GetType().Name}"),
+        };
+    }
+
+    private static object DecodePrimitive(ref BinaryDecoder decoder, AvroPrimitive p)
+    {
+        switch (p.LogicalType)
+        {
+            case AvroLogicalType.Date:
+                return DateOnly.FromDayNumber(_epochDayNumber + decoder.ReadInt());
+
+            case AvroLogicalType.TimeMicros:
+                {
+                    var micros = decoder.ReadLong();
+                    return TimeSpan.FromTicks(micros * 10);
+                }
+
+            case AvroLogicalType.TimeMillis:
+                {
+                    var millis = decoder.ReadInt();
+                    return TimeSpan.FromMilliseconds(millis);
+                }
+
+            case AvroLogicalType.TimestampMicros:
+                {
+                    var micros = decoder.ReadLong();
+                    return DateTime.UnixEpoch.AddTicks(micros * 10);
+                }
+
+            case AvroLogicalType.TimestampMillis:
+                {
+                    var millis = decoder.ReadLong();
+                    return DateTime.UnixEpoch.AddMilliseconds(millis);
+                }
+
+            case AvroLogicalType.Uuid:
+                {
+                    var str = decoder.ReadString();
+                    return Guid.Parse(str, CultureInfo.InvariantCulture);
+                }
+
+            case AvroLogicalType.Decimal:
+                {
+                    // Iceberg encodes decimals as variable-length big-endian two's complement bytes.
+                    ReadOnlySpan<byte> bytes = decoder.ReadBytesSpan();
+                    return DecodeDecimal(bytes, p.DecimalScale);
+                }
+        }
+
+        return p.Kind switch
+        {
+            AvroPrimitiveKind.Boolean => decoder.ReadBoolean(),
+            AvroPrimitiveKind.Int => decoder.ReadInt(),
+            AvroPrimitiveKind.Long => decoder.ReadLong(),
+            AvroPrimitiveKind.Float => decoder.ReadFloat(),
+            AvroPrimitiveKind.Double => decoder.ReadDouble(),
+            AvroPrimitiveKind.Bytes => decoder.ReadBytesSpan().ToArray(),
+            AvroPrimitiveKind.String => decoder.ReadString(),
+            _ => throw new AvroFormatException($"cannot decode primitive {p.Kind}"),
+        };
+    }
+
+    private static object DecodeFixed(ref BinaryDecoder decoder, AvroFixed f)
+    {
+        ReadOnlySpan<byte> bytes = decoder.ReadFixed(f.Size);
+
+        return f.LogicalType switch
+        {
+            AvroLogicalType.Decimal => DecodeDecimal(bytes, f.DecimalScale),
+            AvroLogicalType.Uuid => DecodeUuidBytes(bytes),
+            _ => bytes.ToArray(),
+        };
+    }
+
+    private static decimal DecodeDecimal(ReadOnlySpan<byte> bytes, int scale)
+    {
+        if (bytes.IsEmpty)
+        {
+            return decimal.Zero;
+        }
+
+        // Two's complement big-endian → System.Numerics.BigInteger
+        // (BigInteger expects little-endian, signed).
+        Span<byte> le = stackalloc byte[bytes.Length];
+        for (var i = 0; i < bytes.Length; i++)
+        {
+            le[i] = bytes[bytes.Length - 1 - i];
+        }
+
+        var bi = new System.Numerics.BigInteger(le, isUnsigned: false, isBigEndian: false);
+        var pow = System.Numerics.BigInteger.Pow(10, scale);
+        var quotient = System.Numerics.BigInteger.DivRem(bi, pow, out System.Numerics.BigInteger remainder);
+        // Reconstruct the decimal value: quotient + remainder/10^scale. Loses precision beyond decimal range.
+        var whole = (decimal)quotient;
+        if (remainder.IsZero)
+        {
+            return whole;
+        }
+
+        var frac = (decimal)remainder / (decimal)pow;
+        return whole + frac;
+    }
+
+    private static Guid DecodeUuidBytes(ReadOnlySpan<byte> bytes)
+    {
+        if (bytes.Length != 16)
+        {
+            throw new AvroFormatException($"UUID fixed must be 16 bytes, got {bytes.Length}");
+        }
+
+        // Iceberg uses RFC-4122 big-endian byte layout (same as Java UUID.toString()).
+        Span<byte> shuffled = stackalloc byte[16];
+        bytes.CopyTo(shuffled);
+        // System.Guid byte layout for the first three fields is little-endian; swap.
+        (shuffled[0], shuffled[3]) = (shuffled[3], shuffled[0]);
+        (shuffled[1], shuffled[2]) = (shuffled[2], shuffled[1]);
+        (shuffled[4], shuffled[5]) = (shuffled[5], shuffled[4]);
+        (shuffled[6], shuffled[7]) = (shuffled[7], shuffled[6]);
+        return new Guid(shuffled);
+    }
+
+    private static readonly int _epochDayNumber = new DateOnly(1970, 1, 1).DayNumber;
+}
diff --git a/src/IcebergSharp.Avro/Internal/Errors/AvroFormatException.cs b/src/IcebergSharp.Avro/Internal/Errors/AvroFormatException.cs
new file mode 100644
index 0000000..cc45303
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Errors/AvroFormatException.cs
@@ -0,0 +1,45 @@
+using System.Globalization;
+
+namespace IcebergSharp.Avro.Internal.Errors;
+
+/// <summary>
+/// Thrown when a stream does not conform to the slice of the Avro OCF spec
+/// IcebergSharp.Avro implements (manifests + manifest lists). Carries optional
+/// file-offset and contextual location to make failures locatable in real-world
+/// manifests that can be hundreds of records long.
+/// </summary>
+/// <remarks>
+/// We use a sibling of <see cref="InvalidDataException"/> rather than a subclass
+/// because <see cref="InvalidDataException"/> is sealed. Catch this if you want
+/// only Avro-format errors; otherwise <c>catch (Exception)</c> is fine.
+/// </remarks>
+internal sealed class AvroFormatException : Exception
+{
+    public long? FileOffset { get; }
+    public string? Location { get; }
+
+    public AvroFormatException(string message)
+        : base(message)
+    {
+    }
+
+    public AvroFormatException(string message, long fileOffset, string? location = null)
+        : base(BuildMessage(message, fileOffset, location))
+    {
+        FileOffset = fileOffset;
+        Location = location;
+    }
+
+    public AvroFormatException(string message, Exception inner)
+        : base(message, inner)
+    {
+    }
+
+    private static string BuildMessage(string message, long fileOffset, string? location)
+    {
+        var offsetStr = fileOffset.ToString(CultureInfo.InvariantCulture);
+        return location is null
+            ? $"{message} (offset {offsetStr})"
+            : $"{message} (offset {offsetStr}, {location})";
+    }
+}
diff --git a/src/IcebergSharp.Avro/Internal/Ocf/OcfHeader.cs b/src/IcebergSharp.Avro/Internal/Ocf/OcfHeader.cs
new file mode 100644
index 0000000..9ece3e8
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Ocf/OcfHeader.cs
@@ -0,0 +1,19 @@
+namespace IcebergSharp.Avro.Internal.Ocf;
+
+/// <summary>
+/// Parsed Avro Object Container File header — magic, codec name, schema JSON,
+/// sync bytes, and any extra metadata keys the writer attached (Iceberg uses
+/// these for <c>partition-spec</c>, <c>schema</c>, <c>format-version</c>).
+/// </summary>
+internal sealed class OcfHeader(string schemaJson, string codec, byte[] sync, IReadOnlyDictionary<string, byte[]> metadata)
+{
+    /// <summary>Avro OCF magic: <c>Obj\x01</c>.</summary>
+    public static ReadOnlySpan<byte> Magic => "Obj\x01"u8;
+
+    public const int SyncMarkerSize = 16;
+
+    public string SchemaJson { get; } = schemaJson;
+    public string Codec { get; } = codec;
+    public byte[] Sync { get; } = sync;
+    public IReadOnlyDictionary<string, byte[]> Metadata { get; } = metadata;
+}
diff --git a/src/IcebergSharp.Avro/Internal/Ocf/OcfReader.cs b/src/IcebergSharp.Avro/Internal/Ocf/OcfReader.cs
new file mode 100644
index 0000000..8a44405
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Ocf/OcfReader.cs
@@ -0,0 +1,366 @@
+using System.Buffers;
+using System.Text;
+using IcebergSharp.Avro.Internal.Codec;
+using IcebergSharp.Avro.Internal.Decode;
+using IcebergSharp.Avro.Internal.Errors;
+
+namespace IcebergSharp.Avro.Internal.Ocf;
+
+/// <summary>
+/// Async block iterator over an Avro Object Container File. Reads the header on
+/// <see cref="InitializeAsync"/>, then yields one decompressed block at a time
+/// via <see cref="ReadNextBlockAsync"/>. Buffers are pooled and returned on
+/// dispose; callers must consume <see cref="CurrentBlock"/> before requesting
+/// the next block.
+/// </summary>
+internal sealed class OcfReader : IAsyncDisposable
+{
+    private const int _maxHeaderBlockSize = 16 * 1024 * 1024;
+    private const int _maxHeaderEntryCount = 1024;
+    private const int _maxHeaderKeyLength = 4096;
+    private const int _maxHeaderValueLength = 16 * 1024 * 1024;
+
+    private readonly Stream _stream;
+    private readonly bool _leaveOpen;
+    private readonly int _maxBlockSize;
+    private readonly int _maxBlockRecordCount;
+    private readonly byte[] _singleByte = new byte[1];
+
+    private byte[] _compressedBuffer = [];
+    private byte[] _decompressedBuffer = [];
+    private int _currentBlockLength;
+    private int _currentRecordCount;
+    private long _streamOffset;
+    private OcfHeader? _header;
+    private IBlockCodec? _codec;
+    private bool _initialized;
+
+    public OcfReader(Stream stream, bool leaveOpen, int maxBlockSize, int maxBlockRecordCount = 1_000_000)
+    {
+        ArgumentNullException.ThrowIfNull(stream);
+        ArgumentOutOfRangeException.ThrowIfNegativeOrZero(maxBlockSize);
+        ArgumentOutOfRangeException.ThrowIfNegativeOrZero(maxBlockRecordCount);
+
+        _stream = stream;
+        _leaveOpen = leaveOpen;
+        _maxBlockSize = maxBlockSize;
+        _maxBlockRecordCount = maxBlockRecordCount;
+    }
+
+    public OcfHeader Header => _header
+        ?? throw new InvalidOperationException("call InitializeAsync first");
+
+    public ReadOnlySpan<byte> CurrentBlock => _decompressedBuffer.AsSpan(0, _currentBlockLength);
+
+    public int CurrentRecordCount => _currentRecordCount;
+
+    public async Task InitializeAsync(CancellationToken cancellationToken)
+    {
+        if (_initialized)
+        {
+            return;
+        }
+
+        await ReadMagicAsync(cancellationToken).ConfigureAwait(false);
+        IReadOnlyDictionary<string, byte[]> metadata = await ReadHeaderMetadataAsync(cancellationToken).ConfigureAwait(false);
+        var sync = await ReadExactAsync(OcfHeader.SyncMarkerSize, cancellationToken).ConfigureAwait(false);
+
+        if (!metadata.TryGetValue("avro.schema", out var schemaBytes))
+        {
+            throw new AvroFormatException("OCF header is missing 'avro.schema'", _streamOffset);
+        }
+
+        var codecName = "null";
+        if (metadata.TryGetValue("avro.codec", out var codecBytes))
+        {
+            codecName = Encoding.UTF8.GetString(codecBytes);
+        }
+
+        _codec = codecName switch
+        {
+            "null" => NullCodec.Instance,
+            "deflate" => DeflateCodec.Instance,
+            _ => throw new AvroFormatException($"unsupported codec '{codecName}'", _streamOffset),
+        };
+
+        var schemaJson = Encoding.UTF8.GetString(schemaBytes);
+        _header = new OcfHeader(schemaJson, codecName, sync, metadata);
+        _initialized = true;
+    }
+
+    public async ValueTask<bool> ReadNextBlockAsync(CancellationToken cancellationToken)
+    {
+        if (!_initialized)
+        {
+            throw new InvalidOperationException("call InitializeAsync first");
+        }
+
+        // Block header: long(record-count) long(byte-size). Read varints byte-by-byte
+        // since we don't know the encoded length up front.
+        var blockStartOffset = _streamOffset;
+        var recordCountResult = await TryReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+        if (recordCountResult is null)
+        {
+            return false; // clean EOF before block header
+        }
+
+        var recordCount = recordCountResult.Value;
+        var byteSize = await ReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+
+        if (recordCount <= 0)
+        {
+            throw new AvroFormatException($"invalid block record count {recordCount}", blockStartOffset);
+        }
+
+        if (recordCount > _maxBlockRecordCount)
+        {
+            throw new AvroFormatException($"block record count {recordCount} exceeds limit {_maxBlockRecordCount}", blockStartOffset);
+        }
+
+        if (byteSize <= 0 || byteSize > _maxBlockSize)
+        {
+            throw new AvroFormatException($"invalid block byte size {byteSize} (max {_maxBlockSize})", blockStartOffset);
+        }
+
+        await EnsureCompressedCapacityAsync((int)byteSize, cancellationToken).ConfigureAwait(false);
+        await ReadExactIntoAsync(_compressedBuffer.AsMemory(0, (int)byteSize), cancellationToken).ConfigureAwait(false);
+
+        // Decompress into the decompressed buffer (resized inside the codec if necessary).
+        if (_decompressedBuffer.Length == 0)
+        {
+            _decompressedBuffer = ArrayPool<byte>.Shared.Rent(Math.Max(4096, (int)byteSize));
+        }
+
+        _currentBlockLength = _codec!.Decode(_compressedBuffer.AsSpan(0, (int)byteSize), ref _decompressedBuffer);
+        if (_currentBlockLength > _maxBlockSize)
+        {
+            throw new AvroFormatException($"decompressed block size {_currentBlockLength} exceeds limit {_maxBlockSize}", blockStartOffset);
+        }
+
+        _currentRecordCount = (int)recordCount;
+
+        // Verify the trailing sync marker.
+        var sync = await ReadExactAsync(OcfHeader.SyncMarkerSize, cancellationToken).ConfigureAwait(false);
+        if (!sync.AsSpan().SequenceEqual(_header!.Sync))
+        {
+            throw new AvroFormatException("sync marker mismatch", _streamOffset);
+        }
+
+        return true;
+    }
+
+    public async ValueTask DisposeAsync()
+    {
+        if (_compressedBuffer.Length > 0)
+        {
+            ArrayPool<byte>.Shared.Return(_compressedBuffer);
+            _compressedBuffer = [];
+        }
+
+        if (_decompressedBuffer.Length > 0)
+        {
+            ArrayPool<byte>.Shared.Return(_decompressedBuffer);
+            _decompressedBuffer = [];
+        }
+
+        if (!_leaveOpen)
+        {
+            await _stream.DisposeAsync().ConfigureAwait(false);
+        }
+    }
+
+    private async ValueTask ReadMagicAsync(CancellationToken cancellationToken)
+    {
+        var magic = await ReadExactAsync(OcfHeader.Magic.Length, cancellationToken).ConfigureAwait(false);
+        if (!magic.AsSpan().SequenceEqual(OcfHeader.Magic))
+        {
+            throw new AvroFormatException(
+                $"invalid Avro OCF magic: 0x{Convert.ToHexString(magic)}; expected Obj 01", 0);
+        }
+    }
+
+    private async ValueTask<IReadOnlyDictionary<string, byte[]>> ReadHeaderMetadataAsync(CancellationToken cancellationToken)
+    {
+        // Read the entire metadata map into memory; it's tiny in practice.
+        // We need to buffer enough to drive a sync BinaryDecoder over it.
+        var dict = new Dictionary<string, byte[]>(StringComparer.Ordinal);
+
+        while (true)
+        {
+            var count = await ReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+            if (count == 0)
+            {
+                return dict;
+            }
+
+            long entries;
+            if (count < 0)
+            {
+                if (count == long.MinValue)
+                {
+                    throw new AvroFormatException("OCF metadata block count is too small to negate", _streamOffset);
+                }
+
+                // Negative count: -count entries, followed by a non-negative byte-size header.
+                entries = -count;
+                var byteSize = await ReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+                if (byteSize < 0 || byteSize > _maxHeaderBlockSize)
+                {
+                    throw new AvroFormatException($"invalid OCF metadata block byte size {byteSize}", _streamOffset);
+                }
+            }
+            else
+            {
+                entries = count;
+            }
+
+            if (entries > _maxHeaderEntryCount)
+            {
+                throw new AvroFormatException($"OCF metadata entry count {entries} exceeds limit {_maxHeaderEntryCount}", _streamOffset);
+            }
+
+            for (long i = 0; i < entries; i++)
+            {
+                var key = await ReadVarStringAsync(_maxHeaderKeyLength, cancellationToken).ConfigureAwait(false);
+                var value = await ReadVarBytesAsync(_maxHeaderValueLength, cancellationToken).ConfigureAwait(false);
+                dict[key] = value;
+            }
+        }
+    }
+
+    private async ValueTask EnsureCompressedCapacityAsync(int size, CancellationToken cancellationToken)
+    {
+        if (_compressedBuffer.Length < size)
+        {
+            if (_compressedBuffer.Length > 0)
+            {
+                ArrayPool<byte>.Shared.Return(_compressedBuffer);
+            }
+
+            _compressedBuffer = ArrayPool<byte>.Shared.Rent(size);
+        }
+
+        await ValueTask.CompletedTask.ConfigureAwait(false);
+        _ = cancellationToken; // cancellation is checked on the actual stream reads
+    }
+
+    private async ValueTask<byte[]> ReadExactAsync(int count, CancellationToken cancellationToken)
+    {
+        var buffer = new byte[count];
+        await ReadExactIntoAsync(buffer, cancellationToken).ConfigureAwait(false);
+        return buffer;
+    }
+
+    private async ValueTask ReadExactIntoAsync(Memory<byte> destination, CancellationToken cancellationToken)
+    {
+        var total = 0;
+        while (total < destination.Length)
+        {
+            var n = await _stream.ReadAsync(destination[total..], cancellationToken).ConfigureAwait(false);
+            if (n == 0)
+            {
+                throw new AvroFormatException($"unexpected end of stream after {_streamOffset} bytes (need {destination.Length - total} more)", _streamOffset);
+            }
+
+            total += n;
+            _streamOffset += n;
+        }
+    }
+
+    private async ValueTask<long?> TryReadVarLongAsync(CancellationToken cancellationToken)
+    {
+        // Returns null on clean EOF before any byte is read; otherwise reads a full varint.
+        var n = await _stream.ReadAsync(_singleByte.AsMemory(0, 1), cancellationToken).ConfigureAwait(false);
+        if (n == 0)
+        {
+            return null;
+        }
+
+        _streamOffset += 1;
+
+        var firstByte = _singleByte[0];
+        long value = firstByte & 0x7F;
+        var shift = 7;
+        if ((firstByte & 0x80) != 0)
+        {
+            value |= await ReadRemainingVarLongAsync(shift, cancellationToken).ConfigureAwait(false);
+        }
+
+        return (long)((ulong)value >> 1) ^ -(value & 1L);
+    }
+
+    private async ValueTask<long> ReadVarLongAsync(CancellationToken cancellationToken)
+    {
+        var v = await TryReadVarLongAsync(cancellationToken).ConfigureAwait(false) ?? throw new AvroFormatException("unexpected EOF while reading varint", _streamOffset);
+        return v;
+    }
+
+    private async ValueTask<long> ReadRemainingVarLongAsync(int initialShift, CancellationToken cancellationToken)
+    {
+        long acc = 0;
+        var shift = initialShift;
+        while (true)
+        {
+            var n = await _stream.ReadAsync(_singleByte.AsMemory(0, 1), cancellationToken).ConfigureAwait(false);
+            if (n == 0)
+            {
+                throw new AvroFormatException("truncated varint", _streamOffset);
+            }
+
+            _streamOffset += 1;
+            var b = _singleByte[0];
+            acc |= (long)(b & 0x7F) << shift;
+            if ((b & 0x80) == 0)
+            {
+                return acc;
+            }
+
+            shift += 7;
+            if (shift > 63)
+            {
+                throw new AvroFormatException("varint too long", _streamOffset);
+            }
+        }
+    }
+
+    private async ValueTask<string> ReadVarStringAsync(int maxLength, CancellationToken cancellationToken)
+    {
+        var len = await ReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+        if (len < 0)
+        {
+            throw new AvroFormatException($"negative string length {len}", _streamOffset);
+        }
+
+        if (len > maxLength)
+        {
+            throw new AvroFormatException($"string length {len} exceeds supported maximum {maxLength}", _streamOffset);
+        }
+
+        if (len == 0)
+        {
+            return string.Empty;
+        }
+
+        var buf = await ReadExactAsync((int)len, cancellationToken).ConfigureAwait(false);
+        return Encoding.UTF8.GetString(buf);
+    }
+
+    private async ValueTask<byte[]> ReadVarBytesAsync(int maxLength, CancellationToken cancellationToken)
+    {
+        var len = await ReadVarLongAsync(cancellationToken).ConfigureAwait(false);
+        if (len < 0)
+        {
+            throw new AvroFormatException($"negative bytes length {len}", _streamOffset);
+        }
+
+        if (len > maxLength)
+        {
+            throw new AvroFormatException($"bytes length {len} exceeds supported maximum {maxLength}", _streamOffset);
+        }
+
+        return len == 0 ? [] : await ReadExactAsync((int)len, cancellationToken).ConfigureAwait(false);
+    }
+
+    // BinaryDecoder over the current decompressed block for sinks to use.
+    public BinaryDecoder OpenBlockDecoder() => new(CurrentBlock);
+}
diff --git a/src/IcebergSharp.Avro/Internal/Schema/AvroSchema.cs b/src/IcebergSharp.Avro/Internal/Schema/AvroSchema.cs
new file mode 100644
index 0000000..f1e960e
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Schema/AvroSchema.cs
@@ -0,0 +1,107 @@
+using System.Collections.ObjectModel;
+
+namespace IcebergSharp.Avro.Internal.Schema;
+
+/// <summary>
+/// Avro primitive types Iceberg manifests actually use. <c>Null</c> only appears
+/// as a branch of a <c>[null, T]</c> union — not on its own.
+/// </summary>
+internal enum AvroPrimitiveKind
+{
+    Null,
+    Boolean,
+    Int,
+    Long,
+    Float,
+    Double,
+    Bytes,
+    String,
+}
+
+/// <summary>
+/// Avro "logical types" that overlay a physical primitive with semantic meaning.
+/// Only the ones Iceberg manifest schemas can carry on a partition column are
+/// modelled — everything else is ignored at the schema-parser layer.
+/// </summary>
+internal enum AvroLogicalType
+{
+    None,
+    Decimal,
+    Date,
+    TimeMillis,
+    TimeMicros,
+    TimestampMillis,
+    TimestampMicros,
+    Uuid,
+}
+
+internal abstract class AvroSchema
+{
+    public AvroLogicalType LogicalType { get; init; } = AvroLogicalType.None;
+
+    /// <summary>Decimal precision (when <see cref="LogicalType"/> is <c>Decimal</c>).</summary>
+    public int DecimalPrecision { get; init; }
+
+    /// <summary>Decimal scale (when <see cref="LogicalType"/> is <c>Decimal</c>).</summary>
+    public int DecimalScale { get; init; }
+}
+
+internal sealed class AvroPrimitive(AvroPrimitiveKind kind) : AvroSchema
+{
+    public AvroPrimitiveKind Kind { get; } = kind;
+}
+
+internal sealed class AvroFixed(string name, int size) : AvroSchema
+{
+    public string Name { get; } = name;
+    public int Size { get; } = size;
+}
+
+internal sealed class AvroEnum(string name, IReadOnlyList<string> symbols) : AvroSchema
+{
+    public string Name { get; } = name;
+    public IReadOnlyList<string> Symbols { get; } = new ReadOnlyCollection<string>([.. symbols]);
+}
+
+internal sealed class AvroArray(AvroSchema items) : AvroSchema
+{
+    public AvroSchema Items { get; } = items;
+    /// <summary>Iceberg field-id of the array element, when present.</summary>
+    public int? ElementId { get; init; }
+}
+
+internal sealed class AvroMap(AvroSchema values) : AvroSchema
+{
+    public AvroSchema Values { get; } = values;
+    public int? KeyId { get; init; }
+    public int? ValueId { get; init; }
+}
+
+/// <summary>
+/// Avro union. IcebergSharp.Avro only supports a two-branch union where exactly
+/// one branch is <c>null</c> — i.e. <c>[null, T]</c> or <c>[T, null]</c>. The
+/// parser rejects everything else.
+/// </summary>
+internal sealed class AvroUnion(AvroSchema nonNull, int nullBranchIndex) : AvroSchema
+{
+    public AvroSchema NonNull { get; } = nonNull;
+    /// <summary>Zero-based index of the null branch in the encoded union.</summary>
+    public int NullBranchIndex { get; } = nullBranchIndex;
+
+    /// <summary>Zero-based index of the non-null branch in the encoded union.</summary>
+    public int NonNullBranchIndex => NullBranchIndex == 0 ? 1 : 0;
+}
+
+internal sealed class AvroRecord(string name, IReadOnlyList<AvroRecordField> fields) : AvroSchema
+{
+    public string Name { get; } = name;
+    public IReadOnlyList<AvroRecordField> Fields { get; } = new ReadOnlyCollection<AvroRecordField>([.. fields]);
+}
+
+internal sealed class AvroRecordField(string name, AvroSchema schema, int? fieldId)
+{
+    public string Name { get; } = name;
+    public AvroSchema Schema { get; } = schema;
+    /// <summary>Iceberg <c>field-id</c> JSON property — the stable key the decoder routes on.</summary>
+    public int? FieldId { get; } = fieldId;
+}
diff --git a/src/IcebergSharp.Avro/Internal/Schema/AvroSchemaParser.cs b/src/IcebergSharp.Avro/Internal/Schema/AvroSchemaParser.cs
new file mode 100644
index 0000000..32dc8a9
--- /dev/null
+++ b/src/IcebergSharp.Avro/Internal/Schema/AvroSchemaParser.cs
@@ -0,0 +1,488 @@
+using System.Text;
+using System.Text.Json;
+using IcebergSharp.Avro.Internal.Errors;
+
+namespace IcebergSharp.Avro.Internal.Schema;
+
+/// <summary>
+/// Parses the JSON Avro schema embedded in an OCF header's <c>avro.schema</c>
+/// metadata key into the minimal internal model. Hand-rolled
+/// <see cref="Utf8JsonReader"/> walk — AOT-safe, no DTOs, no reflection.
+/// </summary>
+/// <remarks>
+/// Only the constructs Iceberg manifests use are supported. Named-type
+/// references across records, multi-branch unions other than <c>[null, T]</c>,
+/// defaults beyond <c>null</c>, and named-type registries are intentionally
+/// rejected. Aliases and unknown metadata are ignored — IcebergSharp.Avro is
+/// not a general-purpose Avro library.
+/// </remarks>
+internal static class AvroSchemaParser
+{
+    public static AvroSchema Parse(string json)
+    {
+        ArgumentNullException.ThrowIfNull(json);
+        return Parse(Encoding.UTF8.GetBytes(json));
+    }
+
+    public static AvroSchema Parse(ReadOnlySpan<byte> utf8Json)
+    {
+        var reader = new Utf8JsonReader(utf8Json);
+        if (!reader.Read())
+        {
+            throw new AvroFormatException("empty Avro schema document");
+        }
+
+        AvroSchema schema = ReadSchema(ref reader);
+        if (reader.Read())
+        {
+            throw new AvroFormatException($"unexpected trailing token {reader.TokenType} after Avro schema");
+        }
+
+        return schema;
+    }
+
+    private static AvroSchema ReadSchema(ref Utf8JsonReader reader)
+    {
+        return reader.TokenType switch
+        {
+            JsonTokenType.String => ReadStringSchema(ref reader),
+            JsonTokenType.StartObject => ReadObjectSchema(ref reader),
+            JsonTokenType.StartArray => ReadUnionSchema(ref reader),
+            _ => throw new AvroFormatException($"unexpected token {reader.TokenType} for Avro schema"),
+        };
+    }
+
+    private static AvroPrimitive ReadStringSchema(ref Utf8JsonReader reader)
+    {
+        var name = reader.GetString() ?? throw new AvroFormatException("null Avro type name");
+        return ParsePrimitiveName(name);
+    }
+
+    private static AvroPrimitive ParsePrimitiveName(string name)
+    {
+        return name switch
+        {
+            "null" => new AvroPrimitive(AvroPrimitiveKind.Null),
+            "boolean" => new AvroPrimitive(AvroPrimitiveKind.Boolean),
+            "int" => new AvroPrimitive(AvroPrimitiveKind.Int),
+            "long" => new AvroPrimitive(AvroPrimitiveKind.Long),
+            "float" => new AvroPrimitive(AvroPrimitiveKind.Float),
+            "double" => new AvroPrimitive(AvroPrimitiveKind.Double),
+            "bytes" => new AvroPrimitive(AvroPrimitiveKind.Bytes),
+            "string" => new AvroPrimitive(AvroPrimitiveKind.String),
+            _ => throw new AvroFormatException($"unsupported Avro type name '{name}' (named-type references are not supported)"),
+        };
+    }
+
+    private static AvroUnion ReadUnionSchema(ref Utf8JsonReader reader)
+    {
+        // Parse the branches in order; we only accept exactly two, exactly one
+        // of which is "null".
+        var branches = new List<AvroSchema>(2);
+        var branchIsNull = new List<bool>(2);
+        var sawEndArray = false;
+
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndArray)
+            {
+                sawEndArray = true;
+                break;
+            }
+
+            AvroSchema branch = ReadSchema(ref reader);
+            var isNull = branch is AvroPrimitive { Kind: AvroPrimitiveKind.Null };
+            branches.Add(branch);
+            branchIsNull.Add(isNull);
+        }
+
+        if (!sawEndArray)
+        {
+            throw new AvroFormatException("unexpected end of stream while reading Avro union");
+        }
+
+        if (branches.Count != 2 || branchIsNull.Count(b => b) != 1)
+        {
+            throw new AvroFormatException($"only [null, T] unions are supported (got {branches.Count} branches)");
+        }
+
+        var nullIdx = branchIsNull[0] ? 0 : 1;
+        AvroSchema nonNull = branches[1 - nullIdx];
+        return new AvroUnion(nonNull, nullIdx);
+    }
+
+    private static AvroSchema ReadObjectSchema(ref Utf8JsonReader reader)
+    {
+        string? typeTag = null;
+        string? name = null;
+        int? size = null;
+        List<string>? symbols = null;
+        AvroSchema? items = null;
+        AvroSchema? values = null;
+        List<AvroRecordField>? fields = null;
+        string? logicalType = null;
+        int? precision = null;
+        int? scale = null;
+        int? elementId = null;
+        int? keyId = null;
+        int? valueId = null;
+        var sawEndObject = false;
+
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndObject)
+            {
+                sawEndObject = true;
+                break;
+            }
+
+            if (reader.TokenType != JsonTokenType.PropertyName)
+            {
+                throw new AvroFormatException($"unexpected token {reader.TokenType} while reading Avro type object");
+            }
+
+            var prop = reader.GetString();
+            if (!reader.Read())
+            {
+                throw new AvroFormatException("unexpected end of stream while reading Avro type object property");
+            }
+
+            switch (prop)
+            {
+                case "type":
+                    if (reader.TokenType == JsonTokenType.String)
+                    {
+                        typeTag = reader.GetString();
+                    }
+                    else if (reader.TokenType is JsonTokenType.StartObject or JsonTokenType.StartArray)
+                    {
+                        // {"type": {"type": "..."}} or {"type": [null, ...]} — a wrapped schema. Unwrap and return.
+                        AvroSchema inner = ReadSchema(ref reader);
+                        // Skip remaining properties of the outer object.
+                        SkipRemainingProperties(ref reader);
+                        return inner;
+                    }
+                    else
+                    {
+                        throw new AvroFormatException($"unexpected token {reader.TokenType} for 'type' property");
+                    }
+
+                    break;
+
+                case "name": name = reader.GetString(); break;
+                case "size": size = reader.GetInt32(); break;
+                case "symbols":
+                    symbols = ReadStringArray(ref reader);
+                    break;
+                case "items":
+                    items = ReadSchema(ref reader);
+                    break;
+                case "values":
+                    values = ReadSchema(ref reader);
+                    break;
+                case "fields":
+                    fields = ReadRecordFields(ref reader);
+                    break;
+                case "logicalType": logicalType = reader.GetString(); break;
+                case "precision": precision = reader.GetInt32(); break;
+                case "scale": scale = reader.GetInt32(); break;
+                case "element-id": elementId = reader.GetInt32(); break;
+                case "key-id": keyId = reader.GetInt32(); break;
+                case "value-id": valueId = reader.GetInt32(); break;
+                case "aliases":
+                    // Aliases are not supported but we tolerate their presence by skipping.
+                    reader.Skip();
+                    break;
+                default:
+                    reader.Skip();
+                    break;
+            }
+        }
+
+        if (!sawEndObject)
+        {
+            throw new AvroFormatException("unexpected end of stream while reading Avro type object");
+        }
+
+        if (typeTag is null)
+        {
+            throw new AvroFormatException("Avro type object is missing 'type'");
+        }
+
+        return BuildFromTag(typeTag, name, size, symbols, items, values, fields, logicalType, precision, scale, elementId, keyId, valueId);
+    }
+
+    private static void SkipRemainingProperties(ref Utf8JsonReader reader)
+    {
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndObject)
+            {
+                return;
+            }
+
+            if (reader.TokenType == JsonTokenType.PropertyName)
+            {
+                if (!reader.Read())
+                {
+                    throw new AvroFormatException("unexpected end of stream while skipping Avro type object property");
+                }
+
+                reader.Skip();
+            }
+        }
+
+        throw new AvroFormatException("unexpected end of stream while skipping Avro type object");
+    }
+
+    private static AvroSchema BuildFromTag(
+        string typeTag,
+        string? name,
+        int? size,
+        List<string>? symbols,
+        AvroSchema? items,
+        AvroSchema? values,
+        List<AvroRecordField>? fields,
+        string? logicalType,
+        int? precision,
+        int? scale,
+        int? elementId,
+        int? keyId,
+        int? valueId)
+    {
+        switch (typeTag)
+        {
+            case "record":
+                if (name is null || fields is null)
+                {
+                    throw new AvroFormatException("record schema requires 'name' and 'fields'");
+                }
+
+                return new AvroRecord(name, fields);
+
+            case "array":
+                if (items is null)
+                {
+                    throw new AvroFormatException("array schema requires 'items'");
+                }
+
+                return new AvroArray(items) { ElementId = elementId };
+
+            case "map":
+                if (values is null)
+                {
+                    throw new AvroFormatException("map schema requires 'values'");
+                }
+
+                return new AvroMap(values) { KeyId = keyId, ValueId = valueId };
+
+            case "fixed":
+                if (name is null || size is null)
+                {
+                    throw new AvroFormatException("fixed schema requires 'name' and 'size'");
+                }
+
+                if (size <= 0)
+                {
+                    throw new AvroFormatException($"fixed schema size must be positive, got {size}");
+                }
+
+                return ApplyLogicalType(new AvroFixed(name, size.Value), logicalType, precision, scale);
+
+            case "enum":
+                if (name is null || symbols is null)
+                {
+                    throw new AvroFormatException("enum schema requires 'name' and 'symbols'");
+                }
+
+                return new AvroEnum(name, symbols);
+
+            default:
+                // Primitive type encoded as object (e.g. {"type": "long", "logicalType": "timestamp-micros"}).
+                AvroSchema prim = ParsePrimitiveName(typeTag);
+                return ApplyLogicalType(prim, logicalType, precision, scale);
+        }
+    }
+
+    private static AvroSchema ApplyLogicalType(AvroSchema schema, string? logicalType, int? precision, int? scale)
+    {
+        if (logicalType is null)
+        {
+            return schema;
+        }
+
+        AvroLogicalType kind = logicalType switch
+        {
+            "decimal" => AvroLogicalType.Decimal,
+            "date" => AvroLogicalType.Date,
+            "time-millis" => AvroLogicalType.TimeMillis,
+            "time-micros" => AvroLogicalType.TimeMicros,
+            "timestamp-millis" => AvroLogicalType.TimestampMillis,
+            "timestamp-micros" => AvroLogicalType.TimestampMicros,
+            "uuid" => AvroLogicalType.Uuid,
+            _ => AvroLogicalType.None, // unknown logical types degrade to the underlying primitive
+        };
+
+        if (kind == AvroLogicalType.None || !IsLogicalTypeCompatible(schema, kind))
+        {
+            return schema;
+        }
+
+        if (kind == AvroLogicalType.Decimal)
+        {
+            if (precision is null or <= 0)
+            {
+                throw new AvroFormatException("decimal logical type requires positive 'precision'");
+            }
+
+            if (scale is < 0 || scale > precision)
+            {
+                throw new AvroFormatException($"decimal logical type scale {scale} must be between 0 and precision {precision}");
+            }
+        }
+
+        return schema switch
+        {
+            AvroPrimitive p => new AvroPrimitive(p.Kind)
+            {
+                LogicalType = kind,
+                DecimalPrecision = precision ?? 0,
+                DecimalScale = scale ?? 0,
+            },
+            AvroFixed f => new AvroFixed(f.Name, f.Size)
+            {
+                LogicalType = kind,
+                DecimalPrecision = precision ?? 0,
+                DecimalScale = scale ?? 0,
+            },
+            _ => schema,
+        };
+    }
+
+    private static bool IsLogicalTypeCompatible(AvroSchema schema, AvroLogicalType logicalType)
+    {
+        return logicalType switch
+        {
+            AvroLogicalType.Decimal => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Bytes } or AvroFixed,
+            AvroLogicalType.Date => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Int },
+            AvroLogicalType.TimeMillis => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Int },
+            AvroLogicalType.TimeMicros => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Long },
+            AvroLogicalType.TimestampMillis => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Long },
+            AvroLogicalType.TimestampMicros => schema is AvroPrimitive { Kind: AvroPrimitiveKind.Long },
+            AvroLogicalType.Uuid => schema is AvroPrimitive { Kind: AvroPrimitiveKind.String } or AvroFixed { Size: 16 },
+            _ => false,
+        };
+    }
+
+    private static List<string> ReadStringArray(ref Utf8JsonReader reader)
+    {
+        if (reader.TokenType != JsonTokenType.StartArray)
+        {
+            throw new AvroFormatException($"expected array, got {reader.TokenType}");
+        }
+
+        var list = new List<string>();
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndArray)
+            {
+                return list;
+            }
+
+            if (reader.TokenType != JsonTokenType.String)
+            {
+                throw new AvroFormatException($"expected string in array, got {reader.TokenType}");
+            }
+
+            list.Add(reader.GetString()!);
+        }
+
+        throw new AvroFormatException("unexpected end of stream while reading string array");
+    }
+
+    private static List<AvroRecordField> ReadRecordFields(ref Utf8JsonReader reader)
+    {
+        if (reader.TokenType != JsonTokenType.StartArray)
+        {
+            throw new AvroFormatException($"expected array for 'fields', got {reader.TokenType}");
+        }
+
+        var list = new List<AvroRecordField>();
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndArray)
+            {
+                return list;
+            }
+
+            if (reader.TokenType != JsonTokenType.StartObject)
+            {
+                throw new AvroFormatException($"expected field object, got {reader.TokenType}");
+            }
+
+            list.Add(ReadRecordField(ref reader));
+        }
+
+        throw new AvroFormatException("unexpected end of stream while reading record fields");
+    }
+
+    private static AvroRecordField ReadRecordField(ref Utf8JsonReader reader)
+    {
+        string? name = null;
+        AvroSchema? schema = null;
+        int? fieldId = null;
+
+        while (reader.Read())
+        {
+            if (reader.TokenType == JsonTokenType.EndObject)
+            {
+                if (name is null || schema is null)
+                {
+                    throw new AvroFormatException("record field requires 'name' and 'type'");
+                }
+
+                return new AvroRecordField(name, schema, fieldId);
+            }
+
+            if (reader.TokenType != JsonTokenType.PropertyName)
+            {
+                throw new AvroFormatException($"unexpected token {reader.TokenType} while reading field");
+            }
+
+            var prop = reader.GetString();
+            if (!reader.Read())
+            {
+                throw new AvroFormatException("unexpected end of stream while reading record field property");
+            }
+
+            switch (prop)
+            {
+                case "name": name = reader.GetString(); break;
+                case "type": schema = ReadSchema(ref reader); break;
+                case "field-id": fieldId = reader.GetInt32(); break;
+                case "doc":
+                case "default":
+                case "order":
+                case "aliases":
+                case "adjust-to-utc":
+                    reader.Skip();
+                    break;
+                default:
+                    // Tolerate unknown keys on fields (writers add metadata such as "field-id" before it was standard).
+                    if (prop is not null && prop.EndsWith("-id", StringComparison.Ordinal) && reader.TokenType == JsonTokenType.Number)
+                    {
+                        // Try to capture any "*-id" property the writer attached; we already pulled the most common one.
+                        _ = reader.GetInt32();
+                    }
+                    else
+                    {
+                        reader.Skip();
+                    }
+
+                    break;
+            }
+        }
+
+        throw new AvroFormatException("unexpected end of stream while reading record field");
+    }
+}
diff --git a/src/IcebergSharp.Avro/ManifestListReadOptions.cs b/src/IcebergSharp.Avro/ManifestListReadOptions.cs
new file mode 100644
index 0000000..929e37a
--- /dev/null
+++ b/src/IcebergSharp.Avro/ManifestListReadOptions.cs
@@ -0,0 +1,13 @@
+namespace IcebergSharp.Avro;
+
+public sealed class ManifestListReadOptions
+{
+    /// <summary>If true, the caller's stream is not disposed when the iterator completes.</summary>
+    public bool LeaveOpen { get; init; }
+
+    /// <summary>Hard cap on the size of a single Avro data block, in bytes. Guards against malformed files.</summary>
+    public int MaxBlockSize { get; init; } = 64 * 1024 * 1024;
+
+    /// <summary>Hard cap on records declared by a single Avro data block. Guards against hostile block headers.</summary>
+    public int MaxBlockRecordCount { get; init; } = 1_000_000;
+}
diff --git a/src/IcebergSharp.Avro/ManifestListReader.cs b/src/IcebergSharp.Avro/ManifestListReader.cs
new file mode 100644
index 0000000..b1fbac0
--- /dev/null
+++ b/src/IcebergSharp.Avro/ManifestListReader.cs
@@ -0,0 +1,95 @@
+using System.Runtime.CompilerServices;
+using System.Text;
+using IcebergSharp.Avro.Internal.Decode;
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Ocf;
+using IcebergSharp.Avro.Internal.Schema;
+
+namespace IcebergSharp.Avro;
+
+/// <summary>
+/// Reads an Iceberg manifest-list file (an Avro OCF whose records describe
+/// <see cref="ManifestFile"/>s) into a streaming sequence.
+/// </summary>
+/// <remarks>
+/// The reader is async at the I/O layer but decodes each block synchronously;
+/// every yielded <see cref="ManifestFile"/> comes from an already-buffered
+/// decompressed block, so the inner loop has no suspension points.
+/// </remarks>
+public static class ManifestListReader
+{
+    public static IAsyncEnumerable<ManifestFile> ReadAsync(Stream stream, CancellationToken cancellationToken = default)
+        => ReadAsync(stream, options: null, cancellationToken);
+
+    public static async IAsyncEnumerable<ManifestFile> ReadAsync(
+        Stream stream,
+        ManifestListReadOptions? options,
+        [EnumeratorCancellation] CancellationToken cancellationToken = default)
+    {
+        ArgumentNullException.ThrowIfNull(stream);
+        options ??= new ManifestListReadOptions();
+
+        await using var reader = new OcfReader(stream, options.LeaveOpen, options.MaxBlockSize, options.MaxBlockRecordCount);
+        await reader.InitializeAsync(cancellationToken).ConfigureAwait(false);
+
+        AvroSchema parsedSchema = AvroSchemaParser.Parse(reader.Header.SchemaJson);
+        if (parsedSchema is not AvroRecord record)
+        {
+            throw new AvroFormatException($"manifest list root schema must be a record, got {parsedSchema.GetType().Name}");
+        }
+
+        var formatVersion = DetectFormatVersion(reader.Header.Metadata, record);
+
+        while (await reader.ReadNextBlockAsync(cancellationToken).ConfigureAwait(false))
+        {
+            // Materialise the block sync; BinaryDecoder is a ref struct and can't
+            // cross a yield boundary.
+            List<ManifestFile> entries = DecodeBlock(reader, record, formatVersion);
+            foreach (ManifestFile m in entries)
+            {
+                yield return m;
+            }
+        }
+    }
+
+    private static List<ManifestFile> DecodeBlock(OcfReader reader, AvroRecord record, int formatVersion)
+    {
+        var result = new List<ManifestFile>(reader.CurrentRecordCount);
+        BinaryDecoder decoder = reader.OpenBlockDecoder();
+        for (var i = 0; i < reader.CurrentRecordCount; i++)
+        {
+            result.Add(ManifestFileSink.Decode(ref decoder, record, formatVersion));
+        }
+
+        if (!decoder.EndOfBuffer)
+        {
+            throw new AvroFormatException($"block has {decoder.Length - decoder.Position} unread bytes after {reader.CurrentRecordCount} records");
+        }
+
+        return result;
+    }
+
+    private static int DetectFormatVersion(IReadOnlyDictionary<string, byte[]> metadata, AvroRecord record)
+    {
+        if (metadata.TryGetValue("format-version", out var bytes))
+        {
+            var s = Encoding.UTF8.GetString(bytes);
+            if (int.TryParse(s, out var v) && v is >= 1 and <= 2)
+            {
+                return v;
+            }
+        }
+
+        // v2 manifest-list records carry sequence_number (515) and content (517);
+        // v1 records do not. Use that as the structural signal when metadata is silent.
+        foreach (AvroRecordField f in record.Fields)
+        {
+            if (f.FieldId == Internal.Decode.IcebergFieldIds.SequenceNumber)
+            {
+                return 2;
+            }
+        }
+
+        return 1;
+    }
+}
diff --git a/src/IcebergSharp.Avro/ManifestReadOptions.cs b/src/IcebergSharp.Avro/ManifestReadOptions.cs
new file mode 100644
index 0000000..4f441b9
--- /dev/null
+++ b/src/IcebergSharp.Avro/ManifestReadOptions.cs
@@ -0,0 +1,13 @@
+namespace IcebergSharp.Avro;
+
+public sealed class ManifestReadOptions
+{
+    /// <summary>If true, the caller's stream is not disposed when the iterator completes.</summary>
+    public bool LeaveOpen { get; init; }
+
+    /// <summary>Hard cap on the size of a single Avro data block, in bytes. Guards against malformed files.</summary>
+    public int MaxBlockSize { get; init; } = 64 * 1024 * 1024;
+
+    /// <summary>Hard cap on records declared by a single Avro data block. Guards against hostile block headers.</summary>
+    public int MaxBlockRecordCount { get; init; } = 1_000_000;
+}
diff --git a/src/IcebergSharp.Avro/ManifestReader.cs b/src/IcebergSharp.Avro/ManifestReader.cs
new file mode 100644
index 0000000..34347fd
--- /dev/null
+++ b/src/IcebergSharp.Avro/ManifestReader.cs
@@ -0,0 +1,65 @@
+using System.Runtime.CompilerServices;
+using IcebergSharp.Avro.Internal.Decode;
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Ocf;
+using IcebergSharp.Avro.Internal.Schema;
+
+namespace IcebergSharp.Avro;
+
+/// <summary>
+/// Reads an Iceberg manifest file (an Avro OCF whose records describe
+/// <see cref="ManifestEntry"/>s) into a streaming sequence. Delete-content
+/// entries are emitted unfiltered — the caller inspects <see cref="DataFile.Content"/>
+/// and skips with a warning per the v1 read-only scope.
+/// </summary>
+public static class ManifestReader
+{
+    public static IAsyncEnumerable<ManifestEntry> ReadAsync(Stream stream, CancellationToken cancellationToken = default)
+        => ReadAsync(stream, options: null, cancellationToken);
+
+    public static async IAsyncEnumerable<ManifestEntry> ReadAsync(
+        Stream stream,
+        ManifestReadOptions? options,
+        [EnumeratorCancellation] CancellationToken cancellationToken = default)
+    {
+        ArgumentNullException.ThrowIfNull(stream);
+        options ??= new ManifestReadOptions();
+
+        await using var reader = new OcfReader(stream, options.LeaveOpen, options.MaxBlockSize, options.MaxBlockRecordCount);
+        await reader.InitializeAsync(cancellationToken).ConfigureAwait(false);
+
+        AvroSchema parsedSchema = AvroSchemaParser.Parse(reader.Header.SchemaJson);
+        if (parsedSchema is not AvroRecord record)
+        {
+            throw new AvroFormatException($"manifest root schema must be a record, got {parsedSchema.GetType().Name}");
+        }
+
+        var sink = new ManifestEntrySink(record);
+
+        while (await reader.ReadNextBlockAsync(cancellationToken).ConfigureAwait(false))
+        {
+            List<ManifestEntry> entries = DecodeBlock(reader, sink);
+            foreach (ManifestEntry m in entries)
+            {
+                yield return m;
+            }
+        }
+    }
+
+    private static List<ManifestEntry> DecodeBlock(OcfReader reader, ManifestEntrySink sink)
+    {
+        var result = new List<ManifestEntry>(reader.CurrentRecordCount);
+        BinaryDecoder decoder = reader.OpenBlockDecoder();
+        for (var i = 0; i < reader.CurrentRecordCount; i++)
+        {
+            result.Add(sink.Decode(ref decoder));
+        }
+
+        if (!decoder.EndOfBuffer)
+        {
+            throw new AvroFormatException($"block has {decoder.Length - decoder.Position} unread bytes after {reader.CurrentRecordCount} records");
+        }
+
+        return result;
+    }
+}
diff --git a/src/IcebergSharp.Avro/Properties/AssemblyInfo.cs b/src/IcebergSharp.Avro/Properties/AssemblyInfo.cs
new file mode 100644
index 0000000..d350171
--- /dev/null
+++ b/src/IcebergSharp.Avro/Properties/AssemblyInfo.cs
@@ -0,0 +1,3 @@
+using System.Runtime.CompilerServices;
+
+[assembly: InternalsVisibleTo("IcebergSharp.Tests")]
diff --git a/src/IcebergSharp.Core/ManifestEntry.cs b/src/IcebergSharp.Core/ManifestEntry.cs
new file mode 100644
index 0000000..8b4d923
--- /dev/null
+++ b/src/IcebergSharp.Core/ManifestEntry.cs
@@ -0,0 +1,180 @@
+using System.Collections.ObjectModel;
+
+namespace IcebergSharp;
+
+/// <summary>
+/// Status of a <see cref="ManifestEntry"/> relative to the snapshot that wrote
+/// the manifest. Matches Iceberg spec field 0.
+/// </summary>
+public enum ManifestEntryStatus
+{
+    Existing = 0,
+    Added = 1,
+    Deleted = 2,
+}
+
+/// <summary>
+/// Distinguishes regular data files from delete files. v1 data files are
+/// always <see cref="Data"/>; v2 entries carry the flag explicitly per spec
+/// field 134. Phase 1 (read-only, COW-only) treats delete content as a signal
+/// to skip — see README.
+/// </summary>
+public enum DataFileContent
+{
+    Data = 0,
+    PositionDeletes = 1,
+    EqualityDeletes = 2,
+}
+
+/// <summary>
+/// Data file storage format. The raw spec string is kept on
+/// <see cref="DataFile.FileFormatRaw"/> so unknown formats (e.g. future
+/// additions to the Iceberg spec) survive a round-trip without forcing this
+/// enum to grow.
+/// </summary>
+public enum DataFileFormat
+{
+    Unknown = 0,
+    Parquet,
+    Orc,
+    Avro,
+}
+
+/// <summary>
+/// One data file recorded in a manifest. Carries the file's location, format,
+/// partition tuple, row count, byte size, and per-column statistics that the
+/// planner uses for stats pruning.
+/// </summary>
+public sealed class DataFile
+{
+    public DataFileContent Content { get; }
+    public string FilePath { get; }
+    public DataFileFormat FileFormat { get; }
+    public string FileFormatRaw { get; }
+    public PartitionValues Partition { get; }
+    public long RecordCount { get; }
+    public long FileSizeInBytes { get; }
+    public IReadOnlyDictionary<int, long> ColumnSizes { get; }
+    public IReadOnlyDictionary<int, long> ValueCounts { get; }
+    public IReadOnlyDictionary<int, long> NullValueCounts { get; }
+    public IReadOnlyDictionary<int, long> NanValueCounts { get; }
+    public IReadOnlyDictionary<int, ReadOnlyMemory<byte>> LowerBounds { get; }
+    public IReadOnlyDictionary<int, ReadOnlyMemory<byte>> UpperBounds { get; }
+    public ReadOnlyMemory<byte> KeyMetadata { get; }
+    public IReadOnlyList<long> SplitOffsets { get; }
+    public IReadOnlyList<int> EqualityIds { get; }
+    public int? SortOrderId { get; }
+
+    public DataFile(
+        DataFileContent content,
+        string filePath,
+        string fileFormatRaw,
+        PartitionValues partition,
+        long recordCount,
+        long fileSizeInBytes,
+        IReadOnlyDictionary<int, long>? columnSizes,
+        IReadOnlyDictionary<int, long>? valueCounts,
+        IReadOnlyDictionary<int, long>? nullValueCounts,
+        IReadOnlyDictionary<int, long>? nanValueCounts,
+        IReadOnlyDictionary<int, ReadOnlyMemory<byte>>? lowerBounds,
+        IReadOnlyDictionary<int, ReadOnlyMemory<byte>>? upperBounds,
+        ReadOnlySpan<byte> keyMetadata,
+        IReadOnlyList<long>? splitOffsets,
+        IReadOnlyList<int>? equalityIds,
+        int? sortOrderId)
+    {
+        ArgumentException.ThrowIfNullOrEmpty(filePath);
+        ArgumentException.ThrowIfNullOrEmpty(fileFormatRaw);
+        ArgumentNullException.ThrowIfNull(partition);
+
+        Content = content;
+        FilePath = filePath;
+        FileFormatRaw = fileFormatRaw;
+        FileFormat = ParseFormat(fileFormatRaw);
+        Partition = partition;
+        RecordCount = recordCount;
+        FileSizeInBytes = fileSizeInBytes;
+        ColumnSizes = CopyDict(columnSizes);
+        ValueCounts = CopyDict(valueCounts);
+        NullValueCounts = CopyDict(nullValueCounts);
+        NanValueCounts = CopyDict(nanValueCounts);
+        LowerBounds = CopyDict(lowerBounds);
+        UpperBounds = CopyDict(upperBounds);
+        KeyMetadata = keyMetadata.IsEmpty ? ReadOnlyMemory<byte>.Empty : keyMetadata.ToArray();
+        SplitOffsets = splitOffsets is null ? [] : new ReadOnlyCollection<long>([.. splitOffsets]);
+        EqualityIds = equalityIds is null ? [] : new ReadOnlyCollection<int>([.. equalityIds]);
+        SortOrderId = sortOrderId;
+    }
+
+    private static DataFileFormat ParseFormat(string raw)
+    {
+        // Iceberg writes the format as an upper-case enum symbol ("PARQUET"),
+        // but we accept any casing to be forgiving of catalog-side rewrites.
+        if (raw.Equals("PARQUET", StringComparison.OrdinalIgnoreCase))
+        {
+            return DataFileFormat.Parquet;
+        }
+
+        if (raw.Equals("ORC", StringComparison.OrdinalIgnoreCase))
+        {
+            return DataFileFormat.Orc;
+        }
+
+        if (raw.Equals("AVRO", StringComparison.OrdinalIgnoreCase))
+        {
+            return DataFileFormat.Avro;
+        }
+
+        return DataFileFormat.Unknown;
+    }
+
+    private static IReadOnlyDictionary<int, TValue> CopyDict<TValue>(IReadOnlyDictionary<int, TValue>? source)
+    {
+        if (source is null || source.Count == 0)
+        {
+            return EmptyReadOnlyDict<TValue>.Instance;
+        }
+
+        var copy = new Dictionary<int, TValue>(source.Count);
+        foreach (KeyValuePair<int, TValue> kv in source)
+        {
+            copy[kv.Key] = kv.Value;
+        }
+
+        return new ReadOnlyDictionary<int, TValue>(copy);
+    }
+
+    private static class EmptyReadOnlyDict<TValue>
+    {
+        public static readonly IReadOnlyDictionary<int, TValue> Instance = new ReadOnlyDictionary<int, TValue>(new Dictionary<int, TValue>(0));
+    }
+}
+
+/// <summary>
+/// One row of an Iceberg manifest: a <see cref="DataFile"/> plus the
+/// status/sequence/snapshot tagging that lets the planner decide whether the
+/// file is part of the snapshot being scanned.
+/// </summary>
+public sealed class ManifestEntry
+{
+    public ManifestEntryStatus Status { get; }
+    public long? SnapshotId { get; }
+    public long? SequenceNumber { get; }
+    public long? FileSequenceNumber { get; }
+    public DataFile DataFile { get; }
+
+    public ManifestEntry(
+        ManifestEntryStatus status,
+        long? snapshotId,
+        long? sequenceNumber,
+        long? fileSequenceNumber,
+        DataFile dataFile)
+    {
+        ArgumentNullException.ThrowIfNull(dataFile);
+        Status = status;
+        SnapshotId = snapshotId;
+        SequenceNumber = sequenceNumber;
+        FileSequenceNumber = fileSequenceNumber;
+        DataFile = dataFile;
+    }
+}
diff --git a/src/IcebergSharp.Core/ManifestFile.cs b/src/IcebergSharp.Core/ManifestFile.cs
new file mode 100644
index 0000000..885500a
--- /dev/null
+++ b/src/IcebergSharp.Core/ManifestFile.cs
@@ -0,0 +1,124 @@
+using System.Collections.ObjectModel;
+
+namespace IcebergSharp;
+
+/// <summary>
+/// Distinguishes a manifest that lists data files (the default) from one that
+/// lists delete files. v1 manifests are always <see cref="Data"/>; v2 manifests
+/// carry the flag explicitly per spec field 517.
+/// </summary>
+public enum ManifestContent
+{
+    Data = 0,
+    Deletes = 1,
+}
+
+/// <summary>
+/// Per-partition-column summary embedded in a manifest-list entry. The reader
+/// passes <see cref="LowerBound"/> / <see cref="UpperBound"/> through as raw
+/// bytes — the encoding is the Iceberg single-value byte format keyed by the
+/// partition column's type, which Phase 4 decodes against the table schema.
+/// </summary>
+public sealed class FieldSummary : IEquatable<FieldSummary>
+{
+    public bool ContainsNull { get; }
+    public bool? ContainsNaN { get; }
+    public ReadOnlyMemory<byte> LowerBound { get; }
+    public ReadOnlyMemory<byte> UpperBound { get; }
+
+    public FieldSummary(bool containsNull, bool? containsNaN, ReadOnlySpan<byte> lowerBound, ReadOnlySpan<byte> upperBound)
+    {
+        ContainsNull = containsNull;
+        ContainsNaN = containsNaN;
+        LowerBound = lowerBound.IsEmpty ? ReadOnlyMemory<byte>.Empty : lowerBound.ToArray();
+        UpperBound = upperBound.IsEmpty ? ReadOnlyMemory<byte>.Empty : upperBound.ToArray();
+    }
+
+    public bool Equals(FieldSummary? other)
+        => other is not null
+        && ContainsNull == other.ContainsNull
+        && ContainsNaN == other.ContainsNaN
+        && LowerBound.Span.SequenceEqual(other.LowerBound.Span)
+        && UpperBound.Span.SequenceEqual(other.UpperBound.Span);
+
+    public override bool Equals(object? obj) => Equals(obj as FieldSummary);
+
+    public override int GetHashCode()
+    {
+        var hc = new HashCode();
+        hc.Add(ContainsNull);
+        hc.Add(ContainsNaN);
+        hc.AddBytes(LowerBound.Span);
+        hc.AddBytes(UpperBound.Span);
+        return hc.ToHashCode();
+    }
+}
+
+/// <summary>
+/// One entry of a snapshot's manifest-list file. Points at an Iceberg manifest
+/// (an Avro file listing data or delete files) and carries the per-partition
+/// bounds the planner needs to prune at the manifest level before opening it.
+/// </summary>
+public sealed class ManifestFile
+{
+    public string ManifestPath { get; }
+    public long ManifestLength { get; }
+    public int PartitionSpecId { get; }
+    public ManifestContent Content { get; }
+    public long SequenceNumber { get; }
+    public long MinSequenceNumber { get; }
+    public long AddedSnapshotId { get; }
+    public int AddedFilesCount { get; }
+    public int ExistingFilesCount { get; }
+    public int DeletedFilesCount { get; }
+    public long AddedRowsCount { get; }
+    public long ExistingRowsCount { get; }
+    public long DeletedRowsCount { get; }
+    public IReadOnlyList<FieldSummary> Partitions { get; }
+    public ReadOnlyMemory<byte> KeyMetadata { get; }
+    public int FormatVersion { get; }
+
+    public ManifestFile(
+        string manifestPath,
+        long manifestLength,
+        int partitionSpecId,
+        ManifestContent content,
+        long sequenceNumber,
+        long minSequenceNumber,
+        long addedSnapshotId,
+        int addedFilesCount,
+        int existingFilesCount,
+        int deletedFilesCount,
+        long addedRowsCount,
+        long existingRowsCount,
+        long deletedRowsCount,
+        IReadOnlyList<FieldSummary>? partitions,
+        ReadOnlySpan<byte> keyMetadata,
+        int formatVersion)
+    {
+        ArgumentException.ThrowIfNullOrEmpty(manifestPath);
+        if (formatVersion is < 1 or > 2)
+        {
+            throw new ArgumentOutOfRangeException(nameof(formatVersion), formatVersion, "supported manifest format versions are 1 and 2");
+        }
+
+        ManifestPath = manifestPath;
+        ManifestLength = manifestLength;
+        PartitionSpecId = partitionSpecId;
+        Content = content;
+        SequenceNumber = sequenceNumber;
+        MinSequenceNumber = minSequenceNumber;
+        AddedSnapshotId = addedSnapshotId;
+        AddedFilesCount = addedFilesCount;
+        ExistingFilesCount = existingFilesCount;
+        DeletedFilesCount = deletedFilesCount;
+        AddedRowsCount = addedRowsCount;
+        ExistingRowsCount = existingRowsCount;
+        DeletedRowsCount = deletedRowsCount;
+        Partitions = partitions is null
+            ? []
+            : new ReadOnlyCollection<FieldSummary>([.. partitions]);
+        KeyMetadata = keyMetadata.IsEmpty ? ReadOnlyMemory<byte>.Empty : keyMetadata.ToArray();
+        FormatVersion = formatVersion;
+    }
+}
diff --git a/src/IcebergSharp.Core/PartitionValues.cs b/src/IcebergSharp.Core/PartitionValues.cs
new file mode 100644
index 0000000..da787ba
--- /dev/null
+++ b/src/IcebergSharp.Core/PartitionValues.cs
@@ -0,0 +1,72 @@
+using System.Collections.ObjectModel;
+using IcebergSharp.Types;
+
+namespace IcebergSharp;
+
+/// <summary>
+/// Decoded partition tuple for a single data file. The shape of the tuple is
+/// determined at write time by the manifest's partition-spec metadata — this
+/// type carries the resolved names and types alongside the boxed values so the
+/// planner can reason about them without re-reading the spec.
+/// </summary>
+/// <remarks>
+/// Values are <c>object?</c> because the partition spec is dynamic per
+/// manifest; Phase 4 compares them against boxed literals from the expression
+/// DSL. <c>null</c> is a legal partition value (the partition column is
+/// nullable for that file).
+/// </remarks>
+public sealed class PartitionValues
+{
+    private readonly object?[] _values;
+    private readonly Dictionary<string, int> _indexByName;
+
+    public IReadOnlyList<string> Names { get; }
+    public IReadOnlyList<IcebergType> Types { get; }
+
+    public PartitionValues(IReadOnlyList<string> names, IReadOnlyList<IcebergType> types, IReadOnlyList<object?> values)
+    {
+        ArgumentNullException.ThrowIfNull(names);
+        ArgumentNullException.ThrowIfNull(types);
+        ArgumentNullException.ThrowIfNull(values);
+
+        if (names.Count != types.Count || names.Count != values.Count)
+        {
+            throw new ArgumentException($"names ({names.Count}), types ({types.Count}), and values ({values.Count}) must have the same length");
+        }
+
+        Names = new ReadOnlyCollection<string>([.. names]);
+        Types = new ReadOnlyCollection<IcebergType>([.. types]);
+        _values = [.. values];
+        _indexByName = new Dictionary<string, int>(names.Count, StringComparer.Ordinal);
+        for (var i = 0; i < names.Count; i++)
+        {
+            if (!_indexByName.TryAdd(names[i], i))
+            {
+                throw new ArgumentException($"duplicate partition column name '{names[i]}'", nameof(names));
+            }
+        }
+    }
+
+    public static PartitionValues Empty { get; } = new([], [], []);
+
+    public int Count => _values.Length;
+
+    public object? this[int index] => _values[index];
+
+    public object? this[string name]
+        => _indexByName.TryGetValue(name, out var i)
+            ? _values[i]
+            : throw new KeyNotFoundException($"partition column '{name}' not present");
+
+    public bool TryGetValue(string name, out object? value)
+    {
+        if (_indexByName.TryGetValue(name, out var i))
+        {
+            value = _values[i];
+            return true;
+        }
+
+        value = null;
+        return false;
+    }
+}
diff --git a/src/IcebergSharp.Core/Properties/AssemblyInfo.cs b/src/IcebergSharp.Core/Properties/AssemblyInfo.cs
new file mode 100644
index 0000000..d2d3489
--- /dev/null
+++ b/src/IcebergSharp.Core/Properties/AssemblyInfo.cs
@@ -0,0 +1,4 @@
+using System.Runtime.CompilerServices;
+
+[assembly: InternalsVisibleTo("IcebergSharp.Avro")]
+[assembly: InternalsVisibleTo("IcebergSharp.Tests")]
diff --git a/tests/IcebergSharp.Tests/Avro/AvroSchemaParserTests.cs b/tests/IcebergSharp.Tests/Avro/AvroSchemaParserTests.cs
new file mode 100644
index 0000000..dc74faf
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/AvroSchemaParserTests.cs
@@ -0,0 +1,189 @@
+using IcebergSharp.Avro.Internal.Schema;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+public sealed class AvroSchemaParserTests
+{
+    [Theory]
+    [InlineData("\"int\"", (int)AvroPrimitiveKind.Int)]
+    [InlineData("\"long\"", (int)AvroPrimitiveKind.Long)]
+    [InlineData("\"string\"", (int)AvroPrimitiveKind.String)]
+    [InlineData("\"boolean\"", (int)AvroPrimitiveKind.Boolean)]
+    [InlineData("\"bytes\"", (int)AvroPrimitiveKind.Bytes)]
+    [InlineData("\"float\"", (int)AvroPrimitiveKind.Float)]
+    [InlineData("\"double\"", (int)AvroPrimitiveKind.Double)]
+    public void ParsePrimitiveString(string json, int expectedKind)
+    {
+        var schema = (AvroPrimitive)AvroSchemaParser.Parse(json);
+        ((int)schema.Kind).ShouldBe(expectedKind);
+    }
+
+    [Fact]
+    public void ParseNullTUnionCarriesNonNullBranch()
+    {
+        var schema = (AvroUnion)AvroSchemaParser.Parse("""[ "null", "long" ]""");
+        schema.NullBranchIndex.ShouldBe(0);
+        schema.NonNullBranchIndex.ShouldBe(1);
+        ((AvroPrimitive)schema.NonNull).Kind.ShouldBe(AvroPrimitiveKind.Long);
+    }
+
+    [Fact]
+    public void ParseTNullUnionRecordsBranchIndex()
+    {
+        var schema = (AvroUnion)AvroSchemaParser.Parse("""[ "long", "null" ]""");
+        schema.NullBranchIndex.ShouldBe(1);
+        schema.NonNullBranchIndex.ShouldBe(0);
+    }
+
+    [Fact]
+    public void ParseRejectsThreeBranchUnion()
+    {
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse("""[ "null", "long", "string" ]"""));
+    }
+
+    [Fact]
+    public void ParseRejectsUnionWithoutNull()
+    {
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse("""[ "long", "string" ]"""));
+    }
+
+    [Fact]
+    public void ParseRejectsTruncatedUnion()
+    {
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse("""[ "null", "long" """));
+    }
+
+    [Fact]
+    public void ParseRejectsTruncatedObject()
+    {
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse("""{ "type": "long" """));
+    }
+
+    [Fact]
+    public void ParseRecordWithFieldIds()
+    {
+        const string Json = """
+        {
+          "type": "record",
+          "name": "manifest_file",
+          "fields": [
+            { "name": "manifest_path", "type": "string", "field-id": 500 },
+            { "name": "manifest_length", "type": "long", "field-id": 501 }
+          ]
+        }
+        """;
+
+        var schema = (AvroRecord)AvroSchemaParser.Parse(Json);
+        schema.Name.ShouldBe("manifest_file");
+        schema.Fields.Count.ShouldBe(2);
+        schema.Fields[0].Name.ShouldBe("manifest_path");
+        schema.Fields[0].FieldId.ShouldBe(500);
+        schema.Fields[1].FieldId.ShouldBe(501);
+    }
+
+    [Fact]
+    public void ParseArrayCarriesElementId()
+    {
+        const string Json = """
+        { "type": "array", "items": "long", "element-id": 132 }
+        """;
+
+        var schema = (AvroArray)AvroSchemaParser.Parse(Json);
+        schema.ElementId.ShouldBe(132);
+        ((AvroPrimitive)schema.Items).Kind.ShouldBe(AvroPrimitiveKind.Long);
+    }
+
+    [Fact]
+    public void ParseFixedWithDecimalLogicalType()
+    {
+        const string Json = """
+        { "type": "fixed", "name": "decimal_5_2", "size": 8, "logicalType": "decimal", "precision": 5, "scale": 2 }
+        """;
+
+        var schema = (AvroFixed)AvroSchemaParser.Parse(Json);
+        schema.Size.ShouldBe(8);
+        schema.LogicalType.ShouldBe(AvroLogicalType.Decimal);
+        schema.DecimalPrecision.ShouldBe(5);
+        schema.DecimalScale.ShouldBe(2);
+    }
+
+    [Fact]
+    public void ParseRejectsDecimalLogicalTypeWithoutPrecision()
+    {
+        const string Json = """
+        { "type": "bytes", "logicalType": "decimal", "scale": 2 }
+        """;
+
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse(Json));
+    }
+
+    [Fact]
+    public void ParseRejectsNonPositiveFixedSize()
+    {
+        const string Json = """
+        { "type": "fixed", "name": "empty", "size": 0 }
+        """;
+
+        Should.Throw<Exception>(() => AvroSchemaParser.Parse(Json));
+    }
+
+    [Fact]
+    public void ParseTimestampMicrosLogicalType()
+    {
+        const string Json = """
+        { "type": "long", "logicalType": "timestamp-micros" }
+        """;
+
+        var schema = (AvroPrimitive)AvroSchemaParser.Parse(Json);
+        schema.Kind.ShouldBe(AvroPrimitiveKind.Long);
+        schema.LogicalType.ShouldBe(AvroLogicalType.TimestampMicros);
+    }
+
+    [Fact]
+    public void ParseIgnoresLogicalTypeOnWrongPhysicalType()
+    {
+        const string Json = """
+        { "type": "long", "logicalType": "uuid" }
+        """;
+
+        var schema = (AvroPrimitive)AvroSchemaParser.Parse(Json);
+        schema.Kind.ShouldBe(AvroPrimitiveKind.Long);
+        schema.LogicalType.ShouldBe(AvroLogicalType.None);
+    }
+
+    [Fact]
+    public void ParseRealManifestListV2Schema()
+    {
+        // A trimmed-down but spec-shape-faithful v2 manifest_list schema.
+        const string Json = """
+        {
+          "type": "record",
+          "name": "manifest_file",
+          "fields": [
+            { "name": "manifest_path", "type": "string", "field-id": 500 },
+            { "name": "manifest_length", "type": "long", "field-id": 501 },
+            { "name": "partition_spec_id", "type": "int", "field-id": 502 },
+            { "name": "content", "type": "int", "field-id": 517 },
+            { "name": "sequence_number", "type": "long", "field-id": 515 },
+            { "name": "min_sequence_number", "type": "long", "field-id": 516 },
+            { "name": "added_snapshot_id", "type": "long", "field-id": 503 },
+            { "name": "added_data_files_count", "type": "int", "field-id": 504 },
+            { "name": "existing_data_files_count", "type": "int", "field-id": 505 },
+            { "name": "deleted_data_files_count", "type": "int", "field-id": 506 },
+            { "name": "added_rows_count", "type": "long", "field-id": 512 },
+            { "name": "existing_rows_count", "type": "long", "field-id": 513 },
+            { "name": "deleted_rows_count", "type": "long", "field-id": 514 }
+          ]
+        }
+        """;
+
+        var schema = (AvroRecord)AvroSchemaParser.Parse(Json);
+        schema.Fields.Count.ShouldBe(13);
+        // pick a few to sanity check
+        schema.Fields[0].FieldId.ShouldBe(500);
+        schema.Fields[3].FieldId.ShouldBe(517); // content
+        schema.Fields[4].FieldId.ShouldBe(515); // sequence_number
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/BinaryDecoderTests.cs b/tests/IcebergSharp.Tests/Avro/BinaryDecoderTests.cs
new file mode 100644
index 0000000..ee4e1dc
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/BinaryDecoderTests.cs
@@ -0,0 +1,215 @@
+using IcebergSharp.Avro.Internal.Decode;
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Schema;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+public sealed class BinaryDecoderTests
+{
+    [Theory]
+    [InlineData(0L, new byte[] { 0x00 })]
+    [InlineData(-1L, new byte[] { 0x01 })]
+    [InlineData(1L, new byte[] { 0x02 })]
+    [InlineData(-2L, new byte[] { 0x03 })]
+    [InlineData(2L, new byte[] { 0x04 })]
+    [InlineData(63L, new byte[] { 0x7E })]
+    [InlineData(-64L, new byte[] { 0x7F })]
+    [InlineData(64L, new byte[] { 0x80, 0x01 })]
+    [InlineData(8192L, new byte[] { 0x80, 0x80, 0x01 })]
+    public void ReadLongZigzagVarint(long expected, byte[] bytes)
+    {
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadLong().ShouldBe(expected);
+    }
+
+    [Fact]
+    public void ReadLongMinValueRoundtrips()
+    {
+        byte[] encoded = [0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0x01];
+        var decoder = new BinaryDecoder(encoded);
+        decoder.ReadLong().ShouldBe(long.MinValue);
+    }
+
+    [Fact]
+    public void ReadLongMaxValueRoundtrips()
+    {
+        byte[] encoded = [0xFE, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0x01];
+        var decoder = new BinaryDecoder(encoded);
+        decoder.ReadLong().ShouldBe(long.MaxValue);
+    }
+
+    [Fact]
+    public void ReadIntRejectsOutOfRangeValue()
+    {
+        var bytes = EncodeLong((long)int.MaxValue + 1);
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadInt());
+    }
+
+    [Fact]
+    public void NullableReaderReadIntOrNullWrapsLongOverflowAsAvroFormatException()
+    {
+        var bytes = EncodeLong((long)int.MaxValue + 1);
+        ShouldThrowFromDecoder(bytes, static (ref d) =>
+            NullableReader.ReadIntOrNull(ref d, new AvroPrimitive(AvroPrimitiveKind.Long)));
+    }
+
+    [Fact]
+    public void ReadBooleanAcceptsZeroAndOne()
+    {
+        byte[] bytes = [0x00, 0x01];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadBoolean().ShouldBeFalse();
+        decoder.ReadBoolean().ShouldBeTrue();
+    }
+
+    [Fact]
+    public void ReadBooleanRejectsOtherValues()
+    {
+        byte[] bytes = [0x02];
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadBoolean());
+    }
+
+    [Fact]
+    public void ReadFloatLittleEndian()
+    {
+        byte[] bytes = [0x00, 0x00, 0xC0, 0x3F];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadFloat().ShouldBe(1.5f);
+    }
+
+    [Fact]
+    public void ReadDoubleLittleEndian()
+    {
+        byte[] bytes = [0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xF8, 0x3F];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadDouble().ShouldBe(1.5);
+    }
+
+    [Fact]
+    public void ReadStringUtf8MultiByte()
+    {
+        var payload = System.Text.Encoding.UTF8.GetBytes("café 🦀");
+        var bytes = new byte[1 + payload.Length];
+        bytes[0] = (byte)(payload.Length << 1);
+        Buffer.BlockCopy(payload, 0, bytes, 1, payload.Length);
+
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadString().ShouldBe("café 🦀");
+    }
+
+    [Fact]
+    public void ReadStringEmpty()
+    {
+        byte[] bytes = [0x00];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadString().ShouldBe(string.Empty);
+    }
+
+    [Fact]
+    public void ReadBytesRoundTrip()
+    {
+        byte[] payload = [0xDE, 0xAD, 0xBE, 0xEF];
+        byte[] bytes = [(byte)(payload.Length << 1), .. payload];
+
+        var decoder = new BinaryDecoder(bytes);
+        var result = decoder.ReadBytesSpan().ToArray();
+        result.ShouldBe(payload);
+    }
+
+    [Fact]
+    public void ReadBytesRejectsLengthBeyondInt32()
+    {
+        var bytes = EncodeLong((long)int.MaxValue + 1);
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadBytesSpan().ToArray());
+    }
+
+    [Fact]
+    public void ReadBlockCountPositiveCount()
+    {
+        byte[] bytes = [0x06];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadBlockCount().ShouldBe(3);
+    }
+
+    [Fact]
+    public void ReadBlockCountNegativeConsumesByteSizeHeader()
+    {
+        byte[] bytes = [0x05, 0x54];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadBlockCount().ShouldBe(3);
+        decoder.EndOfBuffer.ShouldBeTrue();
+    }
+
+    [Fact]
+    public void ReadBlockCountRejectsNegativeByteSizeHeader()
+    {
+        byte[] bytes = [0x01, 0x01];
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadBlockCount());
+    }
+
+    [Fact]
+    public void ReadBlockCountZeroTerminates()
+    {
+        byte[] bytes = [0x00];
+        var decoder = new BinaryDecoder(bytes);
+        decoder.ReadBlockCount().ShouldBe(0);
+    }
+
+    [Fact]
+    public void ReadFixedReturnsExactSize()
+    {
+        byte[] bytes = [0x01, 0x02, 0x03, 0x04, 0x05];
+        var decoder = new BinaryDecoder(bytes);
+        ReadOnlySpan<byte> span = decoder.ReadFixed(3);
+        span.ToArray().ShouldBe([0x01, 0x02, 0x03]);
+        decoder.Position.ShouldBe(3);
+    }
+
+    [Fact]
+    public void ReadLongTruncatedVarintThrows()
+    {
+        byte[] bytes = [0x80];
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadLong());
+    }
+
+    [Fact]
+    public void ReadFixedTruncatedThrows()
+    {
+        byte[] bytes = [0x01, 0x02];
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadFixed(5).ToArray());
+    }
+
+    [Fact]
+    public void ReadFixedRejectsNegativeSize()
+    {
+        byte[] bytes = [0x01, 0x02];
+        ShouldThrowFromDecoder(bytes, static (ref d) => d.ReadFixed(-1).ToArray());
+    }
+
+    private delegate void DecoderAction(ref BinaryDecoder d);
+
+    private static void ShouldThrowFromDecoder(byte[] bytes, DecoderAction action)
+    {
+        Should.Throw<AvroFormatException>(() =>
+        {
+            var decoder = new BinaryDecoder(bytes);
+            action(ref decoder);
+        });
+    }
+
+    private static byte[] EncodeLong(long value)
+    {
+        var bytes = new List<byte>();
+        var zz = (ulong)((value << 1) ^ (value >> 63));
+        while ((zz & ~0x7FUL) != 0)
+        {
+            bytes.Add((byte)((zz & 0x7F) | 0x80));
+            zz >>= 7;
+        }
+
+        bytes.Add((byte)zz);
+        return [.. bytes];
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/Helpers/ManifestEncoder.cs b/tests/IcebergSharp.Tests/Avro/Helpers/ManifestEncoder.cs
new file mode 100644
index 0000000..b65ca8b
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/Helpers/ManifestEncoder.cs
@@ -0,0 +1,216 @@
+namespace IcebergSharp.Tests.Avro.Helpers;
+
+/// <summary>
+/// Encodes a minimal v1 / v2 Iceberg manifest OCF. The partition record is
+/// always an empty struct (unpartitioned table) — partition-tuple decoding is
+/// covered separately by tests that use a custom <see cref="MiniAvroEncoder"/>.
+/// </summary>
+internal static class ManifestEncoder
+{
+    public sealed class V1Entry
+    {
+        public int Status { get; init; }
+        public long? SnapshotId { get; init; }
+        public string FilePath { get; init; } = "";
+        public string FileFormat { get; init; } = "PARQUET";
+        public long RecordCount { get; init; }
+        public long FileSizeInBytes { get; init; }
+    }
+
+    public sealed class V2Entry
+    {
+        public int Status { get; init; }
+        public long? SnapshotId { get; init; }
+        public long? SequenceNumber { get; init; }
+        public long? FileSequenceNumber { get; init; }
+        public int Content { get; init; }
+        public string FilePath { get; init; } = "";
+        public string FileFormat { get; init; } = "PARQUET";
+        public long RecordCount { get; init; }
+        public long FileSizeInBytes { get; init; }
+        public Dictionary<int, long>? ColumnSizes { get; init; }
+        public Dictionary<int, byte[]>? LowerBounds { get; init; }
+        public Dictionary<int, byte[]>? UpperBounds { get; init; }
+    }
+
+    public const string V1Schema = """
+    {
+      "type": "record",
+      "name": "manifest_entry",
+      "fields": [
+        { "name": "status", "type": "int", "field-id": 0 },
+        { "name": "snapshot_id", "type": ["null","long"], "default": null, "field-id": 1 },
+        { "name": "data_file", "field-id": 2, "type": {
+            "type": "record",
+            "name": "r102",
+            "fields": [
+              { "name": "file_path", "type": "string", "field-id": 100 },
+              { "name": "file_format", "type": "string", "field-id": 101 },
+              { "name": "partition", "type": { "type": "record", "name": "partition", "fields": [] }, "field-id": 102 },
+              { "name": "record_count", "type": "long", "field-id": 103 },
+              { "name": "file_size_in_bytes", "type": "long", "field-id": 104 },
+              { "name": "block_size_in_bytes", "type": "long", "field-id": 105 }
+            ]
+        } }
+      ]
+    }
+    """;
+
+    public const string V2Schema = """
+    {
+      "type": "record",
+      "name": "manifest_entry",
+      "fields": [
+        { "name": "status", "type": "int", "field-id": 0 },
+        { "name": "snapshot_id", "type": ["null","long"], "default": null, "field-id": 1 },
+        { "name": "sequence_number", "type": ["null","long"], "default": null, "field-id": 3 },
+        { "name": "file_sequence_number", "type": ["null","long"], "default": null, "field-id": 4 },
+        { "name": "data_file", "field-id": 2, "type": {
+            "type": "record",
+            "name": "r102",
+            "fields": [
+              { "name": "content", "type": "int", "field-id": 134 },
+              { "name": "file_path", "type": "string", "field-id": 100 },
+              { "name": "file_format", "type": "string", "field-id": 101 },
+              { "name": "partition", "type": { "type": "record", "name": "partition", "fields": [] }, "field-id": 102 },
+              { "name": "record_count", "type": "long", "field-id": 103 },
+              { "name": "file_size_in_bytes", "type": "long", "field-id": 104 },
+              { "name": "column_sizes", "type": ["null", {
+                  "type":"array", "items": {
+                    "type":"record", "name":"k108_v109", "fields":[
+                      { "name":"key", "type":"int", "field-id": 117 },
+                      { "name":"value", "type":"long", "field-id": 118 }
+                    ]
+                  }, "element-id": 119
+              }], "default": null, "field-id": 108 },
+              { "name": "lower_bounds", "type": ["null", {
+                  "type":"array", "items": {
+                    "type":"record", "name":"k126_v127", "fields":[
+                      { "name":"key", "type":"int", "field-id": 126 },
+                      { "name":"value", "type":"bytes", "field-id": 127 }
+                    ]
+                  }, "element-id": 138
+              }], "default": null, "field-id": 125 },
+              { "name": "upper_bounds", "type": ["null", {
+                  "type":"array", "items": {
+                    "type":"record", "name":"k129_v130", "fields":[
+                      { "name":"key", "type":"int", "field-id": 129 },
+                      { "name":"value", "type":"bytes", "field-id": 130 }
+                    ]
+                  }, "element-id": 139
+              }], "default": null, "field-id": 128 }
+            ]
+        } }
+      ]
+    }
+    """;
+
+    public static byte[] EncodeV1(IEnumerable<V1Entry> entries, string codec = "null")
+    {
+        using var enc = new MiniAvroEncoder(V1Schema, codec, new Dictionary<string, byte[]>
+        {
+            ["format-version"] = "1"u8.ToArray(),
+        });
+        foreach (V1Entry e in entries)
+        {
+            enc.StartRecord();
+            enc.WriteInt(e.Status);
+            WriteNullableLong(enc, e.SnapshotId);
+            // data_file
+            enc.WriteString(e.FilePath);
+            enc.WriteString(e.FileFormat);
+            // partition: empty struct (no fields written)
+            enc.WriteLong(e.RecordCount);
+            enc.WriteLong(e.FileSizeInBytes);
+            enc.WriteLong(0); // block_size_in_bytes (v1)
+        }
+
+        return enc.ToArray();
+    }
+
+    public static byte[] EncodeV2(IEnumerable<V2Entry> entries, string codec = "null")
+    {
+        using var enc = new MiniAvroEncoder(V2Schema, codec, new Dictionary<string, byte[]>
+        {
+            ["format-version"] = "2"u8.ToArray(),
+        });
+        foreach (V2Entry e in entries)
+        {
+            enc.StartRecord();
+            enc.WriteInt(e.Status);
+            WriteNullableLong(enc, e.SnapshotId);
+            WriteNullableLong(enc, e.SequenceNumber);
+            WriteNullableLong(enc, e.FileSequenceNumber);
+            // data_file
+            enc.WriteInt(e.Content);
+            enc.WriteString(e.FilePath);
+            enc.WriteString(e.FileFormat);
+            // partition: empty struct
+            enc.WriteLong(e.RecordCount);
+            enc.WriteLong(e.FileSizeInBytes);
+            WriteNullableIntLongMap(enc, e.ColumnSizes);
+            WriteNullableIntBytesMap(enc, e.LowerBounds);
+            WriteNullableIntBytesMap(enc, e.UpperBounds);
+        }
+
+        return enc.ToArray();
+    }
+
+    private static void WriteNullableLong(MiniAvroEncoder enc, long? value)
+    {
+        if (value is null)
+        {
+            enc.WriteUnionNull(0);
+        }
+        else
+        {
+            enc.WriteUnionNonNull(0);
+            enc.WriteLong(value.Value);
+        }
+    }
+
+    private static void WriteNullableIntLongMap(MiniAvroEncoder enc, Dictionary<int, long>? map)
+    {
+        if (map is null)
+        {
+            enc.WriteUnionNull(0);
+            return;
+        }
+
+        enc.WriteUnionNonNull(0);
+        if (map.Count > 0)
+        {
+            enc.StartArrayBlock(map.Count);
+            foreach (KeyValuePair<int, long> kv in map)
+            {
+                enc.WriteInt(kv.Key);
+                enc.WriteLong(kv.Value);
+            }
+        }
+
+        enc.EndArrayOrMap();
+    }
+
+    private static void WriteNullableIntBytesMap(MiniAvroEncoder enc, Dictionary<int, byte[]>? map)
+    {
+        if (map is null)
+        {
+            enc.WriteUnionNull(0);
+            return;
+        }
+
+        enc.WriteUnionNonNull(0);
+        if (map.Count > 0)
+        {
+            enc.StartArrayBlock(map.Count);
+            foreach (KeyValuePair<int, byte[]> kv in map)
+            {
+                enc.WriteInt(kv.Key);
+                enc.WriteBytes(kv.Value);
+            }
+        }
+
+        enc.EndArrayOrMap();
+    }
+
+}
diff --git a/tests/IcebergSharp.Tests/Avro/Helpers/ManifestListEncoder.cs b/tests/IcebergSharp.Tests/Avro/Helpers/ManifestListEncoder.cs
new file mode 100644
index 0000000..6ad8390
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/Helpers/ManifestListEncoder.cs
@@ -0,0 +1,144 @@
+namespace IcebergSharp.Tests.Avro.Helpers;
+
+/// <summary>
+/// Encodes a minimal v1 or v2 Iceberg manifest_list OCF on top of
+/// <see cref="MiniAvroEncoder"/>. Keeps each schema below in lockstep with the
+/// Iceberg spec — write a new helper here if your test needs a field this one
+/// doesn't expose.
+/// </summary>
+internal static class ManifestListEncoder
+{
+    public const string V1Schema = """
+    {
+      "type": "record",
+      "name": "manifest_file",
+      "fields": [
+        { "name": "manifest_path", "type": "string", "field-id": 500 },
+        { "name": "manifest_length", "type": "long", "field-id": 501 },
+        { "name": "partition_spec_id", "type": "int", "field-id": 502 },
+        { "name": "added_snapshot_id", "type": ["null", "long"], "default": null, "field-id": 503 },
+        { "name": "added_data_files_count", "type": ["null", "int"], "default": null, "field-id": 504 },
+        { "name": "existing_data_files_count", "type": ["null", "int"], "default": null, "field-id": 505 },
+        { "name": "deleted_data_files_count", "type": ["null", "int"], "default": null, "field-id": 506 }
+      ]
+    }
+    """;
+
+    public const string V2Schema = """
+    {
+      "type": "record",
+      "name": "manifest_file",
+      "fields": [
+        { "name": "manifest_path", "type": "string", "field-id": 500 },
+        { "name": "manifest_length", "type": "long", "field-id": 501 },
+        { "name": "partition_spec_id", "type": "int", "field-id": 502 },
+        { "name": "content", "type": "int", "field-id": 517 },
+        { "name": "sequence_number", "type": "long", "field-id": 515 },
+        { "name": "min_sequence_number", "type": "long", "field-id": 516 },
+        { "name": "added_snapshot_id", "type": "long", "field-id": 503 },
+        { "name": "added_data_files_count", "type": "int", "field-id": 504 },
+        { "name": "existing_data_files_count", "type": "int", "field-id": 505 },
+        { "name": "deleted_data_files_count", "type": "int", "field-id": 506 },
+        { "name": "added_rows_count", "type": "long", "field-id": 512 },
+        { "name": "existing_rows_count", "type": "long", "field-id": 513 },
+        { "name": "deleted_rows_count", "type": "long", "field-id": 514 }
+      ]
+    }
+    """;
+
+    public sealed class V1Entry
+    {
+        public string ManifestPath { get; init; } = "";
+        public long ManifestLength { get; init; }
+        public int PartitionSpecId { get; init; }
+        public long? AddedSnapshotId { get; init; }
+        public int? AddedFilesCount { get; init; }
+        public int? ExistingFilesCount { get; init; }
+        public int? DeletedFilesCount { get; init; }
+    }
+
+    public sealed class V2Entry
+    {
+        public string ManifestPath { get; init; } = "";
+        public long ManifestLength { get; init; }
+        public int PartitionSpecId { get; init; }
+        public int Content { get; init; }
+        public long SequenceNumber { get; init; }
+        public long MinSequenceNumber { get; init; }
+        public long AddedSnapshotId { get; init; }
+        public int AddedFilesCount { get; init; }
+        public int ExistingFilesCount { get; init; }
+        public int DeletedFilesCount { get; init; }
+        public long AddedRowsCount { get; init; }
+        public long ExistingRowsCount { get; init; }
+        public long DeletedRowsCount { get; init; }
+    }
+
+    public static byte[] EncodeV1(IEnumerable<V1Entry> entries, string codec = "null")
+    {
+        using var enc = new MiniAvroEncoder(V1Schema, codec);
+        foreach (V1Entry e in entries)
+        {
+            enc.StartRecord();
+            enc.WriteString(e.ManifestPath);
+            enc.WriteLong(e.ManifestLength);
+            enc.WriteInt(e.PartitionSpecId);
+            WriteNullableLong(enc, e.AddedSnapshotId);
+            WriteNullableInt(enc, e.AddedFilesCount);
+            WriteNullableInt(enc, e.ExistingFilesCount);
+            WriteNullableInt(enc, e.DeletedFilesCount);
+        }
+
+        return enc.ToArray();
+    }
+
+    public static byte[] EncodeV2(IEnumerable<V2Entry> entries, string codec = "null")
+    {
+        using var enc = new MiniAvroEncoder(V2Schema, codec);
+        foreach (V2Entry e in entries)
+        {
+            enc.StartRecord();
+            enc.WriteString(e.ManifestPath);
+            enc.WriteLong(e.ManifestLength);
+            enc.WriteInt(e.PartitionSpecId);
+            enc.WriteInt(e.Content);
+            enc.WriteLong(e.SequenceNumber);
+            enc.WriteLong(e.MinSequenceNumber);
+            enc.WriteLong(e.AddedSnapshotId);
+            enc.WriteInt(e.AddedFilesCount);
+            enc.WriteInt(e.ExistingFilesCount);
+            enc.WriteInt(e.DeletedFilesCount);
+            enc.WriteLong(e.AddedRowsCount);
+            enc.WriteLong(e.ExistingRowsCount);
+            enc.WriteLong(e.DeletedRowsCount);
+        }
+
+        return enc.ToArray();
+    }
+
+    private static void WriteNullableLong(MiniAvroEncoder enc, long? value)
+    {
+        if (value is null)
+        {
+            enc.WriteUnionNull(0);
+        }
+        else
+        {
+            enc.WriteUnionNonNull(0);
+            enc.WriteLong(value.Value);
+        }
+    }
+
+    private static void WriteNullableInt(MiniAvroEncoder enc, int? value)
+    {
+        if (value is null)
+        {
+            enc.WriteUnionNull(0);
+        }
+        else
+        {
+            enc.WriteUnionNonNull(0);
+            enc.WriteInt(value.Value);
+        }
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/Helpers/MiniAvroEncoder.cs b/tests/IcebergSharp.Tests/Avro/Helpers/MiniAvroEncoder.cs
new file mode 100644
index 0000000..b34f9f8
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/Helpers/MiniAvroEncoder.cs
@@ -0,0 +1,200 @@
+using System.Buffers.Binary;
+using System.IO.Compression;
+using System.Text;
+
+namespace IcebergSharp.Tests.Avro.Helpers;
+
+/// <summary>
+/// Bare-bones Avro OCF writer used by Phase 2 tests to build fixtures in
+/// memory. Derived directly from the Avro 1.11 spec sections "Binary Encoding"
+/// and "Object Container Files" — intentionally independent of the
+/// IcebergSharp.Avro reader's internal model so a bug in the reader cannot
+/// silently masquerade as correctness here.
+/// </summary>
+/// <remarks>
+/// Supports: null + deflate codec, primitive types (boolean, int, long, float,
+/// double, bytes, string), fixed, records, arrays, maps (as Iceberg-style
+/// array&lt;kv-record&gt;), union[null, T]. Not a general encoder.
+/// </remarks>
+internal sealed class MiniAvroEncoder : IDisposable
+{
+    public void Dispose()
+    {
+        _output.Dispose();
+        _blockBody.Dispose();
+    }
+
+    private static readonly byte[] _magic = "Obj\x01"u8.ToArray();
+    private static readonly byte[] _sync =
+    [
+        0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17,
+        0x18, 0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F,
+    ];
+
+    private readonly MemoryStream _output = new();
+    private readonly MemoryStream _blockBody = new();
+    private readonly string _codec;
+    private int _recordCount;
+    private bool _headerWritten;
+
+    public MiniAvroEncoder(string schemaJson, string codec = "null", IDictionary<string, byte[]>? extraMetadata = null)
+    {
+        if (codec is not ("null" or "deflate"))
+        {
+            throw new ArgumentException($"unsupported codec '{codec}'");
+        }
+
+        _codec = codec;
+        WriteHeader(schemaJson, codec, extraMetadata);
+    }
+
+    public byte[] ToArray()
+    {
+        if (_recordCount > 0)
+        {
+            FlushBlock();
+        }
+
+        return _output.ToArray();
+    }
+
+    public void StartRecord() => _recordCount++;
+
+    public void WriteBoolean(bool value) => _blockBody.WriteByte((byte)(value ? 1 : 0));
+
+    public void WriteInt(int value) => WriteLong(value);
+
+    public void WriteLong(long value)
+    {
+        // Zig-zag encode, then varint.
+        var zz = (ulong)((value << 1) ^ (value >> 63));
+        while ((zz & ~0x7FUL) != 0)
+        {
+            _blockBody.WriteByte((byte)((zz & 0x7F) | 0x80));
+            zz >>= 7;
+        }
+
+        _blockBody.WriteByte((byte)zz);
+    }
+
+    public void WriteFloat(float value)
+    {
+        Span<byte> b = stackalloc byte[4];
+        BinaryPrimitives.WriteSingleLittleEndian(b, value);
+        _blockBody.Write(b);
+    }
+
+    public void WriteDouble(double value)
+    {
+        Span<byte> b = stackalloc byte[8];
+        BinaryPrimitives.WriteDoubleLittleEndian(b, value);
+        _blockBody.Write(b);
+    }
+
+    public void WriteString(string value)
+    {
+        var bytes = Encoding.UTF8.GetBytes(value);
+        WriteLong(bytes.Length);
+        _blockBody.Write(bytes);
+    }
+
+    public void WriteBytes(ReadOnlySpan<byte> value)
+    {
+        WriteLong(value.Length);
+        _blockBody.Write(value);
+    }
+
+    public void WriteFixed(ReadOnlySpan<byte> value) => _blockBody.Write(value);
+
+    /// <summary>Writes the null branch of a [null, T] union.</summary>
+    public void WriteUnionNull(int nullBranchIndex) => WriteLong(nullBranchIndex);
+
+    /// <summary>Writes the non-null branch tag of a [null, T] union; the caller writes the value next.</summary>
+    public void WriteUnionNonNull(int nullBranchIndex) => WriteLong(nullBranchIndex == 0 ? 1 : 0);
+
+    /// <summary>Writes a single-block array prefix; caller writes <paramref name="count"/> items and then calls <see cref="EndArrayOrMap"/>.</summary>
+    public void StartArrayBlock(long count) => WriteLong(count);
+
+    public void EndArrayOrMap() => WriteLong(0);
+
+    public void FlushBlock()
+    {
+        if (_recordCount == 0)
+        {
+            return;
+        }
+
+        var body = _blockBody.ToArray();
+        var payload = _codec == "deflate" ? Deflate(body) : body;
+
+        WriteVarLong(_output, _recordCount);
+        WriteVarLong(_output, payload.Length);
+        _output.Write(payload);
+        _output.Write(_sync);
+
+        _blockBody.SetLength(0);
+        _recordCount = 0;
+    }
+
+    private void WriteHeader(string schemaJson, string codec, IDictionary<string, byte[]>? extraMetadata)
+    {
+        if (_headerWritten)
+        {
+            throw new InvalidOperationException("header already written");
+        }
+
+        _output.Write(_magic);
+
+        // Metadata map: encoded as one positive-count block followed by the zero-count terminator.
+        var keys = new List<KeyValuePair<string, byte[]>>
+        {
+            new("avro.schema", Encoding.UTF8.GetBytes(schemaJson)),
+            new("avro.codec", Encoding.UTF8.GetBytes(codec)),
+        };
+        if (extraMetadata is not null)
+        {
+            foreach (KeyValuePair<string, byte[]> kv in extraMetadata)
+            {
+                keys.Add(kv);
+            }
+        }
+
+        WriteVarLong(_output, keys.Count);
+        foreach (KeyValuePair<string, byte[]> kv in keys)
+        {
+            var keyBytes = Encoding.UTF8.GetBytes(kv.Key);
+            WriteVarLong(_output, keyBytes.Length);
+            _output.Write(keyBytes);
+            WriteVarLong(_output, kv.Value.Length);
+            _output.Write(kv.Value);
+        }
+
+        WriteVarLong(_output, 0);
+
+        _output.Write(_sync);
+        _headerWritten = true;
+    }
+
+    private static void WriteVarLong(Stream s, long value)
+    {
+        var zz = (ulong)((value << 1) ^ (value >> 63));
+        while ((zz & ~0x7FUL) != 0)
+        {
+            s.WriteByte((byte)((zz & 0x7F) | 0x80));
+            zz >>= 7;
+        }
+
+        s.WriteByte((byte)zz);
+    }
+
+    private static byte[] Deflate(byte[] body)
+    {
+        using var ms = new MemoryStream();
+        using (var ds = new DeflateStream(ms, CompressionLevel.Fastest, leaveOpen: true))
+        {
+            ds.Write(body);
+        }
+
+        return ms.ToArray();
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/ManifestListReaderTests.cs b/tests/IcebergSharp.Tests/Avro/ManifestListReaderTests.cs
new file mode 100644
index 0000000..3b75cbb
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/ManifestListReaderTests.cs
@@ -0,0 +1,190 @@
+using IcebergSharp.Avro;
+using IcebergSharp.Tests.Avro.Helpers;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+public sealed class ManifestListReaderTests
+{
+    private static readonly ManifestContent[] _expectedMixedContent =
+    [
+        ManifestContent.Data, ManifestContent.Data, ManifestContent.Deletes,
+    ];
+
+    [Fact]
+    public async Task ReadsV1ManifestListNullCodec()
+    {
+        ManifestListEncoder.V1Entry[] entries =
+        [
+            new ManifestListEncoder.V1Entry
+            {
+                ManifestPath = "s3://lake/m1.avro",
+                ManifestLength = 1234,
+                PartitionSpecId = 0,
+                AddedSnapshotId = 100,
+                AddedFilesCount = 2,
+                ExistingFilesCount = 0,
+                DeletedFilesCount = 0,
+            },
+            new ManifestListEncoder.V1Entry
+            {
+                ManifestPath = "s3://lake/m2.avro",
+                ManifestLength = 4321,
+                PartitionSpecId = 0,
+                AddedSnapshotId = 101,
+                AddedFilesCount = 0,
+                ExistingFilesCount = 3,
+                DeletedFilesCount = 1,
+            },
+        ];
+
+        var bytes = ManifestListEncoder.EncodeV1(entries);
+        using var stream = new MemoryStream(bytes);
+        List<ManifestFile> result = await ToListAsync(ManifestListReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(2);
+        result[0].ManifestPath.ShouldBe("s3://lake/m1.avro");
+        result[0].ManifestLength.ShouldBe(1234);
+        result[0].AddedSnapshotId.ShouldBe(100);
+        result[0].AddedFilesCount.ShouldBe(2);
+        result[0].FormatVersion.ShouldBe(1);
+        result[0].Content.ShouldBe(ManifestContent.Data);
+
+        result[1].ManifestPath.ShouldBe("s3://lake/m2.avro");
+        result[1].DeletedFilesCount.ShouldBe(1);
+    }
+
+    [Fact]
+    public async Task ReadsV1ManifestListWithDeflateCodec()
+    {
+        ManifestListEncoder.V1Entry[] entries =
+        [
+            new ManifestListEncoder.V1Entry
+            {
+                ManifestPath = "s3://lake/compressed.avro",
+                ManifestLength = 999,
+                PartitionSpecId = 0,
+                AddedSnapshotId = 200,
+                AddedFilesCount = 5,
+                ExistingFilesCount = 5,
+                DeletedFilesCount = 0,
+            },
+        ];
+
+        var bytes = ManifestListEncoder.EncodeV1(entries, codec: "deflate");
+        using var stream = new MemoryStream(bytes);
+        List<ManifestFile> result = await ToListAsync(ManifestListReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(1);
+        result[0].ManifestPath.ShouldBe("s3://lake/compressed.avro");
+        result[0].AddedFilesCount.ShouldBe(5);
+        result[0].ExistingFilesCount.ShouldBe(5);
+    }
+
+    [Fact]
+    public async Task ReadsV2ManifestListWithMixedContent()
+    {
+        ManifestListEncoder.V2Entry[] entries =
+        [
+            new ManifestListEncoder.V2Entry
+            {
+                ManifestPath = "s3://lake/data-1.avro",
+                ManifestLength = 1000,
+                PartitionSpecId = 0,
+                Content = 0,
+                SequenceNumber = 1,
+                MinSequenceNumber = 1,
+                AddedSnapshotId = 100,
+                AddedFilesCount = 1,
+                ExistingFilesCount = 0,
+                DeletedFilesCount = 0,
+                AddedRowsCount = 100,
+                ExistingRowsCount = 0,
+                DeletedRowsCount = 0,
+            },
+            new ManifestListEncoder.V2Entry
+            {
+                ManifestPath = "s3://lake/data-2.avro",
+                ManifestLength = 1200,
+                PartitionSpecId = 0,
+                Content = 0,
+                SequenceNumber = 2,
+                MinSequenceNumber = 2,
+                AddedSnapshotId = 101,
+                AddedFilesCount = 0,
+                ExistingFilesCount = 1,
+                DeletedFilesCount = 0,
+                AddedRowsCount = 0,
+                ExistingRowsCount = 50,
+                DeletedRowsCount = 0,
+            },
+            new ManifestListEncoder.V2Entry
+            {
+                ManifestPath = "s3://lake/deletes-1.avro",
+                ManifestLength = 500,
+                PartitionSpecId = 0,
+                Content = 1, // delete
+                SequenceNumber = 2,
+                MinSequenceNumber = 2,
+                AddedSnapshotId = 101,
+                AddedFilesCount = 1,
+                ExistingFilesCount = 0,
+                DeletedFilesCount = 0,
+                AddedRowsCount = 10,
+                ExistingRowsCount = 0,
+                DeletedRowsCount = 0,
+            },
+        ];
+
+        var bytes = ManifestListEncoder.EncodeV2(entries, codec: "deflate");
+        using var stream = new MemoryStream(bytes);
+        List<ManifestFile> result = await ToListAsync(ManifestListReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(3);
+        result.Select(r => r.Content).ShouldBe(_expectedMixedContent);
+        result.Select(r => r.FormatVersion).ShouldAllBe(v => v == 2);
+        result[2].ManifestPath.ShouldBe("s3://lake/deletes-1.avro");
+        result[2].AddedRowsCount.ShouldBe(10);
+    }
+
+    [Fact]
+    public async Task StreamCanBeReplayedAfterPositionReset()
+    {
+        ManifestListEncoder.V1Entry[] entries =
+        [
+            new ManifestListEncoder.V1Entry
+            {
+                ManifestPath = "s3://lake/m.avro",
+                ManifestLength = 100,
+                PartitionSpecId = 0,
+                AddedSnapshotId = 1,
+                AddedFilesCount = 1,
+                ExistingFilesCount = 0,
+                DeletedFilesCount = 0,
+            },
+        ];
+
+        var bytes = ManifestListEncoder.EncodeV1(entries);
+        using var stream = new MemoryStream(bytes);
+
+        List<ManifestFile> first = await ToListAsync(ManifestListReader.ReadAsync(stream, new ManifestListReadOptions { LeaveOpen = true }));
+        stream.Position = 0;
+        List<ManifestFile> second = await ToListAsync(ManifestListReader.ReadAsync(stream));
+
+        first.Count.ShouldBe(1);
+        second.Count.ShouldBe(1);
+        first[0].ManifestPath.ShouldBe(second[0].ManifestPath);
+    }
+
+    private static async Task<List<T>> ToListAsync<T>(IAsyncEnumerable<T> source)
+    {
+        var list = new List<T>();
+        await foreach (T item in source)
+        {
+            list.Add(item);
+        }
+
+        return list;
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/ManifestReaderTests.cs b/tests/IcebergSharp.Tests/Avro/ManifestReaderTests.cs
new file mode 100644
index 0000000..da85555
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/ManifestReaderTests.cs
@@ -0,0 +1,164 @@
+using IcebergSharp.Avro;
+using IcebergSharp.Tests.Avro.Helpers;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+public sealed class ManifestReaderTests
+{
+    [Fact]
+    public async Task ReadsV1ManifestWithMixedStatus()
+    {
+        ManifestEncoder.V1Entry[] entries =
+        [
+            new ManifestEncoder.V1Entry
+            {
+                Status = 1, // Added
+                SnapshotId = 100,
+                FilePath = "s3://lake/data/file-a.parquet",
+                RecordCount = 1000,
+                FileSizeInBytes = 5_000_000,
+            },
+            new ManifestEncoder.V1Entry
+            {
+                Status = 0, // Existing
+                SnapshotId = 99,
+                FilePath = "s3://lake/data/file-b.parquet",
+                RecordCount = 500,
+                FileSizeInBytes = 2_500_000,
+            },
+            new ManifestEncoder.V1Entry
+            {
+                Status = 0,
+                SnapshotId = 99,
+                FilePath = "s3://lake/data/file-c.parquet",
+                RecordCount = 200,
+                FileSizeInBytes = 1_000_000,
+            },
+            new ManifestEncoder.V1Entry
+            {
+                Status = 2, // Deleted
+                SnapshotId = 100,
+                FilePath = "s3://lake/data/file-d.parquet",
+                RecordCount = 50,
+                FileSizeInBytes = 250_000,
+            },
+        ];
+
+        var bytes = ManifestEncoder.EncodeV1(entries);
+        using var stream = new MemoryStream(bytes);
+        List<ManifestEntry> result = await ToListAsync(ManifestReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(4);
+        result[0].Status.ShouldBe(ManifestEntryStatus.Added);
+        result[1].Status.ShouldBe(ManifestEntryStatus.Existing);
+        result[2].Status.ShouldBe(ManifestEntryStatus.Existing);
+        result[3].Status.ShouldBe(ManifestEntryStatus.Deleted);
+
+        result[0].DataFile.FilePath.ShouldBe("s3://lake/data/file-a.parquet");
+        result[0].DataFile.FileFormat.ShouldBe(DataFileFormat.Parquet);
+        result[0].DataFile.RecordCount.ShouldBe(1000);
+        result[0].DataFile.Partition.Count.ShouldBe(0);
+        result[0].DataFile.Content.ShouldBe(DataFileContent.Data); // v1 default
+    }
+
+    [Fact]
+    public async Task ReadsV2ManifestWithStatsAndBounds()
+    {
+        var entry = new ManifestEncoder.V2Entry
+        {
+            Status = 1,
+            SnapshotId = 100,
+            SequenceNumber = 1,
+            FileSequenceNumber = 1,
+            Content = 0,
+            FilePath = "s3://lake/data/file.parquet",
+            RecordCount = 1000,
+            FileSizeInBytes = 5_000_000,
+            ColumnSizes = new() { { 1, 100 }, { 2, 200 } },
+            LowerBounds = new() { { 1, [0x00, 0x00, 0x00, 0x01] } },
+            UpperBounds = new() { { 1, [0x00, 0x00, 0x03, 0xE8] } },
+        };
+
+        var bytes = ManifestEncoder.EncodeV2([entry]);
+        using var stream = new MemoryStream(bytes);
+        List<ManifestEntry> result = await ToListAsync(ManifestReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(1);
+        ManifestEntry e = result[0];
+        e.Status.ShouldBe(ManifestEntryStatus.Added);
+        e.SnapshotId.ShouldBe(100);
+        e.SequenceNumber.ShouldBe(1);
+        e.FileSequenceNumber.ShouldBe(1);
+        e.DataFile.RecordCount.ShouldBe(1000);
+        e.DataFile.ColumnSizes.Count.ShouldBe(2);
+        e.DataFile.ColumnSizes[1].ShouldBe(100);
+        e.DataFile.ColumnSizes[2].ShouldBe(200);
+        e.DataFile.LowerBounds[1].Span.ToArray().ShouldBe([0x00, 0x00, 0x00, 0x01]);
+        e.DataFile.UpperBounds[1].Span.ToArray().ShouldBe([0x00, 0x00, 0x03, 0xE8]);
+    }
+
+    [Fact]
+    public async Task ReadsV2DeleteContentEntriesUnfiltered()
+    {
+        ManifestEncoder.V2Entry[] entries =
+        [
+            new ManifestEncoder.V2Entry
+            {
+                Status = 1, SnapshotId = 100, SequenceNumber = 1, FileSequenceNumber = 1,
+                Content = 1, // PositionDeletes
+                FilePath = "s3://lake/deletes/d.parquet",
+                RecordCount = 10, FileSizeInBytes = 5000,
+            },
+            new ManifestEncoder.V2Entry
+            {
+                Status = 1, SnapshotId = 100, SequenceNumber = 1, FileSequenceNumber = 1,
+                Content = 2, // EqualityDeletes
+                FilePath = "s3://lake/deletes/e.parquet",
+                RecordCount = 5, FileSizeInBytes = 2000,
+            },
+        ];
+
+        var bytes = ManifestEncoder.EncodeV2(entries, codec: "deflate");
+        using var stream = new MemoryStream(bytes);
+        List<ManifestEntry> result = await ToListAsync(ManifestReader.ReadAsync(stream));
+
+        result.Count.ShouldBe(2);
+        result[0].DataFile.Content.ShouldBe(DataFileContent.PositionDeletes);
+        result[1].DataFile.Content.ShouldBe(DataFileContent.EqualityDeletes);
+    }
+
+    [Fact]
+    public async Task StreamReplayAfterPositionReset()
+    {
+        var entry = new ManifestEncoder.V1Entry
+        {
+            Status = 1,
+            SnapshotId = 1,
+            FilePath = "s3://lake/x.parquet",
+            RecordCount = 1,
+            FileSizeInBytes = 1,
+        };
+        var bytes = ManifestEncoder.EncodeV1([entry]);
+        using var stream = new MemoryStream(bytes);
+        List<ManifestEntry> first = await ToListAsync(ManifestReader.ReadAsync(stream, new ManifestReadOptions { LeaveOpen = true }));
+        stream.Position = 0;
+        List<ManifestEntry> second = await ToListAsync(ManifestReader.ReadAsync(stream));
+
+        first.Count.ShouldBe(1);
+        second.Count.ShouldBe(1);
+        first[0].DataFile.FilePath.ShouldBe(second[0].DataFile.FilePath);
+    }
+
+    private static async Task<List<T>> ToListAsync<T>(IAsyncEnumerable<T> source)
+    {
+        var list = new List<T>();
+        await foreach (T item in source)
+        {
+            list.Add(item);
+        }
+
+        return list;
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/OcfHeaderTests.cs b/tests/IcebergSharp.Tests/Avro/OcfHeaderTests.cs
new file mode 100644
index 0000000..b6f17d2
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/OcfHeaderTests.cs
@@ -0,0 +1,132 @@
+using System.Text;
+using IcebergSharp.Avro.Internal.Errors;
+using IcebergSharp.Avro.Internal.Ocf;
+using IcebergSharp.Tests.Avro.Helpers;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+public sealed class OcfHeaderTests
+{
+    [Fact]
+    public async Task InitializeReadsSchemaAndCodecFromMetadata()
+    {
+        const string Schema = """{"type":"record","name":"r","fields":[{"name":"x","type":"long","field-id":1}]}""";
+        using var enc = new MiniAvroEncoder(Schema, "null");
+        enc.StartRecord();
+        enc.WriteLong(42);
+
+        using var stream = new MemoryStream(enc.ToArray());
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await reader.InitializeAsync(default);
+
+        reader.Header.SchemaJson.ShouldBe(Schema);
+        reader.Header.Codec.ShouldBe("null");
+        reader.Header.Sync.Length.ShouldBe(16);
+    }
+
+    [Fact]
+    public async Task InitializeSupportsDeflateCodec()
+    {
+        const string Schema = """{"type":"record","name":"r","fields":[{"name":"x","type":"long","field-id":1}]}""";
+        using var enc = new MiniAvroEncoder(Schema, "deflate");
+        enc.StartRecord();
+        enc.WriteLong(7);
+
+        using var stream = new MemoryStream(enc.ToArray());
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await reader.InitializeAsync(default);
+        reader.Header.Codec.ShouldBe("deflate");
+    }
+
+    [Fact]
+    public async Task InitializeRejectsNegativeMetadataBlockByteSize()
+    {
+        var bytes = new List<byte>();
+        bytes.AddRange("Obj\x01"u8);
+        WriteLong(bytes, -1); // one metadata entry, followed by byte-size header
+        WriteLong(bytes, -1); // invalid negative block byte size
+
+        using var stream = new MemoryStream([.. bytes]);
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await Should.ThrowAsync<AvroFormatException>(async () => await reader.InitializeAsync(default));
+    }
+
+    [Fact]
+    public async Task InitializeRejectsOversizedMetadataValueBeforeAllocating()
+    {
+        var bytes = new List<byte>();
+        bytes.AddRange("Obj\x01"u8);
+        WriteLong(bytes, 1);
+        WriteString(bytes, "avro.schema");
+        WriteLong(bytes, 16 * 1024 * 1024 + 1L);
+
+        using var stream = new MemoryStream([.. bytes]);
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await Should.ThrowAsync<AvroFormatException>(async () => await reader.InitializeAsync(default));
+    }
+
+    [Fact]
+    public async Task ReadNextBlockRejectsRecordCountAboveConfiguredLimit()
+    {
+        const string Schema = """{"type":"record","name":"r","fields":[{"name":"x","type":"long","field-id":1}]}""";
+        using var enc = new MiniAvroEncoder(Schema, "null");
+        enc.StartRecord();
+        enc.WriteLong(1);
+        enc.StartRecord();
+        enc.WriteLong(2);
+
+        using var stream = new MemoryStream(enc.ToArray());
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024, maxBlockRecordCount: 1);
+        await reader.InitializeAsync(default);
+
+        await Should.ThrowAsync<AvroFormatException>(async () => await reader.ReadNextBlockAsync(default));
+    }
+
+    [Fact]
+    public async Task InitializeRejectsBadMagic()
+    {
+        byte[] bytes = [(byte)'O', (byte)'b', (byte)'j', 0x02 /* wrong */];
+        using var stream = new MemoryStream(bytes);
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await Should.ThrowAsync<Exception>(async () => await reader.InitializeAsync(default));
+    }
+
+    [Fact]
+    public async Task InitializeRejectsUnknownCodec()
+    {
+        const string Schema = """{"type":"record","name":"r","fields":[{"name":"x","type":"long","field-id":1}]}""";
+        // Build a valid header by hand with avro.codec = "snappy" — easier to use the encoder and patch.
+        // Instead, just build minimally via encoder set to "null" then mutate the codec key in metadata.
+        using var enc = new MiniAvroEncoder(Schema, "null", new Dictionary<string, byte[]>
+        {
+            // The encoder writes avro.codec first; we add another avro.codec entry which overrides it.
+            ["avro.codec"] = System.Text.Encoding.UTF8.GetBytes("snappy"),
+        });
+
+        // No records — header-only file.
+        using var stream = new MemoryStream(enc.ToArray());
+        await using var reader = new OcfReader(stream, leaveOpen: true, maxBlockSize: 1024);
+        await Should.ThrowAsync<Exception>(async () => await reader.InitializeAsync(default));
+    }
+
+    private static void WriteString(List<byte> output, string value)
+    {
+        var bytes = Encoding.UTF8.GetBytes(value);
+        WriteLong(output, bytes.Length);
+        output.AddRange(bytes);
+    }
+
+    private static void WriteLong(List<byte> output, long value)
+    {
+        var zz = (ulong)((value << 1) ^ (value >> 63));
+        while ((zz & ~0x7FUL) != 0)
+        {
+            output.Add((byte)((zz & 0x7F) | 0x80));
+            zz >>= 7;
+        }
+
+        output.Add((byte)zz);
+    }
+}
diff --git a/tests/IcebergSharp.Tests/Avro/Phase2SmokeTests.cs b/tests/IcebergSharp.Tests/Avro/Phase2SmokeTests.cs
new file mode 100644
index 0000000..43df533
--- /dev/null
+++ b/tests/IcebergSharp.Tests/Avro/Phase2SmokeTests.cs
@@ -0,0 +1,149 @@
+using IcebergSharp.Avro;
+using IcebergSharp.Json;
+using IcebergSharp.Tests.Avro.Helpers;
+using Shouldly;
+using Xunit;
+
+namespace IcebergSharp.Tests.Avro;
+
+/// <summary>
+/// End-to-end smoke test that wires Phase 1 (TableMetadata JSON parsing) to
+/// Phase 2 (Avro manifest reading). Demonstrates the integration Phase 3 will
+/// own via FileIO: given a snapshot, follow manifest_list → manifest →
+/// data-file paths and collect every file the snapshot references.
+/// </summary>
+public sealed class Phase2SmokeTests
+{
+    private static readonly string[] _expectedDataFilePaths =
+    [
+        "s3://lake/d/a1.parquet",
+        "s3://lake/d/a2.parquet",
+        "s3://lake/d/b1.parquet",
+        "s3://lake/d/b2.parquet",
+    ];
+
+    [Fact]
+    public async Task SnapshotToDataFilePathsRoundTrip()
+    {
+        // Lay out a synthetic table on a temp directory:
+        //   table/metadata.json
+        //   table/snap-1.avro (manifest list)
+        //   table/manifest-a.avro
+        //   table/manifest-b.avro
+        DirectoryInfo dir = Directory.CreateTempSubdirectory("icebergsharp-phase2-smoke-");
+        try
+        {
+            var manifestAPath = Path.Combine(dir.FullName, "manifest-a.avro");
+            var manifestBPath = Path.Combine(dir.FullName, "manifest-b.avro");
+            var snapPath = Path.Combine(dir.FullName, "snap-1.avro");
+            var metaPath = Path.Combine(dir.FullName, "metadata.json");
+
+            // ---- write two manifests (each has two data file entries) ----
+            var manifestA = ManifestEncoder.EncodeV2(
+            [
+                new ManifestEncoder.V2Entry
+                {
+                    Status = 1, SnapshotId = 1, SequenceNumber = 1, FileSequenceNumber = 1,
+                    Content = 0, FilePath = "s3://lake/d/a1.parquet", RecordCount = 100, FileSizeInBytes = 1000,
+                },
+                new ManifestEncoder.V2Entry
+                {
+                    Status = 1, SnapshotId = 1, SequenceNumber = 1, FileSequenceNumber = 1,
+                    Content = 0, FilePath = "s3://lake/d/a2.parquet", RecordCount = 200, FileSizeInBytes = 2000,
+                },
+            ]);
+            await File.WriteAllBytesAsync(manifestAPath, manifestA);
+
+            var manifestB = ManifestEncoder.EncodeV2(
+            [
+                new ManifestEncoder.V2Entry
+                {
+                    Status = 1, SnapshotId = 1, SequenceNumber = 1, FileSequenceNumber = 1,
+                    Content = 0, FilePath = "s3://lake/d/b1.parquet", RecordCount = 50, FileSizeInBytes = 500,
+                },
+                new ManifestEncoder.V2Entry
+                {
+                    Status = 1, SnapshotId = 1, SequenceNumber = 1, FileSequenceNumber = 1,
+                    Content = 0, FilePath = "s3://lake/d/b2.parquet", RecordCount = 75, FileSizeInBytes = 750,
+                },
+            ]);
+            await File.WriteAllBytesAsync(manifestBPath, manifestB);
+
+            // ---- write the manifest list pointing at both manifests ----
+            var snap = ManifestListEncoder.EncodeV2(
+            [
+                new ManifestListEncoder.V2Entry
+                {
+                    ManifestPath = manifestAPath, ManifestLength = manifestA.Length,
+                    PartitionSpecId = 0, Content = 0,
+                    SequenceNumber = 1, MinSequenceNumber = 1, AddedSnapshotId = 1,
+                    AddedFilesCount = 2, ExistingFilesCount = 0, DeletedFilesCount = 0,
+                    AddedRowsCount = 300, ExistingRowsCount = 0, DeletedRowsCount = 0,
+                },
+                new ManifestListEncoder.V2Entry
+                {
+                    ManifestPath = manifestBPath, ManifestLength = manifestB.Length,
+                    PartitionSpecId = 0, Content = 0,
+                    SequenceNumber = 1, MinSequenceNumber = 1, AddedSnapshotId = 1,
+                    AddedFilesCount = 2, ExistingFilesCount = 0, DeletedFilesCount = 0,
+                    AddedRowsCount = 125, ExistingRowsCount = 0, DeletedRowsCount = 0,
+                },
+            ]);
+            await File.WriteAllBytesAsync(snapPath, snap);
+
+            // ---- write a TableMetadata pointing at the snapshot file ----
+            var metaJson = $$"""
+            {
+              "format-version": 2,
+              "table-uuid": "11111111-2222-3333-4444-555555555555",
+              "location": "{{dir.FullName.Replace("\\", "/")}}",
+              "last-sequence-number": 1,
+              "last-updated-ms": 1700000000000,
+              "last-column-id": 1,
+              "current-schema-id": 0,
+              "schemas": [{ "type": "struct", "schema-id": 0, "fields": [{ "id": 1, "name": "x", "required": false, "type": "long" }] }],
+              "default-spec-id": 0,
+              "partition-specs": [{ "spec-id": 0, "fields": [] }],
+              "last-partition-id": 999,
+              "default-sort-order-id": 0,
+              "sort-orders": [{ "order-id": 0, "fields": [] }],
+              "properties": {},
+              "current-snapshot-id": 1,
+              "snapshots": [{
+                "snapshot-id": 1,
+                "sequence-number": 1,
+                "timestamp-ms": 1700000000000,
+                "manifest-list": "{{snapPath.Replace("\\", "/")}}",
+                "summary": { "operation": "append" },
+                "schema-id": 0
+              }]
+            }
+            """;
+            await File.WriteAllTextAsync(metaPath, metaJson);
+
+            // ---- now do what Phase 3 would do: load metadata, walk the tree ----
+            TableMetadata md = TableMetadataJson.Parse(await File.ReadAllTextAsync(metaPath));
+            Snapshot current = md.CurrentSnapshot.ShouldNotBeNull();
+
+            var dataFilePaths = new List<string>();
+            await using (FileStream manifestListStream = File.OpenRead(current.ManifestList))
+            {
+                await foreach (ManifestFile mf in ManifestListReader.ReadAsync(manifestListStream))
+                {
+                    await using FileStream manifestStream = File.OpenRead(mf.ManifestPath);
+                    await foreach (ManifestEntry entry in ManifestReader.ReadAsync(manifestStream))
+                    {
+                        dataFilePaths.Add(entry.DataFile.FilePath);
+                    }
+                }
+            }
+
+            dataFilePaths.Count.ShouldBe(4);
+            dataFilePaths.ShouldBe(_expectedDataFilePaths, ignoreOrder: false);
+        }
+        finally
+        {
+            dir.Delete(recursive: true);
+        }
+    }
+}