src/storage/blobfs/blob_loader.cc - fuchsia - Git at Google

 // Copyright 2020 The Fuchsia Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "src/storage/blobfs/blob_loader.h"

 #include <lib/fit/defer.h>
 #include <lib/fzl/owned-vmo-mapper.h>
 #include <lib/syslog/cpp/macros.h>
 #include <lib/zx/status.h>
 #include <zircon/assert.h>
 #include <zircon/errors.h>
 #include <zircon/status.h>
 #include <zircon/syscalls.h>

 #include <algorithm>
 #include <memory>
 #include <vector>

 #include <fbl/string_buffer.h>
 #include <storage/buffer/owned_vmoid.h>

 #include "src/lib/digest/digest.h"
 #include "src/lib/storage/vfs/cpp/trace.h"
 #include "src/lib/storage/vfs/cpp/transaction/buffered_operations_builder.h"
 #include "src/storage/blobfs/blob_layout.h"
 #include "src/storage/blobfs/blob_verifier.h"
 #include "src/storage/blobfs/common.h"
 #include "src/storage/blobfs/compression/chunked.h"
 #include "src/storage/blobfs/compression/decompressor.h"
 #include "src/storage/blobfs/compression/seekable_decompressor.h"
 #include "src/storage/blobfs/compression_settings.h"
 #include "src/storage/blobfs/format.h"
 #include "src/storage/blobfs/iterator/block_iterator.h"
 #include "storage/operation/operation.h"

 namespace blobfs {

 namespace {

 // TODO(jfsulliv): Rationalize this with the size limits for chunk-compression headers.
 constexpr size_t kChunkedHeaderSize = 4 * kBlobfsBlockSize;

 }  // namespace

 BlobLoader::BlobLoader(TransactionManager* txn_manager, BlockIteratorProvider* block_iter_provider,
                        NodeFinder* node_finder, std::shared_ptr<BlobfsMetrics> metrics,
                        fzl::OwnedVmoMapper read_mapper, zx::vmo sandbox_vmo,
                        std::unique_ptr<ExternalDecompressorClient> decompressor_client)
     : txn_manager_(txn_manager),
       block_iter_provider_(block_iter_provider),
       node_finder_(node_finder),
       metrics_(std::move(metrics)),
       read_mapper_(std::move(read_mapper)),
       sandbox_vmo_(std::move(sandbox_vmo)),
       decompressor_client_(std::move(decompressor_client)) {}

 zx::status<BlobLoader> BlobLoader::Create(TransactionManager* txn_manager,
                                           BlockIteratorProvider* block_iter_provider,
                                           NodeFinder* node_finder,
                                           std::shared_ptr<BlobfsMetrics> metrics,
                                           bool sandbox_decompression) {
   fzl::OwnedVmoMapper read_mapper;
   zx_status_t status = read_mapper.CreateAndMap(pager::kTransferBufferSize, "blobfs-loader");
   if (status != ZX_OK) {
     FX_LOGS(ERROR) << "blobfs: Failed to map read vmo: " << zx_status_get_string(status);
     return zx::error(status);
   }
   zx::vmo sandbox_vmo;
   std::unique_ptr<ExternalDecompressorClient> decompressor_client = nullptr;
   if (sandbox_decompression) {
     status = zx::vmo::create(pager::kDecompressionBufferSize, 0, &sandbox_vmo);
     if (status != ZX_OK) {
       return zx::error(status);
     }
     const char* name = "blobfs-sandbox";
     sandbox_vmo.set_property(ZX_PROP_NAME, name, strlen(name));
     zx::status<std::unique_ptr<ExternalDecompressorClient>> client_or =
         ExternalDecompressorClient::Create(sandbox_vmo, read_mapper.vmo());
     if (!client_or.is_ok()) {
       return client_or.take_error();
     } else {
       decompressor_client = std::move(client_or.value());
     }
   }
   return zx::ok(BlobLoader(txn_manager, block_iter_provider, node_finder, std::move(metrics),
                            std::move(read_mapper), std::move(sandbox_vmo),
                            std::move(decompressor_client)));
 }

 zx::status<BlobLoader::LoadResult> BlobLoader::LoadBlob(
     uint32_t node_index, const BlobCorruptionNotifier* corruption_notifier) {
   LoadResult result;

   ZX_DEBUG_ASSERT(read_mapper_.vmo().is_valid());
   auto inode = node_finder_->GetNode(node_index);
   if (inode.is_error()) {
     return inode.take_error();
   }

   // LoadBlob should only be called for nonempty Inodes. If this doesn't hold, one of two things
   // happened:
   //   - Programmer error
   //   - Corruption of a blob's Inode
   // In either case it is preferable to ASSERT than to return an error here, since the first case
   // should happen only during development and in the second case there may be more corruption and
   // we want to unmount the filesystem before any more damage is done.
   ZX_ASSERT_MSG(inode->header.IsInode() && inode->header.IsAllocated(),
                 "LoadBlob failed as inode->header.IsInode():%u inode->header.IsAllocated():%u",
                 inode->header.IsInode(), inode->header.IsAllocated());
   ZX_ASSERT_MSG(inode->blob_size > 0, "Inode blob size should be greater than zero: %lu",
                 inode->blob_size);
   TRACE_DURATION("blobfs", "BlobLoader::LoadBlob", "blob_size", inode->blob_size);

   // Create and save the layout.
   auto blob_layout_or = BlobLayout::CreateFromInode(GetBlobLayoutFormat(txn_manager_->Info()),
                                                     *inode.value(), GetBlockSize());
   if (blob_layout_or.is_error()) {
     FX_LOGS(ERROR) << "Failed to create blob layout: "
                    << zx_status_get_string(blob_layout_or.error_value());
     return blob_layout_or.take_error();
   }
   result.layout = std::move(blob_layout_or.value());
   result.pager_info.identifier = node_index;
   result.pager_info.data_start_bytes =
       static_cast<uint64_t>(result.layout->DataBlockOffset()) * GetBlockSize();
   result.pager_info.data_length_bytes = inode->blob_size;

   if (zx_status_t status =
           InitMerkleVerifier(node_index, *inode.value(), *result.layout, corruption_notifier,
                              &result.merkle, &result.pager_info.verifier);
       status != ZX_OK) {
     return zx::error(status);
   }

   if (zx_status_t status =
           InitForDecompression(node_index, *inode.value(), *result.layout,
                                *result.pager_info.verifier, &result.pager_info.decompressor);
       status != ZX_OK) {
     return zx::error(status);
   }

   return zx::ok(std::move(result));
 }

 zx_status_t BlobLoader::InitMerkleVerifier(uint32_t node_index, const Inode& inode,
                                            const BlobLayout& blob_layout,
                                            const BlobCorruptionNotifier* notifier,
                                            fzl::OwnedVmoMapper* vmo_out,
                                            std::unique_ptr<BlobVerifier>* verifier_out) {
   if (blob_layout.MerkleTreeSize() == 0) {
     return BlobVerifier::CreateWithoutTree(digest::Digest(inode.merkle_root_hash), metrics_,
                                            inode.blob_size, notifier, verifier_out);
   }

   fzl::OwnedVmoMapper merkle_mapper;
   std::unique_ptr<BlobVerifier> verifier;

   fbl::StringBuffer<ZX_MAX_NAME_LEN> merkle_vmo_name;
   FormatBlobMerkleVmoName(digest::Digest(inode.merkle_root_hash), &merkle_vmo_name);

   zx_status_t status;
   if ((status = merkle_mapper.CreateAndMap(blob_layout.MerkleTreeBlockAlignedSize(),
                                            merkle_vmo_name.c_str())) != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to initialize merkle vmo; error: " << zx_status_get_string(status);
     return status;
   }

   if ((status = LoadMerkle(node_index, blob_layout, merkle_mapper)) != ZX_OK) {
     return status;
   }

   // The Merkle tree may not start at the beginning of the vmo in the kCompactMerkleTreeAtEnd
   // format.
   void* merkle_tree_start = static_cast<uint8_t*>(merkle_mapper.start()) +
                             blob_layout.MerkleTreeOffsetWithinBlockOffset();

   if ((status = BlobVerifier::Create(digest::Digest(inode.merkle_root_hash), metrics_,
                                      merkle_tree_start, blob_layout.MerkleTreeSize(),
                                      blob_layout.Format(), inode.blob_size, notifier, &verifier)) !=
       ZX_OK) {
     return status;
   }

   *vmo_out = std::move(merkle_mapper);
   *verifier_out = std::move(verifier);
   return ZX_OK;
 }

 zx_status_t BlobLoader::InitForDecompression(
     uint32_t node_index, const Inode& inode, const BlobLayout& blob_layout,
     const BlobVerifier& verifier, std::unique_ptr<SeekableDecompressor>* decompressor_out) {
   zx::status<CompressionAlgorithm> algorithm_status = AlgorithmForInode(inode);
   if (algorithm_status.is_error()) {
     FX_LOGS(ERROR) << "Cannot decode blob due to invalid compression flags.";
     return algorithm_status.status_value();
   }

   if (algorithm_status.value() == CompressionAlgorithm::kUncompressed)
     return ZX_OK;

   TRACE_DURATION("blobfs", "BlobLoader::InitDecompressor");

   // The first few blocks of data contain the seek table, which we need to read to initialize the
   // decompressor. Read these from disk.

   uint32_t data_block_count = blob_layout.DataBlockCount();
   // We don't know exactly how long the header is, so we generally overshoot.
   // (The header should never be bigger than the size of the kChunkedHeaderSize.)
   ZX_DEBUG_ASSERT(kChunkedHeaderSize % GetBlockSize() == 0);
   uint32_t header_block_count = static_cast<uint32_t>(kChunkedHeaderSize) / GetBlockSize();
   uint32_t blocks_to_read = std::min(header_block_count, data_block_count);
   if (blocks_to_read == 0) {
     FX_LOGS(ERROR) << "No data blocks; corrupted inode?";
     return ZX_ERR_BAD_STATE;
   }

   auto decommit_used = fit::defer([this, length = blocks_to_read * GetBlockSize()]() {
     read_mapper_.vmo().op_range(ZX_VMO_OP_DECOMMIT, 0, length, nullptr, 0);
   });
   auto bytes_read =
       LoadBlocks(node_index, blob_layout.DataBlockOffset(), blocks_to_read, read_mapper_.vmo());
   if (bytes_read.is_error()) {
     FX_LOGS(ERROR) << "Failed to load compression header: " << bytes_read.status_string();
     return bytes_read.error_value();
   }

   zx_status_t status;
   // If we read all of the blob's data into the read VMO then the read VMO may contain part of
   // the Merkle tree that should be removed.
   if (blocks_to_read == data_block_count) {
     ZeroMerkleTreeWithinDataVmo(read_mapper_.start(), read_mapper_.size(), blob_layout);
   }

   if ((status = SeekableChunkedDecompressor::CreateDecompressor(
            read_mapper_.start(), /*max_seek_table_size=*/
            std::min(uint64_t{blocks_to_read} * GetBlockSize(), blob_layout.DataSizeUpperBound()),
            /*max_compressed_size=*/blob_layout.DataSizeUpperBound(), decompressor_out)) != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to init decompressor: " << zx_status_get_string(status);
     return status;
   }

   return ZX_OK;
 }

 zx_status_t BlobLoader::LoadMerkle(uint32_t node_index, const BlobLayout& blob_layout,
                                    const fzl::OwnedVmoMapper& mapper) const {
   fs::Ticker ticker(metrics_->Collecting());
   auto bytes_read = LoadBlocks(node_index, blob_layout.MerkleTreeBlockOffset(),
                                blob_layout.MerkleTreeBlockCount(), mapper.vmo());
   if (bytes_read.is_error()) {
     FX_LOGS(ERROR) << "Failed to load Merkle tree: " << bytes_read.status_string();
     return bytes_read.error_value();
   }

   metrics_->IncrementMerkleDiskRead(bytes_read.value(), ticker.End());
   return ZX_OK;
 }

 zx::status<uint64_t> BlobLoader::LoadBlocks(uint32_t node_index, uint32_t block_offset,
                                             uint32_t block_count, const zx::vmo& vmo) const {
   TRACE_DURATION("blobfs", "BlobLoader::LoadBlocks", "block_count", block_count);

   zx_status_t status;
   // Attach |vmo| for transfer to the block FIFO.
   storage::OwnedVmoid vmoid(txn_manager_);
   if ((status = vmoid.AttachVmo(vmo)) != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to attach VMO to block device; error: "
                    << zx_status_get_string(status);
     return zx::error(status);
   }

   const uint64_t kDataStart = DataStartBlock(txn_manager_->Info());
   auto block_iter = block_iter_provider_->BlockIteratorByNodeIndex(node_index);
   if (block_iter.is_error()) {
     return block_iter.take_error();
   }
   if ((status = IterateToBlock(&block_iter.value(), block_offset)) != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to seek to starting block: " << zx_status_get_string(status);
     return zx::error(status);
   }
   std::vector<storage::BufferedOperation> operations;

   status = StreamBlocks(&block_iter.value(), block_count,
                         [&](uint64_t vmo_offset, uint64_t dev_offset, uint32_t length) {
                           operations.push_back({.vmoid = vmoid.get(),
                                                 .op = {
                                                     .type = storage::OperationType::kRead,
                                                     .vmo_offset = vmo_offset - block_offset,
                                                     .dev_offset = kDataStart + dev_offset,
                                                     .length = length,
                                                 }});
                           return ZX_OK;
                         });

   if (status != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to stream blocks: " << zx_status_get_string(status);
     return zx::error(status);
   }
   status = txn_manager_->RunRequests(operations);
   if (status != ZX_OK) {
     FX_LOGS(ERROR) << "Failed to flush read transaction: " << zx_status_get_string(status);
     return zx::error(status);
   }

   return zx::ok(uint64_t{block_count} * GetBlockSize());
 }

 void BlobLoader::ZeroMerkleTreeWithinDataVmo(void* mapped_data, size_t mapped_data_size,
                                              const BlobLayout& blob_layout) const {
   if (!blob_layout.HasMerkleTreeAndDataSharedBlock()) {
     return;
   }
   uint64_t data_block_aligned_size = blob_layout.DataBlockAlignedSize();
   ZX_DEBUG_ASSERT(mapped_data_size >= data_block_aligned_size);
   uint64_t len = uint64_t{GetBlockSize()} - blob_layout.MerkleTreeOffsetWithinBlockOffset();
   // Since the block is shared, data_block_aligned_size is >= 1 block.
   uint64_t offset = data_block_aligned_size - len;
   memset(static_cast<uint8_t*>(mapped_data) + offset, 0, len);
 }

 uint32_t BlobLoader::GetBlockSize() const { return txn_manager_->Info().block_size; }

 }  // namespace blobfs
	// Copyright 2020 The Fuchsia Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "src/storage/blobfs/blob_loader.h"

	#include <lib/fit/defer.h>
	#include <lib/fzl/owned-vmo-mapper.h>
	#include <lib/syslog/cpp/macros.h>
	#include <lib/zx/status.h>
	#include <zircon/assert.h>
	#include <zircon/errors.h>
	#include <zircon/status.h>
	#include <zircon/syscalls.h>

	#include <algorithm>
	#include <memory>
	#include <vector>

	#include <fbl/string_buffer.h>
	#include <storage/buffer/owned_vmoid.h>

	#include "src/lib/digest/digest.h"
	#include "src/lib/storage/vfs/cpp/trace.h"
	#include "src/lib/storage/vfs/cpp/transaction/buffered_operations_builder.h"
	#include "src/storage/blobfs/blob_layout.h"
	#include "src/storage/blobfs/blob_verifier.h"
	#include "src/storage/blobfs/common.h"
	#include "src/storage/blobfs/compression/chunked.h"
	#include "src/storage/blobfs/compression/decompressor.h"
	#include "src/storage/blobfs/compression/seekable_decompressor.h"
	#include "src/storage/blobfs/compression_settings.h"
	#include "src/storage/blobfs/format.h"
	#include "src/storage/blobfs/iterator/block_iterator.h"
	#include "storage/operation/operation.h"

	namespace blobfs {

	namespace {

	// TODO(jfsulliv): Rationalize this with the size limits for chunk-compression headers.
	constexpr size_t kChunkedHeaderSize = 4 * kBlobfsBlockSize;

	} // namespace

	BlobLoader::BlobLoader(TransactionManager* txn_manager, BlockIteratorProvider* block_iter_provider,
	NodeFinder* node_finder, std::shared_ptr<BlobfsMetrics> metrics,
	fzl::OwnedVmoMapper read_mapper, zx::vmo sandbox_vmo,
	std::unique_ptr<ExternalDecompressorClient> decompressor_client)
	: txn_manager_(txn_manager),
	block_iter_provider_(block_iter_provider),
	node_finder_(node_finder),
	metrics_(std::move(metrics)),
	read_mapper_(std::move(read_mapper)),
	sandbox_vmo_(std::move(sandbox_vmo)),
	decompressor_client_(std::move(decompressor_client)) {}

	zx::status<BlobLoader> BlobLoader::Create(TransactionManager* txn_manager,
	BlockIteratorProvider* block_iter_provider,
	NodeFinder* node_finder,
	std::shared_ptr<BlobfsMetrics> metrics,
	bool sandbox_decompression) {
	fzl::OwnedVmoMapper read_mapper;
	zx_status_t status = read_mapper.CreateAndMap(pager::kTransferBufferSize, "blobfs-loader");
	if (status != ZX_OK) {
	FX_LOGS(ERROR) << "blobfs: Failed to map read vmo: " << zx_status_get_string(status);
	return zx::error(status);
	}
	zx::vmo sandbox_vmo;
	std::unique_ptr<ExternalDecompressorClient> decompressor_client = nullptr;
	if (sandbox_decompression) {
	status = zx::vmo::create(pager::kDecompressionBufferSize, 0, &sandbox_vmo);
	if (status != ZX_OK) {
	return zx::error(status);
	}
	const char* name = "blobfs-sandbox";
	sandbox_vmo.set_property(ZX_PROP_NAME, name, strlen(name));
	zx::status<std::unique_ptr<ExternalDecompressorClient>> client_or =
	ExternalDecompressorClient::Create(sandbox_vmo, read_mapper.vmo());
	if (!client_or.is_ok()) {
	return client_or.take_error();
	} else {
	decompressor_client = std::move(client_or.value());
	}
	}
	return zx::ok(BlobLoader(txn_manager, block_iter_provider, node_finder, std::move(metrics),
	std::move(read_mapper), std::move(sandbox_vmo),
	std::move(decompressor_client)));
	}

	zx::status<BlobLoader::LoadResult> BlobLoader::LoadBlob(
	uint32_t node_index, const BlobCorruptionNotifier* corruption_notifier) {
	LoadResult result;

	ZX_DEBUG_ASSERT(read_mapper_.vmo().is_valid());
	auto inode = node_finder_->GetNode(node_index);
	if (inode.is_error()) {
	return inode.take_error();
	}

	// LoadBlob should only be called for nonempty Inodes. If this doesn't hold, one of two things
	// happened:
	// - Programmer error
	// - Corruption of a blob's Inode
	// In either case it is preferable to ASSERT than to return an error here, since the first case
	// should happen only during development and in the second case there may be more corruption and
	// we want to unmount the filesystem before any more damage is done.
	ZX_ASSERT_MSG(inode->header.IsInode() && inode->header.IsAllocated(),
	"LoadBlob failed as inode->header.IsInode():%u inode->header.IsAllocated():%u",
	inode->header.IsInode(), inode->header.IsAllocated());
	ZX_ASSERT_MSG(inode->blob_size > 0, "Inode blob size should be greater than zero: %lu",
	inode->blob_size);
	TRACE_DURATION("blobfs", "BlobLoader::LoadBlob", "blob_size", inode->blob_size);

	// Create and save the layout.
	auto blob_layout_or = BlobLayout::CreateFromInode(GetBlobLayoutFormat(txn_manager_->Info()),
	*inode.value(), GetBlockSize());
	if (blob_layout_or.is_error()) {
	FX_LOGS(ERROR) << "Failed to create blob layout: "
	<< zx_status_get_string(blob_layout_or.error_value());
	return blob_layout_or.take_error();
	}
	result.layout = std::move(blob_layout_or.value());
	result.pager_info.identifier = node_index;
	result.pager_info.data_start_bytes =
	static_cast<uint64_t>(result.layout->DataBlockOffset()) * GetBlockSize();
	result.pager_info.data_length_bytes = inode->blob_size;

	if (zx_status_t status =
	InitMerkleVerifier(node_index, inode.value(), result.layout, corruption_notifier,
	&result.merkle, &result.pager_info.verifier);
	status != ZX_OK) {
	return zx::error(status);
	}

	if (zx_status_t status =
	InitForDecompression(node_index, inode.value(), result.layout,
	*result.pager_info.verifier, &result.pager_info.decompressor);
	status != ZX_OK) {
	return zx::error(status);
	}

	return zx::ok(std::move(result));
	}

	zx_status_t BlobLoader::InitMerkleVerifier(uint32_t node_index, const Inode& inode,
	const BlobLayout& blob_layout,
	const BlobCorruptionNotifier* notifier,
	fzl::OwnedVmoMapper* vmo_out,
	std::unique_ptr<BlobVerifier>* verifier_out) {
	if (blob_layout.MerkleTreeSize() == 0) {
	return BlobVerifier::CreateWithoutTree(digest::Digest(inode.merkle_root_hash), metrics_,
	inode.blob_size, notifier, verifier_out);
	}

	fzl::OwnedVmoMapper merkle_mapper;
	std::unique_ptr<BlobVerifier> verifier;

	fbl::StringBuffer<ZX_MAX_NAME_LEN> merkle_vmo_name;
	FormatBlobMerkleVmoName(digest::Digest(inode.merkle_root_hash), &merkle_vmo_name);

	zx_status_t status;
	if ((status = merkle_mapper.CreateAndMap(blob_layout.MerkleTreeBlockAlignedSize(),
	merkle_vmo_name.c_str())) != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to initialize merkle vmo; error: " << zx_status_get_string(status);
	return status;
	}

	if ((status = LoadMerkle(node_index, blob_layout, merkle_mapper)) != ZX_OK) {
	return status;
	}

	// The Merkle tree may not start at the beginning of the vmo in the kCompactMerkleTreeAtEnd
	// format.
	void* merkle_tree_start = static_cast<uint8_t*>(merkle_mapper.start()) +
	blob_layout.MerkleTreeOffsetWithinBlockOffset();

	if ((status = BlobVerifier::Create(digest::Digest(inode.merkle_root_hash), metrics_,
	merkle_tree_start, blob_layout.MerkleTreeSize(),
	blob_layout.Format(), inode.blob_size, notifier, &verifier)) !=
	ZX_OK) {
	return status;
	}

	*vmo_out = std::move(merkle_mapper);
	*verifier_out = std::move(verifier);
	return ZX_OK;
	}

	zx_status_t BlobLoader::InitForDecompression(
	uint32_t node_index, const Inode& inode, const BlobLayout& blob_layout,
	const BlobVerifier& verifier, std::unique_ptr<SeekableDecompressor>* decompressor_out) {
	zx::status<CompressionAlgorithm> algorithm_status = AlgorithmForInode(inode);
	if (algorithm_status.is_error()) {
	FX_LOGS(ERROR) << "Cannot decode blob due to invalid compression flags.";
	return algorithm_status.status_value();
	}

	if (algorithm_status.value() == CompressionAlgorithm::kUncompressed)
	return ZX_OK;

	TRACE_DURATION("blobfs", "BlobLoader::InitDecompressor");

	// The first few blocks of data contain the seek table, which we need to read to initialize the
	// decompressor. Read these from disk.

	uint32_t data_block_count = blob_layout.DataBlockCount();
	// We don't know exactly how long the header is, so we generally overshoot.
	// (The header should never be bigger than the size of the kChunkedHeaderSize.)
	ZX_DEBUG_ASSERT(kChunkedHeaderSize % GetBlockSize() == 0);
	uint32_t header_block_count = static_cast<uint32_t>(kChunkedHeaderSize) / GetBlockSize();
	uint32_t blocks_to_read = std::min(header_block_count, data_block_count);
	if (blocks_to_read == 0) {
	FX_LOGS(ERROR) << "No data blocks; corrupted inode?";
	return ZX_ERR_BAD_STATE;
	}

	auto decommit_used = fit::defer([this, length = blocks_to_read * GetBlockSize()]() {
	read_mapper_.vmo().op_range(ZX_VMO_OP_DECOMMIT, 0, length, nullptr, 0);
	});
	auto bytes_read =
	LoadBlocks(node_index, blob_layout.DataBlockOffset(), blocks_to_read, read_mapper_.vmo());
	if (bytes_read.is_error()) {
	FX_LOGS(ERROR) << "Failed to load compression header: " << bytes_read.status_string();
	return bytes_read.error_value();
	}

	zx_status_t status;
	// If we read all of the blob's data into the read VMO then the read VMO may contain part of
	// the Merkle tree that should be removed.
	if (blocks_to_read == data_block_count) {
	ZeroMerkleTreeWithinDataVmo(read_mapper_.start(), read_mapper_.size(), blob_layout);
	}

	if ((status = SeekableChunkedDecompressor::CreateDecompressor(
	read_mapper_.start(), /max_seek_table_size=/
	std::min(uint64_t{blocks_to_read} * GetBlockSize(), blob_layout.DataSizeUpperBound()),
	/max_compressed_size=/blob_layout.DataSizeUpperBound(), decompressor_out)) != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to init decompressor: " << zx_status_get_string(status);
	return status;
	}

	return ZX_OK;
	}

	zx_status_t BlobLoader::LoadMerkle(uint32_t node_index, const BlobLayout& blob_layout,
	const fzl::OwnedVmoMapper& mapper) const {
	fs::Ticker ticker(metrics_->Collecting());
	auto bytes_read = LoadBlocks(node_index, blob_layout.MerkleTreeBlockOffset(),
	blob_layout.MerkleTreeBlockCount(), mapper.vmo());
	if (bytes_read.is_error()) {
	FX_LOGS(ERROR) << "Failed to load Merkle tree: " << bytes_read.status_string();
	return bytes_read.error_value();
	}

	metrics_->IncrementMerkleDiskRead(bytes_read.value(), ticker.End());
	return ZX_OK;
	}

	zx::status<uint64_t> BlobLoader::LoadBlocks(uint32_t node_index, uint32_t block_offset,
	uint32_t block_count, const zx::vmo& vmo) const {
	TRACE_DURATION("blobfs", "BlobLoader::LoadBlocks", "block_count", block_count);

	zx_status_t status;
	// Attach \|vmo\| for transfer to the block FIFO.
	storage::OwnedVmoid vmoid(txn_manager_);
	if ((status = vmoid.AttachVmo(vmo)) != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to attach VMO to block device; error: "
	<< zx_status_get_string(status);
	return zx::error(status);
	}

	const uint64_t kDataStart = DataStartBlock(txn_manager_->Info());
	auto block_iter = block_iter_provider_->BlockIteratorByNodeIndex(node_index);
	if (block_iter.is_error()) {
	return block_iter.take_error();
	}
	if ((status = IterateToBlock(&block_iter.value(), block_offset)) != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to seek to starting block: " << zx_status_get_string(status);
	return zx::error(status);
	}
	std::vector<storage::BufferedOperation> operations;

	status = StreamBlocks(&block_iter.value(), block_count,
	[&](uint64_t vmo_offset, uint64_t dev_offset, uint32_t length) {
	operations.push_back({.vmoid = vmoid.get(),
	.op = {
	.type = storage::OperationType::kRead,
	.vmo_offset = vmo_offset - block_offset,
	.dev_offset = kDataStart + dev_offset,
	.length = length,
	}});
	return ZX_OK;
	});

	if (status != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to stream blocks: " << zx_status_get_string(status);
	return zx::error(status);
	}
	status = txn_manager_->RunRequests(operations);
	if (status != ZX_OK) {
	FX_LOGS(ERROR) << "Failed to flush read transaction: " << zx_status_get_string(status);
	return zx::error(status);
	}

	return zx::ok(uint64_t{block_count} * GetBlockSize());
	}

	void BlobLoader::ZeroMerkleTreeWithinDataVmo(void* mapped_data, size_t mapped_data_size,
	const BlobLayout& blob_layout) const {
	if (!blob_layout.HasMerkleTreeAndDataSharedBlock()) {
	return;
	}
	uint64_t data_block_aligned_size = blob_layout.DataBlockAlignedSize();
	ZX_DEBUG_ASSERT(mapped_data_size >= data_block_aligned_size);
	uint64_t len = uint64_t{GetBlockSize()} - blob_layout.MerkleTreeOffsetWithinBlockOffset();
	// Since the block is shared, data_block_aligned_size is >= 1 block.
	uint64_t offset = data_block_aligned_size - len;
	memset(static_cast<uint8_t*>(mapped_data) + offset, 0, len);
	}

	uint32_t BlobLoader::GetBlockSize() const { return txn_manager_->Info().block_size; }

	} // namespace blobfs