blob: 4dbee034376304090dfef97ef6e133a783c0dbe3 [file] [log] [blame]
// Copyright 2016 The Fuchsia Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include <lib/fdio/watcher.h>
#include <stdlib.h>
#include <string.h>
#include <sys/stat.h>
#include <unistd.h>
#include <memory>
#include <utility>
#include <fbl/auto_call.h>
#include <fs/debug.h>
#include <fs/trace.h>
#include <fs/vfs.h>
#include <fs/vnode.h>
#ifdef __Fuchsia__
#include <lib/zx/event.h>
#include <lib/zx/process.h>
#include <threads.h>
#include <zircon/assert.h>
#include <fbl/auto_lock.h>
#include <fbl/ref_ptr.h>
#include <fs/internal/connection.h>
#include <fs/internal/directory_connection.h>
#include <fs/internal/file_connection.h>
#include <fs/internal/node_connection.h>
#include <fs/remote.h>
namespace fs {
namespace {
// Trim a name before sending it to internal filesystem functions.
// Trailing '/' characters imply that the name must refer to a directory.
zx_status_t TrimName(fbl::StringPiece name, fbl::StringPiece* name_out, bool* dir_out) {
size_t len = name.length();
bool is_dir = false;
while ((len > 0) && name[len - 1] == '/') {
is_dir = true;
if (len == 0) {
// 'name' should not contain paths consisting of exclusively '/' characters.
} else if (len > NAME_MAX) {
// Name must be less than the maximum-expected length.
} else if (memchr(, '/', len) != nullptr) {
// Name must not contain '/' characters after being trimmed.
name_out->set(, len);
*dir_out = is_dir;
return ZX_OK;
zx_status_t LookupNode(fbl::RefPtr<Vnode> vn, fbl::StringPiece name, fbl::RefPtr<Vnode>* out) {
if (name == "..") {
} else if (name == ".") {
*out = std::move(vn);
return ZX_OK;
return vn->Lookup(out, name);
// Validate open flags as much as they can be validated
// independently of the target node.
zx_status_t PrevalidateOptions(VnodeConnectionOptions options) {
if (!options.rights.write) {
if (options.flags.truncate) {
} else if (!options.rights.any()) {
if (!options.flags.node_reference) {
return ZX_OK;
} // namespace
#ifdef __Fuchsia__
bool RemoteContainer::IsRemote() const { return remote_.is_valid(); }
zx::channel RemoteContainer::DetachRemote() { return std::move(remote_); }
zx_handle_t RemoteContainer::GetRemote() const { return remote_.get(); }
void RemoteContainer::SetRemote(zx::channel remote) {
remote_ = std::move(remote);
Vfs::Vfs() = default;
Vfs::~Vfs() = default;
#ifdef __Fuchsia__
Vfs::Vfs(async_dispatcher_t* dispatcher) : dispatcher_(dispatcher) {}
Vfs::OpenResult Vfs::Open(fbl::RefPtr<Vnode> vndir, fbl::StringPiece path,
VnodeConnectionOptions options, Rights parent_rights, uint32_t mode) {
#ifdef __Fuchsia__
fbl::AutoLock lock(&vfs_lock_);
return OpenLocked(std::move(vndir), path, options, parent_rights, mode);
Vfs::OpenResult Vfs::OpenLocked(fbl::RefPtr<Vnode> vndir, fbl::StringPiece path,
VnodeConnectionOptions options, Rights parent_rights,
uint32_t mode) {
FS_PRETTY_TRACE_DEBUG("VfsOpen: path='", Path(, path.size()), "' options=", options);
zx_status_t r;
if ((r = PrevalidateOptions(options)) != ZX_OK) {
return r;
if ((r = Vfs::Walk(vndir, &vndir, path, &path)) < 0) {
return r;
#ifdef __Fuchsia__
if (vndir->IsRemote()) {
// remote filesystem, return handle and path to caller
return OpenResult::Remote{.vnode = std::move(vndir), .path = path};
bool must_be_dir = false;
if ((r = TrimName(path, &path, &must_be_dir)) != ZX_OK) {
return r;
} else if (path == "..") {
if (must_be_dir) { = true;
fbl::RefPtr<Vnode> vn;
bool just_created = false;
if (options.flags.create) {
if ((r = EnsureExists(std::move(vndir), path, &vn, options, mode, &just_created)) != ZX_OK) {
return r;
} else {
if ((r = LookupNode(std::move(vndir), path, &vn)) != ZX_OK) {
return r;
#ifdef __Fuchsia__
if (!options.flags.no_remote && vn->IsRemote()) {
// Opening a mount point: Traverse across remote.
return OpenResult::RemoteRoot{.vnode = std::move(vn)};
if (ReadonlyLocked() && options.rights.write) {
if (vn->Supports(fs::VnodeProtocol::kDirectory) && options.flags.posix) {
// Save this before modifying |options| below.
bool admin = options.rights.admin;
// This is such that POSIX open() can open a directory with O_RDONLY, and
// still get the write/execute right if the parent directory connection has the
// write/execute right respectively. With the execute right in particular, the resulting
// connection may be passed to fdio_get_vmo_exec() which requires the execute right.
// This transfers write and execute from the parent, if present.
auto inheritable_rights = Rights::WriteExec();
options.rights |= parent_rights & inheritable_rights;
// The ADMIN right is not inherited. It must be explicitly specified.
options.rights.admin = admin;
auto validated_options = vn->ValidateOptions(options);
if (validated_options.is_error()) {
return validated_options.error();
// |node_reference| requests that we don't actually open the underlying Vnode,
// but use the connection as a reference to the Vnode.
if (!options.flags.node_reference && !just_created) {
if ((r = OpenVnode(validated_options.value(), &vn)) != ZX_OK) {
return r;
#ifdef __Fuchsia__
if (!options.flags.no_remote && vn->IsRemote()) {
// |OpenVnode| redirected us to a remote vnode; traverse across mount point.
return OpenResult::RemoteRoot{.vnode = std::move(vn)};
if (options.flags.truncate && ((r = vn->Truncate(0)) < 0)) {
return r;
FS_TRACE_DEBUG("VfsOpen: vn=%p\n", vn.get());
return OpenResult::Ok{.vnode = std::move(vn), .validated_options = validated_options.value()};
zx_status_t Vfs::EnsureExists(fbl::RefPtr<Vnode> vndir, fbl::StringPiece path,
fbl::RefPtr<Vnode>* out_vn, fs::VnodeConnectionOptions options,
uint32_t mode, bool* did_create) {
zx_status_t status;
if ( && !S_ISDIR(mode)) {
} else if (options.flags.not_directory && S_ISDIR(mode)) {
} else if (path == ".") {
} else if (ReadonlyLocked()) {
if ((status = vndir->Create(out_vn, path, mode)) != ZX_OK) {
*did_create = false;
if ((status == ZX_ERR_ALREADY_EXISTS) && !options.flags.fail_if_exists) {
return LookupNode(std::move(vndir), path, out_vn);
if (status == ZX_ERR_NOT_SUPPORTED) {
// filesystem may not support create (like devfs)
// in which case we should still try to open() the file
return LookupNode(std::move(vndir), path, out_vn);
return status;
#ifdef __Fuchsia__
vndir->Notify(path, fuchsia_io_WATCH_EVENT_ADDED);
*did_create = true;
return ZX_OK;
zx_status_t Vfs::Unlink(fbl::RefPtr<Vnode> vndir, fbl::StringPiece path) {
bool must_be_dir;
zx_status_t r;
if ((r = TrimName(path, &path, &must_be_dir)) != ZX_OK) {
return r;
} else if (path == ".") {
} else if (path == "..") {
#ifdef __Fuchsia__
fbl::AutoLock lock(&vfs_lock_);
if (ReadonlyLocked()) {
} else {
r = vndir->Unlink(path, must_be_dir);
if (r != ZX_OK) {
return r;
#ifdef __Fuchsia__
vndir->Notify(path, fuchsia_io_WATCH_EVENT_REMOVED);
return ZX_OK;
#ifdef __Fuchsia__
namespace {
zx_koid_t GetTokenKoid(const zx::event& token) {
zx_info_handle_basic_t info = {};
token.get_info(ZX_INFO_HANDLE_BASIC, &info, sizeof(info), nullptr, nullptr);
return info.koid;
} // namespace
void Vfs::TokenDiscard(zx::event ios_token) {
fbl::AutoLock lock(&vfs_lock_);
if (ios_token) {
// The token is cleared here to prevent the following race condition:
// 1) Open
// 2) GetToken
// 3) Close + Release Vnode
// 4) Use token handle to access defunct vnode (or a different vnode,
// if the memory for it is reallocated).
// By cleared the token cookie, any remaining handles to the event will
// be ignored by the filesystem server.
auto rename_request = vnode_tokens_.erase(GetTokenKoid(ios_token));
zx_status_t Vfs::VnodeToToken(fbl::RefPtr<Vnode> vn, zx::event* ios_token, zx::event* out) {
zx_status_t r;
fbl::AutoLock lock(&vfs_lock_);
if (ios_token->is_valid()) {
// Token has already been set for this iostate
if ((r = ios_token->duplicate(TOKEN_RIGHTS, out) != ZX_OK)) {
return r;
return ZX_OK;
zx::event new_token;
zx::event new_ios_token;
if ((r = zx::event::create(0, &new_ios_token)) != ZX_OK) {
return r;
} else if ((r = new_ios_token.duplicate(TOKEN_RIGHTS, &new_token) != ZX_OK)) {
return r;
auto koid = GetTokenKoid(new_ios_token);
vnode_tokens_.insert(std::make_unique<VnodeToken>(koid, std::move(vn)));
*ios_token = std::move(new_ios_token);
*out = std::move(new_token);
return ZX_OK;
zx_status_t Vfs::TokenToVnode(zx::event token, fbl::RefPtr<Vnode>* out) {
const auto& vnode_token = vnode_tokens_.find(GetTokenKoid(token));
if (vnode_token == vnode_tokens_.end()) {
// TODO(smklein): Return a more specific error code for "token not from this server"
*out = vnode_token->get_vnode();
return ZX_OK;
zx_status_t Vfs::Rename(zx::event token, fbl::RefPtr<Vnode> oldparent, fbl::StringPiece oldStr,
fbl::StringPiece newStr) {
// Local filesystem
bool old_must_be_dir;
bool new_must_be_dir;
zx_status_t r;
if ((r = TrimName(oldStr, &oldStr, &old_must_be_dir)) != ZX_OK) {
return r;
} else if (oldStr == ".") {
} else if (oldStr == "..") {
if ((r = TrimName(newStr, &newStr, &new_must_be_dir)) != ZX_OK) {
return r;
} else if (newStr == "." || newStr == "..") {
fbl::RefPtr<fs::Vnode> newparent;
fbl::AutoLock lock(&vfs_lock_);
if (ReadonlyLocked()) {
if ((r = TokenToVnode(std::move(token), &newparent)) != ZX_OK) {
return r;
r = oldparent->Rename(newparent, oldStr, newStr, old_must_be_dir, new_must_be_dir);
if (r != ZX_OK) {
return r;
oldparent->Notify(oldStr, fuchsia_io_WATCH_EVENT_REMOVED);
newparent->Notify(newStr, fuchsia_io_WATCH_EVENT_ADDED);
return ZX_OK;
zx_status_t Vfs::Readdir(Vnode* vn, vdircookie_t* cookie, void* dirents, size_t len,
size_t* out_actual) {
fbl::AutoLock lock(&vfs_lock_);
return vn->Readdir(cookie, dirents, len, out_actual);
zx_status_t Vfs::Link(zx::event token, fbl::RefPtr<Vnode> oldparent, fbl::StringPiece oldStr,
fbl::StringPiece newStr) {
fbl::AutoLock lock(&vfs_lock_);
fbl::RefPtr<fs::Vnode> newparent;
zx_status_t r;
if ((r = TokenToVnode(std::move(token), &newparent)) != ZX_OK) {
return r;
// Local filesystem
bool old_must_be_dir;
bool new_must_be_dir;
if (ReadonlyLocked()) {
} else if ((r = TrimName(oldStr, &oldStr, &old_must_be_dir)) != ZX_OK) {
return r;
} else if (old_must_be_dir) {
return ZX_ERR_NOT_DIR;
} else if (oldStr == ".") {
} else if (oldStr == "..") {
if ((r = TrimName(newStr, &newStr, &new_must_be_dir)) != ZX_OK) {
return r;
} else if (new_must_be_dir) {
return ZX_ERR_NOT_DIR;
} else if (newStr == "." || newStr == "..") {
// Look up the target vnode
fbl::RefPtr<Vnode> target;
if ((r = oldparent->Lookup(&target, oldStr)) < 0) {
return r;
r = newparent->Link(newStr, target);
if (r != ZX_OK) {
return r;
newparent->Notify(newStr, fuchsia_io_WATCH_EVENT_ADDED);
return ZX_OK;
zx_status_t Vfs::Serve(fbl::RefPtr<Vnode> vnode, zx::channel channel,
VnodeConnectionOptions options) {
auto result = vnode->ValidateOptions(options);
if (result.is_error()) {
return result.error();
return Serve(std::move(vnode), std::move(channel), result.value());
zx_status_t Vfs::Serve(fbl::RefPtr<Vnode> vnode, zx::channel channel,
Vnode::ValidatedOptions options) {
// |ValidateOptions| was called, hence at least one protocol must be supported.
auto candidate_protocols = options->protocols() & vnode->GetProtocols();
auto maybe_protocol = candidate_protocols.which();
VnodeProtocol protocol;
if (maybe_protocol.has_value()) {
protocol = maybe_protocol.value();
} else {
protocol = vnode->Negotiate(candidate_protocols);
// Send an || event if requested.
if (options->flags.describe) {
OnOpenMsg response;
memset(&response, 0, sizeof(response));
response.primary.s = ZX_OK;
zx_handle_t extra = ZX_HANDLE_INVALID;
internal::Describe(vnode, protocol, *options, &response, &extra);
uint32_t hcount = (extra != ZX_HANDLE_INVALID) ? 1 : 0;
channel.write(0, &response, sizeof(OnOpenMsg), &extra, hcount);
// If |node_reference| is specified, serve || even for
// |VnodeProtocol::kConnector| nodes.
if (!options->flags.node_reference && protocol == VnodeProtocol::kConnector) {
return vnode->ConnectService(std::move(channel));
auto connection = ([&, this] () -> std::unique_ptr<internal::Connection> {
switch (protocol) {
case VnodeProtocol::kFile:
case VnodeProtocol::kDevice:
case VnodeProtocol::kTty:
// In memfs and bootfs, memory objects (vmo-files) appear to support ||.
// Therefore choosing a file connection here is the closest approximation.
case VnodeProtocol::kMemory:
return std::make_unique<internal::FileConnection>(this, std::move(vnode),
std::move(channel), protocol, *options);
case VnodeProtocol::kDirectory:
return std::make_unique<internal::DirectoryConnection>(this, std::move(vnode),
std::move(channel), protocol,
case VnodeProtocol::kConnector:
case VnodeProtocol::kPipe:
return std::make_unique<internal::NodeConnection>(this, std::move(vnode),
std::move(channel), protocol, *options);
case VnodeProtocol::kSocket:
// The posix socket protocol is used by netstack and served through the
// src/lib/component/go library.
ZX_PANIC("fuchsia.posix.socket/Control is not implemented");
#ifdef __GNUC__
// GCC does not infer that the above switch statement will always return by
// handling all defined enum members.
zx_status_t status = connection->StartDispatching();
if (status != ZX_OK) {
return status;
return ZX_OK;
void Vfs::OnConnectionClosedRemotely(internal::Connection* connection) {
zx_status_t Vfs::ServeDirectory(fbl::RefPtr<fs::Vnode> vn, zx::channel channel, Rights rights) {
VnodeConnectionOptions options; = true;
options.rights = rights;
auto validated_options = vn->ValidateOptions(options);
if (validated_options.is_error()) {
return validated_options.error();
} else if (zx_status_t r = OpenVnode(validated_options.value(), &vn); r != ZX_OK) {
return r;
// Tell the calling process that we've mounted the directory.
zx_status_t r = channel.signal_peer(0, ZX_USER_SIGNAL_0);
// ZX_ERR_PEER_CLOSED is ok because the channel may still be readable.
if (r != ZX_OK && r != ZX_ERR_PEER_CLOSED) {
return r;
return Serve(std::move(vn), std::move(channel), validated_options.value());
#endif // ifdef __Fuchsia__
void Vfs::SetReadonly(bool value) {
#ifdef __Fuchsia__
fbl::AutoLock lock(&vfs_lock_);
readonly_ = value;
zx_status_t Vfs::Walk(fbl::RefPtr<Vnode> vn, fbl::RefPtr<Vnode>* out_vn, fbl::StringPiece path,
fbl::StringPiece* out_path) {
zx_status_t r;
while (!path.empty() && path[path.length() - 1] == '/') {
// Discard extra trailing '/' characters.
path.set(, path.length() - 1);
for (;;) {
while (!path.empty() && path[0] == '/') {
// Discard extra leading '/' characters.
path.set(&path[1], path.length() - 1);
if (path.empty()) {
// Convert empty initial path of final path segment to ".".
path.set(".", 1);
#ifdef __Fuchsia__
if (vn->IsRemote()) {
// Remote filesystem mount, caller must resolve.
*out_vn = std::move(vn);
*out_path = std::move(path);
return ZX_OK;
// Look for the next '/' separated path component.
const char* next_path = reinterpret_cast<const char*>(memchr(, '/', path.length()));
if (next_path == nullptr) {
// Final path segment.
*out_vn = vn;
*out_path = std::move(path);
return ZX_OK;
// Path has at least one additional segment.
fbl::StringPiece component(, next_path -;
if (component.length() > NAME_MAX) {
if ((r = LookupNode(std::move(vn), component, &vn)) != ZX_OK) {
return r;
// Traverse to the next segment.
path.set(next_path + 1, path.length() - (component.length() + 1));
} // namespace fs