executor/executor_runner.h - third_party/syzkaller - Git at Google

 // Copyright 2024 syzkaller project authors. All rights reserved.
 // Use of this source code is governed by Apache 2 LICENSE that can be found in the LICENSE file.

 #include <fcntl.h>
 #include <signal.h>
 #include <sys/mman.h>
 #include <sys/resource.h>
 #include <unistd.h>

 #include <algorithm>
 #include <deque>
 #include <iomanip>
 #include <memory>
 #include <optional>
 #include <sstream>
 #include <string>
 #include <utility>
 #include <vector>

 inline std::ostream& operator<<(std::ostream& ss, const rpc::ExecRequestRawT& req)
 {
 	return ss << "id=" << req.id
 		  << " flags=0x" << std::hex << static_cast<uint64>(req.flags)
 		  << " env_flags=0x" << std::hex << static_cast<uint64>(req.exec_opts->env_flags())
 		  << " exec_flags=0x" << std::hex << static_cast<uint64>(req.exec_opts->exec_flags())
 		  << " data_size=" << std::dec << req.data.size()
 		  << "\n";
 }

 // ProcIDPool allows to reuse a set of unique proc IDs across a set of subprocesses.
 //
 // When a subprocess hangs, it's a bit unclear what to do (we don't have means to kill
 // the whole tree of its children, and waiting for all them will presumably hang as well).
 // Later there may appear a "task hung" report from the kernel, so we don't want to terminate
 // the VM immidiatly. But the "task hung" report may also not appear at all, so we can't
 // just wait for a hanged subprocesses forever.
 //
 // So in that case we kill/wait just the top subprocesses, and give it a new proc ID
 // (since some resources associated with the old proc ID may still be used by the old
 // unterminated test processes). However, we don't have infinite number of proc IDs,
 // so we recycle them in FIFO order. This is not ideal, but it looks like the best
 // practical solution.
 class ProcIDPool
 {
 public:
 	ProcIDPool(int num_procs)
 	{
 		// Theoretically we have 32 procs (prog.MaxPids), but there are some limitations in descriptions
 		// that make them work well only for up to 10 procs. For example, we form /dev/loopN
 		// device name using proc['0', 1, int8]. When these limitations are fixed,
 		// we can use all 32 here (prog.MaxPids)
 		constexpr int kNumGoodProcs = 10;
 		for (int i = 0; i < std::max(num_procs, kNumGoodProcs); i++)
 			ids_.push_back(i);
 		mask_ = 0;
 	}

 	int Alloc(int old = -1)
 	{
 		if (old >= 0) {
 			mask_ &= ~(1UL << old);
 			ids_.push_back(old);
 		}
 		if (ids_.empty())
 			fail("out of proc ids");
 		int id = ids_.front();
 		ids_.pop_front();
 		mask_ |= 1UL << id;
 		return id;
 	}

 	uint64 Mask()
 	{
 		return mask_;
 	}

 private:
 	std::deque<int> ids_;
 	uint64 mask_;

 	ProcIDPool(const ProcIDPool&) = delete;
 	ProcIDPool& operator=(const ProcIDPool&) = delete;
 };

 class ProcOpts
 {
 public:
 	bool use_cover_edges = false;
 	bool is_kernel_64_bit = false;
 	uint32 slowdown = 0;
 	uint32 syscall_timeout_ms = 0;
 	uint32 program_timeout_ms = 0;

 private:
 	friend std::ostream& operator<<(std::ostream& ss, const ProcOpts& opts)
 	{
 		ss << "use_cover_edges=" << opts.use_cover_edges
 		   << " is_kernel_64_bit=" << opts.is_kernel_64_bit
 		   << " slowdown=" << opts.slowdown
 		   << " syscall_timeout_ms=" << opts.syscall_timeout_ms
 		   << " program_timeout_ms=" << opts.program_timeout_ms;
 		return ss;
 	}
 };

 // Proc represents one subprocess that runs tests (re-execed syz-executor with 'exec' argument).
 // The object is persistent and re-starts subprocess when it crashes.
 class Proc
 {
 public:
 	Proc(Connection& conn, const char* bin, ProcIDPool& proc_id_pool, int& restarting, const bool& corpus_triaged, int max_signal_fd,
 	     int cover_filter_fd, ProcOpts opts)
 	    : conn_(conn),
 	      bin_(bin),
 	      proc_id_pool_(proc_id_pool),
 	      id_(proc_id_pool.Alloc()),
 	      restarting_(restarting),
 	      corpus_triaged_(corpus_triaged),
 	      max_signal_fd_(max_signal_fd),
 	      cover_filter_fd_(cover_filter_fd),
 	      opts_(opts),
 	      req_shmem_(kMaxInput),
 	      resp_shmem_(kMaxOutput),
 	      resp_mem_(static_cast<OutputData*>(resp_shmem_.Mem()))
 	{
 		Start();
 	}

 	bool Execute(rpc::ExecRequestRawT& msg)
 	{
 		if (state_ != State::Started && state_ != State::Idle)
 			return false;
 		if (((~msg.avoid) & proc_id_pool_.Mask()) == 0)
 			msg.avoid = 0;
 		if (msg.avoid & (1ull << id_))
 			return false;
 		if (msg_)
 			fail("already have pending msg");
 		if (wait_start_)
 			wait_end_ = current_time_ms();
 		// Restart every once in a while to not let too much state accumulate.
 		// Also request if request type differs as it affects program timeout.
 		constexpr uint64 kRestartEvery = 600;
 		if (state_ == State::Idle && ((corpus_triaged_ && restarting_ == 0 && freshness_ >= kRestartEvery) ||
 					      req_type_ != msg.type ||
 					      exec_env_ != msg.exec_opts->env_flags() || sandbox_arg_ != msg.exec_opts->sandbox_arg()))
 			Restart();
 		attempts_ = 0;
 		msg_ = std::move(msg);
 		if (state_ == State::Started)
 			Handshake();
 		else
 			Execute();
 		return true;
 	}

 	void Arm(Select& select)
 	{
 		select.Arm(resp_pipe_);
 		select.Arm(stdout_pipe_);
 	}

 	void Ready(Select& select, uint64 now, bool out_of_requests)
 	{
 		if (state_ == State::Handshaking || state_ == State::Executing) {
 			// Check if the subprocess has hung.
 #if SYZ_EXECUTOR_USES_FORK_SERVER
 			// Child process has an internal timeout and protects against most hangs when
 			// fork server is enabled, so we use quite large timeout. Child process can be slow
 			// due to global locks in namespaces and other things, so let's better wait than
 			// report false misleading crashes.
 			uint64 timeout = 3 * ProgramTimeoutMs();
 #else
 			uint64 timeout = ProgramTimeoutMs();
 #endif
 			// Sandbox setup can take significant time.
 			if (state_ == State::Handshaking)
 				timeout = 60 * 1000 * opts_.slowdown;
 			if (now > exec_start_ + timeout) {
 				Restart();
 				return;
 			}
 		}

 		if (select.Ready(stdout_pipe_) && !ReadOutput()) {
 #if SYZ_EXECUTOR_USES_FORK_SERVER
 			// In non-forking mode the subprocess exits after test execution
 			// and the pipe read fails with EOF, so we rely on the resp_pipe_ instead.
 			Restart();
 			return;
 #endif
 		}
 		if (select.Ready(resp_pipe_) && !ReadResponse(out_of_requests)) {
 			Restart();
 			return;
 		}
 		return;
 	}

 private:
 	enum State : uint8 {
 		// The process has just started.
 		Started,
 		// We sent the process env flags and waiting for handshake reply.
 		Handshaking,
 		// Handshaked and ready to execute programs.
 		Idle,
 		// Currently executing a test program.
 		Executing,
 	};

 	Connection& conn_;
 	const char* const bin_;
 	ProcIDPool& proc_id_pool_;
 	int id_;
 	int& restarting_;
 	const bool& corpus_triaged_;
 	const int max_signal_fd_;
 	const int cover_filter_fd_;
 	const ProcOpts opts_;
 	State state_ = State::Started;
 	std::optional<Subprocess> process_;
 	ShmemFile req_shmem_;
 	ShmemFile resp_shmem_;
 	OutputData* resp_mem_;
 	int req_pipe_ = -1;
 	int resp_pipe_ = -1;
 	int stdout_pipe_ = -1;
 	rpc::RequestType req_type_ = rpc::RequestType::Program;
 	rpc::ExecEnv exec_env_ = rpc::ExecEnv::NONE;
 	int64_t sandbox_arg_ = 0;
 	std::optional<rpc::ExecRequestRawT> msg_;
 	std::vector<uint8_t> output_;
 	size_t debug_output_pos_ = 0;
 	uint64 attempts_ = 0;
 	uint64 freshness_ = 0;
 	uint64 exec_start_ = 0;
 	uint64 wait_start_ = 0;
 	uint64 wait_end_ = 0;

 	friend std::ostream& operator<<(std::ostream& ss, const Proc& proc)
 	{
 		ss << "id=" << proc.id_
 		   << " state=" << static_cast<int>(proc.state_)
 		   << " freshness=" << proc.freshness_
 		   << " attempts=" << proc.attempts_
 		   << " exec_start=" << current_time_ms() - proc.exec_start_
 		   << "\n";
 		if (proc.msg_)
 			ss << "\tcurrent request: " << *proc.msg_;
 		return ss;
 	}

 	void ChangeState(State state)
 	{
 		if (state_ == State::Handshaking)
 			restarting_--;
 		if (state == State::Handshaking)
 			restarting_++;
 		state_ = state;
 	}

 	void Restart()
 	{
 		debug("proc %d: restarting subprocess, current state %u attempts %llu\n", id_, state_, attempts_);
 		int status = process_->KillAndWait();
 		process_.reset();
 		debug("proc %d: subprocess exit status %d\n", id_, status);
 		if (++attempts_ > 20) {
 			while (ReadOutput())
 				;
 			// Write the subprocess output first. If it contains own SYFAIL,
 			// we want it to be before our SYZFAIL.
 			ssize_t wrote = write(STDERR_FILENO, output_.data(), output_.size());
 			if (wrote != static_cast<ssize_t>(output_.size()))
 				fprintf(stderr, "output truncated: %zd/%zd (errno=%d)\n",
 					wrote, output_.size(), errno);
 			uint64 req_id = msg_ ? msg_->id : -1;
 			failmsg("repeatedly failed to execute the program", "proc=%d req=%lld state=%d status=%d",
 				id_, req_id, state_, status);
 		}
 		// Ignore all other errors.
 		// Without fork server executor can legitimately exit (program contains exit_group),
 		// with fork server the top process can exit with kFailStatus if it wants special handling.
 		if (status != kFailStatus)
 			status = 0;
 		if (FailCurrentRequest(status == kFailStatus)) {
 			// Read out all pening output until EOF.
 			if (IsSet(msg_->flags, rpc::RequestFlag::ReturnOutput)) {
 				while (ReadOutput())
 					;
 			}
 			bool hanged = SYZ_EXECUTOR_USES_FORK_SERVER && state_ == State::Executing;
 			HandleCompletion(status, hanged);
 			if (hanged) {
 				// If the process has hanged, it may still be using per-proc resources,
 				// so allocate a fresh proc id.
 				int new_id = proc_id_pool_.Alloc(id_);
 				debug("proc %d: changing proc id to %d\n", id_, new_id);
 				id_ = new_id;
 			}
 		} else if (attempts_ > 3)
 			sleep_ms(100 * attempts_);
 		Start();
 	}

 	bool FailCurrentRequest(bool failed)
 	{
 		if (state_ == State::Handshaking)
 			return IsSet(msg_->flags, rpc::RequestFlag::ReturnError);
 		if (state_ == State::Executing)
 			return !failed || IsSet(msg_->flags, rpc::RequestFlag::ReturnError);
 		return false;
 	}

 	void Start()
 	{
 		ChangeState(State::Started);
 		freshness_ = 0;
 		int req_pipe[2];
 		if (pipe(req_pipe))
 			fail("pipe failed");
 		int resp_pipe[2];
 		if (pipe(resp_pipe))
 			fail("pipe failed");
 		int stdout_pipe[2];
 		if (pipe(stdout_pipe))
 			fail("pipe failed");

 		std::vector<std::pair<int, int>> fds = {
 		    {req_pipe[0], STDIN_FILENO},
 		    {resp_pipe[1], STDOUT_FILENO},
 		    {stdout_pipe[1], STDERR_FILENO},
 		    {req_shmem_.FD(), kInFd},
 		    {resp_shmem_.FD(), kOutFd},
 		    {max_signal_fd_, kMaxSignalFd},
 		    {cover_filter_fd_, kCoverFilterFd},
 		};
 		const char* argv[] = {bin_, "exec", nullptr};
 		process_.emplace(argv, fds);

 		Select::Prepare(resp_pipe[0]);
 		Select::Prepare(stdout_pipe[0]);

 		close(req_pipe[0]);
 		close(resp_pipe[1]);
 		close(stdout_pipe[1]);

 		close(req_pipe_);
 		close(resp_pipe_);
 		close(stdout_pipe_);

 		req_pipe_ = req_pipe[1];
 		resp_pipe_ = resp_pipe[0];
 		stdout_pipe_ = stdout_pipe[0];

 		if (msg_)
 			Handshake();
 	}

 	void Handshake()
 	{
 		if (state_ != State::Started || !msg_)
 			fail("wrong handshake state");
 		debug("proc %d: handshaking to execute request %llu\n", id_, static_cast<uint64>(msg_->id));
 		ChangeState(State::Handshaking);
 		exec_start_ = current_time_ms();
 		req_type_ = msg_->type;
 		exec_env_ = msg_->exec_opts->env_flags() & ~rpc::ExecEnv::ResetState;
 		sandbox_arg_ = msg_->exec_opts->sandbox_arg();
 		handshake_req req = {
 		    .magic = kInMagic,
 		    .use_cover_edges = opts_.use_cover_edges,
 		    .is_kernel_64_bit = opts_.is_kernel_64_bit,
 		    .flags = exec_env_,
 		    .pid = static_cast<uint64>(id_),
 		    .sandbox_arg = static_cast<uint64>(sandbox_arg_),
 		    .syscall_timeout_ms = opts_.syscall_timeout_ms,
 		    .program_timeout_ms = ProgramTimeoutMs(),
 		    .slowdown_scale = opts_.slowdown,
 		};
 		if (write(req_pipe_, &req, sizeof(req)) != sizeof(req)) {
 			debug("request pipe write failed (errno=%d)\n", errno);
 			Restart();
 		}
 	}

 	void Execute()
 	{
 		if (state_ != State::Idle || !msg_)
 			fail("wrong state for execute");

 		debug("proc %d: start executing request %llu\n", id_, static_cast<uint64>(msg_->id));

 		rpc::ExecutingMessageRawT exec;
 		exec.id = msg_->id;
 		exec.proc_id = id_;
 		exec.try_ = attempts_;

 		if (wait_start_) {
 			exec.wait_duration = (wait_end_ - wait_start_) * 1000 * 1000;
 			wait_end_ = wait_start_ = 0;
 		}

 		rpc::ExecutorMessageRawT raw;
 		raw.msg.Set(std::move(exec));
 		conn_.Send(raw);

 		uint64 all_call_signal = 0;
 		bool all_extra_signal = false;
 		for (int32_t call : msg_->all_signal) {
 			// This code assumes that call indices can be represented as bits in uint64 all_call_signal.
 			static_assert(kMaxCalls == 64);
 			if (call < -1 || call >= static_cast<int32_t>(kMaxCalls))
 				failmsg("bad all_signal call", "call=%d", call);
 			if (call < 0)
 				all_extra_signal = true;
 			else
 				all_call_signal |= 1ull << call;
 		}
 		memcpy(req_shmem_.Mem(), msg_->data.data(), std::min(msg_->data.size(), kMaxInput));
 		execute_req req{
 		    .magic = kInMagic,
 		    .id = static_cast<uint64>(msg_->id),
 		    .type = msg_->type,
 		    .exec_flags = static_cast<uint64>(msg_->exec_opts->exec_flags()),
 		    .all_call_signal = all_call_signal,
 		    .all_extra_signal = all_extra_signal,
 		};
 		exec_start_ = current_time_ms();
 		ChangeState(State::Executing);
 		if (write(req_pipe_, &req, sizeof(req)) != sizeof(req)) {
 			debug("request pipe write failed (errno=%d)\n", errno);
 			Restart();
 		}
 	}

 	void HandleCompletion(uint32 status, bool hanged = false)
 	{
 		if (!msg_)
 			fail("don't have executed msg");

 		// Note: if the child process crashed during handshake and the request has ReturnError flag,
 		// we have not started executing the request yet.
 		uint64 elapsed = (current_time_ms() - exec_start_) * 1000 * 1000;
 		uint8* prog_data = msg_->data.data();
 		input_data = prog_data;
 		std::vector<uint8_t>* output = nullptr;
 		if (IsSet(msg_->flags, rpc::RequestFlag::ReturnOutput)) {
 			output = &output_;
 			if (status) {
 				char tmp[128];
 				snprintf(tmp, sizeof(tmp), "\nprocess exited with status %d\n", status);
 				output_.insert(output_.end(), tmp, tmp + strlen(tmp));
 			}
 		}
 		uint32 num_calls = 0;
 		if (msg_->type == rpc::RequestType::Program)
 			num_calls = read_input(&prog_data);
 		auto data = finish_output(resp_mem_, id_, msg_->id, num_calls, elapsed, freshness_++, status, hanged, output);
 		conn_.Send(data.data(), data.size());

 		resp_mem_->Reset();
 		msg_.reset();
 		output_.clear();
 		debug_output_pos_ = 0;
 		ChangeState(State::Idle);
 #if !SYZ_EXECUTOR_USES_FORK_SERVER
 		if (process_)
 			Restart();
 #endif
 	}

 	bool ReadResponse(bool out_of_requests)
 	{
 		uint32 status;
 		ssize_t n;
 		while ((n = read(resp_pipe_, &status, sizeof(status))) == -1) {
 			if (errno != EINTR && errno != EAGAIN)
 				break;
 		}
 		if (n == 0) {
 			debug("proc %d: response pipe EOF\n", id_);
 			return false;
 		}
 		if (n != sizeof(status))
 			failmsg("proc resp pipe read failed", "n=%zd", n);
 		if (state_ == State::Handshaking) {
 			debug("proc %d: got handshake reply\n", id_);
 			ChangeState(State::Idle);
 			Execute();
 		} else if (state_ == State::Executing) {
 			debug("proc %d: got execute reply\n", id_);
 			HandleCompletion(status);
 			if (out_of_requests)
 				wait_start_ = current_time_ms();
 		} else {
 			debug("got data on response pipe in wrong state %d\n", state_);
 			return false;
 		}
 		return true;
 	}

 	bool ReadOutput()
 	{
 		const size_t kChunk = 1024;
 		output_.resize(output_.size() + kChunk);
 		ssize_t n = read(stdout_pipe_, output_.data() + output_.size() - kChunk, kChunk);
 		output_.resize(output_.size() - kChunk + std::max<ssize_t>(n, 0));
 		if (n < 0) {
 			if (errno == EINTR || errno == EAGAIN)
 				return true;
 			fail("proc stdout read failed");
 		}
 		if (n == 0) {
 			debug("proc %d: output pipe EOF\n", id_);
 			return false;
 		}
 		if (flag_debug) {
 			const bool has_nl = output_.back() == '\n';
 			output_.resize(output_.size() + 1);
 			char* output = reinterpret_cast<char*>(output_.data()) + debug_output_pos_;
 			// During machine check we can execute some requests that legitimately fail.
 			// These requests have ReturnError flag, so that the failure is returned
 			// to the caller for analysis. Don't print SYZFAIL in these requests,
 			// otherwise it will be detected as a bug.
 			if (msg_ && IsSet(msg_->flags, rpc::RequestFlag::ReturnError)) {
 				char* syzfail = strstr(output, "SYZFAIL");
 				if (syzfail)
 					memcpy(syzfail, "NOTFAIL", strlen("NOTFAIL"));
 			}
 			debug("proc %d: got output: %s%s", id_, output, has_nl ? "" : "\n");
 			output_.resize(output_.size() - 1);
 			debug_output_pos_ = output_.size();
 		}
 		return true;
 	}

 	uint32 ProgramTimeoutMs() const
 	{
 		// Glob requests can expand to >10K files and can take a while to run.
 		return opts_.program_timeout_ms * (req_type_ == rpc::RequestType::Program ? 1 : 10);
 	}
 };

 // Runner manages a set of test subprocesses (Proc's), receives new test requests from the manager,
 // and dispatches them to subprocesses.
 class Runner
 {
 public:
 	Runner(Connection& conn, int vm_index, const char* bin)
 	    : conn_(conn),
 	      vm_index_(vm_index)
 	{
 		int num_procs = Handshake();
 		proc_id_pool_.emplace(num_procs);
 		int max_signal_fd = max_signal_ ? max_signal_->FD() : -1;
 		int cover_filter_fd = cover_filter_ ? cover_filter_->FD() : -1;
 		for (int i = 0; i < num_procs; i++)
 			procs_.emplace_back(new Proc(conn, bin, *proc_id_pool_, restarting_, corpus_triaged_,
 						     max_signal_fd, cover_filter_fd, proc_opts_));

 		for (;;)
 			Loop();
 	}

 private:
 	Connection& conn_;
 	const int vm_index_;
 	std::optional<CoverFilter> max_signal_;
 	std::optional<CoverFilter> cover_filter_;
 	std::optional<ProcIDPool> proc_id_pool_;
 	std::vector<std::unique_ptr<Proc>> procs_;
 	std::deque<rpc::ExecRequestRawT> requests_;
 	std::vector<std::string> leak_frames_;
 	int restarting_ = 0;
 	bool corpus_triaged_ = false;
 	ProcOpts proc_opts_{};

 	friend std::ostream& operator<<(std::ostream& ss, const Runner& runner)
 	{
 		ss << "vm_index=" << runner.vm_index_
 		   << " max_signal=" << !!runner.max_signal_
 		   << " cover_filter=" << !!runner.cover_filter_
 		   << " restarting=" << runner.restarting_
 		   << " corpus_triaged=" << runner.corpus_triaged_
 		   << " " << runner.proc_opts_
 		   << "\n";
 		ss << "procs:\n";
 		for (const auto& proc : runner.procs_)
 			ss << *proc;
 		ss << "\nqueued requests (" << runner.requests_.size() << "):\n";
 		for (const auto& req : runner.requests_)
 			ss << req;
 		return ss;
 	}

 	void Loop()
 	{
 		Select select;
 		select.Arm(conn_.FD());
 		for (auto& proc : procs_)
 			proc->Arm(select);
 		// Wait for ready host connection and subprocess pipes.
 		// Timeout is for terminating hanged subprocesses.
 		select.Wait(1000);
 		uint64 now = current_time_ms();

 		if (select.Ready(conn_.FD())) {
 			rpc::HostMessageRawT raw;
 			conn_.Recv(raw);
 			if (auto* msg = raw.msg.AsExecRequest())
 				Handle(*msg);
 			else if (auto* msg = raw.msg.AsSignalUpdate())
 				Handle(*msg);
 			else if (auto* msg = raw.msg.AsCorpusTriaged())
 				Handle(*msg);
 			else if (auto* msg = raw.msg.AsStateRequest())
 				Handle(*msg);
 			else
 				failmsg("unknown host message type", "type=%d", static_cast<int>(raw.msg.type));
 		}

 		for (auto& proc : procs_) {
 			proc->Ready(select, now, requests_.empty());
 			if (!requests_.empty()) {
 				if (proc->Execute(requests_.front()))
 					requests_.pop_front();
 			}
 		}

 		if (restarting_ < 0 || restarting_ > static_cast<int>(procs_.size()))
 			failmsg("bad restarting", "restarting=%d", restarting_);
 	}

 	// Implementation must match that in pkg/rpcserver/rpcserver.go.
 	uint64 HashAuthCookie(uint64 cookie)
 	{
 		const uint64_t prime1 = 73856093;
 		const uint64_t prime2 = 83492791;

 		return (cookie * prime1) ^ prime2;
 	}

 	int Handshake()
 	{
 		// Handshake stage 0: get a cookie from the manager.
 		rpc::ConnectHelloRawT conn_hello;
 		conn_.Recv(conn_hello);

 		// Handshake stage 1: share basic information about the client.
 		rpc::ConnectRequestRawT conn_req;
 		conn_req.cookie = HashAuthCookie(conn_hello.cookie);
 		conn_req.id = vm_index_;
 		conn_req.arch = GOARCH;
 		conn_req.git_revision = GIT_REVISION;
 		conn_req.syz_revision = SYZ_REVISION;
 		conn_.Send(conn_req);

 		rpc::ConnectReplyRawT conn_reply;
 		conn_.Recv(conn_reply);
 		if (conn_reply.debug)
 			flag_debug = true;
 		debug("connected to manager: procs=%d cover_edges=%d kernel_64_bit=%d slowdown=%d syscall_timeout=%u"
 		      " program_timeout=%u features=0x%llx\n",
 		      conn_reply.procs, conn_reply.cover_edges, conn_reply.kernel_64_bit,
 		      conn_reply.slowdown, conn_reply.syscall_timeout_ms,
 		      conn_reply.program_timeout_ms, static_cast<uint64>(conn_reply.features));
 		leak_frames_ = conn_reply.leak_frames;

 		proc_opts_.use_cover_edges = conn_reply.cover_edges;
 		proc_opts_.is_kernel_64_bit = is_kernel_64_bit = conn_reply.kernel_64_bit;
 		proc_opts_.slowdown = conn_reply.slowdown;
 		proc_opts_.syscall_timeout_ms = conn_reply.syscall_timeout_ms;
 		proc_opts_.program_timeout_ms = conn_reply.program_timeout_ms;
 		if (conn_reply.cover)
 			max_signal_.emplace();

 		// Handshake stage 2: share information requested by the manager.
 		rpc::InfoRequestRawT info_req;
 		info_req.files = ReadFiles(conn_reply.files);

 		// This does any one-time setup for the requested features on the machine.
 		// Note: this can be called multiple times and must be idempotent.
 #if SYZ_HAVE_FEATURES
 		setup_sysctl();
 		setup_cgroups();
 #endif
 #if SYZ_HAVE_SETUP_EXT
 		// This can be defined in common_ext.h.
 		setup_ext();
 #endif
 		for (const auto& feat : features) {
 			if (!(conn_reply.features & feat.id))
 				continue;
 			debug("setting up feature %s\n", rpc::EnumNameFeature(feat.id));
 			const char* reason = feat.setup();
 			conn_reply.features &= ~feat.id;
 			std::unique_ptr<rpc::FeatureInfoRawT> res(new rpc::FeatureInfoRawT);
 			res->id = feat.id;
 			res->need_setup = true;
 			if (reason) {
 				debug("failed: %s\n", reason);
 				res->reason = reason;
 			}
 			info_req.features.push_back(std::move(res));
 		}
 		for (auto id : rpc::EnumValuesFeature()) {
 			if (!(conn_reply.features & id))
 				continue;
 			std::unique_ptr<rpc::FeatureInfoRawT> res(new rpc::FeatureInfoRawT);
 			res->id = id;
 			res->need_setup = false;
 			info_req.features.push_back(std::move(res));
 		}

 #if SYZ_HAVE_KCSAN
 		setup_kcsan_filter(conn_reply.race_frames);
 #endif

 		conn_.Send(info_req);

 		rpc::InfoReplyRawT info_reply;
 		conn_.Recv(info_reply);
 		debug("received info reply: covfilter=%zu\n", info_reply.cover_filter.size());
 		if (!info_reply.cover_filter.empty()) {
 			cover_filter_.emplace();
 			for (auto pc : info_reply.cover_filter)
 				cover_filter_->Insert(pc);
 		}

 		Select::Prepare(conn_.FD());
 		return conn_reply.procs;
 	}

 	void Handle(rpc::ExecRequestRawT& msg)
 	{
 		debug("recv exec request %llu: type=%llu flags=0x%llx env=0x%llx exec=0x%llx size=%zu\n",
 		      static_cast<uint64>(msg.id),
 		      static_cast<uint64>(msg.type),
 		      static_cast<uint64>(msg.flags),
 		      static_cast<uint64>(msg.exec_opts->env_flags()),
 		      static_cast<uint64>(msg.exec_opts->exec_flags()),
 		      msg.data.size());
 		if (msg.type == rpc::RequestType::Binary) {
 			ExecuteBinary(msg);
 			return;
 		}
 		for (auto& proc : procs_) {
 			if (proc->Execute(msg))
 				return;
 		}
 		requests_.push_back(std::move(msg));
 	}

 	void Handle(const rpc::SignalUpdateRawT& msg)
 	{
 		debug("recv signal update: new=%zu\n", msg.new_max.size());
 		if (!max_signal_)
 			fail("signal update when no signal filter installed");
 		for (auto pc : msg.new_max)
 			max_signal_->Insert(pc);
 	}

 	void Handle(const rpc::CorpusTriagedRawT& msg)
 	{
 		// TODO: repair leak checking (#4728).
 		debug("recv corpus triaged\n");
 		corpus_triaged_ = true;
 	}

 	void Handle(const rpc::StateRequestRawT& msg)
 	{
 		// Debug request about our internal state.
 		std::ostringstream ss;
 		ss << *this;
 		const std::string& str = ss.str();
 		rpc::StateResultRawT res;
 		res.data.insert(res.data.begin(), str.data(), str.data() + str.size());
 		rpc::ExecutorMessageRawT raw;
 		raw.msg.Set(std::move(res));
 		conn_.Send(raw);
 	}

 	void ExecuteBinary(rpc::ExecRequestRawT& msg)
 	{
 		rpc::ExecutingMessageRawT exec;
 		exec.id = msg.id;
 		rpc::ExecutorMessageRawT raw;
 		raw.msg.Set(std::move(exec));
 		conn_.Send(raw);

 		char dir_template[] = "syz-bin-dirXXXXXX";
 		char* dir = mkdtemp(dir_template);
 		if (dir == nullptr)
 			fail("mkdtemp failed");
 		if (chmod(dir, 0777))
 			fail("chmod failed");
 		auto [err, output] = ExecuteBinaryImpl(msg, dir);
 		if (!err.empty()) {
 			char tmp[64];
 			snprintf(tmp, sizeof(tmp), " (errno %d: %s)", errno, strerror(errno));
 			err += tmp;
 		}
 		remove_dir(dir);
 		rpc::ExecResultRawT res;
 		res.id = msg.id;
 		res.error = std::move(err);
 		res.output = std::move(output);
 		raw.msg.Set(std::move(res));
 		conn_.Send(raw);
 	}

 	std::tuple<std::string, std::vector<uint8_t>> ExecuteBinaryImpl(rpc::ExecRequestRawT& msg, const char* dir)
 	{
 		// For simplicity we just wait for binary tests to complete blocking everything else.
 		std::string file = std::string(dir) + "/syz-executor";
 		int fd = open(file.c_str(), O_WRONLY | O_CLOEXEC | O_CREAT, 0755);
 		if (fd == -1)
 			return {"binary file creation failed", {}};
 		ssize_t wrote = write(fd, msg.data.data(), msg.data.size());
 		close(fd);
 		if (wrote != static_cast<ssize_t>(msg.data.size()))
 			return {"binary file write failed", {}};

 		int stdin_pipe[2];
 		if (pipe(stdin_pipe))
 			fail("pipe failed");
 		int stdout_pipe[2];
 		if (pipe(stdout_pipe))
 			fail("pipe failed");

 		const char* argv[] = {file.c_str(), nullptr};
 		std::vector<std::pair<int, int>> fds = {
 		    {stdin_pipe[0], STDIN_FILENO},
 		    {stdout_pipe[1], STDOUT_FILENO},
 		    {stdout_pipe[1], STDERR_FILENO},
 		};
 		Subprocess process(argv, fds);

 		close(stdin_pipe[0]);
 		close(stdout_pipe[1]);

 		int status = process.WaitAndKill(5 * proc_opts_.program_timeout_ms);

 		std::vector<uint8_t> output;
 		for (;;) {
 			const size_t kChunk = 1024;
 			output.resize(output.size() + kChunk);
 			ssize_t n = read(stdout_pipe[0], output.data() + output.size() - kChunk, kChunk);
 			output.resize(output.size() - kChunk + std::max<ssize_t>(n, 0));
 			if (n <= 0)
 				break;
 		}
 		close(stdin_pipe[1]);
 		close(stdout_pipe[0]);

 		return {status == kFailStatus ? "process failed" : "", std::move(output)};
 	}
 };

 static void SigintHandler(int sig)
 {
 	// GCE VM preemption is signalled as SIGINT, notify syz-manager.
 	exitf("SYZ-EXECUTOR: PREEMPTED");
 }

 static void SigchldHandler(int sig)
 {
 	// We need just blocking syscall preemption.
 }

 static void FatalHandler(int sig, siginfo_t* info, void* ucontext)
 {
 	// Print minimal debugging info we can extract reasonably easy.
 	uintptr_t pc = 0xdeadbeef;
 #if GOOS_linux
 	auto& mctx = static_cast<ucontext_t*>(ucontext)->uc_mcontext;
 	(void)mctx;
 #if GOARCH_amd64
 	pc = mctx.gregs[REG_RIP];
 #elif GOARCH_arm64
 	pc = mctx.pc;
 #endif
 #endif
 	const char* name = "unknown signal";
 	switch (sig) {
 	case SIGSEGV:
 		name = "SIGSEGV";
 		break;
 	case SIGBUS:
 		name = "SIGBUS";
 		break;
 	case SIGILL:
 		name = "SIGILL";
 		break;
 	case SIGFPE:
 		name = "SIGFPE";
 		break;
 	}
 	// Print the current function PC so that it's possible to map the failing PC
 	// to a symbol in the binary offline (we usually compile as PIE).
 	failmsg(name, "pc-offset:0x%zx pc:%p addr:%p code=%d",
 		reinterpret_cast<uintptr_t>(reinterpret_cast<void*>(FatalHandler)) - pc,
 		reinterpret_cast<void*>(pc), info->si_addr, info->si_code);
 }

 static void runner(char** argv, int argc)
 {
 	if (argc != 5)
 		fail("usage: syz-executor runner <index> <manager-addr> <manager-port>");
 	char* endptr = nullptr;
 	int vm_index = strtol(argv[2], &endptr, 10);
 	if (vm_index < 0 || *endptr != 0)
 		failmsg("failed to parse VM index", "str='%s'", argv[2]);
 	const char* const manager_addr = argv[3];
 	const char* const manager_port = argv[4];

 	struct rlimit rlim;
 	rlim.rlim_cur = rlim.rlim_max = kFdLimit;
 	if (setrlimit(RLIMIT_NOFILE, &rlim))
 		fail("setrlimit(RLIMIT_NOFILE) failed");

 	// Ignore all signals we are not interested in.
 	// In particular we want to ignore SIGPIPE, but also everything else since
 	// test processes manage to send random signals using tracepoints with bpf programs.
 	// This is not a bullet-proof protection, but it won't harm either.
 	for (int sig = 0; sig <= 64; sig++)
 		signal(sig, SIG_IGN);
 	if (signal(SIGINT, SigintHandler) == SIG_ERR)
 		fail("signal(SIGINT) failed");
 	if (signal(SIGTERM, SigintHandler) == SIG_ERR)
 		fail("signal(SIGTERM) failed");
 	if (signal(SIGCHLD, SigchldHandler) == SIG_ERR)
 		fail("signal(SIGCHLD) failed");
 	struct sigaction act = {};
 	act.sa_flags = SA_SIGINFO;
 	act.sa_sigaction = FatalHandler;
 	for (auto sig : {SIGSEGV, SIGBUS, SIGILL, SIGFPE}) {
 		if (sigaction(sig, &act, nullptr))
 			failmsg("sigaction failed", "sig=%d", sig);
 	}

 	Connection conn(manager_addr, manager_port);

 	// This is required to make Subprocess fd remapping logic work.
 	// kCoverFilterFd is the largest fd we set in the child processes.
 	for (int fd = conn.FD(); fd < kCoverFilterFd;)
 		fd = dup(fd);

 	Runner(conn, vm_index, argv[0]);
 }