| //go:build linux || freebsd |
| |
| package daemon |
| |
| import ( |
| "context" |
| "fmt" |
| "os" |
| "path" |
| "path/filepath" |
| "strconv" |
| "syscall" |
| |
| "github.com/containerd/log" |
| "github.com/moby/moby/v2/daemon/config" |
| "github.com/moby/moby/v2/daemon/container" |
| "github.com/moby/moby/v2/daemon/internal/netipstringer" |
| "github.com/moby/moby/v2/daemon/internal/stringid" |
| "github.com/moby/moby/v2/daemon/libnetwork" |
| "github.com/moby/moby/v2/daemon/libnetwork/drivers/bridge" |
| "github.com/moby/moby/v2/daemon/links" |
| "github.com/moby/moby/v2/daemon/network" |
| "github.com/moby/moby/v2/errdefs" |
| "github.com/moby/moby/v2/pkg/process" |
| "github.com/moby/sys/mount" |
| "github.com/moby/sys/user" |
| "github.com/opencontainers/selinux/go-selinux/label" |
| "github.com/pkg/errors" |
| "go.opentelemetry.io/otel" |
| "golang.org/x/sys/unix" |
| ) |
| |
| func (daemon *Daemon) setupLinkedContainers(ctr *container.Container) ([]string, error) { |
| bridgeSettings := ctr.NetworkSettings.Networks[network.DefaultNetwork] |
| if bridgeSettings == nil || bridgeSettings.EndpointSettings == nil { |
| return nil, nil |
| } |
| |
| var env []string |
| for linkAlias, child := range daemon.linkIndex.children(ctr) { |
| if !child.State.IsRunning() { |
| return nil, fmt.Errorf("Cannot link to a non running container: %s AS %s", child.Name, linkAlias) |
| } |
| |
| childBridgeSettings := child.NetworkSettings.Networks[network.DefaultNetwork] |
| if childBridgeSettings == nil || childBridgeSettings.EndpointSettings == nil { |
| return nil, fmt.Errorf("container %s not attached to default bridge network", child.ID) |
| } |
| |
| // Environment variables defined when using legacy links are deprecated and will be removed in a future release. |
| // Allow users to restore the old behavior through this escape hatch. |
| if os.Getenv("DOCKER_KEEP_DEPRECATED_LEGACY_LINKS_ENV_VARS") == "1" { |
| linkEnvVars := links.EnvVars( |
| netipstringer.Addr(bridgeSettings.IPAddress.Unmap()), |
| netipstringer.Addr(childBridgeSettings.IPAddress.Unmap()), |
| linkAlias, |
| child.Config.Env, |
| child.Config.ExposedPorts, |
| ) |
| env = append(env, linkEnvVars...) |
| } |
| } |
| |
| return env, nil |
| } |
| |
| func (daemon *Daemon) addLegacyLinks( |
| ctx context.Context, |
| cfg *config.Config, |
| ctr *container.Container, |
| epConfig *network.EndpointSettings, |
| sb *libnetwork.Sandbox, |
| ) error { |
| ctx, span := otel.Tracer("").Start(ctx, "daemon.addLegacyLinks") |
| defer span.End() |
| |
| if epConfig.EndpointID == "" { |
| return nil |
| } |
| |
| children := daemon.linkIndex.children(ctr) |
| var parents map[string]*container.Container |
| if !cfg.DisableBridge && ctr.HostConfig.NetworkMode.IsPrivate() { |
| parents = daemon.linkIndex.parents(ctr) |
| } |
| if len(children) == 0 && len(parents) == 0 { |
| return nil |
| } |
| for _, child := range children { |
| if _, ok := child.NetworkSettings.Networks[network.DefaultNetwork]; !ok { |
| return fmt.Errorf("Cannot link to %s, as it does not belong to the default network", child.Name) |
| } |
| } |
| |
| var ( |
| childEndpoints []string |
| cEndpointID string |
| ) |
| for linkAlias, child := range children { |
| _, alias := path.Split(linkAlias) |
| // allow access to the linked container via the alias, real name, and container hostname |
| aliasList := alias + " " + child.Config.Hostname |
| // only add the name if alias isn't equal to the name |
| if alias != child.Name[1:] { |
| aliasList = aliasList + " " + child.Name[1:] |
| } |
| defaultNW := child.NetworkSettings.Networks[network.DefaultNetwork] |
| if defaultNW.IPAddress.IsValid() { |
| if err := sb.AddHostsEntry(ctx, aliasList, defaultNW.IPAddress.Unmap()); err != nil { |
| return errors.Wrapf(err, "failed to add address to /etc/hosts for link to %s", child.Name) |
| } |
| } |
| if defaultNW.GlobalIPv6Address.IsValid() { |
| if err := sb.AddHostsEntry(ctx, aliasList, defaultNW.GlobalIPv6Address); err != nil { |
| return errors.Wrapf(err, "failed to add IPv6 address to /etc/hosts for link to %s", child.Name) |
| } |
| } |
| cEndpointID = defaultNW.EndpointID |
| if cEndpointID != "" { |
| childEndpoints = append(childEndpoints, cEndpointID) |
| } |
| } |
| |
| var parentEndpoints []string |
| for alias, parent := range parents { |
| _, alias = path.Split(alias) |
| // Update ctr's IP address in /etc/hosts files in containers with legacy-links to ctr. |
| log.G(context.TODO()).Debugf("Update /etc/hosts of %s for alias %s with ip %s", parent.ID, alias, epConfig.IPAddress) |
| if psb, _ := daemon.netController.GetSandbox(parent.ID); psb != nil { |
| if err := psb.UpdateHostsEntry(alias, epConfig.IPAddress); err != nil { |
| return errors.Wrapf(err, "failed to update /etc/hosts of %s for alias %s with IP %s", |
| parent.ID, alias, epConfig.IPAddress) |
| } |
| if epConfig.GlobalIPv6Address.IsValid() { |
| if err := psb.UpdateHostsEntry(alias, epConfig.GlobalIPv6Address); err != nil { |
| return errors.Wrapf(err, "failed to update /etc/hosts of %s for alias %s with IP %s", |
| parent.ID, alias, epConfig.GlobalIPv6Address) |
| } |
| } |
| } |
| if cEndpointID != "" { |
| parentEndpoints = append(parentEndpoints, cEndpointID) |
| } |
| } |
| |
| sb.UpdateLabels(bridge.LegacyContainerLinkOptions(parentEndpoints, childEndpoints)) |
| |
| return nil |
| } |
| |
| func (daemon *Daemon) getIPCContainer(id string) (*container.Container, error) { |
| // Check if the container exists, is running, and not restarting |
| ctr, err := daemon.GetContainer(id) |
| if err != nil { |
| return nil, errdefs.InvalidParameter(err) |
| } |
| if !ctr.State.IsRunning() { |
| return nil, errNotRunning(id) |
| } |
| if ctr.State.IsRestarting() { |
| return nil, errContainerIsRestarting(id) |
| } |
| |
| // Check the container ipc is shareable |
| if st, err := os.Stat(ctr.ShmPath); err != nil || !st.IsDir() { |
| if err == nil || os.IsNotExist(err) { |
| return nil, errdefs.InvalidParameter(errors.New("container " + id + ": non-shareable IPC (hint: use IpcMode:shareable for the donor container)")) |
| } |
| // stat() failed? |
| return nil, errdefs.System(errors.Wrap(err, "container "+id)) |
| } |
| |
| return ctr, nil |
| } |
| |
| func (daemon *Daemon) getPIDContainer(id string) (*container.Container, error) { |
| ctr, err := daemon.GetContainer(id) |
| if err != nil { |
| return nil, errdefs.InvalidParameter(err) |
| } |
| if !ctr.State.IsRunning() { |
| return nil, errNotRunning(id) |
| } |
| if ctr.State.IsRestarting() { |
| return nil, errContainerIsRestarting(id) |
| } |
| |
| return ctr, nil |
| } |
| |
| // setupContainerDirs sets up base container directories (root, ipc, tmpfs and secrets). |
| func (daemon *Daemon) setupContainerDirs(ctr *container.Container) (_ []container.Mount, err error) { |
| if err := daemon.setupContainerMountsRoot(ctr); err != nil { |
| return nil, err |
| } |
| |
| if err := daemon.setupIPCDirs(ctr); err != nil { |
| return nil, err |
| } |
| |
| if err := daemon.setupSecretDir(ctr); err != nil { |
| return nil, err |
| } |
| defer func() { |
| if err != nil { |
| daemon.cleanupSecretDir(ctr) |
| } |
| }() |
| |
| var ms []container.Mount |
| if !ctr.HostConfig.IpcMode.IsPrivate() && !ctr.HostConfig.IpcMode.IsEmpty() { |
| ms = append(ms, ctr.IpcMounts()...) |
| } |
| |
| tmpfsMounts, err := ctr.TmpfsMounts() |
| if err != nil { |
| return nil, err |
| } |
| ms = append(ms, tmpfsMounts...) |
| |
| secretMounts, err := ctr.SecretMounts() |
| if err != nil { |
| return nil, err |
| } |
| ms = append(ms, secretMounts...) |
| |
| return ms, nil |
| } |
| |
| func (daemon *Daemon) setupIPCDirs(ctr *container.Container) error { |
| ipcMode := ctr.HostConfig.IpcMode |
| |
| switch { |
| case ipcMode.IsContainer(): |
| ic, err := daemon.getIPCContainer(ipcMode.Container()) |
| if err != nil { |
| return errors.Wrapf(err, "failed to join IPC namespace") |
| } |
| ctr.ShmPath = ic.ShmPath |
| |
| case ipcMode.IsHost(): |
| if _, err := os.Stat("/dev/shm"); err != nil { |
| return errors.New("/dev/shm is not mounted, but must be for --ipc=host") |
| } |
| ctr.ShmPath = "/dev/shm" |
| |
| case ipcMode.IsPrivate(), ipcMode.IsNone(): |
| // c.ShmPath will/should not be used, so make it empty. |
| // Container's /dev/shm mount comes from OCI spec. |
| ctr.ShmPath = "" |
| |
| case ipcMode.IsEmpty(): |
| // A container was created by an older version of the daemon. |
| // The default behavior used to be what is now called "shareable". |
| fallthrough |
| |
| case ipcMode.IsShareable(): |
| uid, gid := daemon.idMapping.RootPair() |
| if !ctr.HasMountFor("/dev/shm") { |
| shmPath, err := ctr.ShmResourcePath() |
| if err != nil { |
| return err |
| } |
| |
| if err := user.MkdirAllAndChown(shmPath, 0o700, uid, gid); err != nil { |
| return err |
| } |
| |
| shmproperty := "mode=1777,size=" + strconv.FormatInt(ctr.HostConfig.ShmSize, 10) |
| if err := unix.Mount("shm", shmPath, "tmpfs", uintptr(unix.MS_NOEXEC|unix.MS_NOSUID|unix.MS_NODEV), label.FormatMountLabel(shmproperty, ctr.GetMountLabel())); err != nil { |
| return fmt.Errorf("mounting shm tmpfs: %s", err) |
| } |
| if err := os.Chown(shmPath, uid, gid); err != nil { |
| return err |
| } |
| ctr.ShmPath = shmPath |
| } |
| |
| default: |
| return fmt.Errorf("invalid IPC mode: %v", ipcMode) |
| } |
| |
| return nil |
| } |
| |
| func (daemon *Daemon) setupSecretDir(ctr *container.Container) (setupErr error) { |
| if len(ctr.SecretReferences) == 0 && len(ctr.ConfigReferences) == 0 { |
| return nil |
| } |
| |
| if err := daemon.createSecretsDir(ctr); err != nil { |
| return err |
| } |
| defer func() { |
| if setupErr != nil { |
| daemon.cleanupSecretDir(ctr) |
| } |
| }() |
| |
| if ctr.DependencyStore == nil { |
| return errors.New("secret store is not initialized") |
| } |
| |
| // retrieve possible remapped range start for root UID, GID |
| ruid, rgid := daemon.idMapping.RootPair() |
| |
| for _, s := range ctr.SecretReferences { |
| // TODO (ehazlett): use type switch when more are supported |
| if s.File == nil { |
| log.G(context.TODO()).Error("secret target type is not a file target") |
| continue |
| } |
| |
| // secrets are created in the SecretMountPath on the host, at a |
| // single level |
| fPath, err := ctr.SecretFilePath(*s) |
| if err != nil { |
| return errors.Wrap(err, "error getting secret file path") |
| } |
| if err := user.MkdirAllAndChown(filepath.Dir(fPath), 0o700, ruid, rgid); err != nil { |
| return errors.Wrap(err, "error creating secret mount path") |
| } |
| |
| log.G(context.TODO()).WithFields(log.Fields{ |
| "name": s.File.Name, |
| "path": fPath, |
| }).Debug("injecting secret") |
| secret, err := ctr.DependencyStore.Secrets().Get(s.SecretID) |
| if err != nil { |
| return errors.Wrap(err, "unable to get secret from secret store") |
| } |
| if err := os.WriteFile(fPath, secret.Spec.Data, s.File.Mode); err != nil { |
| return errors.Wrap(err, "error injecting secret") |
| } |
| |
| uid, err := strconv.Atoi(s.File.UID) |
| if err != nil { |
| return err |
| } |
| gid, err := strconv.Atoi(s.File.GID) |
| if err != nil { |
| return err |
| } |
| |
| if err := os.Chown(fPath, ruid+uid, rgid+gid); err != nil { |
| return errors.Wrap(err, "error setting ownership for secret") |
| } |
| if err := os.Chmod(fPath, s.File.Mode); err != nil { |
| return errors.Wrap(err, "error setting file mode for secret") |
| } |
| } |
| |
| for _, configRef := range ctr.ConfigReferences { |
| // TODO (ehazlett): use type switch when more are supported |
| if configRef.File == nil { |
| // Runtime configs are not mounted into the container, but they're |
| // a valid type of config so we should not error when we encounter |
| // one. |
| if configRef.Runtime == nil { |
| log.G(context.TODO()).Error("config target type is not a file or runtime target") |
| } |
| // However, in any case, this isn't a file config, so we have no |
| // further work to do |
| continue |
| } |
| |
| fPath, err := ctr.ConfigFilePath(*configRef) |
| if err != nil { |
| return errors.Wrap(err, "error getting config file path for container") |
| } |
| if err := user.MkdirAllAndChown(filepath.Dir(fPath), 0o700, ruid, rgid); err != nil { |
| return errors.Wrap(err, "error creating config mount path") |
| } |
| |
| log.G(context.TODO()).WithFields(log.Fields{ |
| "name": configRef.File.Name, |
| "path": fPath, |
| }).Debug("injecting config") |
| config, err := ctr.DependencyStore.Configs().Get(configRef.ConfigID) |
| if err != nil { |
| return errors.Wrap(err, "unable to get config from config store") |
| } |
| if err := os.WriteFile(fPath, config.Spec.Data, configRef.File.Mode); err != nil { |
| return errors.Wrap(err, "error injecting config") |
| } |
| |
| uid, err := strconv.Atoi(configRef.File.UID) |
| if err != nil { |
| return err |
| } |
| gid, err := strconv.Atoi(configRef.File.GID) |
| if err != nil { |
| return err |
| } |
| |
| if err := os.Chown(fPath, ruid+uid, rgid+gid); err != nil { |
| return errors.Wrap(err, "error setting ownership for config") |
| } |
| if err := os.Chmod(fPath, configRef.File.Mode); err != nil { |
| return errors.Wrap(err, "error setting file mode for config") |
| } |
| } |
| |
| return daemon.remountSecretDir(ctr) |
| } |
| |
| // createSecretsDir is used to create a dir suitable for storing container secrets. |
| // In practice this is using a tmpfs mount and is used for both "configs" and "secrets" |
| func (daemon *Daemon) createSecretsDir(ctr *container.Container) error { |
| // retrieve possible remapped range start for root UID, GID |
| uid, gid := daemon.idMapping.RootPair() |
| dir, err := ctr.SecretMountPath() |
| if err != nil { |
| return errors.Wrap(err, "error getting container secrets dir") |
| } |
| |
| // create tmpfs |
| if err := user.MkdirAllAndChown(dir, 0o700, uid, gid); err != nil { |
| return errors.Wrap(err, "error creating secret local mount path") |
| } |
| |
| tmpfsOwnership := fmt.Sprintf("uid=%d,gid=%d", uid, gid) |
| if err := mount.Mount("tmpfs", dir, "tmpfs", "nodev,nosuid,noexec,"+tmpfsOwnership); err != nil { |
| return errors.Wrap(err, "unable to setup secret mount") |
| } |
| return nil |
| } |
| |
| func (daemon *Daemon) remountSecretDir(ctr *container.Container) error { |
| dir, err := ctr.SecretMountPath() |
| if err != nil { |
| return errors.Wrap(err, "error getting container secrets path") |
| } |
| if err := label.Relabel(dir, ctr.MountLabel, false); err != nil { |
| log.G(context.TODO()).WithError(err).WithField("dir", dir).Warn("Error while attempting to set selinux label") |
| } |
| uid, gid := daemon.idMapping.RootPair() |
| tmpfsOwnership := fmt.Sprintf("uid=%d,gid=%d", uid, gid) |
| |
| // remount secrets ro |
| if err := mount.Mount("tmpfs", dir, "tmpfs", "remount,ro,"+tmpfsOwnership); err != nil { |
| return errors.Wrap(err, "unable to remount dir as readonly") |
| } |
| |
| return nil |
| } |
| |
| func (daemon *Daemon) cleanupSecretDir(ctr *container.Container) { |
| dir, err := ctr.SecretMountPath() |
| if err != nil { |
| log.G(context.TODO()).WithError(err).WithField("container", ctr.ID).Warn("error getting secrets mount path for container") |
| } |
| if err := mount.RecursiveUnmount(dir); err != nil { |
| log.G(context.TODO()).WithField("dir", dir).WithError(err).Warn("Error while attempting to unmount dir, this may prevent removal of container.") |
| } |
| if err := os.RemoveAll(dir); err != nil { |
| log.G(context.TODO()).WithField("dir", dir).WithError(err).Error("Error removing dir.") |
| } |
| } |
| |
| func killProcessDirectly(ctr *container.Container) error { |
| pid := ctr.State.GetPID() |
| if pid == 0 { |
| // Ensure that we don't kill ourselves |
| return nil |
| } |
| |
| if err := unix.Kill(pid, syscall.SIGKILL); err != nil { |
| if !errors.Is(err, unix.ESRCH) { |
| return errdefs.System(err) |
| } |
| err = errNoSuchProcess{pid, syscall.SIGKILL} |
| log.G(context.TODO()).WithFields(log.Fields{ |
| "error": err, |
| "container": ctr.ID, |
| "pid": pid, |
| }).Debug("no such process") |
| return err |
| } |
| |
| // In case there were some exceptions(e.g., state of zombie and D) |
| if process.Alive(pid) { |
| // Since we can not kill a zombie pid, add zombie check here |
| isZombie, err := process.Zombie(pid) |
| if err != nil { |
| log.G(context.TODO()).WithFields(log.Fields{ |
| "error": err, |
| "container": ctr.ID, |
| "pid": pid, |
| }).Warn("Container state is invalid") |
| return err |
| } |
| if isZombie { |
| return errdefs.System(errors.Errorf("container %s PID %d is zombie and can not be killed. Use the --init option when creating containers to run an init inside the container that forwards signals and reaps processes", stringid.TruncateID(ctr.ID), pid)) |
| } |
| } |
| return nil |
| } |
| |
| // TODO(aker): remove when we make the default bridge network behave like any other network |
| func enableIPOnPredefinedNetwork() bool { |
| return false |
| } |
| |
| // serviceDiscoveryOnDefaultNetwork indicates if service discovery is supported on the default network |
| // TODO(aker): remove when we make the default bridge network behave like any other network |
| func serviceDiscoveryOnDefaultNetwork() bool { |
| return false |
| } |
| |
| func buildSandboxPlatformOptions(ctr *container.Container, cfg *config.Config) ([]libnetwork.SandboxOption, error) { |
| var ( |
| sboxOptions []libnetwork.SandboxOption |
| originResolvConfPath string |
| ) |
| |
| // Set the correct paths for /etc/hosts and /etc/resolv.conf, based on the |
| // networking-mode of the container. Note that containers with "container" |
| // networking are already handled in "initializeNetworking()" before we reach |
| // this function, so do not have to be accounted for here. |
| switch { |
| case ctr.HostConfig.NetworkMode.IsHost(): |
| // In host-mode networking, the container does not have its own networking |
| // namespace, so both `/etc/hosts` and `/etc/resolv.conf` should be the same |
| // as on the host itself. The container gets a copy of these files. |
| sboxOptions = append(sboxOptions, libnetwork.OptionOriginHostsPath("/etc/hosts")) |
| originResolvConfPath = "/etc/resolv.conf" |
| case ctr.HostConfig.NetworkMode.IsUserDefined(): |
| // The container uses a user-defined network. We use the embedded DNS |
| // server for container name resolution and to act as a DNS forwarder |
| // for external DNS resolution. |
| // We parse the DNS server(s) that are defined in /etc/resolv.conf on |
| // the host, which may be a local DNS server (for example, if DNSMasq or |
| // systemd-resolvd are in use). The embedded DNS server forwards DNS |
| // resolution to the DNS server configured on the host, which in itself |
| // may act as a forwarder for external DNS servers. |
| // If systemd-resolvd is used, the "upstream" DNS servers can be found in |
| // /run/systemd/resolve/resolv.conf. We do not query those DNS servers |
| // directly, as they can be dynamically reconfigured. |
| originResolvConfPath = "/etc/resolv.conf" |
| default: |
| // For other situations, such as the default bridge network, container |
| // discovery / name resolution is handled through /etc/hosts, and no |
| // embedded DNS server is available. Without the embedded DNS, we |
| // cannot use local DNS servers on the host (for example, if DNSMasq or |
| // systemd-resolvd is used). If systemd-resolvd is used, we try to |
| // determine the external DNS servers that are used on the host. |
| // This situation is not ideal, because DNS servers configured in the |
| // container are not updated after the container is created, but the |
| // DNS servers on the host can be dynamically updated. |
| // |
| // Copy the host's resolv.conf for the container (/run/systemd/resolve/resolv.conf or /etc/resolv.conf) |
| originResolvConfPath = cfg.GetResolvConf() |
| } |
| |
| // Allow tests to point at their own resolv.conf file. Note that |
| // this only overrides the resolvConf path, not "/etc/hosts", which |
| // for containers using the "host" network namespace is set above. |
| if envPath := os.Getenv("DOCKER_TEST_RESOLV_CONF_PATH"); envPath != "" { |
| log.G(context.TODO()).Infof("Using OriginResolvConfPath from env: %s", envPath) |
| originResolvConfPath = envPath |
| } |
| sboxOptions = append(sboxOptions, libnetwork.OptionOriginResolvConfPath(originResolvConfPath)) |
| |
| hostsPath, err := ctr.GetRootResourcePath("hosts") |
| if err != nil { |
| return nil, err |
| } |
| resolvConfPath, err := ctr.GetRootResourcePath("resolv.conf") |
| if err != nil { |
| return nil, err |
| } |
| |
| ctr.HostsPath, ctr.ResolvConfPath = hostsPath, resolvConfPath |
| sboxOptions = append(sboxOptions, |
| libnetwork.OptionHostsPath(hostsPath), |
| libnetwork.OptionResolvConfPath(resolvConfPath), |
| ) |
| |
| return sboxOptions, nil |
| } |
| |
| func (daemon *Daemon) initializeNetworkingPaths(ctr *container.Container, nc *container.Container) error { |
| ctr.HostnamePath = nc.HostnamePath |
| ctr.HostsPath = nc.HostsPath |
| ctr.ResolvConfPath = nc.ResolvConfPath |
| return nil |
| } |
| |
| func (daemon *Daemon) setupContainerMountsRoot(ctr *container.Container) error { |
| // get the root mount path so we can make it unbindable |
| p, err := ctr.MountsResourcePath("") |
| if err != nil { |
| return err |
| } |
| _, gid := daemon.IdentityMapping().RootPair() |
| return user.MkdirAllAndChown(p, 0o710, os.Getuid(), gid) |
| } |