You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
ansible/test/lib/ansible_test/_internal/host_profiles.py

1422 lines
63 KiB
Python

"""Profiles to represent individual test hosts or a user-provided inventory file."""
from __future__ import annotations
import abc
import dataclasses
import os
import shlex
import tempfile
import time
import typing as t
from .io import (
read_text_file,
write_text_file,
)
from .config import (
CommonConfig,
EnvironmentConfig,
IntegrationConfig,
TerminateMode,
)
from .host_configs import (
ControllerConfig,
ControllerHostConfig,
DockerConfig,
HostConfig,
NetworkInventoryConfig,
NetworkRemoteConfig,
OriginConfig,
PosixConfig,
PosixRemoteConfig,
PosixSshConfig,
PythonConfig,
RemoteConfig,
VirtualPythonConfig,
WindowsInventoryConfig,
WindowsRemoteConfig,
)
from .core_ci import (
AnsibleCoreCI,
SshKey,
VmResource,
)
from .util import (
ApplicationError,
SubprocessError,
cache,
display,
get_type_map,
sanitize_host_name,
sorted_versions,
InternalError,
HostConnectionError,
ANSIBLE_TEST_TARGET_ROOT,
)
from .util_common import (
get_docs_url,
intercept_python,
)
from .docker_util import (
docker_exec,
docker_image_inspect,
docker_logs,
docker_pull,
docker_rm,
get_docker_hostname,
require_docker,
get_docker_info,
detect_host_properties,
run_utility_container,
SystemdControlGroupV1Status,
LOGINUID_NOT_SET,
UTILITY_IMAGE,
)
from .bootstrap import (
BootstrapDocker,
BootstrapRemote,
)
from .venv import (
get_virtual_python,
)
from .ssh import (
SshConnectionDetail,
)
from .ansible_util import (
ansible_environment,
get_hosts,
parse_inventory,
)
from .containers import (
CleanupMode,
HostType,
get_container_database,
run_support_container,
)
from .connections import (
Connection,
DockerConnection,
LocalConnection,
SshConnection,
)
from .become import (
Become,
SUPPORTED_BECOME_METHODS,
Sudo,
)
from .completion import (
AuditMode,
CGroupVersion,
)
from .dev.container_probe import (
CGroupMount,
CGroupPath,
CGroupState,
MountType,
check_container_cgroup_status,
)
TControllerHostConfig = t.TypeVar('TControllerHostConfig', bound=ControllerHostConfig)
THostConfig = t.TypeVar('THostConfig', bound=HostConfig)
TPosixConfig = t.TypeVar('TPosixConfig', bound=PosixConfig)
TRemoteConfig = t.TypeVar('TRemoteConfig', bound=RemoteConfig)
class ControlGroupError(ApplicationError):
"""Raised when the container host does not have the necessary cgroup support to run a container."""
def __init__(self, args: CommonConfig, reason: str) -> None:
engine = require_docker().command
dd_wsl2 = get_docker_info(args).docker_desktop_wsl2
message = f'''
{reason}
Run the following commands as root on the container host to resolve this issue:
mkdir /sys/fs/cgroup/systemd
mount cgroup -t cgroup /sys/fs/cgroup/systemd -o none,name=systemd,xattr
chown -R {{user}}:{{group}} /sys/fs/cgroup/systemd # only when rootless
NOTE: These changes must be applied each time the container host is rebooted.
'''.strip()
podman_message = '''
If rootless Podman is already running [1], you may need to stop it before
containers are able to use the new mount point.
[1] Check for 'podman' and 'catatonit' processes.
'''
dd_wsl_message = f'''
When using Docker Desktop with WSL2, additional configuration [1] is required.
[1] {get_docs_url("https://docs.ansible.com/ansible-core/devel/dev_guide/testing_running_locally.html#docker-desktop-with-wsl2")}
'''
if engine == 'podman':
message += podman_message
elif dd_wsl2:
message += dd_wsl_message
message = message.strip()
super().__init__(message)
@dataclasses.dataclass(frozen=True)
class Inventory:
"""Simple representation of an Ansible inventory."""
host_groups: dict[str, dict[str, dict[str, t.Union[str, int]]]]
extra_groups: t.Optional[dict[str, list[str]]] = None
@staticmethod
def create_single_host(name: str, variables: dict[str, t.Union[str, int]]) -> Inventory:
"""Return an inventory instance created from the given hostname and variables."""
return Inventory(host_groups=dict(all={name: variables}))
def write(self, args: CommonConfig, path: str) -> None:
"""Write the given inventory to the specified path on disk."""
# NOTE: Switching the inventory generation to write JSON would be nice, but is currently not possible due to the use of hard-coded inventory filenames.
# The name `inventory` works for the POSIX integration tests, but `inventory.winrm` and `inventory.networking` will only parse in INI format.
# If tests are updated to use the `INVENTORY_PATH` environment variable, then this could be changed.
# Also, some tests detect the test type by inspecting the suffix on the inventory filename, which would break if it were changed.
inventory_text = ''
for group, hosts in self.host_groups.items():
inventory_text += f'[{group}]\n'
for host, variables in hosts.items():
kvp = ' '.join(f'{key}="{value}"' for key, value in variables.items())
inventory_text += f'{host} {kvp}\n'
inventory_text += '\n'
for group, children in (self.extra_groups or {}).items():
inventory_text += f'[{group}]\n'
for child in children:
inventory_text += f'{child}\n'
inventory_text += '\n'
inventory_text = inventory_text.strip()
if not args.explain:
write_text_file(path, inventory_text + '\n')
display.info(f'>>> Inventory\n{inventory_text}', verbosity=3)
class HostProfile(t.Generic[THostConfig], metaclass=abc.ABCMeta):
"""Base class for host profiles."""
def __init__(self,
*,
args: EnvironmentConfig,
config: THostConfig,
targets: t.Optional[list[HostConfig]],
) -> None:
self.args = args
self.config = config
self.controller = bool(targets)
self.targets = targets or []
self.state: dict[str, t.Any] = {}
"""State that must be persisted across delegation."""
self.cache: dict[str, t.Any] = {}
"""Cache that must not be persisted across delegation."""
def provision(self) -> None:
"""Provision the host before delegation."""
def setup(self) -> None:
"""Perform out-of-band setup before delegation."""
def on_target_failure(self) -> None:
"""Executed during failure handling if this profile is a target."""
def deprovision(self) -> None:
"""Deprovision the host after delegation has completed."""
def wait(self) -> None:
"""Wait for the instance to be ready. Executed before delegation for the controller and after delegation for targets."""
def configure(self) -> None:
"""Perform in-band configuration. Executed before delegation for the controller and after delegation for targets."""
def __getstate__(self):
return {key: value for key, value in self.__dict__.items() if key not in ('args', 'cache')}
def __setstate__(self, state):
self.__dict__.update(state)
# args will be populated after the instances are restored
self.cache = {}
class PosixProfile(HostProfile[TPosixConfig], metaclass=abc.ABCMeta):
"""Base class for POSIX host profiles."""
@property
def python(self) -> PythonConfig:
"""
The Python to use for this profile.
If it is a virtual python, it will be created the first time it is requested.
"""
python = self.state.get('python')
if not python:
python = self.config.python
if isinstance(python, VirtualPythonConfig):
python = get_virtual_python(self.args, python)
self.state['python'] = python
return python
class ControllerHostProfile(PosixProfile[TControllerHostConfig], metaclass=abc.ABCMeta):
"""Base class for profiles usable as a controller."""
@abc.abstractmethod
def get_origin_controller_connection(self) -> Connection:
"""Return a connection for accessing the host as a controller from the origin."""
@abc.abstractmethod
def get_working_directory(self) -> str:
"""Return the working directory for the host."""
class SshTargetHostProfile(HostProfile[THostConfig], metaclass=abc.ABCMeta):
"""Base class for profiles offering SSH connectivity."""
@abc.abstractmethod
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
class RemoteProfile(SshTargetHostProfile[TRemoteConfig], metaclass=abc.ABCMeta):
"""Base class for remote instance profiles."""
@property
def core_ci_state(self) -> t.Optional[dict[str, str]]:
"""The saved Ansible Core CI state."""
return self.state.get('core_ci')
@core_ci_state.setter
def core_ci_state(self, value: dict[str, str]) -> None:
"""The saved Ansible Core CI state."""
self.state['core_ci'] = value
def provision(self) -> None:
"""Provision the host before delegation."""
self.core_ci = self.create_core_ci(load=True)
self.core_ci.start()
self.core_ci_state = self.core_ci.save()
def deprovision(self) -> None:
"""Deprovision the host after delegation has completed."""
if self.args.remote_terminate == TerminateMode.ALWAYS or (self.args.remote_terminate == TerminateMode.SUCCESS and self.args.success):
self.delete_instance()
@property
def core_ci(self) -> t.Optional[AnsibleCoreCI]:
"""Return the cached AnsibleCoreCI instance, if any, otherwise None."""
return self.cache.get('core_ci')
@core_ci.setter
def core_ci(self, value: AnsibleCoreCI) -> None:
"""Cache the given AnsibleCoreCI instance."""
self.cache['core_ci'] = value
def get_instance(self) -> t.Optional[AnsibleCoreCI]:
"""Return the current AnsibleCoreCI instance, loading it if not already loaded."""
if not self.core_ci and self.core_ci_state:
self.core_ci = self.create_core_ci(load=False)
self.core_ci.load(self.core_ci_state)
return self.core_ci
def delete_instance(self) -> None:
"""Delete the AnsibleCoreCI VM instance."""
core_ci = self.get_instance()
if not core_ci:
return # instance has not been provisioned
core_ci.stop()
def wait_for_instance(self) -> AnsibleCoreCI:
"""Wait for an AnsibleCoreCI VM instance to become ready."""
core_ci = self.get_instance()
core_ci.wait()
return core_ci
def create_core_ci(self, load: bool) -> AnsibleCoreCI:
"""Create and return an AnsibleCoreCI instance."""
if not self.config.arch:
raise InternalError(f'No arch specified for config: {self.config}')
return AnsibleCoreCI(
args=self.args,
resource=VmResource(
platform=self.config.platform,
version=self.config.version,
architecture=self.config.arch,
provider=self.config.provider,
tag='controller' if self.controller else 'target',
),
load=load,
)
class ControllerProfile(SshTargetHostProfile[ControllerConfig], PosixProfile[ControllerConfig]):
"""Host profile for the controller as a target."""
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
settings = SshConnectionDetail(
name='localhost',
host='localhost',
port=None,
user='root',
identity_file=SshKey(self.args).key,
python_interpreter=self.args.controller_python.path,
)
return [SshConnection(self.args, settings)]
class DockerProfile(ControllerHostProfile[DockerConfig], SshTargetHostProfile[DockerConfig]):
"""Host profile for a docker instance."""
MARKER = 'ansible-test-marker'
@dataclasses.dataclass(frozen=True)
class InitConfig:
"""Configuration details required to run the container init."""
options: list[str]
command: str
command_privileged: bool
expected_mounts: tuple[CGroupMount, ...]
@property
def container_name(self) -> t.Optional[str]:
"""Return the stored container name, if any, otherwise None."""
return self.state.get('container_name')
@container_name.setter
def container_name(self, value: str) -> None:
"""Store the given container name."""
self.state['container_name'] = value
@property
def cgroup_path(self) -> t.Optional[str]:
"""Return the path to the cgroup v1 systemd hierarchy, if any, otherwise None."""
return self.state.get('cgroup_path')
@cgroup_path.setter
def cgroup_path(self, value: str) -> None:
"""Store the path to the cgroup v1 systemd hierarchy."""
self.state['cgroup_path'] = value
@property
def label(self) -> str:
"""Label to apply to resources related to this profile."""
return f'{"controller" if self.controller else "target"}-{self.args.session_name}'
def provision(self) -> None:
"""Provision the host before delegation."""
init_probe = self.args.dev_probe_cgroups is not None
init_config = self.get_init_config()
container = run_support_container(
args=self.args,
context='__test_hosts__',
image=self.config.image,
name=f'ansible-test-{self.label}',
ports=[22],
publish_ports=not self.controller, # connections to the controller over SSH are not required
options=init_config.options,
cleanup=CleanupMode.NO,
cmd=self.build_init_command(init_config, init_probe),
)
if not container:
if self.args.prime_containers:
if init_config.command_privileged or init_probe:
docker_pull(self.args, UTILITY_IMAGE)
return
self.container_name = container.name
try:
options = ['--pid', 'host', '--privileged']
if init_config.command and init_config.command_privileged:
init_command = init_config.command
if not init_probe:
init_command += f' && {shlex.join(self.wake_command)}'
cmd = ['nsenter', '-t', str(container.details.container.pid), '-m', '-p', 'sh', '-c', init_command]
run_utility_container(self.args, f'ansible-test-init-{self.label}', cmd, options)
if init_probe:
check_container_cgroup_status(self.args, self.config, self.container_name, init_config.expected_mounts)
cmd = ['nsenter', '-t', str(container.details.container.pid), '-m', '-p'] + self.wake_command
run_utility_container(self.args, f'ansible-test-wake-{self.label}', cmd, options)
except SubprocessError:
display.info(f'Checking container "{self.container_name}" logs...')
docker_logs(self.args, self.container_name)
raise
def get_init_config(self) -> InitConfig:
"""Return init config for running under the current container engine."""
self.check_cgroup_requirements()
engine = require_docker().command
init_config = getattr(self, f'get_{engine}_init_config')()
return init_config
def get_podman_init_config(self) -> InitConfig:
"""Return init config for running under Podman."""
options = self.get_common_run_options()
command: t.Optional[str] = None
command_privileged = False
expected_mounts: tuple[CGroupMount, ...]
cgroup_version = get_docker_info(self.args).cgroup_version
# Without AUDIT_WRITE the following errors may appear in the system logs of a container after attempting to log in using SSH:
#
# fatal: linux_audit_write_entry failed: Operation not permitted
#
# This occurs when running containers as root when the container host provides audit support, but the user lacks the AUDIT_WRITE capability.
# The AUDIT_WRITE capability is provided by docker by default, but not podman.
# See: https://github.com/moby/moby/pull/7179
#
# OpenSSH Portable requires AUDIT_WRITE when logging in with a TTY if the Linux audit feature was compiled in.
# Containers with the feature enabled will require the AUDIT_WRITE capability when EPERM is returned while accessing the audit system.
# See: https://github.com/openssh/openssh-portable/blob/2dc328023f60212cd29504fc05d849133ae47355/audit-linux.c#L90
# See: https://github.com/openssh/openssh-portable/blob/715c892f0a5295b391ae92c26ef4d6a86ea96e8e/loginrec.c#L476-L478
#
# Some containers will be running a patched version of OpenSSH which blocks logins when EPERM is received while using the audit system.
# These containers will require the AUDIT_WRITE capability when EPERM is returned while accessing the audit system.
# See: https://src.fedoraproject.org/rpms/openssh/blob/f36/f/openssh-7.6p1-audit.patch
#
# Since only some containers carry the patch or enable the Linux audit feature in OpenSSH, this capability is enabled on a per-container basis.
# No warning is provided when adding this capability, since there's not really anything the user can do about it.
if self.config.audit == AuditMode.REQUIRED and detect_host_properties(self.args).audit_code == 'EPERM':
options.extend(('--cap-add', 'AUDIT_WRITE'))
# Without AUDIT_CONTROL the following errors may appear in the system logs of a container after attempting to log in using SSH:
#
# pam_loginuid(sshd:session): Error writing /proc/self/loginuid: Operation not permitted
# pam_loginuid(sshd:session): set_loginuid failed
#
# Containers configured to use the pam_loginuid module will encounter this error. If the module is required, logins will fail.
# Since most containers will have this configuration, the code to handle this issue is applied to all containers.
#
# This occurs when the loginuid is set on the container host and doesn't match the user on the container host which is running the container.
# Container hosts which do not use systemd are likely to leave the loginuid unset and thus be unaffected.
# The most common source of a mismatch is the use of sudo to run ansible-test, which changes the uid but cannot change the loginuid.
# This condition typically occurs only under podman, since the loginuid is inherited from the current user.
# See: https://github.com/containers/podman/issues/13012#issuecomment-1034049725
#
# This condition is detected by querying the loginuid of a container running on the container host.
# When it occurs, a warning is displayed and the AUDIT_CONTROL capability is added to containers to work around the issue.
# The warning serves as notice to the user that their usage of ansible-test is responsible for the additional capability requirement.
if (loginuid := detect_host_properties(self.args).loginuid) not in (0, LOGINUID_NOT_SET, None):
display.warning(f'Running containers with capability AUDIT_CONTROL since the container loginuid ({loginuid}) is incorrect. '
'This is most likely due to use of sudo to run ansible-test when loginuid is already set.', unique=True)
options.extend(('--cap-add', 'AUDIT_CONTROL'))
if self.config.cgroup == CGroupVersion.NONE:
# Containers which do not require cgroup do not use systemd.
options.extend((
# Disabling systemd support in Podman will allow these containers to work on hosts without systemd.
# Without this, running a container on a host without systemd results in errors such as (from crun):
# Error: crun: error stat'ing file `/sys/fs/cgroup/systemd`: No such file or directory:
# A similar error occurs when using runc:
# OCI runtime attempted to invoke a command that was not found
'--systemd', 'false',
# A private cgroup namespace limits what is visible in /proc/*/cgroup.
'--cgroupns', 'private',
# Mounting a tmpfs overrides the cgroup mount(s) that would otherwise be provided by Podman.
# This helps provide a consistent container environment across various container host configurations.
'--tmpfs', '/sys/fs/cgroup',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.TMPFS, writable=True, state=None),
)
elif self.config.cgroup in (CGroupVersion.V1_V2, CGroupVersion.V1_ONLY) and cgroup_version == 1:
# Podman hosts providing cgroup v1 will automatically bind mount the systemd hierarchy read-write in the container.
# They will also create a dedicated cgroup v1 systemd hierarchy for the container.
# On hosts with systemd this path is: /sys/fs/cgroup/systemd/libpod_parent/libpod-{container_id}/
# On hosts without systemd this path is: /sys/fs/cgroup/systemd/{container_id}/
options.extend((
# Force Podman to enable systemd support since a command may be used later (to support pre-init diagnostics).
'--systemd', 'always',
# The host namespace must be used to permit the container to access the cgroup v1 systemd hierarchy created by Podman.
'--cgroupns', 'host',
# Mask the host cgroup tmpfs mount to avoid exposing the host cgroup v1 hierarchies (or cgroup v2 hybrid) to the container.
# Podman will provide a cgroup v1 systemd hiearchy on top of this.
'--tmpfs', '/sys/fs/cgroup',
))
self.check_systemd_cgroup_v1(options) # podman
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.TMPFS, writable=True, state=None),
# The mount point can be writable or not.
# The reason for the variation is not known.
CGroupMount(path=CGroupPath.SYSTEMD, type=MountType.CGROUP_V1, writable=None, state=CGroupState.HOST),
# The filesystem type can be tmpfs or devtmpfs.
# The reason for the variation is not known.
CGroupMount(path=CGroupPath.SYSTEMD_RELEASE_AGENT, type=None, writable=False, state=None),
)
elif self.config.cgroup in (CGroupVersion.V1_V2, CGroupVersion.V2_ONLY) and cgroup_version == 2:
# Podman hosts providing cgroup v2 will give each container a read-write cgroup mount.
options.extend((
# Force Podman to enable systemd support since a command may be used later (to support pre-init diagnostics).
'--systemd', 'always',
# A private cgroup namespace is used to avoid exposing the host cgroup to the container.
'--cgroupns', 'private',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.CGROUP_V2, writable=True, state=CGroupState.PRIVATE),
)
elif self.config.cgroup == CGroupVersion.V1_ONLY and cgroup_version == 2:
# Containers which require cgroup v1 need explicit volume mounts on container hosts not providing that version.
# We must put the container PID 1 into the cgroup v1 systemd hierarchy we create.
cgroup_path = self.create_systemd_cgroup_v1() # podman
command = f'echo 1 > {cgroup_path}/cgroup.procs'
options.extend((
# Force Podman to enable systemd support since a command is being provided.
'--systemd', 'always',
# A private cgroup namespace is required. Using the host cgroup namespace results in errors such as the following (from crun):
# Error: OCI runtime error: mount `/sys/fs/cgroup` to '/sys/fs/cgroup': Invalid argument
# A similar error occurs when using runc:
# Error: OCI runtime error: runc create failed: unable to start container process: error during container init:
# error mounting "/sys/fs/cgroup" to rootfs at "/sys/fs/cgroup": mount /sys/fs/cgroup:/sys/fs/cgroup (via /proc/self/fd/7), flags: 0x1000:
# invalid argument
'--cgroupns', 'private',
# Unlike Docker, Podman ignores a /sys/fs/cgroup tmpfs mount, instead exposing a cgroup v2 mount.
# The exposed volume will be read-write, but the container will have its own private namespace.
# Provide a read-only cgroup v1 systemd hierarchy under which the dedicated ansible-test cgroup will be mounted read-write.
# Without this systemd will fail while attempting to mount the cgroup v1 systemd hierarchy.
# Podman doesn't support using a tmpfs for this. Attempting to do so results in an error (from crun):
# Error: OCI runtime error: read: Invalid argument
# A similar error occurs when using runc:
# Error: OCI runtime error: runc create failed: unable to start container process: error during container init:
# error mounting "tmpfs" to rootfs at "/sys/fs/cgroup/systemd": tmpcopyup: failed to copy /sys/fs/cgroup/systemd to /proc/self/fd/7
# (/tmp/runctop3876247619/runctmpdir1460907418): read /proc/self/fd/7/cgroup.kill: invalid argument
'--volume', '/sys/fs/cgroup/systemd:/sys/fs/cgroup/systemd:ro',
# Provide the container access to the cgroup v1 systemd hierarchy created by ansible-test.
'--volume', f'{cgroup_path}:{cgroup_path}:rw',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.CGROUP_V2, writable=True, state=CGroupState.PRIVATE),
CGroupMount(path=CGroupPath.SYSTEMD, type=MountType.CGROUP_V1, writable=False, state=CGroupState.SHADOWED),
CGroupMount(path=cgroup_path, type=MountType.CGROUP_V1, writable=True, state=CGroupState.HOST),
)
else:
raise InternalError(f'Unhandled cgroup configuration: {self.config.cgroup} on cgroup v{cgroup_version}.')
return self.InitConfig(
options=options,
command=command,
command_privileged=command_privileged,
expected_mounts=expected_mounts,
)
def get_docker_init_config(self) -> InitConfig:
"""Return init config for running under Docker."""
options = self.get_common_run_options()
command: t.Optional[str] = None
command_privileged = False
expected_mounts: tuple[CGroupMount, ...]
cgroup_version = get_docker_info(self.args).cgroup_version
if self.config.cgroup == CGroupVersion.NONE:
# Containers which do not require cgroup do not use systemd.
if get_docker_info(self.args).cgroupns_option_supported:
# Use the `--cgroupns` option if it is supported.
# Older servers which do not support the option use the host group namespace.
# Older clients which do not support the option cause newer servers to use the host cgroup namespace (cgroup v1 only).
# See: https://github.com/moby/moby/blob/master/api/server/router/container/container_routes.go#L512-L517
# If the host cgroup namespace is used, cgroup information will be visible, but the cgroup mounts will be unavailable due to the tmpfs below.
options.extend((
# A private cgroup namespace limits what is visible in /proc/*/cgroup.
'--cgroupns', 'private',
))
options.extend((
# Mounting a tmpfs overrides the cgroup mount(s) that would otherwise be provided by Docker.
# This helps provide a consistent container environment across various container host configurations.
'--tmpfs', '/sys/fs/cgroup',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.TMPFS, writable=True, state=None),
)
elif self.config.cgroup in (CGroupVersion.V1_V2, CGroupVersion.V1_ONLY) and cgroup_version == 1:
# Docker hosts providing cgroup v1 will automatically bind mount the systemd hierarchy read-only in the container.
# They will also create a dedicated cgroup v1 systemd hierarchy for the container.
# The cgroup v1 system hierarchy path is: /sys/fs/cgroup/systemd/{container_id}/
if get_docker_info(self.args).cgroupns_option_supported:
# Use the `--cgroupns` option if it is supported.
# Older servers which do not support the option use the host group namespace.
# Older clients which do not support the option cause newer servers to use the host cgroup namespace (cgroup v1 only).
# See: https://github.com/moby/moby/blob/master/api/server/router/container/container_routes.go#L512-L517
options.extend((
# The host cgroup namespace must be used.
# Otherwise, /proc/1/cgroup will report "/" for the cgroup path, which is incorrect.
# See: https://github.com/systemd/systemd/issues/19245#issuecomment-815954506
# It is set here to avoid relying on the current Docker configuration.
'--cgroupns', 'host',
))
options.extend((
# Mask the host cgroup tmpfs mount to avoid exposing the host cgroup v1 hierarchies (or cgroup v2 hybrid) to the container.
'--tmpfs', '/sys/fs/cgroup',
# A cgroup v1 systemd hierarchy needs to be mounted read-write over the read-only one provided by Docker.
# Alternatives were tested, but were unusable due to various issues:
# - Attempting to remount the existing mount point read-write will result in a "mount point is busy" error.
# - Adding the entire "/sys/fs/cgroup" mount will expose hierarchies other than systemd.
# If the host is a cgroup v2 hybrid host it would also expose the /sys/fs/cgroup/unified/ hierarchy read-write.
# On older systems, such as an Ubuntu 18.04 host, a dedicated v2 cgroup would not be used, exposing the host cgroups to the container.
'--volume', '/sys/fs/cgroup/systemd:/sys/fs/cgroup/systemd:rw',
))
self.check_systemd_cgroup_v1(options) # docker
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.TMPFS, writable=True, state=None),
CGroupMount(path=CGroupPath.SYSTEMD, type=MountType.CGROUP_V1, writable=True, state=CGroupState.HOST),
)
elif self.config.cgroup in (CGroupVersion.V1_V2, CGroupVersion.V2_ONLY) and cgroup_version == 2:
# Docker hosts providing cgroup v2 will give each container a read-only cgroup mount.
# It must be remounted read-write before systemd starts.
# This must be done in a privileged container, otherwise a "permission denied" error can occur.
command = 'mount -o remount,rw /sys/fs/cgroup/'
command_privileged = True
options.extend((
# A private cgroup namespace is used to avoid exposing the host cgroup to the container.
# This matches the behavior in Podman 1.7.0 and later, which select cgroupns 'host' mode for cgroup v1 and 'private' mode for cgroup v2.
# See: https://github.com/containers/podman/pull/4374
# See: https://github.com/containers/podman/blob/main/RELEASE_NOTES.md#170
'--cgroupns', 'private',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.CGROUP_V2, writable=True, state=CGroupState.PRIVATE),
)
elif self.config.cgroup == CGroupVersion.V1_ONLY and cgroup_version == 2:
# Containers which require cgroup v1 need explicit volume mounts on container hosts not providing that version.
# We must put the container PID 1 into the cgroup v1 systemd hierarchy we create.
cgroup_path = self.create_systemd_cgroup_v1() # docker
command = f'echo 1 > {cgroup_path}/cgroup.procs'
options.extend((
# A private cgroup namespace is used since no access to the host cgroup namespace is required.
# This matches the configuration used for running cgroup v1 containers under Podman.
'--cgroupns', 'private',
# Provide a read-write tmpfs filesystem to support additional cgroup mount points.
# Without this Docker will provide a read-only cgroup2 mount instead.
'--tmpfs', '/sys/fs/cgroup',
# Provide a read-write tmpfs filesystem to simulate a systemd cgroup v1 hierarchy.
# Without this systemd will fail while attempting to mount the cgroup v1 systemd hierarchy.
'--tmpfs', '/sys/fs/cgroup/systemd',
# Provide the container access to the cgroup v1 systemd hierarchy created by ansible-test.
'--volume', f'{cgroup_path}:{cgroup_path}:rw',
))
expected_mounts = (
CGroupMount(path=CGroupPath.ROOT, type=MountType.TMPFS, writable=True, state=None),
CGroupMount(path=CGroupPath.SYSTEMD, type=MountType.TMPFS, writable=True, state=None),
CGroupMount(path=cgroup_path, type=MountType.CGROUP_V1, writable=True, state=CGroupState.HOST),
)
else:
raise InternalError(f'Unhandled cgroup configuration: {self.config.cgroup} on cgroup v{cgroup_version}.')
return self.InitConfig(
options=options,
command=command,
command_privileged=command_privileged,
expected_mounts=expected_mounts,
)
def build_init_command(self, init_config: InitConfig, sleep: bool) -> t.Optional[list[str]]:
"""
Build and return the command to start in the container.
Returns None if the default command for the container should be used.
The sleep duration below was selected to:
- Allow enough time to perform necessary operations in the container before waking it.
- Make the delay obvious if the wake command doesn't run or succeed.
- Avoid hanging indefinitely or for an unreasonably long time.
NOTE: The container must have a POSIX-compliant default shell "sh" with a non-builtin "sleep" command.
"""
command = ''
if init_config.command and not init_config.command_privileged:
command += f'{init_config.command} && '
if sleep or init_config.command_privileged:
command += 'sleep 60 ; '
if not command:
return None
docker_pull(self.args, self.config.image)
inspect = docker_image_inspect(self.args, self.config.image)
command += f'exec {shlex.join(inspect.cmd)}'
return ['sh', '-c', command]
@property
def wake_command(self) -> list[str]:
"""
The command used to wake the container from sleep.
This will be run inside our utility container, so the command used does not need to be present in the container being woken up.
"""
return ['pkill', 'sleep']
def check_systemd_cgroup_v1(self, options: list[str]) -> None:
"""Check the cgroup v1 systemd hierarchy to verify it is writeable for our container."""
probe_script = (read_text_file(os.path.join(ANSIBLE_TEST_TARGET_ROOT, 'setup', 'check_systemd_cgroup_v1.sh'))
.replace('@MARKER@', self.MARKER)
.replace('@LABEL@', self.label))
cmd = ['sh']
try:
run_utility_container(self.args, f'ansible-test-cgroup-check-{self.label}', cmd, options, data=probe_script)
except SubprocessError as ex:
if error := self.extract_error(ex.stderr):
raise ControlGroupError(self.args, 'Unable to create a v1 cgroup within the systemd hierarchy.\n'
f'Reason: {error}') from ex # cgroup probe failed
raise
def create_systemd_cgroup_v1(self) -> str:
"""Create a unique ansible-test cgroup in the v1 systemd hierarchy and return its path."""
self.cgroup_path = f'/sys/fs/cgroup/systemd/ansible-test-{self.label}'
# Privileged mode is required to create the cgroup directories on some hosts, such as Fedora 36 and RHEL 9.0.
# The mkdir command will fail with "Permission denied" otherwise.
options = ['--volume', '/sys/fs/cgroup/systemd:/sys/fs/cgroup/systemd:rw', '--privileged']
cmd = ['sh', '-c', f'>&2 echo {shlex.quote(self.MARKER)} && mkdir {shlex.quote(self.cgroup_path)}']
try:
run_utility_container(self.args, f'ansible-test-cgroup-create-{self.label}', cmd, options)
except SubprocessError as ex:
if error := self.extract_error(ex.stderr):
raise ControlGroupError(self.args, f'Unable to create a v1 cgroup within the systemd hierarchy.\n'
f'Reason: {error}') from ex # cgroup create permission denied
raise
return self.cgroup_path
@property
def delete_systemd_cgroup_v1_command(self) -> list[str]:
"""The command used to remove the previously created ansible-test cgroup in the v1 systemd hierarchy."""
return ['find', self.cgroup_path, '-type', 'd', '-delete']
def delete_systemd_cgroup_v1(self) -> None:
"""Delete a previously created ansible-test cgroup in the v1 systemd hierarchy."""
# Privileged mode is required to remove the cgroup directories on some hosts, such as Fedora 36 and RHEL 9.0.
# The BusyBox find utility will report "Permission denied" otherwise, although it still exits with a status code of 0.
options = ['--volume', '/sys/fs/cgroup/systemd:/sys/fs/cgroup/systemd:rw', '--privileged']
cmd = ['sh', '-c', f'>&2 echo {shlex.quote(self.MARKER)} && {shlex.join(self.delete_systemd_cgroup_v1_command)}']
try:
run_utility_container(self.args, f'ansible-test-cgroup-delete-{self.label}', cmd, options)
except SubprocessError as ex:
if error := self.extract_error(ex.stderr):
if error.endswith(': No such file or directory'):
return
display.error(str(ex))
def extract_error(self, value: str) -> t.Optional[str]:
"""
Extract the ansible-test portion of the error message from the given value and return it.
Returns None if no ansible-test marker was found.
"""
lines = value.strip().splitlines()
try:
idx = lines.index(self.MARKER)
except ValueError:
return None
lines = lines[idx + 1:]
message = '\n'.join(lines)
return message
def check_cgroup_requirements(self) -> None:
"""Check cgroup requirements for the container."""
cgroup_version = get_docker_info(self.args).cgroup_version
if cgroup_version not in (1, 2):
raise ApplicationError(f'The container host provides cgroup v{cgroup_version}, but only version v1 and v2 are supported.')
# Stop early for containers which require cgroup v2 when the container host does not provide it.
# None of the containers included with ansible-test currently use this configuration.
# Support for v2-only was added in preparation for the eventual removal of cgroup v1 support from systemd after EOY 2023.
# See: https://github.com/systemd/systemd/pull/24086
if self.config.cgroup == CGroupVersion.V2_ONLY and cgroup_version != 2:
raise ApplicationError(f'Container {self.config.name} requires cgroup v2 but the container host provides cgroup v{cgroup_version}.')
# Containers which use old versions of systemd (earlier than version 226) require cgroup v1 support.
# If the host is a cgroup v2 (unified) host, changes must be made to how the container is run.
#
# See: https://github.com/systemd/systemd/blob/main/NEWS
# Under the "CHANGES WITH 226" section:
# > systemd now optionally supports the new Linux kernel "unified" control group hierarchy.
#
# NOTE: The container host must have the cgroup v1 mount already present.
# If the container is run rootless, the user it runs under must have permissions to the mount.
#
# The following commands can be used to make the mount available:
#
# mkdir /sys/fs/cgroup/systemd
# mount cgroup -t cgroup /sys/fs/cgroup/systemd -o none,name=systemd,xattr
# chown -R {user}:{group} /sys/fs/cgroup/systemd # only when rootless
#
# See: https://github.com/containers/crun/blob/main/crun.1.md#runocisystemdforce_cgroup_v1path
if self.config.cgroup == CGroupVersion.V1_ONLY or (self.config.cgroup != CGroupVersion.NONE and get_docker_info(self.args).cgroup_version == 1):
if (cgroup_v1 := detect_host_properties(self.args).cgroup_v1) != SystemdControlGroupV1Status.VALID:
if self.config.cgroup == CGroupVersion.V1_ONLY:
if get_docker_info(self.args).cgroup_version == 2:
reason = f'Container {self.config.name} requires cgroup v1, but the container host only provides cgroup v2.'
else:
reason = f'Container {self.config.name} requires cgroup v1, but the container host does not appear to be running systemd.'
else:
reason = 'The container host provides cgroup v1, but does not appear to be running systemd.'
reason += f'\n{cgroup_v1.value}'
raise ControlGroupError(self.args, reason) # cgroup probe reported invalid state
def setup(self) -> None:
"""Perform out-of-band setup before delegation."""
bootstrapper = BootstrapDocker(
controller=self.controller,
python_versions=[self.python.version],
ssh_key=SshKey(self.args),
)
setup_sh = bootstrapper.get_script()
shell = setup_sh.splitlines()[0][2:]
try:
docker_exec(self.args, self.container_name, [shell], data=setup_sh, capture=False)
except SubprocessError:
display.info(f'Checking container "{self.container_name}" logs...')
docker_logs(self.args, self.container_name)
raise
def deprovision(self) -> None:
"""Deprovision the host after delegation has completed."""
container_exists = False
if self.container_name:
if self.args.docker_terminate == TerminateMode.ALWAYS or (self.args.docker_terminate == TerminateMode.SUCCESS and self.args.success):
docker_rm(self.args, self.container_name)
else:
container_exists = True
if self.cgroup_path:
if container_exists:
display.notice(f'Remember to run `{require_docker().command} rm -f {self.container_name}` when finished testing. '
f'Then run `{shlex.join(self.delete_systemd_cgroup_v1_command)}` on the container host.')
else:
self.delete_systemd_cgroup_v1()
elif container_exists:
display.notice(f'Remember to run `{require_docker().command} rm -f {self.container_name}` when finished testing.')
def wait(self) -> None:
"""Wait for the instance to be ready. Executed before delegation for the controller and after delegation for targets."""
if not self.controller:
con = self.get_controller_target_connections()[0]
last_error = ''
for dummy in range(1, 10):
try:
con.run(['id'], capture=True)
except SubprocessError as ex:
if 'Permission denied' in ex.message:
raise
last_error = str(ex)
time.sleep(1)
else:
return
display.info('Checking SSH debug output...')
display.info(last_error)
if not self.args.delegate and not self.args.host_path:
def callback() -> None:
"""Callback to run during error display."""
self.on_target_failure() # when the controller is not delegated, report failures immediately
else:
callback = None
raise HostConnectionError(f'Timeout waiting for {self.config.name} container {self.container_name}.', callback)
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
containers = get_container_database(self.args)
access = containers.data[HostType.control]['__test_hosts__'][self.container_name]
host = access.host_ip
port = dict(access.port_map())[22]
settings = SshConnectionDetail(
name=self.config.name,
user='root',
host=host,
port=port,
identity_file=SshKey(self.args).key,
python_interpreter=self.python.path,
# CentOS 6 uses OpenSSH 5.3, making it incompatible with the default configuration of OpenSSH 8.8 and later clients.
# Since only CentOS 6 is affected, and it is only supported by ansible-core 2.12, support for RSA SHA-1 is simply hard-coded here.
# A substring is used to allow custom containers to work, not just the one provided with ansible-test.
enable_rsa_sha1='centos6' in self.config.image,
)
return [SshConnection(self.args, settings)]
def get_origin_controller_connection(self) -> DockerConnection:
"""Return a connection for accessing the host as a controller from the origin."""
return DockerConnection(self.args, self.container_name)
def get_working_directory(self) -> str:
"""Return the working directory for the host."""
return '/root'
def on_target_failure(self) -> None:
"""Executed during failure handling if this profile is a target."""
display.info(f'Checking container "{self.container_name}" logs...')
try:
docker_logs(self.args, self.container_name)
except SubprocessError as ex:
display.error(str(ex))
if self.config.cgroup != CGroupVersion.NONE:
# Containers with cgroup support are assumed to be running systemd.
display.info(f'Checking container "{self.container_name}" systemd logs...')
try:
docker_exec(self.args, self.container_name, ['journalctl'], capture=False)
except SubprocessError as ex:
display.error(str(ex))
display.error(f'Connection to container "{self.container_name}" failed. See logs and original error above.')
def get_common_run_options(self) -> list[str]:
"""Return a list of options needed to run the container."""
options = [
# These temporary mount points need to be created at run time when using Docker.
# They are automatically provided by Podman, but will be overridden by VOLUME instructions for the container, if they exist.
# If supporting containers with VOLUME instructions is not desired, these options could be limited to use with Docker.
# See: https://github.com/containers/podman/pull/1318
# Previously they were handled by the VOLUME instruction during container image creation.
# However, that approach creates anonymous volumes when running the container, which are then left behind after the container is deleted.
# These options eliminate the need for the VOLUME instruction, and override it if they are present.
# The mount options used are those typically found on Linux systems.
# Of special note is the "exec" option for "/tmp", which is required by ansible-test for path injection of executables using temporary directories.
'--tmpfs', '/tmp:exec',
'--tmpfs', '/run:exec',
'--tmpfs', '/run/lock', # some systemd containers require a separate tmpfs here, such as Ubuntu 20.04 and Ubuntu 22.04
]
if self.config.privileged:
options.append('--privileged')
if self.config.memory:
options.extend([
f'--memory={self.config.memory}',
f'--memory-swap={self.config.memory}',
])
if self.config.seccomp != 'default':
options.extend(['--security-opt', f'seccomp={self.config.seccomp}'])
docker_socket = '/var/run/docker.sock'
if get_docker_hostname() != 'localhost' or os.path.exists(docker_socket):
options.extend(['--volume', f'{docker_socket}:{docker_socket}'])
return options
class NetworkInventoryProfile(HostProfile[NetworkInventoryConfig]):
"""Host profile for a network inventory."""
class NetworkRemoteProfile(RemoteProfile[NetworkRemoteConfig]):
"""Host profile for a network remote instance."""
def wait(self) -> None:
"""Wait for the instance to be ready. Executed before delegation for the controller and after delegation for targets."""
self.wait_until_ready()
def get_inventory_variables(self) -> dict[str, t.Optional[t.Union[str, int]]]:
"""Return inventory variables for accessing this host."""
core_ci = self.wait_for_instance()
connection = core_ci.connection
variables: dict[str, t.Optional[t.Union[str, int]]] = dict(
ansible_connection=self.config.connection,
ansible_pipelining='yes',
ansible_host=connection.hostname,
ansible_port=connection.port,
ansible_user=connection.username,
ansible_ssh_private_key_file=core_ci.ssh_key.key,
# VyOS 1.1.8 uses OpenSSH 5.5, making it incompatible with RSA SHA-256/512 used by Paramiko 2.9 and later.
# IOS CSR 1000V uses an ancient SSH server, making it incompatible with RSA SHA-256/512 used by Paramiko 2.9 and later.
# That means all network platforms currently offered by ansible-core-ci require support for RSA SHA-1, so it is simply hard-coded here.
# NOTE: This option only exists in ansible-core 2.14 and later. For older ansible-core versions, use of Paramiko 2.8.x or earlier is required.
# See: https://github.com/ansible/ansible/pull/78789
# See: https://github.com/ansible/ansible/pull/78842
ansible_paramiko_use_rsa_sha2_algorithms='no',
ansible_network_os=f'{self.config.collection}.{self.config.platform}' if self.config.collection else self.config.platform,
)
return variables
def wait_until_ready(self) -> None:
"""Wait for the host to respond to an Ansible module request."""
core_ci = self.wait_for_instance()
if not isinstance(self.args, IntegrationConfig):
return # skip extended checks unless we're running integration tests
inventory = Inventory.create_single_host(sanitize_host_name(self.config.name), self.get_inventory_variables())
env = ansible_environment(self.args)
module_name = f'{self.config.collection + "." if self.config.collection else ""}{self.config.platform}_command'
with tempfile.NamedTemporaryFile() as inventory_file:
inventory.write(self.args, inventory_file.name)
cmd = ['ansible', '-m', module_name, '-a', 'commands=?', '-i', inventory_file.name, 'all']
for dummy in range(1, 90):
try:
intercept_python(self.args, self.args.controller_python, cmd, env, capture=True)
except SubprocessError as ex:
display.warning(str(ex))
time.sleep(10)
else:
return
raise HostConnectionError(f'Timeout waiting for {self.config.name} instance {core_ci.instance_id}.')
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
core_ci = self.wait_for_instance()
settings = SshConnectionDetail(
name=core_ci.name,
host=core_ci.connection.hostname,
port=core_ci.connection.port,
user=core_ci.connection.username,
identity_file=core_ci.ssh_key.key,
# VyOS 1.1.8 uses OpenSSH 5.5, making it incompatible with the default configuration of OpenSSH 8.8 and later clients.
# IOS CSR 1000V uses an ancient SSH server, making it incompatible with the default configuration of OpenSSH 8.8 and later clients.
# That means all network platforms currently offered by ansible-core-ci require support for RSA SHA-1, so it is simply hard-coded here.
enable_rsa_sha1=True,
)
return [SshConnection(self.args, settings)]
class OriginProfile(ControllerHostProfile[OriginConfig]):
"""Host profile for origin."""
def get_origin_controller_connection(self) -> LocalConnection:
"""Return a connection for accessing the host as a controller from the origin."""
return LocalConnection(self.args)
def get_working_directory(self) -> str:
"""Return the working directory for the host."""
return os.getcwd()
class PosixRemoteProfile(ControllerHostProfile[PosixRemoteConfig], RemoteProfile[PosixRemoteConfig]):
"""Host profile for a POSIX remote instance."""
def wait(self) -> None:
"""Wait for the instance to be ready. Executed before delegation for the controller and after delegation for targets."""
self.wait_until_ready()
def configure(self) -> None:
"""Perform in-band configuration. Executed before delegation for the controller and after delegation for targets."""
# a target uses a single python version, but a controller may include additional versions for targets running on the controller
python_versions = [self.python.version] + [target.python.version for target in self.targets if isinstance(target, ControllerConfig)]
python_versions = sorted_versions(list(set(python_versions)))
core_ci = self.wait_for_instance()
pwd = self.wait_until_ready()
display.info(f'Remote working directory: {pwd}', verbosity=1)
bootstrapper = BootstrapRemote(
controller=self.controller,
platform=self.config.platform,
platform_version=self.config.version,
python_versions=python_versions,
ssh_key=core_ci.ssh_key,
)
setup_sh = bootstrapper.get_script()
shell = setup_sh.splitlines()[0][2:]
ssh = self.get_origin_controller_connection()
ssh.run([shell], data=setup_sh, capture=False)
def get_ssh_connection(self) -> SshConnection:
"""Return an SSH connection for accessing the host."""
core_ci = self.wait_for_instance()
settings = SshConnectionDetail(
name=core_ci.name,
user=core_ci.connection.username,
host=core_ci.connection.hostname,
port=core_ci.connection.port,
identity_file=core_ci.ssh_key.key,
python_interpreter=self.python.path,
)
if settings.user == 'root':
become: t.Optional[Become] = None
elif self.config.become:
become = SUPPORTED_BECOME_METHODS[self.config.become]()
else:
display.warning(f'Defaulting to "sudo" for platform "{self.config.platform}" become support.', unique=True)
become = Sudo()
return SshConnection(self.args, settings, become)
def wait_until_ready(self) -> str:
"""Wait for instance to respond to SSH, returning the current working directory once connected."""
core_ci = self.wait_for_instance()
for dummy in range(1, 90):
try:
return self.get_working_directory()
except SubprocessError as ex:
# No "Permission denied" check is performed here.
# Unlike containers, with remote instances, user configuration isn't guaranteed to have been completed before SSH connections are attempted.
display.warning(str(ex))
time.sleep(10)
raise HostConnectionError(f'Timeout waiting for {self.config.name} instance {core_ci.instance_id}.')
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
return [self.get_ssh_connection()]
def get_origin_controller_connection(self) -> SshConnection:
"""Return a connection for accessing the host as a controller from the origin."""
return self.get_ssh_connection()
def get_working_directory(self) -> str:
"""Return the working directory for the host."""
if not self.pwd:
ssh = self.get_origin_controller_connection()
stdout = ssh.run(['pwd'], capture=True)[0]
if self.args.explain:
return '/pwd'
pwd = stdout.strip().splitlines()[-1]
if not pwd.startswith('/'):
raise Exception(f'Unexpected current working directory "{pwd}" from "pwd" command output:\n{stdout.strip()}')
self.pwd = pwd
return self.pwd
@property
def pwd(self) -> t.Optional[str]:
"""Return the cached pwd, if any, otherwise None."""
return self.cache.get('pwd')
@pwd.setter
def pwd(self, value: str) -> None:
"""Cache the given pwd."""
self.cache['pwd'] = value
class PosixSshProfile(SshTargetHostProfile[PosixSshConfig], PosixProfile[PosixSshConfig]):
"""Host profile for a POSIX SSH instance."""
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
settings = SshConnectionDetail(
name='target',
user=self.config.user,
host=self.config.host,
port=self.config.port,
identity_file=SshKey(self.args).key,
python_interpreter=self.python.path,
)
return [SshConnection(self.args, settings)]
class WindowsInventoryProfile(SshTargetHostProfile[WindowsInventoryConfig]):
"""Host profile for a Windows inventory."""
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
inventory = parse_inventory(self.args, self.config.path)
hosts = get_hosts(inventory, 'windows')
identity_file = SshKey(self.args).key
settings = [SshConnectionDetail(
name=name,
host=config['ansible_host'],
port=22,
user=config['ansible_user'],
identity_file=identity_file,
shell_type='powershell',
) for name, config in hosts.items()]
if settings:
details = '\n'.join(f'{ssh.name} {ssh.user}@{ssh.host}:{ssh.port}' for ssh in settings)
display.info(f'Generated SSH connection details from inventory:\n{details}', verbosity=1)
return [SshConnection(self.args, setting) for setting in settings]
class WindowsRemoteProfile(RemoteProfile[WindowsRemoteConfig]):
"""Host profile for a Windows remote instance."""
def wait(self) -> None:
"""Wait for the instance to be ready. Executed before delegation for the controller and after delegation for targets."""
self.wait_until_ready()
def get_inventory_variables(self) -> dict[str, t.Optional[t.Union[str, int]]]:
"""Return inventory variables for accessing this host."""
core_ci = self.wait_for_instance()
connection = core_ci.connection
variables: dict[str, t.Optional[t.Union[str, int]]] = dict(
ansible_connection='winrm',
ansible_pipelining='yes',
ansible_winrm_server_cert_validation='ignore',
ansible_host=connection.hostname,
ansible_port=connection.port,
ansible_user=connection.username,
ansible_password=connection.password,
ansible_ssh_private_key_file=core_ci.ssh_key.key,
)
# HACK: force 2016 to use NTLM + HTTP message encryption
if self.config.version == '2016':
variables.update(
ansible_winrm_transport='ntlm',
ansible_winrm_scheme='http',
ansible_port='5985',
)
return variables
def wait_until_ready(self) -> None:
"""Wait for the host to respond to an Ansible module request."""
core_ci = self.wait_for_instance()
if not isinstance(self.args, IntegrationConfig):
return # skip extended checks unless we're running integration tests
inventory = Inventory.create_single_host(sanitize_host_name(self.config.name), self.get_inventory_variables())
env = ansible_environment(self.args)
module_name = 'ansible.windows.win_ping'
with tempfile.NamedTemporaryFile() as inventory_file:
inventory.write(self.args, inventory_file.name)
cmd = ['ansible', '-m', module_name, '-i', inventory_file.name, 'all']
for dummy in range(1, 120):
try:
intercept_python(self.args, self.args.controller_python, cmd, env, capture=True)
except SubprocessError as ex:
display.warning(str(ex))
time.sleep(10)
else:
return
raise HostConnectionError(f'Timeout waiting for {self.config.name} instance {core_ci.instance_id}.')
def get_controller_target_connections(self) -> list[SshConnection]:
"""Return SSH connection(s) for accessing the host as a target from the controller."""
core_ci = self.wait_for_instance()
settings = SshConnectionDetail(
name=core_ci.name,
host=core_ci.connection.hostname,
port=22,
user=core_ci.connection.username,
identity_file=core_ci.ssh_key.key,
shell_type='powershell',
)
return [SshConnection(self.args, settings)]
@cache
def get_config_profile_type_map() -> dict[t.Type[HostConfig], t.Type[HostProfile]]:
"""Create and return a mapping of HostConfig types to HostProfile types."""
return get_type_map(HostProfile, HostConfig)
def create_host_profile(
args: EnvironmentConfig,
config: HostConfig,
controller: bool,
) -> HostProfile:
"""Create and return a host profile from the given host configuration."""
profile_type = get_config_profile_type_map()[type(config)]
profile = profile_type(args=args, config=config, targets=args.targets if controller else None)
return profile