Skip to content

Commit

Permalink
Fixing problem with multiple VM reboots
Browse files Browse the repository at this point in the history
Try to differentiate power_state vm power_action
Surprise - vm_params can send RESET to stopped VM, it does not fail
(no 500 error), but VM does not get booted (it was not running before).

Signed-off-by: Justin Cinkelj <[email protected]>
  • Loading branch information
justinc1 committed Feb 23, 2024
1 parent f0daa50 commit 1777a75
Show file tree
Hide file tree
Showing 6 changed files with 566 additions and 259 deletions.
123 changes: 86 additions & 37 deletions plugins/module_utils/vm.py
Original file line number Diff line number Diff line change
Expand Up @@ -52,9 +52,18 @@
stop="STOP",
reboot="REBOOT",
reset="RESET",
started="START",
started="START", # TODO remove?
)

FROM_ANSIBLE_POWER_ACTION_TO_ANSIBLE_POWER_STATE = dict(
start="started",
# both "stop" and "shutdown" result in "stopped" state
shutdown="stopped",
stop="stopped",
reboot="started",
reset="started",
started="started", # TODO remove?
)

VM_PAYLOAD_KEYS = [
"blockDevs",
Expand Down Expand Up @@ -83,7 +92,9 @@
"NVRAM",
]


# List VM params that require VM reboot,
# either because VM then can be changed only if VM is shutdown,
# or because change is applied only after shutdown.
REBOOT_LOOKUP = dict(
vm_name=False,
description=False,
Expand Down Expand Up @@ -208,6 +219,7 @@ def __init__(
tags=None, # tags are stored internally as list of strings
description=None,
power_state=None,
power_action=None,
nics=None, # nics represents a list of type Nic
disks=None, # disks represents a list of type Nic
# boot_devices are stored as list of nics and/or disks internally.
Expand All @@ -228,7 +240,6 @@ def __init__(
self.tags = tags
self.description = description
self.mem = memory
self.power_state = power_state
self.numVCPU = vcpu
self.nics = nics or []
self.disks = disks or []
Expand All @@ -240,8 +251,28 @@ def __init__(
self.machine_type = machine_type
self.replication_source_vm_uuid = replication_source_vm_uuid

if power_state not in FROM_HYPERCORE_TO_ANSIBLE_POWER_STATE.values():
if power_state not in list(FROM_HYPERCORE_TO_ANSIBLE_POWER_STATE.values()) + [None]:
raise AssertionError(f"Unknown VM power_state={power_state}")
if power_action not in list(FROM_ANSIBLE_TO_HYPERCORE_POWER_ACTION.keys()) + [None]:
raise AssertionError(f"Unknown VM power_action={power_action}")
# VM.from_hypercore() will get only power_state
# VM.from_ansible() will get only power_action
if power_state and power_action:
# is bug, or is this useful?
raise AssertionError(f"Both power_state={power_state} and power_action={power_action} are set")
if power_state is None and power_action is None:
# is bug, or is this useful?
raise AssertionError(f"Neither power_state={power_state} nor power_action={power_action} is set")
self._power_state = power_state
self._power_action = power_action
if power_state and power_action is None:
# computer required action (if current state is known)
pass
if power_state is None and power_action:
# compute final power_state after action is applied
pass
#self._power_state = FROM_ANSIBLE_POWER_ACTION_TO_ANSIBLE_POWER_STATE[power_action]

self._initially_running = power_state == "started"
# .was_nice_shutdown_tried is True if nice ACPI shutdown was tried
self._was_nice_shutdown_tried = False
Expand All @@ -268,9 +299,8 @@ def from_ansible(cls, ansible_data):
vm_dict = ansible_data

# Unfortunately we were using in playbooks "start" instead of "started", etc.
power_state_value = vm_dict.get("power_state", None)
if power_state_value == "start":
power_state_value = "started"
# Ansible module param with name "power_state" is actually power_action.
power_action = vm_dict.get("power_state", None)

return cls(
uuid=vm_dict.get("uuid", None), # No uuid when creating object from ansible
Expand All @@ -286,7 +316,7 @@ def from_ansible(cls, ansible_data):
boot_devices=vm_dict.get("boot_devices", []),
attach_guest_tools_iso=vm_dict["attach_guest_tools_iso"] or False,
operating_system=vm_dict.get("operating_system"),
power_state=power_state_value,
power_action=power_action,
machine_type=vm_dict.get("machine_type", None),
)

Expand Down Expand Up @@ -536,9 +566,9 @@ def to_hypercore(self, hcversion: HyperCoreVersion):
if self.operating_system:
vm_dict["operatingSystem"] = self.operating_system
# state attribute is used by HC3 only during VM create.
if self.power_state:
if self._power_action:
vm_dict["state"] = FROM_ANSIBLE_TO_HYPERCORE_POWER_ACTION.get(
self.power_state, "unknown-power-state-sorry"
self._power_action, "unknown-power-state-sorry"
)

if self.machine_type and hcversion.verify("<9.3.0"):
Expand All @@ -554,7 +584,7 @@ def to_ansible(self):
vm_name=self.name,
description=self.description,
operating_system=self.operating_system,
power_state=self.power_state,
power_state=self._power_state,
memory=self.mem,
vcpu=self.numVCPU,
disks=[disk.to_ansible() for disk in self.disk_list],
Expand Down Expand Up @@ -713,7 +743,7 @@ def clone_vm(self, rest_client, ansible_dict):
timeout=None,
)

def __eq__(self, other):
def __eq__(self, other: "VM"):
"""One VM is equal to another if it has ALL attributes exactly the same"""
return all(
(
Expand All @@ -724,7 +754,8 @@ def __eq__(self, other):
self.tags == other.tags,
self.description == other.description,
self.mem == other.mem,
self.power_state == other.power_state,
self._power_state == other._power_state,
self._power_action == other._power_action,
self.numVCPU == other.numVCPU,
self.nics == other.nics,
self.disks == other.disks,
Expand Down Expand Up @@ -812,22 +843,22 @@ def get_vm_and_boot_devices(cls, ansible_dict, rest_client):
]
return vm, boot_devices_uuid, boot_devices_ansible

def update_vm_power_state(self, module, rest_client, desired_power_state):
def update_vm_power_state(self, module, rest_client, desired_power_action):
"""Sets the power state to what is stored in self.power_state"""
# desired_power_state must be present in FROM_ANSIBLE_TO_HYPERCORE_ACTION_STATE's keys
if not self.power_state:
if not self._power_state:
raise errors.ScaleComputingError("No information about VM's power state.")

# keep a record what was done
if desired_power_state == "start":
if desired_power_action == "start":
if self._was_start_tried:
raise AssertionError("VM _was_start_tried already set")
self._was_start_tried = True
if desired_power_state == "shutdown":
if desired_power_action == "shutdown":
if self._was_nice_shutdown_tried:
raise AssertionError("VM _was_nice_shutdown_tried already set")
self._was_nice_shutdown_tried = True
if desired_power_state == "stop":
if desired_power_action == "stop":
if self._was_force_shutdown_tried:
raise AssertionError("VM _was_force_shutdown_tried already set")
self._was_force_shutdown_tried = True
Expand All @@ -839,7 +870,7 @@ def update_vm_power_state(self, module, rest_client, desired_power_state):
dict(
virDomainUUID=self.uuid,
actionType=FROM_ANSIBLE_TO_HYPERCORE_POWER_ACTION[
desired_power_state
desired_power_action
],
cause="INTERNAL",
)
Expand Down Expand Up @@ -936,10 +967,21 @@ def wait_shutdown(self, module, rest_client):
return False

def vm_power_up(self, module, rest_client):
# Powers up a VM in case it was shutdown during module action.
# Do not power up VM that was initially stopped.
# Powers up a VM in case:
# - VM was shutdown during module execution or
# - started/running state was explicitly requested (by module param power_state).
# But: VM is not started if
# - VM was initially stopped and
# - module param power_state is omitted or contains "stop".
if self.was_vm_shutdown() and self._initially_running:
self.update_vm_power_state(module, rest_client, "start")
return
# Also start VM if module power_state requires a power on.
# Field _power_action is set only if VM instance was created with from_ansible();
# it is None if VM instance was created with from_hypercore().
requested_power_action = module.params.get("power_state")
if requested_power_action == "start":
self.update_vm_power_state(module, rest_client, "start")

def was_vm_shutdown(self) -> bool:
"""
Expand Down Expand Up @@ -1064,9 +1106,22 @@ def _to_be_changed(vm, module, param_subset: List[str]):
# is in FROM_ANSIBLE_TO_HYPERCORE_POWER_ACTION.keys(), whereas vm.power_state
# is in FROM_HYPERCORE_TO_ANSIBLE_POWER_STATE.values().
# state in playbook is different than read from HC3 (start/started)
# E.g. "start" in "started", "stop" in "stopped".
# TODO double check if text above is still true
is_substring = module.params["power_state"] not in vm.power_state
changed_params["power_state"] = is_substring
# is_substring = module.params["power_state"] not in vm._power_action
# changed_params["power_state"] = is_substring
# q(module.params["power_state"], vm._power_state, vm._power_action, changed_params["power_state"])

# vm._power_state describes actual state from HC3.
# module.params["power_state"] is ansible power_action, describing desired state.
requested_power_action = module.params["power_state"]
if requested_power_action in ["reset", "reboot"]:
# "reset" and "reboot" needs to be applied always.
changed_params["power_state"] = True
else:
desired_power_state = FROM_ANSIBLE_POWER_ACTION_TO_ANSIBLE_POWER_STATE[requested_power_action]
changed_params["power_state"] = desired_power_state != vm._power_state

if module.params.get("machine_type") is not None:
changed_params["machine_type"] = (
vm.machine_type != module.params["machine_type"]
Expand Down Expand Up @@ -1132,7 +1187,7 @@ def _build_after_diff(module, rest_client):
if module.params["vcpu"] is not None:
after["vcpu"] = vm.numVCPU
if module.params["power_state"]:
after["power_state"] = vm.power_state
after["power_state"] = vm._power_state
if module.params["snapshot_schedule"] is not None:
after["snapshot_schedule"] = vm.snapshot_schedule
return after
Expand All @@ -1153,7 +1208,7 @@ def _build_before_diff(vm, module):
if module.params["vcpu"]:
before["vcpu"] = vm.numVCPU
if module.params["power_state"]:
before["power_state"] = vm.power_state
before["power_state"] = vm._power_state
if module.params["snapshot_schedule"] is not None:
before["snapshot_schedule"] = vm.snapshot_schedule
return before
Expand All @@ -1172,17 +1227,8 @@ def set_vm_params(cls, module, rest_client, vm, param_subset: List[str]):
TaskTag.wait_task(rest_client, task_tag)
if ManageVMParams._needs_reboot(
module, changed_parameters
) and vm.power_state not in ["stop", "stopped", "shutdown"]:
) and vm._power_action not in ["stop", "stopped", "shutdown"]:
vm.do_shutdown_steps(module, rest_client)
else:
# boot/reboot/reset VM if requested
# power_state needs different endpoint
# Wait_task in update_vm_power_state doesn't handle check_mode
# TODO likely this is to early for VM module
if module.params["power_state"] and not module.check_mode:
vm.update_vm_power_state(
module, rest_client, module.params["power_state"]
)
return (
True,
dict(
Expand Down Expand Up @@ -1218,11 +1264,14 @@ def _check_if_required_disks_are_present(
f"machine_type={module.params['machine_type']} not included in set_vm_params."
)
# At end of module execution we will have VM with final_disks.
final_disks = vm.disks
if module.params["disks"]:
if "disks" in module.params:
# vm module, "disks" param was passed
final_disks = [
Disk.from_ansible(disk) for disk in module.params["disks"]
]
else:
# vm_params has no disks, we need to check the actual VM disks
final_disks = vm.disks
nvram_disks = [disk for disk in final_disks if disk.type == "nvram"]
vtpm_disks = [disk for disk in final_disks if disk.type == "vtpm"]
fail_message_requirements = []
Expand Down
3 changes: 2 additions & 1 deletion plugins/modules/vm.py
Original file line number Diff line number Diff line change
Expand Up @@ -523,7 +523,8 @@ def ensure_absent(module, rest_client):
reboot = False
vm = VM.get_by_name(module.params, rest_client)
if vm:
if vm.power_state != "shutdown": # First, shut it off and then delete
if vm._power_state != "shutdown": # First, shut it off and then delete
# TODO ==shutdown or ==stopped ??
vm.update_vm_power_state(module, rest_client, "stop")
task_tag = rest_client.delete_record(
"{0}/{1}".format("/rest/v1/VirDomain", vm.uuid), module.check_mode
Expand Down
Loading

0 comments on commit 1777a75

Please sign in to comment.