1# Copyright 2016 The Chromium OS Authors. All rights reserved. 2# Use of this source code is governed by a BSD-style license that can be 3# found in the LICENSE file. 4 5""" 6Repair actions and verifiers relating to CrOS firmware. 7 8This contains the repair actions and verifiers need to find problems 9with the firmware installed on Chrome OS DUTs, and when necessary, to 10fix problems by updating or re-installing the firmware. 11 12The operations in the module support two distinct use cases: 13 * DUTs used for FAFT tests can in some cases have problems with 14 corrupted firmware. The module supplies `FirmwareStatusVerifier` 15 to check for corruption, and supplies `FirmwareRepair` to re-install 16 firmware via servo when needed. 17 * DUTs used for general testing normally should be running a 18 designated "stable" firmware version. This module supplies 19 `FirmwareVersionVerifier` to detect and automatically update 20 firmware that is out-of-date from the designated version. 21 22For purposes of the operations in the module, we distinguish three kinds 23of DUT, based on pool assignments: 24 * DUTs used for general testing. These DUTs automatically check for 25 and install the stable firmware using `FirmwareVersionVerifier`. 26 * DUTs in pools used for FAFT testing. These check for bad firmware 27 builds with `FirmwareStatusVerifier`, and will fix problems using 28 `FirmwareRepair`. These DUTs don't check for or install the 29 stable firmware. 30 * DUTs not in general pools, and not used for FAFT. These DUTs 31 are expected to be managed by separate processes and are excluded 32 from all of the verification and repair code in this module. 33""" 34 35# pylint: disable=missing-docstring 36 37import logging 38import re 39 40import common 41from autotest_lib.client.common_lib import global_config 42from autotest_lib.client.common_lib import hosts 43from autotest_lib.server import afe_utils 44from autotest_lib.server.hosts import repair_utils 45 46 47# _FIRMWARE_REPAIR_POOLS - The set of pools that should be 48# managed by `FirmwareStatusVerifier` and `FirmwareRepair`. 49# 50_FIRMWARE_REPAIR_POOLS = set( 51 global_config.global_config.get_config_value( 52 'CROS', 53 'pools_support_firmware_repair', 54 type=str).split(',')) 55 56 57def _is_firmware_repair_supported(host): 58 """ 59 Check if a host supports firmware repair. 60 61 When this function returns true, the DUT should be managed by 62 `FirmwareStatusVerifier` and `FirmwareRepair`, but not 63 `FirmwareVersionVerifier`. In general, this applies to DUTs 64 used for firmware testing. 65 66 @return A true value if the host should use `FirmwareStatusVerifier` 67 and `FirmwareRepair`; a false value otherwise. 68 """ 69 info = host.host_info_store.get() 70 return bool(info.pools & _FIRMWARE_REPAIR_POOLS) 71 72 73def _is_firmware_update_supported(host): 74 """ 75 Return whether a DUT should be running the standard firmware. 76 77 In the test lab, DUTs used for general testing, (e.g. the `bvt` 78 pool) need their firmware kept up-to-date with 79 `FirmwareVersionVerifier`. However, some pools have alternative 80 policies for firmware management. This returns whether a given DUT 81 should be updated via the standard stable version update, or 82 managed by some other procedure. 83 84 @param host The host to be checked for update policy. 85 @return A true value if the host should use 86 `FirmwareVersionVerifier`; a false value otherwise. 87 """ 88 return not _is_firmware_repair_supported(host) 89 90 91def _get_firmware_version(output): 92 """Parse the output and get the firmware version. 93 94 @param output The standard output of chromeos-firmwareupdate script. 95 @return Firmware version if found, else, None. 96 """ 97 # At one point, the chromeos-firmwareupdate script was updated to 98 # add "RW" version fields. The old string, "BIOS version:" still 99 # appears in the new output, however it now refers to the RO 100 # firmware version. Therefore, we try searching for the new string 101 # first, "BIOS (RW) version". If that string isn't found, we then 102 # fallback to searching for old string. 103 version = re.search(r'BIOS \(RW\) version:\s*(?P<version>.*)', output) 104 105 if not version: 106 version = re.search(r'BIOS version:\s*(?P<version>.*)', output) 107 108 if version is not None: 109 return version.group('version') 110 111 return None 112 113 114def _get_available_firmware(host, model): 115 """Get the available firmware version given the model. 116 117 @param host The host to get available firmware for. 118 @param model The model name to get corresponding firmware version. 119 @return The available firmware version if found, else, None. 120 """ 121 result = host.run('chromeos-firmwareupdate -V', ignore_status=True) 122 123 if result.exit_status == 0: 124 unibuild = False 125 paragraphs = result.stdout.split('\n\n') 126 for p in paragraphs: 127 match = re.search(r'Model:\s*(?P<model>.*)', p) 128 if match: 129 unibuild = True 130 if model == match.group('model'): 131 return _get_firmware_version(p) 132 133 if not unibuild: 134 return _get_firmware_version(result.stdout) 135 136 return None 137 138 139class FirmwareStatusVerifier(hosts.Verifier): 140 """ 141 Verify that a host's firmware is in a good state. 142 143 For DUTs that run firmware tests, it's possible that the firmware 144 on the DUT can get corrupted. This verifier checks whether it 145 appears that firmware should be re-flashed using servo. 146 """ 147 148 def verify(self, host): 149 if not _is_firmware_repair_supported(host): 150 return 151 try: 152 # Read the AP firmware and dump the sections that we're 153 # interested in. 154 cmd = ('mkdir /tmp/verify_firmware; ' 155 'cd /tmp/verify_firmware; ' 156 'for section in VBLOCK_A VBLOCK_B FW_MAIN_A FW_MAIN_B; ' 157 'do flashrom -p host -r -i $section:$section; ' 158 'done') 159 host.run(cmd) 160 161 # Verify the firmware blocks A and B. 162 cmd = ('vbutil_firmware --verify /tmp/verify_firmware/VBLOCK_%c' 163 ' --signpubkey /usr/share/vboot/devkeys/root_key.vbpubk' 164 ' --fv /tmp/verify_firmware/FW_MAIN_%c') 165 for c in ('A', 'B'): 166 rv = host.run(cmd % (c, c), ignore_status=True) 167 if rv.exit_status: 168 raise hosts.AutoservVerifyError( 169 'Firmware %c is in a bad state.' % c) 170 finally: 171 # Remove the temporary files. 172 host.run('rm -rf /tmp/verify_firmware') 173 174 @property 175 def description(self): 176 return 'Firmware on this DUT is clean' 177 178 179class FirmwareRepair(hosts.RepairAction): 180 """ 181 Reinstall the firmware image using servo. 182 183 This repair function attempts to use servo to install the DUT's 184 designated "stable firmware version". 185 186 This repair method only applies to DUTs used for FAFT. 187 """ 188 189 def repair(self, host): 190 if not _is_firmware_repair_supported(host): 191 raise hosts.AutoservRepairError( 192 'Firmware repair is not applicable to host %s.' % 193 host.hostname, 'not_applicable') 194 repair_utils.require_servo(host) 195 host.firmware_install() 196 197 @property 198 def description(self): 199 return 'Re-install the stable firmware via servo' 200 201 202class FirmwareVersionVerifier(hosts.Verifier): 203 """ 204 Check for a firmware update, and apply it if appropriate. 205 206 This verifier checks to ensure that either the firmware on the DUT 207 is up-to-date, or that the target firmware can be installed from the 208 currently running build. 209 210 Failure occurs when all of the following apply: 211 1. The DUT is not excluded from updates. For example, DUTs used 212 for FAFT testing use `FirmwareRepair` instead. 213 2. The DUT's board has an assigned stable firmware version. 214 3. The DUT is not running the assigned stable firmware. 215 4. The firmware supplied in the running OS build is not the 216 assigned stable firmware. 217 218 If the DUT needs an upgrade and the currently running OS build 219 supplies the necessary firmware, the verifier installs the new 220 firmware using `chromeos-firmwareupdate`. Failure to install will 221 cause the verifier to fail. 222 223 This verifier nominally breaks the rule that "verifiers must succeed 224 quickly", since it can invoke `reboot()` during the success code 225 path. We're doing it anyway for two reasons: 226 * The time between updates will typically be measured in months, 227 so the amortized cost is low. 228 * The reason we distinguish repair from verify is to allow 229 rescheduling work immediately while the expensive repair happens 230 out-of-band. But a firmware update will likely hit all DUTs at 231 once, so it's pointless to pass the buck to repair. 232 233 N.B. This verifier is a trigger for all repair actions that install 234 the stable repair image. If the firmware is out-of-date, but the 235 stable repair image does *not* contain the proper firmware version, 236 _the target DUT will fail repair, and will be unable to fix itself_. 237 """ 238 239 @staticmethod 240 def _get_rw_firmware(host): 241 result = host.run('crossystem fwid', ignore_status=True) 242 if result.exit_status == 0: 243 return result.stdout 244 else: 245 return None 246 247 @staticmethod 248 def _check_hardware_match(version_a, version_b): 249 """ 250 Check that two firmware versions identify the same hardware. 251 252 Firmware version strings look like this: 253 Google_Gnawty.5216.239.34 254 The part before the numbers identifies the hardware for which 255 the firmware was built. This function checks that the hardware 256 identified by `version_a` and `version_b` is the same. 257 258 This is a sanity check to protect us from installing the wrong 259 firmware on a DUT when a board label has somehow gone astray. 260 261 @param version_a First firmware version for the comparison. 262 @param version_b Second firmware version for the comparison. 263 """ 264 hardware_a = version_a.split('.')[0] 265 hardware_b = version_b.split('.')[0] 266 if hardware_a != hardware_b: 267 message = 'Hardware/Firmware mismatch updating %s to %s' 268 raise hosts.AutoservVerifyError( 269 message % (version_a, version_b)) 270 271 def verify(self, host): 272 # Test 1 - The DUT is not excluded from updates. 273 if not _is_firmware_update_supported(host): 274 return 275 # Test 2 - The DUT has an assigned stable firmware version. 276 info = host.host_info_store.get() 277 if info.model is None: 278 raise hosts.AutoservVerifyError( 279 'Can not verify firmware version. ' 280 'No model label value found') 281 282 stable_firmware = afe_utils.get_stable_firmware_version(info.model) 283 if stable_firmware is None: 284 # This DUT doesn't have a firmware update target 285 return 286 287 # For tests 3 and 4: If the output from `crossystem` or 288 # `chromeos-firmwareupdate` isn't what we expect, we log an 289 # error, but don't fail: We don't want DUTs unable to test a 290 # build merely because of a bug or change in either of those 291 # commands. 292 293 # Test 3 - The DUT is not running the target stable firmware. 294 current_firmware = self._get_rw_firmware(host) 295 if current_firmware is None: 296 logging.error('DUT firmware version can\'t be determined.') 297 return 298 if current_firmware == stable_firmware: 299 return 300 # Test 4 - The firmware supplied in the running OS build is not 301 # the assigned stable firmware. 302 available_firmware = _get_available_firmware(host, info.model) 303 if available_firmware is None: 304 logging.error('Supplied firmware version in OS can\'t be ' 305 'determined.') 306 return 307 if available_firmware != stable_firmware: 308 raise hosts.AutoservVerifyError( 309 'DUT firmware requires update from %s to %s' % 310 (current_firmware, stable_firmware)) 311 # Time to update the firmware. 312 logging.info('Updating firmware from %s to %s', 313 current_firmware, stable_firmware) 314 self._check_hardware_match(current_firmware, stable_firmware) 315 try: 316 host.run('chromeos-firmwareupdate --mode=autoupdate') 317 host.reboot() 318 except Exception as e: 319 message = ('chromeos-firmwareupdate failed: from ' 320 '%s to %s') 321 logging.exception(message, current_firmware, stable_firmware) 322 raise hosts.AutoservVerifyError( 323 message % (current_firmware, stable_firmware)) 324 final_firmware = self._get_rw_firmware(host) 325 if final_firmware != stable_firmware: 326 message = ('chromeos-firmwareupdate failed: tried upgrade ' 327 'to %s, now running %s instead') 328 raise hosts.AutoservVerifyError( 329 message % (stable_firmware, final_firmware)) 330 331 @property 332 def description(self): 333 return 'The firmware on this DUT is up-to-date' 334