| # -*- coding: utf-8 -*- |
| # |
| # Copyright 2019 The Chromium OS Authors. All rights reserved. |
| # Use of this source code is governed by a BSD-style license that can be |
| # found in the LICENSE file. |
| |
| """Utils for setting devices |
| |
| This script provides utils to set device specs. |
| """ |
| |
| from __future__ import division |
| from __future__ import print_function |
| |
| __author__ = '[email protected] (Zhizhou Yang)' |
| |
| import re |
| import time |
| |
| from contextlib import contextmanager |
| |
| from cros_utils import command_executer |
| |
| |
| class DutWrapper(object): |
| """Wrap DUT parameters inside.""" |
| |
| def __init__(self, |
| chromeos_root, |
| remote, |
| log_level='verbose', |
| logger=None, |
| ce=None, |
| dut_config=None): |
| self.chromeos_root = chromeos_root |
| self.remote = remote |
| self.log_level = log_level |
| self.logger = logger |
| self.ce = ce or command_executer.GetCommandExecuter(log_level=log_level) |
| self.dut_config = dut_config |
| |
| def RunCommandOnDut(self, command, ignore_status=False): |
| """Helper function to run command on DUT.""" |
| ret, msg, err_msg = self.ce.CrosRunCommandWOutput( |
| command, machine=self.remote, chromeos_root=self.chromeos_root) |
| |
| if ret: |
| err_msg = ('Command execution on DUT %s failed.\n' |
| 'Failing command: %s\n' |
| 'returned %d\n' |
| 'Error message: %s' % (self.remote, command, ret, err_msg)) |
| if ignore_status: |
| self.logger.LogError(err_msg + |
| '\n(Failure is considered non-fatal. Continue.)') |
| else: |
| self.logger.LogFatal(err_msg) |
| |
| return ret, msg, err_msg |
| |
| def DisableASLR(self): |
| """Disable ASLR on DUT.""" |
| disable_aslr = ('set -e; ' |
| 'if [[ -e /proc/sys/kernel/randomize_va_space ]]; then ' |
| ' echo 0 > /proc/sys/kernel/randomize_va_space; ' |
| 'fi') |
| if self.log_level == 'average': |
| self.logger.LogOutput('Disable ASLR.') |
| self.RunCommandOnDut(disable_aslr) |
| |
| def SetCpuGovernor(self, governor, ignore_status=False): |
| """Setup CPU Governor on DUT.""" |
| set_gov_cmd = ( |
| 'for f in `ls -d /sys/devices/system/cpu/cpu*/cpufreq 2>/dev/null`; do ' |
| # Skip writing scaling_governor if cpu is offline. |
| ' [[ -e ${f/cpufreq/online} ]] && grep -q 0 ${f/cpufreq/online} ' |
| ' && continue; ' |
| ' cd $f; ' |
| ' if [[ -e scaling_governor ]]; then ' |
| ' echo %s > scaling_governor; fi; ' |
| 'done; ') |
| if self.log_level == 'average': |
| self.logger.LogOutput('Setup CPU Governor: %s.' % governor) |
| ret, _, _ = self.RunCommandOnDut( |
| set_gov_cmd % governor, ignore_status=ignore_status) |
| return ret |
| |
| def DisableTurbo(self): |
| """Disable Turbo on DUT.""" |
| dis_turbo_cmd = ( |
| 'if [[ -e /sys/devices/system/cpu/intel_pstate/no_turbo ]]; then ' |
| ' if grep -q 0 /sys/devices/system/cpu/intel_pstate/no_turbo; then ' |
| ' echo -n 1 > /sys/devices/system/cpu/intel_pstate/no_turbo; ' |
| ' fi; ' |
| 'fi; ') |
| if self.log_level == 'average': |
| self.logger.LogOutput('Disable Turbo.') |
| self.RunCommandOnDut(dis_turbo_cmd) |
| |
| def SetupCpuUsage(self): |
| """Setup CPU usage. |
| |
| Based on self.dut_config['cpu_usage'] configure CPU cores |
| utilization. |
| """ |
| |
| if (self.dut_config['cpu_usage'] == 'big_only' or |
| self.dut_config['cpu_usage'] == 'little_only'): |
| _, arch, _ = self.RunCommandOnDut('uname -m') |
| |
| if arch.lower().startswith('arm') or arch.lower().startswith('aarch64'): |
| self.SetupArmCores() |
| |
| def SetupArmCores(self): |
| """Setup ARM big/little cores.""" |
| |
| # CPU implemeters/part numbers of big/LITTLE CPU. |
| # Format: dict(CPU implementer: set(CPU part numbers)) |
| LITTLE_CORES = { |
| '0x41': { |
| '0xd01', # Cortex A32 |
| '0xd03', # Cortex A53 |
| '0xd04', # Cortex A35 |
| '0xd05', # Cortex A55 |
| }, |
| } |
| BIG_CORES = { |
| '0x41': { |
| '0xd07', # Cortex A57 |
| '0xd08', # Cortex A72 |
| '0xd09', # Cortex A73 |
| '0xd0a', # Cortex A75 |
| '0xd0b', # Cortex A76 |
| }, |
| } |
| |
| # Values of CPU Implementer and CPU part number are exposed by cpuinfo. |
| # Format: |
| # ================= |
| # processor : 0 |
| # model name : ARMv8 Processor rev 4 (v8l) |
| # BogoMIPS : 48.00 |
| # Features : half thumb fastmult vfp edsp neon vfpv3 tls vfpv4 |
| # CPU implementer : 0x41 |
| # CPU architecture: 8 |
| # CPU variant : 0x0 |
| # CPU part : 0xd03 |
| # CPU revision : 4 |
| |
| _, cpuinfo, _ = self.RunCommandOnDut('cat /proc/cpuinfo') |
| |
| # List of all CPU cores: 0, 1, .. |
| proc_matches = re.findall(r'^processor\s*: (\d+)$', cpuinfo, re.MULTILINE) |
| # List of all corresponding CPU implementers |
| impl_matches = re.findall(r'^CPU implementer\s*: (0x[\da-f]+)$', cpuinfo, |
| re.MULTILINE) |
| # List of all corresponding CPU part numbers |
| part_matches = re.findall(r'^CPU part\s*: (0x[\da-f]+)$', cpuinfo, |
| re.MULTILINE) |
| assert len(proc_matches) == len(impl_matches) |
| assert len(part_matches) == len(impl_matches) |
| |
| all_cores = set(proc_matches) |
| dut_big_cores = { |
| core |
| for core, impl, part in zip(proc_matches, impl_matches, part_matches) |
| if impl in BIG_CORES and part in BIG_CORES[impl] |
| } |
| dut_lit_cores = { |
| core |
| for core, impl, part in zip(proc_matches, impl_matches, part_matches) |
| if impl in LITTLE_CORES and part in LITTLE_CORES[impl] |
| } |
| |
| if self.dut_config['cpu_usage'] == 'big_only': |
| cores_to_enable = dut_big_cores |
| cores_to_disable = all_cores - dut_big_cores |
| elif self.dut_config['cpu_usage'] == 'little_only': |
| cores_to_enable = dut_lit_cores |
| cores_to_disable = all_cores - dut_lit_cores |
| else: |
| self.logger.LogError( |
| 'cpu_usage=%s is not supported on ARM.\n' |
| 'Ignore ARM CPU setup and continue.' % self.dut_config['cpu_usage']) |
| return |
| |
| if cores_to_enable: |
| cmd_enable_cores = ('echo 1 | tee /sys/devices/system/cpu/cpu{%s}/online' |
| % ','.join(sorted(cores_to_enable))) |
| |
| cmd_disable_cores = '' |
| if cores_to_disable: |
| cmd_disable_cores = ( |
| 'echo 0 | tee /sys/devices/system/cpu/cpu{%s}/online' % ','.join( |
| sorted(cores_to_disable))) |
| |
| self.RunCommandOnDut('; '.join([cmd_enable_cores, cmd_disable_cores])) |
| else: |
| # If there are no cores enabled by dut_config then configuration |
| # is invalid for current platform and should be ignored. |
| self.logger.LogError( |
| '"cpu_usage" is invalid for targeted platform.\n' |
| 'dut_config[cpu_usage]=%s\n' |
| 'dut big cores: %s\n' |
| 'dut little cores: %s\n' |
| 'Ignore ARM CPU setup and continue.' % (self.dut_config['cpu_usage'], |
| dut_big_cores, dut_lit_cores)) |
| |
| def GetCpuOnline(self): |
| """Get online status of CPU cores. |
| |
| Return dict of {int(cpu_num): <0|1>}. |
| """ |
| get_cpu_online_cmd = ('paste -d" "' |
| ' <(ls /sys/devices/system/cpu/cpu*/online)' |
| ' <(cat /sys/devices/system/cpu/cpu*/online)') |
| _, online_output_str, _ = self.RunCommandOnDut(get_cpu_online_cmd) |
| |
| # Here is the output we expect to see: |
| # ----------------- |
| # /sys/devices/system/cpu/cpu0/online 0 |
| # /sys/devices/system/cpu/cpu1/online 1 |
| |
| cpu_online = {} |
| cpu_online_match = re.compile(r'^[/\S]+/cpu(\d+)/[/\S]+\s+(\d+)$') |
| for line in online_output_str.splitlines(): |
| match = cpu_online_match.match(line) |
| if match: |
| cpu = int(match.group(1)) |
| status = int(match.group(2)) |
| cpu_online[cpu] = status |
| # At least one CPU has to be online. |
| assert cpu_online |
| |
| return cpu_online |
| |
| def SetupCpuFreq(self, online_cores): |
| """Setup CPU frequency. |
| |
| Based on self.dut_config['cpu_freq_pct'] setup frequency of online CPU cores |
| to a supported value which is less or equal to (freq_pct * max_freq / 100) |
| limited by min_freq. |
| |
| NOTE: scaling_available_frequencies support is required. |
| Otherwise the function has no effect. |
| """ |
| freq_percent = self.dut_config['cpu_freq_pct'] |
| list_all_avail_freq_cmd = ('ls /sys/devices/system/cpu/cpu{%s}/cpufreq/' |
| 'scaling_available_frequencies') |
| # Ignore error to support general usage of frequency setup. |
| # Not all platforms support scaling_available_frequencies. |
| ret, all_avail_freq_str, _ = self.RunCommandOnDut( |
| list_all_avail_freq_cmd % ','.join(str(core) for core in online_cores), |
| ignore_status=True) |
| if ret or not all_avail_freq_str: |
| # No scalable frequencies available for the core. |
| return ret |
| for avail_freq_path in all_avail_freq_str.split(): |
| # Get available freq from every scaling_available_frequency path. |
| # Error is considered fatal in self.RunCommandOnDut(). |
| _, avail_freq_str, _ = self.RunCommandOnDut('cat ' + avail_freq_path) |
| assert avail_freq_str |
| |
| all_avail_freq = sorted( |
| int(freq_str) for freq_str in avail_freq_str.split()) |
| min_freq = all_avail_freq[0] |
| max_freq = all_avail_freq[-1] |
| # Calculate the frequency we are targeting. |
| target_freq = round(max_freq * freq_percent / 100) |
| # More likely it's not in the list of supported frequencies |
| # and our goal is to find the one which is less or equal. |
| # Default is min and we will try to maximize it. |
| avail_ngt_target = min_freq |
| # Find the largest not greater than the target. |
| for next_largest in reversed(all_avail_freq): |
| if next_largest <= target_freq: |
| avail_ngt_target = next_largest |
| break |
| |
| max_freq_path = avail_freq_path.replace('scaling_available_frequencies', |
| 'scaling_max_freq') |
| min_freq_path = avail_freq_path.replace('scaling_available_frequencies', |
| 'scaling_min_freq') |
| # With default ignore_status=False we expect 0 status or Fatal error. |
| self.RunCommandOnDut('echo %s | tee %s %s' % |
| (avail_ngt_target, max_freq_path, min_freq_path)) |
| |
| def WaitCooldown(self): |
| """Wait for DUT to cool down to certain temperature.""" |
| waittime = 0 |
| timeout_in_sec = int(self.dut_config['cooldown_time']) * 60 |
| # Temperature from sensors come in uCelsius units. |
| temp_in_ucels = int(self.dut_config['cooldown_temp']) * 1000 |
| sleep_interval = 30 |
| |
| # Wait until any of two events occurs: |
| # 1. CPU cools down to a specified temperature. |
| # 2. Timeout cooldown_time expires. |
| # For the case when targeted temperature is not reached within specified |
| # timeout the benchmark is going to start with higher initial CPU temp. |
| # In the worst case it may affect test results but at the same time we |
| # guarantee the upper bound of waiting time. |
| # TODO(denik): Report (or highlight) "high" CPU temperature in test results. |
| # "high" should be calculated based on empirical data per platform. |
| # Based on such reports we can adjust CPU configuration or |
| # cooldown limits accordingly. |
| while waittime < timeout_in_sec: |
| _, temp_output, _ = self.RunCommandOnDut( |
| 'cat /sys/class/thermal/thermal_zone*/temp', ignore_status=True) |
| if any(int(temp) > temp_in_ucels for temp in temp_output.split()): |
| time.sleep(sleep_interval) |
| waittime += sleep_interval |
| else: |
| # Exit the loop when: |
| # 1. Reported temp numbers from all thermal sensors do not exceed |
| # 'cooldown_temp' or |
| # 2. No data from the sensors. |
| break |
| |
| self.logger.LogOutput('Cooldown wait time: %.1f min' % (waittime / 60)) |
| return waittime |
| |
| def DecreaseWaitTime(self): |
| """Change the ten seconds wait time for pagecycler to two seconds.""" |
| FILE = '/usr/local/telemetry/src/tools/perf/page_sets/page_cycler_story.py' |
| ret = self.RunCommandOnDut('ls ' + FILE) |
| |
| if not ret: |
| sed_command = 'sed -i "s/_TTI_WAIT_TIME = 10/_TTI_WAIT_TIME = 2/g" ' |
| self.RunCommandOnDut(sed_command + FILE) |
| |
| def StopUI(self): |
| """Stop UI on DUT.""" |
| # Added "ignore_status" for the case when crosperf stops ui service which |
| # was already stopped. Command is going to fail with 1. |
| self.RunCommandOnDut('stop ui', ignore_status=True) |
| |
| def StartUI(self): |
| """Start UI on DUT.""" |
| # Similar to StopUI, `start ui` fails if the service is already started. |
| self.RunCommandOnDut('start ui', ignore_status=True) |
| |
| def KerncmdUpdateNeeded(self, intel_pstate): |
| """Check whether kernel cmdline update is needed. |
| |
| Args: |
| intel_pstate: kernel command line argument (active, passive, no_hwp) |
| |
| Returns: |
| True if update is needed. |
| """ |
| |
| good = 0 |
| |
| # Check that dut platform supports hwp |
| cmd = "grep -q '^flags.*hwp' /proc/cpuinfo" |
| ret_code, _, _ = self.RunCommandOnDut(cmd, ignore_status=True) |
| if ret_code != good: |
| # Intel hwp is not supported, update is not needed. |
| return False |
| |
| kern_cmdline_cmd = 'grep -q "intel_pstate=%s" /proc/cmdline' % intel_pstate |
| ret_code, _, _ = self.RunCommandOnDut(kern_cmdline_cmd, ignore_status=True) |
| self.logger.LogOutput('grep /proc/cmdline returned %d' % ret_code) |
| if (intel_pstate and ret_code == good or |
| not intel_pstate and ret_code != good): |
| # No need to updated cmdline if: |
| # 1. We are setting intel_pstate and we found it is already set. |
| # 2. Not using intel_pstate and it is not in cmdline. |
| return False |
| |
| # Otherwise we need to update intel_pstate. |
| return True |
| |
| def UpdateKerncmdIntelPstate(self, intel_pstate): |
| """Update kernel command line. |
| |
| Args: |
| intel_pstate: kernel command line argument (active, passive, no_hwp) |
| """ |
| |
| good = 0 |
| |
| # First phase is to remove rootfs verification to allow cmdline change. |
| remove_verif_cmd = ' '.join([ |
| '/usr/share/vboot/bin/make_dev_ssd.sh', |
| '--remove_rootfs_verification', |
| '--partition %d', |
| ]) |
| # Command for partition 2. |
| verif_part2_failed, _, _ = self.RunCommandOnDut( |
| remove_verif_cmd % 2, ignore_status=True) |
| # Command for partition 4 |
| # Some machines in the lab use partition 4 to boot from, |
| # so cmdline should be update for both partitions. |
| verif_part4_failed, _, _ = self.RunCommandOnDut( |
| remove_verif_cmd % 4, ignore_status=True) |
| if verif_part2_failed or verif_part4_failed: |
| self.logger.LogFatal( |
| 'ERROR. Failed to update kernel cmdline on partition %d.\n' |
| 'Remove verification failed with status %d' % |
| (2 if verif_part2_failed else 4, verif_part2_failed or |
| verif_part4_failed)) |
| |
| self.RunCommandOnDut('reboot && exit') |
| # Give enough time for dut to complete reboot |
| # TODO(denik): Replace with the function checking machine availability. |
| time.sleep(30) |
| |
| # Second phase to update intel_pstate in kernel cmdline. |
| kern_cmdline = '\n'.join([ |
| 'tmpfile=$(mktemp)', |
| 'partnumb=%d', |
| 'pstate=%s', |
| # Store kernel cmdline in a temp file. |
| '/usr/share/vboot/bin/make_dev_ssd.sh --partition ${partnumb}' |
| ' --save_config ${tmpfile}', |
| # Remove intel_pstate argument if present. |
| "sed -i -r 's/ intel_pstate=[A-Za-z_]+//g' ${tmpfile}.${partnumb}", |
| # Insert intel_pstate with a new value if it is set. |
| '[[ -n ${pstate} ]] &&' |
| ' sed -i -e \"s/ *$/ intel_pstate=${pstate}/\" ${tmpfile}.${partnumb}', |
| # Save the change in kernel cmdline. |
| # After completion we have to reboot. |
| '/usr/share/vboot/bin/make_dev_ssd.sh --partition ${partnumb}' |
| ' --set_config ${tmpfile}' |
| ]) |
| kern_part2_cmdline_cmd = kern_cmdline % (2, intel_pstate) |
| self.logger.LogOutput( |
| 'Command to change kernel command line: %s' % kern_part2_cmdline_cmd) |
| upd_part2_failed, _, _ = self.RunCommandOnDut( |
| kern_part2_cmdline_cmd, ignore_status=True) |
| # Again here we are updating cmdline for partition 4 |
| # in addition to partition 2. Without this some machines |
| # in the lab might fail. |
| kern_part4_cmdline_cmd = kern_cmdline % (4, intel_pstate) |
| self.logger.LogOutput( |
| 'Command to change kernel command line: %s' % kern_part4_cmdline_cmd) |
| upd_part4_failed, _, _ = self.RunCommandOnDut( |
| kern_part4_cmdline_cmd, ignore_status=True) |
| if upd_part2_failed or upd_part4_failed: |
| self.logger.LogFatal( |
| 'ERROR. Failed to update kernel cmdline on partition %d.\n' |
| 'intel_pstate update failed with status %d' % |
| (2 if upd_part2_failed else 4, upd_part2_failed or upd_part4_failed)) |
| |
| self.RunCommandOnDut('reboot && exit') |
| # Wait 30s after reboot. |
| time.sleep(30) |
| |
| # Verification phase. |
| # Check that cmdline was updated. |
| # Throw an exception if not. |
| kern_cmdline_cmd = 'grep -q "intel_pstate=%s" /proc/cmdline' % intel_pstate |
| ret_code, _, _ = self.RunCommandOnDut(kern_cmdline_cmd, ignore_status=True) |
| if (intel_pstate and ret_code != good or |
| not intel_pstate and ret_code == good): |
| # Kernel cmdline doesn't match input intel_pstate. |
| self.logger.LogFatal( |
| 'ERROR. Failed to update kernel cmdline. ' |
| 'Final verification failed with status %d' % ret_code) |
| |
| self.logger.LogOutput('Kernel cmdline updated successfully.') |
| |
| @contextmanager |
| def PauseUI(self): |
| """Stop UI before and Start UI after the context block. |
| |
| Context manager will make sure UI is always resumed at the end. |
| """ |
| self.StopUI() |
| try: |
| yield |
| |
| finally: |
| self.StartUI() |
| |
| def SetupDevice(self): |
| """Setup device to get it ready for testing. |
| |
| @Returns Wait time of cool down for this benchmark run. |
| """ |
| self.logger.LogOutput('Update kernel cmdline if necessary and reboot') |
| intel_pstate = self.dut_config['intel_pstate'] |
| if intel_pstate and self.KerncmdUpdateNeeded(intel_pstate): |
| self.UpdateKerncmdIntelPstate(intel_pstate) |
| |
| wait_time = 0 |
| # Pause UI while configuring the DUT. |
| # This will accelerate setup (waiting for cooldown has x10 drop) |
| # and help to reset a Chrome state left after the previous test. |
| with self.PauseUI(): |
| # Unless the user turns on ASLR in the flag, we first disable ASLR |
| # before running the benchmarks |
| if not self.dut_config['enable_aslr']: |
| self.DisableASLR() |
| |
| # CPU usage setup comes first where we enable/disable cores. |
| self.SetupCpuUsage() |
| cpu_online_status = self.GetCpuOnline() |
| # List of online cores of type int (core number). |
| online_cores = [ |
| core for core, status in cpu_online_status.items() if status |
| ] |
| if self.dut_config['cooldown_time']: |
| # Setup power conservative mode for effective cool down. |
| # Set ignore status since powersave may no be available |
| # on all platforms and we are going to handle it. |
| ret = self.SetCpuGovernor('powersave', ignore_status=True) |
| if ret: |
| # "powersave" is not available, use "ondemand". |
| # Still not a fatal error if it fails. |
| ret = self.SetCpuGovernor('ondemand', ignore_status=True) |
| # TODO(denik): Run comparison test for 'powersave' and 'ondemand' |
| # on scarlet and kevin64. |
| # We might have to consider reducing freq manually to the min |
| # if it helps to reduce waiting time. |
| wait_time = self.WaitCooldown() |
| |
| # Setup CPU governor for the benchmark run. |
| # It overwrites the previous governor settings. |
| governor = self.dut_config['governor'] |
| # FIXME(denik): Pass online cores to governor setup. |
| self.SetCpuGovernor(governor) |
| |
| # Disable Turbo and Setup CPU freq should ALWAYS proceed governor setup |
| # since governor may change: |
| # - frequency; |
| # - turbo/boost. |
| self.DisableTurbo() |
| self.SetupCpuFreq(online_cores) |
| |
| self.DecreaseWaitTime() |
| # FIXME(denik): Currently we are not recovering the previous cpufreq |
| # settings since we do reboot/setup every time anyway. |
| # But it may change in the future and then we have to recover the |
| # settings. |
| return wait_time |