blob: 765d39a92f818064edb2af9d91b6b64231e1c0e1 [file] [log] [blame] [edit]
# Copyright 2020 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
import os
from contextlib import contextmanager
from recipe_engine import recipe_api
from PB.go.chromium.org.luci.buildbucket.proto import common as common_pb2
TIMEOUT_PROPERTY = 'ios_debug_symbol_doctor_timeout_seconds'
class OsUtilsApi(recipe_api.RecipeApi):
"""Operating system utilities."""
def initialize(self):
self._mock_is_symlink = None
if self._test_data.enabled:
self._mock_is_symlink = self._test_data.get('is_symlink', True)
def _kill_win(self, name, exe_name):
"""Kills all the windows processes with a given name.
Args:
name(str): The name of the step.
exe_name(str): The name of the windows executable.
"""
self.m.step(
name,
['taskkill', '/f', '/im', exe_name, '/t'],
ok_ret='any',
)
def print_pub_certs(self):
"""Prints pub.dev certificates."""
cmd = (
'gci -Recurse cert: |Where-Object {$_.Subject -like "*GTS CA 1D4*"'
' -or $_.FriendlyName -like "GlobalSign Root CA - R1" -or $_.Subject'
' -like "*GTS Root R1*"}'
)
if self.m.platform.is_win:
self.m.step(
'Print pub.dev certs',
['powershell.exe', cmd],
infra_step=True,
)
def is_symlink(self, path):
"""Returns if a path points to a symlink or not."""
is_symlink = os.path.islink(self.m.path.abspath(path))
return is_symlink if self._mock_is_symlink is None else self._mock_is_symlink
def symlink(self, source, dest):
"""Creates a symbolic link.
Creates a symbolic link in mac platforms.
"""
if self.m.platform.is_mac:
self.m.step(
'Link %s to %s' % (dest, source),
['ln', '-s', source, dest],
infra_step=True,
)
def clean_derived_data(self):
"""Cleans the derived data folder in mac builders.
Derived data caches fail very frequently when different version of mac/ios
sdks are used in the same bot. To prevent those failures we will start
deleting the folder before every task.
"""
derived_data_path = self.m.path['home'].join(
'Library', 'Developer', 'Xcode', 'DerivedData'
)
if self.m.platform.is_mac:
self.m.step(
'Delete mac deriveddata',
['rm', '-rf', derived_data_path],
infra_step=True,
)
def collect_os_info(self):
"""Collects meminfo, cpu, processes for mac"""
if self.m.platform.is_mac:
self.m.step(
'OS info',
cmd=['top', '-l', '3', '-o', 'mem'],
infra_step=True,
)
# These are temporary steps to collect xattr info for triage purpose.
# See issue: https://github.com/flutter/flutter/issues/68322#issuecomment-740264251
self.m.step(
'python xattr info',
cmd=['xattr', '/opt/s/w/ir/cipd_bin_packages/python'],
ok_ret='any',
infra_step=True,
)
self.m.step(
'git xattr info',
cmd=['xattr', '/opt/s/w/ir/cipd_bin_packages/git'],
ok_ret='any',
infra_step=True,
)
elif self.m.platform.is_linux:
self.m.step(
'OS info',
cmd=['top', '-b', '-n', '3', '-o', '%MEM'],
infra_step=True,
)
def kill_simulators(self):
"""Kills any open simulators.
This is to ensure builds use xcode from a clean state.
"""
if self.m.platform.is_mac:
self.m.step(
'kill dart', ['killall', '-9', 'com.apple.CoreSimulator.CoreSimulatorDevice'],
ok_ret='any',
infra_step=True
)
def kill_processes(self):
"""Kills processes.
Windows uses exclusive file locking. On LUCI, if these processes remain
they will cause the build to fail because the builder won't be able to
clean up.
Linux and Mac have leaking processes after task executions, potentially
causing the build to fail if without clean up.
This might fail if there's not actually a process running, which is
fine.
If it actually fails to kill the task, the job will just fail anyway.
"""
with self.m.step.nest('Killing Processes') as presentation:
if self.m.platform.is_win:
self._kill_win('stop gradle daemon', 'java.exe')
self._kill_win('stop dart', 'dart.exe')
self._kill_win('stop adb', 'adb.exe')
self._kill_win('stop flutter_tester', 'flutter_tester.exe')
elif self.m.platform.is_mac:
self.m.step(
'kill dart', ['killall', '-9', 'dart'],
ok_ret='any',
infra_step=True
)
self.m.step(
'kill flutter', ['killall', '-9', 'flutter'],
ok_ret='any',
infra_step=True
)
self.m.step(
'kill Chrome', ['killall', '-9', 'Chrome'],
ok_ret='any',
infra_step=True
)
self.m.step(
'kill Safari', ['killall', '-9', 'Safari'],
ok_ret='any',
infra_step=True
)
self.m.step(
'kill Safari', ['killall', '-9', 'java'],
ok_ret='any',
infra_step=True
)
self.m.step(
'kill Safari', ['killall', '-9', 'adb'],
ok_ret='any',
infra_step=True
)
else:
self.m.step(
'kill chrome', ['pkill', 'chrome'], ok_ret='any', infra_step=True
)
self.m.step(
'kill dart', ['pkill', 'dart'], ok_ret='any', infra_step=True
)
self.m.step(
'kill flutter', ['pkill', 'flutter'], ok_ret='any', infra_step=True
)
self.m.step(
'kill java', ['pkill', 'java'], ok_ret='any', infra_step=True
)
self.m.step('kill adb', ['pkill', 'adb'], ok_ret='any', infra_step=True)
# Ensure we always pass this step as killing non existing processes
# may create errors.
presentation.status = 'SUCCESS'
@contextmanager
def make_temp_directory(self, label):
"""Makes a temporary directory that is automatically deleted.
Args:
label:
(str) Part of the step name that removes the directory after is used.
"""
temp_dir = self.m.path.mkdtemp('tmp')
try:
yield temp_dir
finally:
self.m.file.rmtree('temp dir for %s' % label, temp_dir)
def shutdown_simulators(self):
"""It stops simulators if task is running on a devicelab bot."""
if (str(self.m.swarming.bot_id).startswith('flutter-devicelab')
and self.m.platform.is_mac):
with self.m.step.nest('Shutdown simulators'):
self.m.step(
'Shutdown simulators',
['sudo', 'xcrun', 'simctl', 'shutdown', 'all']
)
self.m.step(
'Erase simulators', ['sudo', 'xcrun', 'simctl', 'erase', 'all']
)
def enable_long_paths(self):
"""Enables long path support in Windows."""
if not self.m.platform.is_win:
# noop for non windows platforms.
return
with self.m.step.nest('Enable long path support'):
resource_name = self.resource('long_paths.ps1')
self.m.step(
'Run long path support script',
['powershell.exe', resource_name],
)
def ios_debug_symbol_doctor(self):
"""Call the ios_debug_symbol_doctor entrypoint of the Device Doctor."""
if str(self.m.swarming.bot_id
).startswith('flutter-devicelab') and self.m.platform.is_mac:
with self.m.step.nest('ios_debug_symbol_doctor'):
cocoon_path = self._checkout_cocoon()
entrypoint = cocoon_path.join(
'device_doctor',
'bin',
'ios_debug_symbol_doctor.dart',
)
# This is not set by the builder config, but can be provided via LED
timeout = self.m.properties.get(
TIMEOUT_PROPERTY,
120, # 2 minutes
)
# Since we double the timeout on each retry, the last retry will have a
# timeout of 16 minutes
retry_count = 4
with self.m.context(cwd=cocoon_path.join('device_doctor'),
infra_steps=True):
self.m.step(
'pub get device_doctor',
['dart', 'pub', 'get'],
)
for _ in range(retry_count):
result = self._diagnose_and_recover_debug_symbols(entrypoint, timeout, cocoon_path)
# No errors in attached phones
if result:
return
# Try for twice as long next time
timeout *= 2
message = '''
The ios_debug_symbol_doctor is detecting phones attached with errors and failed
to recover this bot with a timeout of %s seconds.
See https://github.com/flutter/flutter/issues/103511 for more context.
''' % timeout
# raise purple
self.m.step.empty(
'Recovery failed after %s attempts' % retry_count,
status=self.m.step.INFRA_FAILURE,
step_text=message,
)
def dismiss_dialogs(self):
"""Dismisses iOS dialogs to avoid problems.
Args:
flutter_path(Path): A path to the checkout of the flutter sdk repository.
"""
if str(self.m.swarming.bot_id
).startswith('flutter-devicelab') and self.m.platform.is_mac:
with self.m.step.nest('Dismiss dialogs'):
cocoon_path = self._checkout_cocoon()
resource_name = self.resource('dismiss_dialogs.sh')
self.m.step(
'Set execute permission',
['chmod', '755', resource_name],
infra_step=True,
)
with self.m.context(
cwd=cocoon_path.join('device_doctor', 'tool', 'infra-dialog'),
infra_steps=True,
):
device_id = self.m.step(
'Find device id', ['idevice_id', '-l'],
stdout=self.m.raw_io.output_text()
).stdout.rstrip()
cmd = [resource_name, device_id]
self.m.step('Run app to dismiss dialogs', cmd)
def _checkout_cocoon(self):
"""Checkout cocoon at HEAD to the cache and return the path."""
cocoon_path = self.m.path['cache'].join('cocoon')
self.m.repo_util.checkout(
'cocoon', cocoon_path, ref='refs/heads/main'
)
return cocoon_path
def _diagnose_and_recover_debug_symbols(self, entrypoint, timeout, cocoon_path):
"""Diagnose if attached phones have errors with debug symbols.
If there are errors, a recovery will be attempted. This function is intended
to be called in a retry loop until it returns True, or until a max retry
count is reached.
Returns a boolean for whether or not the initial diagnose succeeded.
"""
try:
self.m.step(
'diagnose',
['dart', entrypoint, 'diagnose'],
)
return True
except self.m.step.StepFailure as e:
self.m.step(
'recover with %s second timeout' % timeout,
[
'dart',
entrypoint,
'recover',
'--cocoon-root',
cocoon_path,
'--timeout',
timeout,
],
)
return False