blob: 8464ae4341c8b7a3014920f57fe26afe72632502 [file] [log] [blame] [edit]
# Copyright 2024 The Chromium Authors
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""Adapter for printing legacy recipe output
TODO(https://crbug.com/326904531): This file is intended to be a temporary
workaround and should be replaced once this bug is resolved"""
import json
import logging
import os
import re
import sys
# Create a logger that avoids rich formatting as we can't control recipe
# formatting from here
basic_logger = logging.getLogger('basic_logger')
basic_logger.addHandler(logging.StreamHandler(sys.stdout))
basic_logger.propagate = False
class PassthroughAdapter:
"""Doesn't filter anything, just logs everything from the recipe run."""
def ProcessLine(self, line):
basic_logger.log(logging.DEBUG, line)
class LegacyOutputAdapter:
"""Interprets the legacy recipe run mode output to logging
This will filter, route and in some cases reformat the output to trace levels
of logging. This will cause specific output (e.g. unfiltered step names) to
always print to std out or when -v is passed, the stdout will additionally
be passed to the logging stdout. Note -vv will cause PassthroughAdapter to
interpret results"""
SEED_STEP_TEXT = '@@@SEED_STEP@'
STEP_CLOSED_TEXT = '@@@STEP_CLOSED@@@'
ANNOTATOR_PREFIX_SUFIX = '@@@'
TRIGGER_STEP_PREFIX = 'test_pre_run.[trigger] '
TRIGGER_LINK_TEXT = '@@@STEP_LINK@task UI:'
# Special sub-log names added by the UTR recipe to surface to users.
UTR_LOG_NAME = 'utr_log'
def __init__(self):
self._trigger_link_re = re.compile(r'.+@(https://.+)@@@$')
self._ninja_status_re = re.compile(r'\[(\d+)\/(\d+)\]')
self._collect_wait_re = re.compile(
r'.+prpc call (.+) swarming.v2.Tasks.ListTaskStates, stdin: '
r'(\{"task_id": .+\})$'
)
self._result_links_re = re.compile(
r'@@@STEP_LINK@shard (#\d+) test results@(https://[^@]+)@@@')
self._current_proccess_fn = self._StepNameProcessLine
# The first match is used. This allows us to filter parent steps while still
# printing child steps by adding the child step name first. By default
# _StepNameProcessLine will be used which prints the step name and it's
# stdout
self._step_to_processors = {
'compile': self._ProcessCompileLine,
'reclient compile': self._ProcessCompileLine,
'test_pre_run.[trigger] ': self._ProcessTriggerLine,
'collect tasks.wait for tasks': self._ProcessCollectLine,
'download compilation outputs': self._PrintOnlyStepName,
}
# The first match is used. This allows us to filter parent steps while still
# printing child steps by adding the child step name first. By default INFO
# will be used which prints in non-verbose mode (i.e. no -v flag)
self._step_to_log_level = {
'lookup_builder_gn_args': logging.DEBUG,
'git rev-parse': logging.DEBUG,
'git diff to instrument': logging.DEBUG,
'save paths of affected files': logging.DEBUG,
'preprocess for reclient.start reproxy via bootstrap': logging.INFO,
'preprocess for reclient': logging.DEBUG,
'process clang crashes': logging.DEBUG,
'compile confirm no-op': logging.DEBUG,
'postprocess for reclient': logging.DEBUG,
'setup_build': logging.DEBUG,
'get compile targets for scripts': logging.DEBUG,
'lookup GN args': logging.DEBUG,
'install infra/tools/luci/isolate': logging.DEBUG,
'find command lines': logging.DEBUG,
'test_pre_run.install infra/tools/luci/swarming': logging.DEBUG,
'isolate tests': logging.DEBUG,
'read GN args': logging.DEBUG,
'test_pre_run.[trigger] ': logging.INFO,
'test_pre_run.': logging.DEBUG,
'collect tasks.wait for tasks': logging.INFO,
'collect tasks': logging.DEBUG,
'$debug - all results': logging.DEBUG,
'Test statistics': logging.DEBUG,
'read gclient': logging.DEBUG,
'write output_properties_file': logging.DEBUG,
'prepare skylab tests.': logging.DEBUG,
'update invocation instructions': logging.DEBUG,
}
# Setup logger for printing to the same line
logger = logging.getLogger('single_line_logger')
handler = logging.StreamHandler(sys.stdout)
handler.terminator = ''
logger.addHandler(handler)
logger.propagate = False
self._last_line = ''
self._last_line_teriminal_lines = 0
self._current_log_level = logging.DEBUG
self._single_line_logger = logger
self._terminal_columns, _ = os.get_terminal_size()
self._current_step_name = ''
self._dot_count = 0
def _PrintCurrentStepName(self, log_level):
logging.log(log_level, '\n[cyan]Running: %s[/]', self._current_step_name)
def _StdoutProcessLine(self, line):
# Pass through any non-engine or utr-log text.
if line.startswith(f'@@@STEP_LOG_LINE@{self.UTR_LOG_NAME}@'):
# '-3' corresponds to the trailing @@@ on every sub-log line.
line = line[len(f'@@@STEP_LOG_LINE@{self.UTR_LOG_NAME}@'):-3]
if line.startswith(self.ANNOTATOR_PREFIX_SUFIX):
return
is_urlish = re.match(r'^http[s]?://\S+$', line)
if is_urlish:
logging.log(self._current_log_level, line)
else:
basic_logger.log(self._current_log_level, line)
def _StepNameProcessLine(self, line):
if line.startswith(self.SEED_STEP_TEXT):
# Always print the step name to info
self._PrintCurrentStepName(self._current_log_level)
return
self._StdoutProcessLine(line)
def _PrintOnlyStepName(self, line):
if line.startswith(self.SEED_STEP_TEXT):
self._PrintCurrentStepName(logging.INFO)
def _ProcessTriggerLine(self, line):
if line.startswith(self.SEED_STEP_TEXT + self.TRIGGER_STEP_PREFIX):
# The step names for tests don't have any identifying keywords so the
# result step parsers need to be installed at trigger time
test_name = line[len(self.SEED_STEP_TEXT +
self.TRIGGER_STEP_PREFIX):line.index(' (') if ' (' in
line else -len(self.ANNOTATOR_PREFIX_SUFIX)]
self._step_to_processors[test_name] = self._ProcessResult
self._step_to_log_level[test_name] = logging.DEBUG
elif line.startswith(self.TRIGGER_LINK_TEXT):
matches = self._trigger_link_re.match(line)
if matches:
task_name = self._current_step_name[len(self.TRIGGER_STEP_PREFIX):]
basic_logger.log(self._current_log_level,
f'Triggered {task_name}: ' + matches[1])
else:
self._StdoutProcessLine(line)
def _ProcessCompileLine(self, line):
if line.startswith(self.SEED_STEP_TEXT):
self._PrintCurrentStepName(logging.INFO)
return
matches = self._ninja_status_re.match(line)
if matches:
# Remove the last line which might be multiple on the terminal
self._single_line_logger.log(self._current_log_level, '\33[2K')
if self._last_line_teriminal_lines > 1:
for _ in range(self._last_line_teriminal_lines - 1):
self._single_line_logger.log(self._current_log_level, '\33[A\33[2K')
self._single_line_logger.log(self._current_log_level, '\r' + line)
self._single_line_logger.handlers[0].flush()
return
if self._last_line.startswith('['):
basic_logger.log(self._current_log_level, '')
self._StdoutProcessLine(line)
def _ProcessCollectLine(self, line):
if line.startswith(self.SEED_STEP_TEXT):
self._PrintCurrentStepName(logging.INFO)
matches = self._collect_wait_re.match(line)
if matches:
task_ids = json.loads(matches[2])['task_id']
self._dot_count = (self._dot_count % 5) + 1
self._single_line_logger.log(
self._current_log_level,
f'\33[2K\rStill waiting on: {len(task_ids)} shard(s)' +
'.' * self._dot_count)
return
if line == self.STEP_CLOSED_TEXT:
self._single_line_logger.log(self._current_log_level,
'\33[2K\rStill waiting on: 0 shard(s)...')
basic_logger.log(self._current_log_level, '')
def _ProcessResult(self, line):
matches = self._result_links_re.match(line)
if matches:
basic_logger.log(self._current_log_level,
'Test results for %s shard %s: %s',
self._current_step_name, matches[1], matches[2])
def ProcessLine(self, line):
# If we're in a new step see if it needs to be parsed differently
if line.startswith(self.SEED_STEP_TEXT):
self._current_step_name = line[len(self.SEED_STEP_TEXT
):-len(self.ANNOTATOR_PREFIX_SUFIX)]
self._current_proccess_fn = self._get_processor(self._current_step_name)
self._current_log_level = self._get_log_level(self._current_step_name)
self._current_proccess_fn(line)
self._last_line = line
self._last_line_teriminal_lines = int(
(len(line) - 1) / self._terminal_columns) + 1
if line.startswith(self.STEP_CLOSED_TEXT):
# Text outside of steps will use the last processor otherwise
self._current_log_level = logging.DEBUG
_current_proccess_fn = self._StepNameProcessLine
def _get_processor(self, step_name):
if step_name in self._step_to_processors:
return self._step_to_processors[step_name]
for match_name in self._step_to_processors:
if step_name.startswith(match_name):
return self._step_to_processors[match_name]
return self._StepNameProcessLine
def _get_log_level(self, step_name):
if step_name in self._step_to_log_level:
return self._step_to_log_level[step_name]
for match_name in self._step_to_log_level:
if step_name.startswith(match_name):
return self._step_to_log_level[match_name]
return logging.INFO