Adding classifiers to metrics and updating csv and telemetry to take advantage of them

- Adding "classifiers" field to Metric objects. This is a dict mapping classifier names (arbitrary strings) to corresponding values for that specific metrics. This is to allow extensions to add extension-specific annotations to metric that could be handled in a generic way (e.g. by result processors). - Updating telemetry workload to add classifiers for the url and internal iteration (or "time") for a particular result. - Updating csv result processor with the option to use classifiers to add columns to results.csv (either using all classifiers found, or only for the specific ones listed).
2025-10-19 02:04:03 +01:00 · 2015-05-14 15:10:42 +01:00
parent 782d4501cd
commit 512bacc1be
4 changed files with 65 additions and 34 deletions
--- a/wlauto/core/execution.py
+++ b/wlauto/core/execution.py
@@ -192,6 +192,9 @@ class ExecutionContext(object):
        self.current_job = None
        self.output_directory = self.run_output_directory
    def add_metric(self, *args, **kwargs):
        self.result.add_metric(*args, **kwargs)
    def add_artifact(self, name, path, kind, *args, **kwargs):
        if self.current_job is None:
            self.add_run_artifact(name, path, kind, *args, **kwargs)
--- a/wlauto/core/result.py
+++ b/wlauto/core/result.py
@@ -261,8 +261,8 @@ class IterationResult(object):
        self.metrics = []
        self.artifacts = []
-    def add_metric(self, name, value, units=None, lower_is_better=False):
+    def add_metric(self, name, value, units=None, lower_is_better=False, classifiers=None):
-        self.metrics.append(Metric(name, value, units, lower_is_better))
+        self.metrics.append(Metric(name, value, units, lower_is_better, classifiers))
    def has_metric(self, name):
        for metric in self.metrics:
@@ -300,14 +300,18 @@ class Metric(object):
                  has no units (e.g. it's a count or a standardised score).
    :param lower_is_better: Boolean flag indicating where lower values are
                            better than higher ones. Defaults to False.
    :param classifiers: A set of key-value pairs to further classify this metric
                        beyond current iteration (e.g. this can be used to identify
                        sub-tests).
    """
-    def __init__(self, name, value, units=None, lower_is_better=False):
+    def __init__(self, name, value, units=None, lower_is_better=False, classifiers=None):
        self.name = name
        self.value = numeric(value)
        self.units = units
        self.lower_is_better = lower_is_better
        self.classifiers = classifiers or {}
    def to_dict(self):
        return self.__dict__
--- a/wlauto/result_processors/standard.py
+++ b/wlauto/result_processors/standard.py
@@ -24,7 +24,9 @@ import os
 import csv
 import json
-from wlauto import ResultProcessor, settings
+from wlauto import ResultProcessor, Parameter
 from wlauto.exceptions import ConfigError
 from wlauto.utils.types import list_of_strings
 class StandardProcessor(ResultProcessor):
@@ -63,15 +65,50 @@ class CsvReportProcessor(ResultProcessor):
    name = 'csv'
    parameters = [
        Parameter('use_all_classifiers', kind=bool, default=False,
                  description="""
                  If set to ``True``, this will add a column for every classifier
                  that features in at least one collected metric.
                  .. note:: This cannot be ``True`` if ``extra_columns`` is set.
                  """),
        Parameter('extra_columns', kind=list_of_strings,
                  description="""
                  List of classifiers to use as columns.
                   .. note:: This cannot be set if ``use_all_classifiers`` is ``True``.
                  """),
    ]
    def validate(self):
        if self.use_all_classifiers and self.extra_columns:
            raise ConfigError('extra_columns cannot be specified when use_all_classifiers is True')
    def process_run_result(self, result, context):
-        outfile = os.path.join(settings.output_directory, 'results.csv')
+        if self.use_all_classifiers:
            classifiers = set([])
            for ir in result.iteration_results:
                for metric in ir.metrics:
                    classifiers.update(metric.classifiers.keys())
            extra_columns = list(classifiers)
        elif self.extra_columns:
            extra_columns = self.extra_columns
        else:
            extra_columns = []
        outfile = os.path.join(context.run_output_directory, 'results.csv')
        with open(outfile, 'wb') as wfh:
            writer = csv.writer(wfh)
-            writer.writerow(['id', 'workload', 'iteration', 'metric', 'value', 'units'])
+            writer.writerow(['id', 'workload', 'iteration', 'metric', ] +
-            for result in result.iteration_results:
+                            extra_columns + ['value', 'units'])
-                for metric in result.metrics:
+            for ir in result.iteration_results:
-                    row = [result.id, result.spec.label, result.iteration,
+                for metric in ir.metrics:
-                           metric.name, str(metric.value), metric.units or '']
+                    row = ([ir.id, ir.spec.label, ir.iteration, metric.name] +
                           [str(metric.classifiers.get(c) or '') for c in extra_columns] +
                           [str(metric.value), metric.units or ''])
                    writer.writerow(row)
        context.add_artifact('run_result_csv', 'results.csv', 'export')
@@ -86,7 +123,7 @@ class JsonReportProcessor(ResultProcessor):
    name = 'json'
    def process_run_result(self, result, context):
-        outfile = os.path.join(settings.output_directory, 'results.json')
+        outfile = os.path.join(context.run_output_directory, 'results.json')
        with open(outfile, 'wb') as wfh:
            output = []
            for result in result.iteration_results:
@@ -111,7 +148,7 @@ class SummaryCsvProcessor(ResultProcessor):
    name = 'summary_csv'
    def process_run_result(self, result, context):
-        outfile = os.path.join(settings.output_directory, 'summary.csv')
+        outfile = os.path.join(context.run_output_directory, 'summary.csv')
        with open(outfile, 'wb') as wfh:
            writer = csv.writer(wfh)
            writer.writerow(['id', 'workload', 'iteration', 'metric', 'value', 'units'])
--- a/wlauto/workloads/telemetry/init.py
+++ b/wlauto/workloads/telemetry/init.py
@@ -125,7 +125,7 @@ class Telemetry(Workload):
            raise WorkloadError('Unexected error from run_benchmark: {}'.format(ret))
        if self.extract_fps and 'trace' not in self.run_benchmark_params:
            raise ConfigError('"trace" profiler must be enabled in order to extract FPS for Telemetry')
-        self._resovlve_run_benchmark_path()
+        self._resolve_run_benchmark_path()
    def setup(self, context):
        self.raw_output = None
@@ -133,7 +133,7 @@ class Telemetry(Workload):
    def run(self, context):
        self.logger.debug(self.command)
-        self.raw_output, _ = check_output(self.command, shell=True, timeout=self.run_timeout, ignore=1)
+        self.raw_output, _ = check_output(self.command, shell=True, timeout=self.run_timeout, ignore=range(256))
    def update_result(self, context):  # pylint: disable=too-many-locals
        if not self.raw_output:
@@ -158,10 +158,12 @@ class Telemetry(Workload):
                context.result.add_metric(name_template.format('sd'), result.std,
                                          result.units, lower_is_better=True)
                writer.writerows(result.rows)
            context.add_artifact('telemetry', csv_outfile, kind='data')
-        for kind, values in averages.iteritems():
+                for i, value in enumerate(result.values, 1):
-            context.result.add_metric(kind, special_average(values), lower_is_better=True)
+                    context.add_metric(result.kind, value, units=result.units,
                                       classifiers={'url': result.url, 'time': i})
            context.add_artifact('telemetry', csv_outfile, kind='data')
        for idx, artifact in enumerate(artifacts):
            if is_zipfile(artifact):
@@ -199,10 +201,10 @@ class Telemetry(Workload):
                                    device_opts,
                                    self.run_benchmark_params)
-    def _resovlve_run_benchmark_path(self):
+    def _resolve_run_benchmark_path(self):
        # pylint: disable=access-member-before-definition
        if self.run_benchmark_path:
-            if not os.path.exists(self.run_bencmark_path):
+            if not os.path.exists(self.run_benchmark_path):
                raise ConfigError('run_benchmark path "{}" does not exist'.format(self.run_benchmark_path))
        else:
            self.run_benchmark_path = os.path.join(self.dependencies_directory, 'telemetry', 'run_benchmark')
@@ -291,21 +293,6 @@ def parse_telemetry_results(filepath):
    return results, artifacts
 def special_average(values):
    """Overall score calculation. Tries to accound for large differences
    between different pages."""
    negs = [v < 0 for v in values]
    abs_logs = [(av and math.log(av, 10) or av)
                for av in map(abs, values)]
    signed_logs = []
    for lv, n in zip(abs_logs, negs):
        if n:
            signed_logs.append(-lv)
        else:
            signed_logs.append(lv)
    return get_meansd(signed_logs)[0]
 if __name__ == '__main__':
    import sys
    from pprint import pprint