perfkitbenchmarker/edw_benchmark_results

"""Aggregates the performance results from a edw benchmark. An edw benchmark, runs multiple iterations of a suite of queries. Independent raw query performance is aggregated during the benchmark, and used for generating: a. Raw query performance samples b. Aggregated query performance samples c. Raw wall time for each stream in each iteration d. Raw wall time for each iteration e. Aggregated (average) iteration wall time f. Raw geo mean performance for each iteration g. Aggregated geo mean performance using the aggregated query performances """ import abc import copy import enum import functools import json import logging from typing import Any, Iterable from absl import flags import numpy as np from perfkitbenchmarker import sample flags.DEFINE_bool( 'edw_generate_aggregated_metrics', True, 'Whether the benchmark generates aggregated_metrics such as ' 'geomean. Query performance metrics are still generated.', ) FLAGS = flags.FLAGS class EdwPerformanceAggregationError(Exception): """Error encountered during aggregation of performance results.""" def geometric_mean(iterable: list[float]) -> float: """Function to compute the geo mean for a list of numeric values. Args: iterable: A list of Float performance values Returns: A float value equal to the geometric mean of the input performance values. Raises: EdwPerformanceAggregationError: If an invalid performance value was included for aggregation. """ if not iterable or any(perf <= 0.0 for perf in iterable): raise EdwPerformanceAggregationError('Invalid values cannot be aggregated.') a = np.array(iterable) return a.prod() ** (1.0 / len(a)) class EdwQueryExecutionStatus(enum.Enum): """Enum class for potential status of query execution. Potential values: FAILED: Indicates that the query execution failed. SUCCESSFUL: Indicates that the query execution succeeded. """ FAILED = 'query_execution_failed' SUCCESSFUL = 'query_execution_successful' class EdwQueryPerformance: """Class that represents the performance of an executed edw query. Attributes: name: A string name of the query that was executed performance: A Float variable set to the query's completion time in secs. -1.0 is used as a sentinel value implying the query failed. For a successful query the value is expected to be positive. execution_status: An EdwQueryExecutionStatus enum indicating success/failure metadata: A dictionary of query execution attributes (job_id, etc.) """ def __init__( self, query_name: str, performance: float, metadata: dict[str, Any] ): # TODO(user): add query start and query end as attributes. self.name = query_name self.performance = performance self.execution_status = ( EdwQueryExecutionStatus.FAILED if performance == -1.0 else EdwQueryExecutionStatus.SUCCESSFUL ) self.metadata = metadata @classmethod def from_json(cls, serialized_performance: str): """Process the serialized query performance from client jar. Expected Performance format: {"query_wall_time_in_secs":1.998,"query_end":1601695222108,"query":"1", "query_start":1601695220110, "details":{"job_id":"b66b5a8e-633f-4ee4-8632-4e3d0856172f"}} Args: serialized_performance: Stringified json performance. Returns: An instance of EdwQueryPerformance """ results = json.loads(serialized_performance) if 'details' in results: metadata = results['details'] else: metadata = {} if results['query_wall_time_in_secs'] == -1: logging.warning('Query %s failed.', results['query']) return cls( query_name=results['query'], performance=results['query_wall_time_in_secs'], metadata=metadata, ) def get_performance_sample(self, metadata: dict[str, Any]) -> sample.Sample: """Method to generate a sample for the query performance. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample for the edw query performance. """ query_metadata = copy.copy(metadata) query_metadata['query'] = self.name query_metadata['execution_status'] = self.execution_status query_metadata.update(self.metadata) return sample.Sample( 'edw_raw_query_time', self.performance, 'seconds', query_metadata ) def get_performance_value(self) -> float: """Method to get the query's completion time in secs. Returns: A float value set to the query's completion time in secs. """ return self.performance def get_performance_metadata(self) -> dict[str, Any]: """Method to get the query's execution attributes (job_id, etc.). Returns: A dictionary set to query's execution attributes (job_id, etc.) """ return self.metadata def is_successful(self) -> bool: """Validates if the query was successful.""" return self.execution_status == EdwQueryExecutionStatus.SUCCESSFUL class EdwBaseIterationPerformance(abc.ABC): """Class that represents the performance of an iteration of edw queries.""" id: str @abc.abstractmethod def has_query_performance(self, query_name: str) -> bool: """Returns whether the query was run at least once in the iteration.""" @abc.abstractmethod def is_successful(self, expected_queries: list[str]) -> bool: """Check if all the expected queries ran and all succeeded.""" @abc.abstractmethod def is_query_successful(self, query_name: str) -> bool: """Returns whether the query was successful in the iteration.""" @abc.abstractmethod def get_query_performance(self, query_name: str) -> float: """Gets a query's execution performance generated during iteration execution.""" @abc.abstractmethod def get_query_metadata(self, query_name: str) -> dict[str, Any]: """Gets the metadata of a query as executed in the current iteration.""" @abc.abstractmethod def get_all_query_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Gets a list of samples for all queries in the iteration.""" @abc.abstractmethod def get_queries_geomean_performance_sample( self, expected_queries: list[str], metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for geomean of all queries in the iteration.""" @abc.abstractmethod def get_queries_geomean(self) -> float: """Gets the geometric mean of all queries in the iteration.""" @abc.abstractmethod def get_wall_time(self) -> float: """Gets the total wall time, in seconds, for the iteration.""" @abc.abstractmethod def get_wall_time_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for wall time performance of the iteration.""" class EdwPowerIterationPerformance(EdwBaseIterationPerformance): """Class that represents the performance of a power iteration of edw queries. Attributes: id: A unique string id for the iteration. start_time: The start time of the iteration in milliseconds since epoch. end_time: The end time of the iteration in milliseconds since epoch. wall_time: The wall time in seconds as a double value. performance: A dictionary of query name to its execution performance which is a EdwQueryPerformance instance. successful_count: An integer count of the successful queries in the iteration. total_count: An integer count of the total number of queries in the iteration. """ def __init__(self, iteration_id: str, total_queries: int): self.id = iteration_id self.performance: dict[str, EdwQueryPerformance] = {} self.total_count = total_queries self.successful_count: int = 0 self.start_time = 0 self.end_time = -1 self.wall_time: float = 0.0 def add_query_performance( self, query_name: str, performance: float, metadata: dict[str, Any] ): """Creates and populates a query performance from the input results. Updates the iteration's performance map with the query performance. The method also increaments the success and failure query counts for the iteration. Also updates the wall time of the iteration based on the query time. Args: query_name: A string name of the query that was executed performance: A Float variable set to the query's completion time in secs. -1.0 is used as a sentinel value implying the query failed. For a successful query the value is expected to be positive. metadata: Extra metadata to add to each performance. Raises: EdwPerformanceAggregationError: If the query has already been added. """ query_metadata = copy.copy(metadata) self._log_and_strip_query_results(query_metadata) query_performance = EdwQueryPerformance( query_name=query_name, performance=performance, metadata=query_metadata ) if query_performance.name in self.performance: raise EdwPerformanceAggregationError( 'Attempting to aggregate a duplicate query: %s.' % query_performance.name ) self.performance[query_performance.name] = query_performance if query_performance.is_successful(): self.successful_count += 1 self.wall_time = self.wall_time + performance def _log_and_strip_query_results( self, metadata: dict[str, str | dict[Any, Any]] ) -> None: """Logs first 100 characters of query output, then removes from metadata. Args: metadata: A metadata dict with query detail fields resulting of a query run via an EDW driver. If a key named 'output' exists in the dict, then the first 100 characters of the associated value are printed, and the key is deleted from the dict. """ # Although normally only one of either 'output' or 'query_results' should be # set, we want to err on the safe-side and remove both keys if they ever # existed together and then log whichever. output = metadata.pop('output', None) query_results = metadata.pop('query_results', None) stripped = output or query_results if stripped: logging.info('query results (first 100 chars): %s', str(stripped)[:100]) def has_query_performance(self, query_name: str) -> bool: """Returns whether the query was run at least once in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was executed in the iteration. """ return query_name in self.performance def is_query_successful(self, query_name: str) -> bool: """Returns whether the query was successful in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was successful in the iteration. """ return self.performance[query_name].is_successful() def get_query_performance(self, query_name: str) -> float: """Gets a query's execution performance generated during iteration execution. Args: query_name: A String name of the query to retrieve details for Returns: A float value set to the query's completion time in secs. """ return self.performance[query_name].get_performance_value() def get_query_metadata(self, query_name: str) -> dict[str, Any]: """Gets the metadata of a query as executed in the current iteration. Args: query_name: Name of the query whose performance is requested. Returns: A dictionary set to the query's metadata. Raises: EdwPerformanceAggregationError: If the query failed. """ if not self.is_query_successful(query_name): raise EdwPerformanceAggregationError( 'Cannot aggregate invalid / failed query' + query_name ) return self.performance[query_name].metadata def get_all_queries_in_iteration(self) -> Iterable[str]: """Gets a list of names of all queries in the iteration. Returns: A list of all queries in the iteration. """ return self.performance.keys() def get_all_query_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Gets a list of samples for all queries in the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples of each query's performance """ return [ query_performance.get_performance_sample(metadata) for query_performance in self.performance.values() ] def add_start_time(self, start_time: int): """Sets the start time of the iteration. Args: start_time: The UNIX timestamp, in milliseconds, at which the iteration was started """ self.start_time = start_time def add_end_time(self, end_time: int): """Sets the end time of the iteration. Args: end_time: The UNIX timestamp, in milliseconds, at which the iteration completed """ self.end_time = end_time def get_wall_time(self) -> float: """Gets the total wall time, in seconds, for the iteration. The wall time is the sum of the wall time of all individual queries. Returns: The wall time in seconds. """ return self.wall_time def get_wall_time_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for wall time performance of the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration wall time performance """ wall_time_metadata = copy.copy(metadata) wall_time_metadata['iteration_start_time'] = self.start_time wall_time_metadata['iteration_end_time'] = self.end_time return sample.Sample( 'edw_iteration_wall_time', self.wall_time, 'seconds', wall_time_metadata ) def is_successful(self, expected_queries: list[str]) -> bool: """Check if all the expected queries ran and all succeeded.""" all_queries_ran = set(self.get_all_queries_in_iteration()) == set( expected_queries ) all_queries_were_successful = self.total_count == self.successful_count return all_queries_ran and all_queries_were_successful def get_queries_geomean(self) -> float: """Gets the geometric mean of all queries in the iteration. Returns: The (float) geometric mean of all the queries ran in the iteration. Raises: EdwPerformanceAggregationError: If the iteration contains unsuccessful query executions. """ return geometric_mean([ query_performance.performance for query_performance in self.performance.values() ]) def get_queries_geomean_performance_sample( self, expected_queries: list[str], metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for geomean of all queries in the iteration. Args: expected_queries: A list of query names expected to have been executed in an iteration. metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration geomean performance. Raises: EdwPerformanceAggregationError: If the iteration contains unsuccessful query executions. """ if not self.is_successful(expected_queries): raise EdwPerformanceAggregationError('Failed executions in iteration.') raw_geo_mean = self.get_queries_geomean() geo_mean_metadata = copy.copy(metadata) return sample.Sample( 'edw_iteration_geomean_time', raw_geo_mean, 'seconds', geo_mean_metadata ) class EdwSimultaneousIterationPerformance(EdwBaseIterationPerformance): """Class that represents the performance of a simultaneous iteration. Attributes: id: A unique string id for the iteration. start_time: The start time of the iteration in milliseconds since epoch. end_time: The end time of the iteration in milliseconds since epoch. wall_time: The wall time in seconds as a double value. performance: A dictionary of query name to its execution performance which is an EdwQueryPerformance instance. all_queries_succeeded: Whether all queries in the iteration were successful. """ def __init__( self, iteration_id: str, iteration_start_time: int, iteration_end_time: int, iteration_wall_time: float, iteration_performance: dict[str, EdwQueryPerformance], all_queries_succeeded: bool, ): self.id = iteration_id self.start_time = iteration_start_time self.end_time = iteration_end_time self.wall_time = iteration_wall_time self.performance = iteration_performance self.all_queries_succeeded = all_queries_succeeded @classmethod def from_json(cls, iteration_id: str, serialized_performance: str): """Process the serialized simultaneous iteration performance from client jar. Expected Performance format: {"simultaneous_end":1601145943197,"simultaneous_start":1601145940113, "all_queries_performance_array":[{"query_wall_time_in_secs":2.079, "query_end":1601145942208,"job_id":"914682d9-4f64-4323-bad2-554267cbbd8d", "query":"1","query_start":1601145940129},{"query_wall_time_in_secs":2.572, "query_end":1601145943192,"job_id":"efbf93a1-614c-4645-a268-e3801ae994f1", "query":"2","query_start":1601145940620}], "simultaneous_wall_time_in_secs":3.084} Args: iteration_id: String identifier of the simultaneous iteration. serialized_performance: Stringified json performance. Returns: An instance of EdwSimultaneousIterationPerformance """ results = json.loads(serialized_performance) query_performance_map = {} all_queries_succeeded = 'failure_reason' not in results if all_queries_succeeded: for query_perf_json in results['all_queries_performance_array']: query_perf = EdwQueryPerformance.from_json( serialized_performance=(json.dumps(query_perf_json)) ) query_performance_map[query_perf.name] = query_perf else: logging.warning('Failure reported. Reason: %s', results['failure_reason']) return cls( iteration_id=iteration_id, iteration_start_time=( results['simultaneous_start'] if all_queries_succeeded else -1 ), iteration_end_time=( results['simultaneous_end'] if all_queries_succeeded else -1 ), iteration_wall_time=results['simultaneous_wall_time_in_secs'], iteration_performance=query_performance_map, all_queries_succeeded=all_queries_succeeded, ) def get_wall_time(self) -> float: """Gets the total wall time, in seconds, for the iteration. The wall time is the time from the start of the first query to the end time of the last query to finish. Returns: The wall time in seconds. """ return self.wall_time def get_wall_time_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for wall time performance of the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration wall time performance """ wall_time = self.wall_time wall_time_metadata = copy.copy(metadata) wall_time_metadata['iteration_start_time'] = self.start_time wall_time_metadata['iteration_end_time'] = self.end_time return sample.Sample( 'edw_iteration_wall_time', wall_time, 'seconds', wall_time_metadata ) def get_all_query_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Gets a list of samples for all queries in the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples of each query's performance """ return [ query_performance.get_performance_sample(metadata) for query_performance in self.performance.values() ] def is_successful(self, expected_queries: list[str]) -> bool: """Check if all the expected queries ran and all succeeded.""" all_queries_ran = self.performance.keys() == set(expected_queries) return all_queries_ran and self.all_queries_succeeded def has_query_performance(self, query_name: str) -> bool: """Returns whether the query was run at least once in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was executed in the iteration. """ return query_name in self.performance def is_query_successful(self, query_name: str) -> bool: """Returns whether the query was successful in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was successful in the iteration. """ if self.has_query_performance(query_name): return self.performance[query_name].is_successful() return False def get_query_performance(self, query_name: str) -> float: """Gets a query's execution performance in the current iteration. Args: query_name: A String name of the query to retrieve details for Returns: A float value set to the query's completion time in secs. """ return self.performance[query_name].get_performance_value() def get_query_metadata(self, query_name: str) -> dict[str, Any]: """Gets the metadata of a query in the current iteration. Args: query_name: Name of the query whose aggregated performance is requested Returns: A dictionary set to the query's aggregated metadata, accumulated from the raw query run in the current iteration. Raises: EdwPerformanceAggregationError: If the query failed in the iteration. """ if not self.is_query_successful(query_name): raise EdwPerformanceAggregationError( 'Cannot aggregate invalid / failed query' + query_name ) return self.performance[query_name].metadata def get_queries_geomean(self) -> float: """Gets the geometric mean of all queries in the iteration. Returns: The (float) geometric mean of all the queries ran in the iteration. Raises: EdwPerformanceAggregationError: If the iteration contains unsuccessful query executions. """ return geometric_mean([ query_performance.performance for query_performance in self.performance.values() ]) def get_queries_geomean_performance_sample( self, expected_queries: list[str], metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for geomean of all queries in the iteration. Args: expected_queries: A list of query names expected to have been executed in an iteration. metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration geomean performance. Raises: EdwPerformanceAggregationError: If the iteration contains unsuccessful query executions. """ if not self.is_successful(expected_queries): raise EdwPerformanceAggregationError('Failed executions in iteration.') raw_geo_mean = self.get_queries_geomean() geo_mean_metadata = copy.copy(metadata) return sample.Sample( 'edw_iteration_geomean_time', raw_geo_mean, 'seconds', geo_mean_metadata ) class EdwThroughputIterationPerformance(EdwBaseIterationPerformance): """Class that represents the performance of an iteration of edw queries. Attributes: id: A unique string id for the iteration. start_time: The start time of the iteration execution. end_time: The end time of the iteration execution. wall_time: The wall time of the stream execution. performance: A dict of stream_id to stream performances, each of which is a dictionary mapping query names to their execution performances, which are EdwQueryPerformance instances. """ def __init__( self, iteration_id: str, iteration_start_time: int, iteration_end_time: int, iteration_wall_time: float, iteration_performance: dict[str, dict[str, EdwQueryPerformance]], ): self.id = iteration_id self.start_time = iteration_start_time self.end_time = iteration_end_time self.wall_time = iteration_wall_time self.performance = iteration_performance @classmethod def from_json(cls, iteration_id: str, serialized_performance: str): """Process the serialized throughput iteration performance from client jar. Expected Performance format: {"throughput_start":1601666911596,"throughput_end":1601666916139, "throughput_wall_time_in_secs":4.543, "all_streams_performance_array":[ {"stream_start":1601666911597,"stream_end":1601666916139, "stream_wall_time_in_secs":4.542, "stream_performance_array":[ {"query_wall_time_in_secs":2.238,"query_end":1601666913849, "query":"1","query_start":1601666911611, "details":{"job_id":"438170b0-b0cb-4185-b733-94dd05b46b05"}}, {"query_wall_time_in_secs":2.285,"query_end":1601666916139, "query":"2","query_start":1601666913854, "details":{"job_id":"371902c7-5964-46f6-9f90-1dd00137d0c8"}} ]}, {"stream_start":1601666911597,"stream_end":1601666916018, "stream_wall_time_in_secs":4.421, "stream_performance_array":[ {"query_wall_time_in_secs":2.552,"query_end":1601666914163, "query":"2","query_start":1601666911611, "details":{"job_id":"5dcba418-d1a2-4a73-be70-acc20c1f03e6"}}, {"query_wall_time_in_secs":1.855,"query_end":1601666916018, "query":"1","query_start":1601666914163, "details":{"job_id":"568c4526-ae26-4e9d-842c-03459c3a216d"}} ]} ]} Args: iteration_id: String identifier of the throughput iteration. serialized_performance: Stringified json performance. Returns: An instance of EdwThroughputIterationPerformance """ results = json.loads(serialized_performance) stream_performances = {} all_queries_succeeded = 'failure_reason' not in results if all_queries_succeeded: for stream_id, stream_perf_json in enumerate( results['all_streams_performance_array'] ): stream_id = str(stream_id) stream_performance_map = {} for query_perf_json in stream_perf_json['stream_performance_array']: query_perf = EdwQueryPerformance.from_json( serialized_performance=(json.dumps(query_perf_json)) ) stream_performance_map[query_perf.name] = query_perf stream_performances.update({stream_id: stream_performance_map}) else: logging.warning('Failure reported. Reason: %s', results['failure_reason']) return cls( iteration_id=iteration_id, iteration_start_time=( results['throughput_start'] if all_queries_succeeded else -1 ), iteration_end_time=( results['throughput_end'] if all_queries_succeeded else -1 ), iteration_wall_time=results['throughput_wall_time_in_secs'], iteration_performance=stream_performances, ) def has_query_performance(self, query_name: str) -> bool: """Returns whether the query was run at least once in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was executed in the iteration. """ for stream in self.performance.values(): if query_name in stream: return True return False def is_query_successful(self, query_name: str) -> bool: """Returns whether the query was successful in the iteration. Args: query_name: A String name of the query to check. Returns: A boolean value indicating if the query was successful in the iteration. """ for stream in self.performance.values(): if query_name in stream: if not stream[query_name].is_successful(): return False return True def get_query_performance(self, query_name: str) -> float: """Gets a query's execution performance aggregated across all streams in the current iteration. Args: query_name: A String name of the query to retrieve details for Returns: A float value set to the query's average completion time in secs. """ all_performances = [] for stream in self.performance.values(): if query_name in stream: all_performances.append(stream[query_name].get_performance_value()) if not all_performances: return -1.0 return sum(all_performances) / len(all_performances) def get_query_metadata(self, query_name: str) -> dict[str, Any]: """Gets the metadata of a query aggregated across all streams in the current iteration. Args: query_name: Name of the query whose aggregated performance is requested Returns: A dictionary set to the query's aggregated metadata, accumulated from the raw query runs in all streams of the current iteration. Raises: EdwPerformanceAggregationError: If the query failed in one or more streams """ result = {} for stream_id, stream_performance in self.performance.items(): if query_name in stream_performance: q_performance = stream_performance[query_name] result[stream_id + '_runtime'] = q_performance.get_performance_value() result.update({ stream_id + '_' + k: v for (k, v) in q_performance.get_performance_metadata().items() }) return result def get_all_query_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Gets a list of samples for all queries in all streams of the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples of each query's performance """ all_query_performances = [] for stream_id, stream_performance in self.performance.items(): stream_metadata = copy.copy(metadata) stream_metadata['stream'] = stream_id all_query_performances.extend([ query_perf.get_performance_sample(stream_metadata) for query_perf in stream_performance.values() ]) return all_query_performances def all_streams_ran_all_expected_queries( self, expected_queries: list[str] ) -> bool: """Checks that the same set of expected queries ran in all streams.""" for stream in self.performance.values(): if set(stream.keys()) != set(expected_queries): return False return True def no_duplicate_queries(self) -> bool: """Checks that no streams contain any duplicate queries.""" for stream in self.performance.values(): if len(stream.keys()) != len(set(stream.keys())): return False return True def all_queries_succeeded(self) -> bool: """Checks if every query in every stream was successful.""" for stream_performance in self.performance.values(): for query_perf in stream_performance.values(): if query_perf.performance == -1: return False return True def is_successful(self, expected_queries: list[str]) -> bool: """Check if the throughput run was successful. A successful run meets the following conditions: - There were more than 0 streams. - Each stream ran the same set of expected queries (regardless of order) - Each stream ran each query only once - Every query in every stream succeeded Args: expected_queries: A list of query names expected to have been executed in an iteration. Returns: True if all success conditions were met, false otherwise. """ non_zero_streams = len(self.performance) >= 1 all_streams_ran_all_queries = self.all_streams_ran_all_expected_queries( expected_queries ) no_duplicate_queries = self.no_duplicate_queries() all_queries_succeeded = self.all_queries_succeeded() return ( non_zero_streams and all_streams_ran_all_queries and no_duplicate_queries and all_queries_succeeded ) def get_queries_geomean(self) -> float: """Gets the geometric mean of all queries in all streams of the iteration. Returns: The (float) geometric mean of all the individual queries ran in all streams of the iteration. Raises: EdwPerformanceAggregationError: If the suite contains unsuccessful query executions. """ query_performances = [] for stream in self.performance.values(): for query in stream.values(): query_performances.append(query.get_performance_value()) return geometric_mean(query_performances) def get_queries_geomean_performance_sample( self, expected_queries: list[str], metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for geomean of all queries in all streams of the iteration. Args: expected_queries: A list of query names expected to have been executed in an iteration. metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration geomean performance. Raises: EdwPerformanceAggregationError: If the iteration contains unsuccessful query executions. """ if not self.is_successful(expected_queries): raise EdwPerformanceAggregationError('Failed executions in iteration.') raw_geo_mean = self.get_queries_geomean() geo_mean_metadata = copy.copy(metadata) return sample.Sample( 'edw_iteration_geomean_time', raw_geo_mean, 'seconds', geo_mean_metadata ) def get_wall_time(self) -> float: """Gets the total wall time, in seconds, for the iteration. The wall time is the time from the start of the first stream to the end time of the last stream to finish. Returns: The wall time in seconds. """ return self.wall_time def get_wall_time_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets a sample for total wall time performance of the iteration. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of iteration wall time performance """ wall_time_metadata = copy.copy(metadata) wall_time_metadata['iteration_start_time'] = self.start_time wall_time_metadata['iteration_end_time'] = self.end_time return sample.Sample( 'edw_iteration_wall_time', self.wall_time, 'seconds', wall_time_metadata ) class EdwBenchmarkPerformance: """Class that represents the performance of an edw benchmark. Attributes: total_iterations: An integer variable set to total of number of iterations. expected_queries: A list of query names that are executed in an iteration of the benchmark iteration_performances: A dictionary of iteration id (String value) to its execution performance (an instance of EdwBaseIterationPerformance) """ def __init__(self, total_iterations: int, expected_queries: Iterable[str]): self.total_iterations = total_iterations self.expected_queries = list(expected_queries) self.iteration_performances: dict[str, EdwBaseIterationPerformance] = {} def add_iteration_performance(self, performance: EdwBaseIterationPerformance): """Add an iteration's performance to the benchmark results. Args: performance: An instance of EdwBaseIterationPerformance encapsulating the iteration performance details. Raises: EdwPerformanceAggregationError: If the iteration has already been added. """ iteration_id = performance.id if iteration_id in self.iteration_performances: raise EdwPerformanceAggregationError( 'Attempting to aggregate a duplicate iteration: %s.' % iteration_id ) self.iteration_performances[iteration_id] = performance def is_successful(self) -> bool: """Check a benchmark's success, only if all the iterations succeed.""" return functools.reduce( (lambda x, y: x and y), [ iteration_performance.is_successful(self.expected_queries) for iteration_performance in self.iteration_performances.values() ], ) def aggregated_query_status(self, query_name: str) -> bool: """Gets the status of query aggregated across all iterations. A query is considered successful only if a. Query was executed in every iteration b. Query was successful in every iteration Args: query_name: Name of the query whose aggregated success is requested Returns: A boolean value indicating if the query was successful in the benchmark. """ for performance in self.iteration_performances.values(): if not performance.has_query_performance(query_name): return False if not performance.is_query_successful(query_name): return False return True def aggregated_query_execution_time(self, query_name: str) -> float: """Gets the execution time of query aggregated across all iterations. Args: query_name: Name of the query whose aggregated performance is requested Returns: A float value set to the query's aggregated execution time Raises: EdwPerformanceAggregationError: If the query failed in one or more iterations """ if not self.aggregated_query_status(query_name): raise EdwPerformanceAggregationError( 'Cannot aggregate invalid / failed query ' + query_name ) query_performances = [ iteration_performance.get_query_performance(query_name) for iteration_performance in self.iteration_performances.values() ] return sum(query_performances) / self.total_iterations def aggregated_query_metadata(self, query_name: str) -> dict[str, Any]: """Gets the metadata of a query aggregated across all iterations. Args: query_name: Name of the query whose aggregated performance is requested Returns: A dictionary set to the query's aggregated metadata, accumulated from the raw query runs. Raises: EdwPerformanceAggregationError: If the query failed in one or more iterations """ if not self.aggregated_query_status(query_name): raise EdwPerformanceAggregationError( 'Cannot aggregate invalid / failed query ' + query_name ) result = {} for ( iteration_id, iteration_performance, ) in self.iteration_performances.items(): result.update({ iteration_id + '_' + k: v for (k, v) in iteration_performance.get_query_metadata( query_name ).items() }) return result def get_aggregated_query_performance_sample( self, query_name: str, metadata: dict[str, Any] ) -> sample.Sample: """Gets the performance of query aggregated across all iterations. Args: query_name: Name of the query whose aggregated performance is requested metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of the query's aggregated execution time """ query_metadata = copy.copy(metadata) query_metadata['query'] = query_name query_metadata['aggregation_method'] = 'mean' perf, exec_status, agg_md = -1.0, EdwQueryExecutionStatus.FAILED, {} if self.aggregated_query_status(query_name): perf = self.aggregated_query_execution_time(query_name=query_name) exec_status = EdwQueryExecutionStatus.SUCCESSFUL agg_md = self.aggregated_query_metadata(query_name=query_name) query_metadata['execution_status'] = exec_status query_metadata.update(agg_md) return sample.Sample( 'edw_aggregated_query_time', perf, 'seconds', query_metadata ) def get_all_query_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Generates samples for all query performances. Benchmark relies on iteration runs to generate the raw query performance samples Benchmark appends the aggregated query performance sample Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples (raw and aggregated) """ results = [] # Raw query performance samples for iteration, performance in self.iteration_performances.items(): iteration_metadata = copy.copy(metadata) iteration_metadata['iteration'] = iteration results.extend( performance.get_all_query_performance_samples(iteration_metadata) ) # Aggregated query performance samples for query in self.expected_queries: results.append( self.get_aggregated_query_performance_sample( query_name=query, metadata=metadata ) ) return results def get_aggregated_wall_time_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets the wall time performance aggregated across all iterations. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of aggregated (averaged) wall time. """ wall_times = [ iteration.get_wall_time() for iteration in self.iteration_performances.values() ] aggregated_wall_time = sum(wall_times) / self.total_iterations wall_time_metadata = copy.copy(metadata) wall_time_metadata['aggregation_method'] = 'mean' return sample.Sample( 'edw_aggregated_wall_time', aggregated_wall_time, 'seconds', wall_time_metadata, ) def get_wall_time_performance_samples(self, metadata: dict[str, Any]): """Generates samples for all wall time performances. Benchmark relies on iterations to generate the raw wall time performance samples. Benchmark appends the aggregated wall time performance sample Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples (raw and aggregated) """ results = [] for iteration, performance in self.iteration_performances.items(): iteration_metadata = copy.copy(metadata) iteration_metadata['iteration'] = iteration results.append( performance.get_wall_time_performance_sample(iteration_metadata) ) results.append( self.get_aggregated_wall_time_performance_sample(metadata=metadata) ) return results def get_aggregated_geomean_performance_sample( self, metadata: dict[str, Any] ) -> sample.Sample: """Gets the geomean performance aggregated across all iterations. Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A sample of aggregated geomean Raises: EdwPerformanceAggregationError: If the benchmark conatins a failed query execution. """ if not self.is_successful(): raise EdwPerformanceAggregationError('Benchmark contains a failed query.') aggregated_geo_mean = geometric_mean([ self.aggregated_query_execution_time(query_name=query) for query in self.expected_queries ]) geomean_metadata = copy.copy(metadata) geomean_metadata['intra_query_aggregation_method'] = 'mean' geomean_metadata['inter_query_aggregation_method'] = 'geomean' return sample.Sample( 'edw_aggregated_geomean', aggregated_geo_mean, 'seconds', geomean_metadata, ) def get_queries_geomean_performance_samples( self, metadata: dict[str, Any] ) -> list[sample.Sample]: """Generates samples for all geomean performances. Benchmark relies on iteration runs to generate the raw geomean performance samples Benchmark appends the aggregated geomean performance sample Args: metadata: A dictionary of execution attributes to be merged with the query execution attributes, for eg. tpc suite, scale of dataset, etc. Returns: A list of samples (raw and aggregated) Raises: EdwPerformanceAggregationError: If the benchmark conatins a failed query execution """ if not self.is_successful(): raise EdwPerformanceAggregationError('Benchmark contains a failed query.') results = [] for iteration, performance in self.iteration_performances.items(): iteration_metadata = copy.copy(metadata) iteration_metadata['iteration'] = iteration results.append( performance.get_queries_geomean_performance_sample( self.expected_queries, iteration_metadata ) ) results.append( self.get_aggregated_geomean_performance_sample(metadata=metadata) ) return results

perfkitbenchmarker/edw_benchmark_results_aggregator.py (572 lines of code) (raw):