build_tools/benchmarks/upload_benchmarks_to_dashboard.py - 3p/openxla/iree - Git at Google

 #!/usr/bin/env python3
 # Copyright 2021 The IREE Authors
 #
 # Licensed under the Apache License v2.0 with LLVM Exceptions.
 # See https://llvm.org/LICENSE.txt for license information.
 # SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 """Upload benchmark results to IREE Benchmark Dashboards.

 This script is meant to be used by Buildkite for automation.

 Example usage:
   # Export necessary environment variables:
   export IREE_DASHBOARD_URL=...
   export IREE_DASHBOARD_API_TOKEN=...
   # Then run the script:
   python3 upload_benchmarks.py /path/to/benchmark/json/file
 """

 import argparse
 import json
 import os
 import re
 import requests
 import subprocess
 import time

 from typing import Any, Dict, Optional
 from common.benchmark_presentation import COMPILATION_METRICS_TO_TABLE_MAPPERS, collect_all_compilation_metrics
 from common.benchmark_definition import (BenchmarkInfo, BenchmarkResults,
                                          execute_cmd_and_get_output)
 from common.benchmark_thresholds import BENCHMARK_THRESHOLDS

 IREE_GITHUB_COMMIT_URL_PREFIX = 'https://github.com/iree-org/iree/commit'
 IREE_PROJECT_ID = 'IREE'
 THIS_DIRECTORY = os.path.dirname(os.path.realpath(__file__))

 COMMON_DESCRIIPTION = """
 <br>
 For the graph, the x axis is the Git commit index, and the y axis is the
 measured latency in milliseconds.
 <br>
 See <a href="https://github.com/iree-org/iree/tree/main/benchmarks/dashboard.md">
 https://github.com/iree-org/iree/tree/main/benchmarks/dashboard.md
 </a> for benchmark philosophy, specification, and definitions.
 """

 # A non-exhaustive list of models and their source URLs.
 # For models listed here we can provide a nicer description for them on
 # webpage.
 IREE_TF_MODEL_SOURCE_URL = {
     'MobileBertSquad':
         'https://github.com/google-research/google-research/tree/master/mobilebert',
     'MobileNetV2':
         'https://www.tensorflow.org/api_docs/python/tf/keras/applications/MobileNetV2',
     'MobileNetV3Small':
         'https://www.tensorflow.org/api_docs/python/tf/keras/applications/MobileNetV3Small',
 }

 IREE_TFLITE_MODEL_SOURCE_URL = {
     'DeepLabV3':
         'https://tfhub.dev/tensorflow/lite-model/deeplabv3/1/default/1',
     'MobileSSD':
         'https://www.tensorflow.org/lite/performance/gpu#demo_app_tutorials',
     'PoseNet':
         'https://tfhub.dev/tensorflow/lite-model/posenet/mobilenet/float/075/1/default/1',
 }


 def get_model_description(model_name: str, model_source: str) -> Optional[str]:
   """Gets the model description for the given benchmark."""
   url = None
   if model_source == "TensorFlow":
     url = IREE_TF_MODEL_SOURCE_URL.get(model_name)
   elif model_source == "TFLite":
     url = IREE_TFLITE_MODEL_SOURCE_URL.get(model_name)
   if url is not None:
     description = f'{model_name} from <a href="{url}">{url}</a>.'
     return description
   return None


 def get_git_commit_hash(commit: str, verbose: bool = False) -> str:
   """Gets the commit hash for the given commit."""
   return execute_cmd_and_get_output(['git', 'rev-parse', commit],
                                     cwd=THIS_DIRECTORY,
                                     verbose=verbose)


 def get_git_total_commit_count(commit: str, verbose: bool = False) -> int:
   """Gets the total commit count in history ending with the given commit."""
   count = execute_cmd_and_get_output(['git', 'rev-list', '--count', commit],
                                      cwd=THIS_DIRECTORY,
                                      verbose=verbose)
   return int(count)


 def get_git_commit_info(commit: str, verbose: bool = False) -> Dict[str, str]:
   """Gets commit information dictory for the given commit."""
   cmd = [
       'git', 'show', '--format=%H:::%h:::%an:::%ae:::%s', '--no-patch', commit
   ]
   info = execute_cmd_and_get_output(cmd, cwd=THIS_DIRECTORY, verbose=verbose)
   segments = info.split(':::')
   return {
       'hash': segments[0],
       'abbrevHash': segments[1],
       'authorName': segments[2],
       'authorEmail': segments[3],
       'subject': segments[4],
   }


 def compose_series_payload(project_id: str,
                            series_id: str,
                            series_description: bool = None,
                            average_range: str = '5%',
                            average_min_count: int = 3,
                            better_criterion: str = 'smaller',
                            override: bool = False) -> Dict[str, Any]:
   """Composes the payload dictionary for a series."""
   payload = {
       'projectId': project_id,
       'serieId': series_id,
       'analyse': {
           'benchmark': {
               'range': average_range,
               'required': average_min_count,
               'trend': better_criterion,
           }
       },
       'override': override,
   }
   if series_description is not None:
     payload['description'] = series_description
   return payload


 def compose_build_payload(project_id: str,
                           project_github_comit_url: str,
                           build_id: int,
                           commit: str,
                           override: bool = False) -> Dict[str, Any]:
   """Composes the payload dictionary for a build."""
   commit_info = get_git_commit_info(commit)
   commit_info['url'] = f'{project_github_comit_url}/{commit_info["hash"]}'
   return {
       'projectId': project_id,
       'build': {
           'buildId': build_id,
           'infos': commit_info,
       },
       'override': override,
   }


 def compose_sample_payload(project_id: str,
                            series_id: str,
                            build_id: int,
                            sample_value: int,
                            override: bool = False) -> Dict[str, Any]:
   """Composes the payload dictionary for a sample."""
   return {
       'projectId': project_id,
       'serieId': series_id,
       'sample': {
           'buildId': build_id,
           'value': sample_value
       },
       'override': override
   }


 def get_required_env_var(var: str) -> str:
   """Gets the value for a required environment variable."""
   value = os.getenv(var)
   if value is None:
     raise RuntimeError(f'Missing environment variable "{var}"')
   return value


 def post_to_dashboard(url: str,
                       payload: Dict[str, Any],
                       dry_run: bool = False,
                       verbose: bool = False):
   data = json.dumps(payload)

   if dry_run or verbose:
     print(f'API request payload: {data}')

   if dry_run:
     return

   api_token = get_required_env_var('IREE_DASHBOARD_API_TOKEN')
   headers = {
       'Content-type': 'application/json',
       'Authorization': f'Bearer {api_token}',
   }

   response = requests.post(url, data=data, headers=headers)
   code = response.status_code
   if code != 200:
     raise requests.RequestException(
         f'Failed to post to dashboard server with status code {code}')


 def add_new_iree_series(series_id: str,
                         series_description: Optional[str] = None,
                         override: bool = False,
                         dry_run: bool = False,
                         verbose: bool = False):
   """Posts a new series to the dashboard."""
   url = get_required_env_var('IREE_DASHBOARD_URL')

   average_range = None
   for threshold in BENCHMARK_THRESHOLDS:
     if threshold.regex.match(series_id):
       average_range = threshold.get_threshold_str()
       break
   if average_range is None:
     raise ValueError(f"no matched threshold setting for benchmark: {series_id}")

   payload = compose_series_payload(IREE_PROJECT_ID,
                                    series_id,
                                    series_description,
                                    average_range=average_range,
                                    override=override)
   post_to_dashboard(f'{url}/apis/addSerie',
                     payload,
                     dry_run=dry_run,
                     verbose=verbose)


 def add_new_iree_build(build_id: int,
                        commit: str,
                        override: bool = False,
                        dry_run: bool = False,
                        verbose: bool = False):
   """Posts a new build to the dashboard."""
   url = get_required_env_var('IREE_DASHBOARD_URL')
   payload = compose_build_payload(IREE_PROJECT_ID,
                                   IREE_GITHUB_COMMIT_URL_PREFIX, build_id,
                                   commit, override)
   post_to_dashboard(f'{url}/apis/addBuild',
                     payload,
                     dry_run=dry_run,
                     verbose=verbose)


 def add_new_sample(series_id: str,
                    build_id: int,
                    sample_value: int,
                    override: bool = False,
                    dry_run: bool = False,
                    verbose: bool = False):
   """Posts a new sample to the dashboard."""
   url = get_required_env_var('IREE_DASHBOARD_URL')
   payload = compose_sample_payload(IREE_PROJECT_ID, series_id, build_id,
                                    sample_value, override)
   post_to_dashboard(f'{url}/apis/addSample',
                     payload,
                     dry_run=dry_run,
                     verbose=verbose)


 def parse_arguments():
   """Parses command-line options."""

   def check_file_path(path):
     if os.path.isfile(path):
       return path
     else:
       raise ValueError(path)

   parser = argparse.ArgumentParser()
   parser.add_argument(
       '--benchmark_files',
       metavar='<benchmark-json-files>',
       type=check_file_path,
       required=True,
       nargs='+',
       help='Paths to the JSON files containing benchmark results')
   parser.add_argument(
       "--compile_stats_files",
       metavar="<compile-stats-json-files>",
       type=check_file_path,
       default=[],
       nargs="+",
       help="Paths to the JSON files containing compilation statistics")
   parser.add_argument("--dry-run",
                       action="store_true",
                       help="Print the comment instead of posting to dashboard")
   parser.add_argument('--verbose',
                       action='store_true',
                       help='Print internal information during execution')
   args = parser.parse_args()

   return args


 def main(args):
   # Collect benchmark results from all files.
   all_results = []
   for benchmark_file in args.benchmark_files:
     with open(benchmark_file) as f:
       content = f.read()
     all_results.append(BenchmarkResults.from_json_str(content))
   for other_results in all_results[1:]:
     all_results[0].merge(other_results)
   all_results = all_results[0]

   # Register a new build for the current commit.
   commit_hash = get_git_commit_hash(all_results.commit, verbose=args.verbose)
   commit_count = get_git_total_commit_count(commit_hash, verbose=args.verbose)

   # Allow override to support uploading data for the same build in
   # different batches.
   add_new_iree_build(commit_count,
                      commit_hash,
                      override=True,
                      dry_run=args.dry_run,
                      verbose=args.verbose)

   # Get the mean time for all benchmarks.
   aggregate_results = {}
   for benchmark_index in range(len(all_results.benchmarks)):
     benchmark_case = all_results.benchmarks[benchmark_index]
     benchmark_info = benchmark_case.benchmark_info

     # Make sure each benchmark has a unique name.
     name = str(benchmark_info)
     if name in aggregate_results:
       raise ValueError(f"Duplicated benchmarks: {name}")

     mean_time = all_results.get_aggregate_time(benchmark_index, "mean")
     aggregate_results[name] = (mean_time, benchmark_info)

   # Upload benchmark results to the dashboard.
   for series_id, (sample_value, benchmark_info) in aggregate_results.items():
     description = get_model_description(benchmark_info.model_name,
                                         benchmark_info.model_source)
     if description is None:
       description = ""
     description += COMMON_DESCRIIPTION

     # Override by default to allow updates to the series.
     add_new_iree_series(series_id,
                         description,
                         override=True,
                         dry_run=args.dry_run,
                         verbose=args.verbose)
     add_new_sample(series_id,
                    commit_count,
                    sample_value,
                    dry_run=args.dry_run,
                    verbose=args.verbose)

   all_compilation_metrics = collect_all_compilation_metrics(
       compile_stats_files=args.compile_stats_files,
       expected_pr_commit=commit_hash)
   for name, compile_metrics in all_compilation_metrics.items():
     description = get_model_description(
         compile_metrics.compilation_info.model_name,
         compile_metrics.compilation_info.model_source)
     if description is None:
       description = ""
     description += COMMON_DESCRIIPTION

     for mapper in COMPILATION_METRICS_TO_TABLE_MAPPERS:
       sample_value, _ = mapper.get_current_and_base_value(compile_metrics)
       series_id = mapper.get_series_name(name)
       # Override by default to allow updates to the series.
       add_new_iree_series(series_id,
                           description,
                           override=True,
                           dry_run=args.dry_run,
                           verbose=args.verbose)
       add_new_sample(series_id,
                      commit_count,
                      sample_value,
                      dry_run=args.dry_run,
                      verbose=args.verbose)


 if __name__ == "__main__":
   main(parse_arguments())
	#!/usr/bin/env python3
	# Copyright 2021 The IREE Authors
	#
	# Licensed under the Apache License v2.0 with LLVM Exceptions.
	# See https://llvm.org/LICENSE.txt for license information.
	# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	"""Upload benchmark results to IREE Benchmark Dashboards.

	This script is meant to be used by Buildkite for automation.

	Example usage:
	# Export necessary environment variables:
	export IREE_DASHBOARD_URL=...
	export IREE_DASHBOARD_API_TOKEN=...
	# Then run the script:
	python3 upload_benchmarks.py /path/to/benchmark/json/file
	"""

	import argparse
	import json
	import os
	import re
	import requests
	import subprocess
	import time

	from typing import Any, Dict, Optional
	from common.benchmark_presentation import COMPILATION_METRICS_TO_TABLE_MAPPERS, collect_all_compilation_metrics
	from common.benchmark_definition import (BenchmarkInfo, BenchmarkResults,
	execute_cmd_and_get_output)
	from common.benchmark_thresholds import BENCHMARK_THRESHOLDS

	IREE_GITHUB_COMMIT_URL_PREFIX = 'https://github.com/iree-org/iree/commit'
	IREE_PROJECT_ID = 'IREE'
	THIS_DIRECTORY = os.path.dirname(os.path.realpath(__file__))

	COMMON_DESCRIIPTION = """
	<br>
	For the graph, the x axis is the Git commit index, and the y axis is the
	measured latency in milliseconds.
	<br>
	See <a href="https://github.com/iree-org/iree/tree/main/benchmarks/dashboard.md">
	https://github.com/iree-org/iree/tree/main/benchmarks/dashboard.md
	</a> for benchmark philosophy, specification, and definitions.
	"""

	# A non-exhaustive list of models and their source URLs.
	# For models listed here we can provide a nicer description for them on
	# webpage.
	IREE_TF_MODEL_SOURCE_URL = {
	'MobileBertSquad':
	'https://github.com/google-research/google-research/tree/master/mobilebert',
	'MobileNetV2':
	'https://www.tensorflow.org/api_docs/python/tf/keras/applications/MobileNetV2',
	'MobileNetV3Small':
	'https://www.tensorflow.org/api_docs/python/tf/keras/applications/MobileNetV3Small',
	}

	IREE_TFLITE_MODEL_SOURCE_URL = {
	'DeepLabV3':
	'https://tfhub.dev/tensorflow/lite-model/deeplabv3/1/default/1',
	'MobileSSD':
	'https://www.tensorflow.org/lite/performance/gpu#demo_app_tutorials',
	'PoseNet':
	'https://tfhub.dev/tensorflow/lite-model/posenet/mobilenet/float/075/1/default/1',
	}


	def get_model_description(model_name: str, model_source: str) -> Optional[str]:
	"""Gets the model description for the given benchmark."""
	url = None
	if model_source == "TensorFlow":
	url = IREE_TF_MODEL_SOURCE_URL.get(model_name)
	elif model_source == "TFLite":
	url = IREE_TFLITE_MODEL_SOURCE_URL.get(model_name)
	if url is not None:
	description = f'{model_name} from <a href="{url}">{url}</a>.'
	return description
	return None


	def get_git_commit_hash(commit: str, verbose: bool = False) -> str:
	"""Gets the commit hash for the given commit."""
	return execute_cmd_and_get_output(['git', 'rev-parse', commit],
	cwd=THIS_DIRECTORY,
	verbose=verbose)


	def get_git_total_commit_count(commit: str, verbose: bool = False) -> int:
	"""Gets the total commit count in history ending with the given commit."""
	count = execute_cmd_and_get_output(['git', 'rev-list', '--count', commit],
	cwd=THIS_DIRECTORY,
	verbose=verbose)
	return int(count)


	def get_git_commit_info(commit: str, verbose: bool = False) -> Dict[str, str]:
	"""Gets commit information dictory for the given commit."""
	cmd = [
	'git', 'show', '--format=%H:::%h:::%an:::%ae:::%s', '--no-patch', commit
	]
	info = execute_cmd_and_get_output(cmd, cwd=THIS_DIRECTORY, verbose=verbose)
	segments = info.split(':::')
	return {
	'hash': segments[0],
	'abbrevHash': segments[1],
	'authorName': segments[2],
	'authorEmail': segments[3],
	'subject': segments[4],
	}


	def compose_series_payload(project_id: str,
	series_id: str,
	series_description: bool = None,
	average_range: str = '5%',
	average_min_count: int = 3,
	better_criterion: str = 'smaller',
	override: bool = False) -> Dict[str, Any]:
	"""Composes the payload dictionary for a series."""
	payload = {
	'projectId': project_id,
	'serieId': series_id,
	'analyse': {
	'benchmark': {
	'range': average_range,
	'required': average_min_count,
	'trend': better_criterion,
	}
	},
	'override': override,
	}
	if series_description is not None:
	payload['description'] = series_description
	return payload


	def compose_build_payload(project_id: str,
	project_github_comit_url: str,
	build_id: int,
	commit: str,
	override: bool = False) -> Dict[str, Any]:
	"""Composes the payload dictionary for a build."""
	commit_info = get_git_commit_info(commit)
	commit_info['url'] = f'{project_github_comit_url}/{commit_info["hash"]}'
	return {
	'projectId': project_id,
	'build': {
	'buildId': build_id,
	'infos': commit_info,
	},
	'override': override,
	}


	def compose_sample_payload(project_id: str,
	series_id: str,
	build_id: int,
	sample_value: int,
	override: bool = False) -> Dict[str, Any]:
	"""Composes the payload dictionary for a sample."""
	return {
	'projectId': project_id,
	'serieId': series_id,
	'sample': {
	'buildId': build_id,
	'value': sample_value
	},
	'override': override
	}


	def get_required_env_var(var: str) -> str:
	"""Gets the value for a required environment variable."""
	value = os.getenv(var)
	if value is None:
	raise RuntimeError(f'Missing environment variable "{var}"')
	return value


	def post_to_dashboard(url: str,
	payload: Dict[str, Any],
	dry_run: bool = False,
	verbose: bool = False):
	data = json.dumps(payload)

	if dry_run or verbose:
	print(f'API request payload: {data}')

	if dry_run:
	return

	api_token = get_required_env_var('IREE_DASHBOARD_API_TOKEN')
	headers = {
	'Content-type': 'application/json',
	'Authorization': f'Bearer {api_token}',
	}

	response = requests.post(url, data=data, headers=headers)
	code = response.status_code
	if code != 200:
	raise requests.RequestException(
	f'Failed to post to dashboard server with status code {code}')


	def add_new_iree_series(series_id: str,
	series_description: Optional[str] = None,
	override: bool = False,
	dry_run: bool = False,
	verbose: bool = False):
	"""Posts a new series to the dashboard."""
	url = get_required_env_var('IREE_DASHBOARD_URL')

	average_range = None
	for threshold in BENCHMARK_THRESHOLDS:
	if threshold.regex.match(series_id):
	average_range = threshold.get_threshold_str()
	break
	if average_range is None:
	raise ValueError(f"no matched threshold setting for benchmark: {series_id}")

	payload = compose_series_payload(IREE_PROJECT_ID,
	series_id,
	series_description,
	average_range=average_range,
	override=override)
	post_to_dashboard(f'{url}/apis/addSerie',
	payload,
	dry_run=dry_run,
	verbose=verbose)


	def add_new_iree_build(build_id: int,
	commit: str,
	override: bool = False,
	dry_run: bool = False,
	verbose: bool = False):
	"""Posts a new build to the dashboard."""
	url = get_required_env_var('IREE_DASHBOARD_URL')
	payload = compose_build_payload(IREE_PROJECT_ID,
	IREE_GITHUB_COMMIT_URL_PREFIX, build_id,
	commit, override)
	post_to_dashboard(f'{url}/apis/addBuild',
	payload,
	dry_run=dry_run,
	verbose=verbose)


	def add_new_sample(series_id: str,
	build_id: int,
	sample_value: int,
	override: bool = False,
	dry_run: bool = False,
	verbose: bool = False):
	"""Posts a new sample to the dashboard."""
	url = get_required_env_var('IREE_DASHBOARD_URL')
	payload = compose_sample_payload(IREE_PROJECT_ID, series_id, build_id,
	sample_value, override)
	post_to_dashboard(f'{url}/apis/addSample',
	payload,
	dry_run=dry_run,
	verbose=verbose)


	def parse_arguments():
	"""Parses command-line options."""

	def check_file_path(path):
	if os.path.isfile(path):
	return path
	else:
	raise ValueError(path)

	parser = argparse.ArgumentParser()
	parser.add_argument(
	'--benchmark_files',
	metavar='<benchmark-json-files>',
	type=check_file_path,
	required=True,
	nargs='+',
	help='Paths to the JSON files containing benchmark results')
	parser.add_argument(
	"--compile_stats_files",
	metavar="<compile-stats-json-files>",
	type=check_file_path,
	default=[],
	nargs="+",
	help="Paths to the JSON files containing compilation statistics")
	parser.add_argument("--dry-run",
	action="store_true",
	help="Print the comment instead of posting to dashboard")
	parser.add_argument('--verbose',
	action='store_true',
	help='Print internal information during execution')
	args = parser.parse_args()

	return args


	def main(args):
	# Collect benchmark results from all files.
	all_results = []
	for benchmark_file in args.benchmark_files:
	with open(benchmark_file) as f:
	content = f.read()
	all_results.append(BenchmarkResults.from_json_str(content))
	for other_results in all_results[1:]:
	all_results[0].merge(other_results)
	all_results = all_results[0]

	# Register a new build for the current commit.
	commit_hash = get_git_commit_hash(all_results.commit, verbose=args.verbose)
	commit_count = get_git_total_commit_count(commit_hash, verbose=args.verbose)

	# Allow override to support uploading data for the same build in
	# different batches.
	add_new_iree_build(commit_count,
	commit_hash,
	override=True,
	dry_run=args.dry_run,
	verbose=args.verbose)

	# Get the mean time for all benchmarks.
	aggregate_results = {}
	for benchmark_index in range(len(all_results.benchmarks)):
	benchmark_case = all_results.benchmarks[benchmark_index]
	benchmark_info = benchmark_case.benchmark_info

	# Make sure each benchmark has a unique name.
	name = str(benchmark_info)
	if name in aggregate_results:
	raise ValueError(f"Duplicated benchmarks: {name}")

	mean_time = all_results.get_aggregate_time(benchmark_index, "mean")
	aggregate_results[name] = (mean_time, benchmark_info)

	# Upload benchmark results to the dashboard.
	for series_id, (sample_value, benchmark_info) in aggregate_results.items():
	description = get_model_description(benchmark_info.model_name,
	benchmark_info.model_source)
	if description is None:
	description = ""
	description += COMMON_DESCRIIPTION

	# Override by default to allow updates to the series.
	add_new_iree_series(series_id,
	description,
	override=True,
	dry_run=args.dry_run,
	verbose=args.verbose)
	add_new_sample(series_id,
	commit_count,
	sample_value,
	dry_run=args.dry_run,
	verbose=args.verbose)

	all_compilation_metrics = collect_all_compilation_metrics(
	compile_stats_files=args.compile_stats_files,
	expected_pr_commit=commit_hash)
	for name, compile_metrics in all_compilation_metrics.items():
	description = get_model_description(
	compile_metrics.compilation_info.model_name,
	compile_metrics.compilation_info.model_source)
	if description is None:
	description = ""
	description += COMMON_DESCRIIPTION

	for mapper in COMPILATION_METRICS_TO_TABLE_MAPPERS:
	sample_value, _ = mapper.get_current_and_base_value(compile_metrics)
	series_id = mapper.get_series_name(name)
	# Override by default to allow updates to the series.
	add_new_iree_series(series_id,
	description,
	override=True,
	dry_run=args.dry_run,
	verbose=args.verbose)
	add_new_sample(series_id,
	commit_count,
	sample_value,
	dry_run=args.dry_run,
	verbose=args.verbose)


	if __name__ == "__main__":
	main(parse_arguments())