content/test/gpu/suppress_flakes.py - chromium/src - Git at Google

 #!/usr/bin/env vpython3
 # Copyright 2021 The Chromium Authors
 # Use of this source code is governed by a BSD-style license that can be
 # found in the LICENSE file.
 """Script for finding and suppressing flaky GPU tests.

 This relies on ResultDB BigQuery data under the hood, so it requires the `bq`
 tool which is available as part of the Google Cloud SDK
 https://cloud.google.com/sdk/docs/quickstarts.

 Example usage, which finds all failures in the past 5 days. Any tests that
 failed more than twice on a configuration is marked as flaky, and any that
 failed more than 5 times is marked as failing:

 suppress_flakes.py \
   --project chrome-unexpected-pass-data \
   --sample-period 5
 """
 import os
 import sys

 CHROMIUM_SRC_DIR = os.path.join(os.path.dirname(__file__), '..', '..', '..')
 sys.path.append(os.path.join(CHROMIUM_SRC_DIR, 'testing'))

 # pylint: disable=wrong-import-position
 from flake_suppressor_common import argument_parsing
 from flake_suppressor_common import result_output
 from flake_suppressor_common import tag_utils as common_tag_utils
 from flake_suppressor import gpu_expectations
 from flake_suppressor import gpu_queries
 from flake_suppressor import gpu_tag_utils as tag_utils
 from flake_suppressor import gpu_results as results_module
 # pylint: enable=wrong-import-position


 def main():
   args = argument_parsing.ParseArgs()
   common_tag_utils.SetTagUtilsImplementation(tag_utils.GpuTagUtils)
   expectations_processor = gpu_expectations.GpuExpectationProcessor()
   if not args.bypass_up_to_date_check:
     expectations_processor.AssertCheckoutIsUpToDate()

   results_processor = results_module.GpuResultProcessor(expectations_processor)
   querier_instance = gpu_queries.GpuBigQueryQuerier(args.sample_period,
                                                     args.project,
                                                     results_processor)

   results = querier_instance.GetFlakyOrFailingCiTests()
   results.extend(querier_instance.GetFlakyOrFailingTryTests())
   aggregated_results = results_processor.AggregateResults(results)
   if args.result_output_file:
     with open(args.result_output_file, 'w', encoding='utf-8') as outfile:
       result_output.GenerateHtmlOutputFile(aggregated_results, outfile)
   else:
     result_output.GenerateHtmlOutputFile(aggregated_results)
   print('If there are many instances of failed tests, that may be indicative '
         'of an issue that should be handled in some other way, e.g. reverting '
         'a bad CL.')
   if args.prompt_for_user_input:
     input('\nBeginning of user input section - press any key to continue')
     expectations_processor.IterateThroughResultsForUser(aggregated_results,
                                                         args.group_by_tags,
                                                         args.include_all_tags)
   else:
     result_counts = querier_instance.GetResultCounts()
     expectations_processor.IterateThroughResultsWithThresholds(
         aggregated_results, args.group_by_tags, result_counts,
         args.ignore_threshold, args.flaky_threshold, args.include_all_tags)
     print('\nGenerated expectations will need to have bugs manually added.')
   print('\nGenerated expectations likely contain conflicting tags that need to '
         'be removed.')


 if __name__ == '__main__':
   main()
	#!/usr/bin/env vpython3
	# Copyright 2021 The Chromium Authors
	# Use of this source code is governed by a BSD-style license that can be
	# found in the LICENSE file.
	"""Script for finding and suppressing flaky GPU tests.

	This relies on ResultDB BigQuery data under the hood, so it requires the `bq`
	tool which is available as part of the Google Cloud SDK
	https://cloud.google.com/sdk/docs/quickstarts.

	Example usage, which finds all failures in the past 5 days. Any tests that
	failed more than twice on a configuration is marked as flaky, and any that
	failed more than 5 times is marked as failing:

	suppress_flakes.py \
	--project chrome-unexpected-pass-data \
	--sample-period 5
	"""
	import os
	import sys

	CHROMIUM_SRC_DIR = os.path.join(os.path.dirname(__file__), '..', '..', '..')
	sys.path.append(os.path.join(CHROMIUM_SRC_DIR, 'testing'))

	# pylint: disable=wrong-import-position
	from flake_suppressor_common import argument_parsing
	from flake_suppressor_common import result_output
	from flake_suppressor_common import tag_utils as common_tag_utils
	from flake_suppressor import gpu_expectations
	from flake_suppressor import gpu_queries
	from flake_suppressor import gpu_tag_utils as tag_utils
	from flake_suppressor import gpu_results as results_module
	# pylint: enable=wrong-import-position


	def main():
	args = argument_parsing.ParseArgs()
	common_tag_utils.SetTagUtilsImplementation(tag_utils.GpuTagUtils)
	expectations_processor = gpu_expectations.GpuExpectationProcessor()
	if not args.bypass_up_to_date_check:
	expectations_processor.AssertCheckoutIsUpToDate()

	results_processor = results_module.GpuResultProcessor(expectations_processor)
	querier_instance = gpu_queries.GpuBigQueryQuerier(args.sample_period,
	args.project,
	results_processor)

	results = querier_instance.GetFlakyOrFailingCiTests()
	results.extend(querier_instance.GetFlakyOrFailingTryTests())
	aggregated_results = results_processor.AggregateResults(results)
	if args.result_output_file:
	with open(args.result_output_file, 'w', encoding='utf-8') as outfile:
	result_output.GenerateHtmlOutputFile(aggregated_results, outfile)
	else:
	result_output.GenerateHtmlOutputFile(aggregated_results)
	print('If there are many instances of failed tests, that may be indicative '
	'of an issue that should be handled in some other way, e.g. reverting '
	'a bad CL.')
	if args.prompt_for_user_input:
	input('\nBeginning of user input section - press any key to continue')
	expectations_processor.IterateThroughResultsForUser(aggregated_results,
	args.group_by_tags,
	args.include_all_tags)
	else:
	result_counts = querier_instance.GetResultCounts()
	expectations_processor.IterateThroughResultsWithThresholds(
	aggregated_results, args.group_by_tags, result_counts,
	args.ignore_threshold, args.flaky_threshold, args.include_all_tags)
	print('\nGenerated expectations will need to have bugs manually added.')
	print('\nGenerated expectations likely contain conflicting tags that need to '
	'be removed.')


	if __name__ == '__main__':
	main()