integrations/pjrt/test/test_jax.py - 3p/openxla/iree - Git at Google

 # Licensed under the Apache License v2.0 with LLVM Exceptions.
 # See https://llvm.org/LICENSE.txt for license information.
 # SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 import argparse
 import multiprocessing
 import os
 import random
 import re
 import subprocess
 import sys
 import time

 from collections import namedtuple
 from enum import Enum

 parser = argparse.ArgumentParser(
     prog="test_jax.py", description="Run jax testsuite hermetically"
 )
 parser.add_argument("testfiles", nargs="*")
 parser.add_argument("-t", "--timeout", default=60)
 parser.add_argument("-l", "--logdir", default="/tmp/jaxtest")
 parser.add_argument("-p", "--passing", default=None)
 parser.add_argument("-f", "--failing", default=None)
 parser.add_argument("-e", "--expected", default=None)
 parser.add_argument("-j", "--jobs", default=None)

 args = parser.parse_args()

 PYTEST_CMD = [
     "pytest",
     "-p",
     "openxla_pjrt_artifacts",
     f"--openxla-pjrt-artifact-dir={args.logdir}",
 ]


 def get_test(test):
     print("Fetching from:", test)
     stdout = subprocess.run(PYTEST_CMD + ["--setup-only", test], capture_output=True)
     lst = re.findall("::[^ ]*::[^ ]*", str(stdout))
     return [test + func for func in lst]


 def get_tests(tests):
     fulltestlist = []
     with multiprocessing.Pool(os.cpu_count()) as p:
         fulltestlist = p.map(get_test, tests)
     fulltestlist = sorted([i for lst in fulltestlist for i in lst])
     return fulltestlist


 def generate_test_commands(tests):
     cmds = []
     for test in tests:
         test_cmd = PYTEST_CMD + [test]
         cmds.append(test_cmd)

     return cmds


 TestCase = namedtuple("TestCase", ["test", "timeout"])
 TestResult = Enum("TestResult", ["SUCCESS", "FAILURE", "TIMEOUT"])


 def exec_test(testcase):
     command, timeout = testcase
     if float(timeout) > 0:
         command = ["timeout", f"{timeout}"] + command

     start = time.perf_counter()
     result = subprocess.run(command, capture_output=True)
     end = time.perf_counter()
     ellapsed = end - start
     timedout = (float(timeout) > 0) and (ellapsed > float(timeout))

     if result.returncode == 0:
         sys.stdout.write(".")
         sys.stdout.flush()
         return TestResult.SUCCESS

     if timedout:
         sys.stdout.write("t")
         sys.stdout.flush()
         return TestResult.TIMEOUT

     sys.stdout.write("f")
     sys.stdout.flush()
     return TestResult.FAILURE


 def exec_testsuite(commands, jobs, timeout):
     random.shuffle(commands)
     withTimeout = list(map(lambda x: TestCase(x, timeout), commands))

     results = []
     with multiprocessing.Pool(int(jobs)) as p:
         results = p.map(exec_test, withTimeout)

     passing, timeout, failing = [], [], []
     for result, cmd in zip(results, commands):
         if result == TestResult.SUCCESS:
             passing.append(cmd)

         if result == TestResult.TIMEOUT:
             timeout.append(cmd)

         if result == TestResult.FAILURE:
             failing.append(cmd)
     print("")

     return passing, timeout, failing


 def get_testnames(cmd):
     names = []
     for c in cmd:
         testname = " ".join(c)
         testname = re.search("[^ /]*::[^ ]*::[^ ]*", testname)[0]
         names.append(testname)
     return names


 def write_results(filename, results):
     if filename is not None:
         with open(filename, "w") as f:
             for line in results:
                 f.write(line + "\n")


 def load_results(filename):
     if not filename or not os.path.isfile(filename):
         return []
     expected = []
     with open(filename, "r") as f:
         for line in f:
             expected.append(line.strip())
     return expected


 def compare_results(expected, passing):
     passing = set(passing)
     expected = set(expected)
     new_failures = expected - passing
     new_passing = passing - expected
     return new_passing, new_failures


 print("Querying All Tests")
 tests = get_tests(args.testfiles)

 print("Generating test suite")
 commands = generate_test_commands(tests)

 print(
     f"Executing {len(commands)} tests across {args.jobs} threads with timeout = {args.timeout}"
 )
 passing, timeout, failing = exec_testsuite(
     commands, jobs=args.jobs, timeout=args.timeout
 )

 expected = load_results(args.expected)

 # Break into passing vs failing
 failing = failing + timeout

 # Get the testnames
 passing = get_testnames(passing)
 failing = get_testnames(failing)

 write_results(args.passing, passing)
 write_results(args.failing, failing)

 print("Total:", len(commands))
 print("Passing:", len(passing))
 print("Failing:", len(failing))
 print("Failing (timed out):", len(timeout))

 if expected:
     new_passing, new_failures = compare_results(expected, passing)

     if new_passing:
         print("Newly Passing Tests:")
         for test in new_passing:
             print(" ", test)

     if new_failures:
         print("Newly Failing Tests:")
         for test in new_failures:
             print(" ", test)

     if len(expected) > len(passing):
         exit(1)
	# Licensed under the Apache License v2.0 with LLVM Exceptions.
	# See https://llvm.org/LICENSE.txt for license information.
	# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

	import argparse
	import multiprocessing
	import os
	import random
	import re
	import subprocess
	import sys
	import time

	from collections import namedtuple
	from enum import Enum

	parser = argparse.ArgumentParser(
	prog="test_jax.py", description="Run jax testsuite hermetically"
	)
	parser.add_argument("testfiles", nargs="*")
	parser.add_argument("-t", "--timeout", default=60)
	parser.add_argument("-l", "--logdir", default="/tmp/jaxtest")
	parser.add_argument("-p", "--passing", default=None)
	parser.add_argument("-f", "--failing", default=None)
	parser.add_argument("-e", "--expected", default=None)
	parser.add_argument("-j", "--jobs", default=None)

	args = parser.parse_args()

	PYTEST_CMD = [
	"pytest",
	"-p",
	"openxla_pjrt_artifacts",
	f"--openxla-pjrt-artifact-dir={args.logdir}",
	]


	def get_test(test):
	print("Fetching from:", test)
	stdout = subprocess.run(PYTEST_CMD + ["--setup-only", test], capture_output=True)
	lst = re.findall("::[^ ]::[^ ]", str(stdout))
	return [test + func for func in lst]


	def get_tests(tests):
	fulltestlist = []
	with multiprocessing.Pool(os.cpu_count()) as p:
	fulltestlist = p.map(get_test, tests)
	fulltestlist = sorted([i for lst in fulltestlist for i in lst])
	return fulltestlist


	def generate_test_commands(tests):
	cmds = []
	for test in tests:
	test_cmd = PYTEST_CMD + [test]
	cmds.append(test_cmd)

	return cmds


	TestCase = namedtuple("TestCase", ["test", "timeout"])
	TestResult = Enum("TestResult", ["SUCCESS", "FAILURE", "TIMEOUT"])


	def exec_test(testcase):
	command, timeout = testcase
	if float(timeout) > 0:
	command = ["timeout", f"{timeout}"] + command

	start = time.perf_counter()
	result = subprocess.run(command, capture_output=True)
	end = time.perf_counter()
	ellapsed = end - start
	timedout = (float(timeout) > 0) and (ellapsed > float(timeout))

	if result.returncode == 0:
	sys.stdout.write(".")
	sys.stdout.flush()
	return TestResult.SUCCESS

	if timedout:
	sys.stdout.write("t")
	sys.stdout.flush()
	return TestResult.TIMEOUT

	sys.stdout.write("f")
	sys.stdout.flush()
	return TestResult.FAILURE


	def exec_testsuite(commands, jobs, timeout):
	random.shuffle(commands)
	withTimeout = list(map(lambda x: TestCase(x, timeout), commands))

	results = []
	with multiprocessing.Pool(int(jobs)) as p:
	results = p.map(exec_test, withTimeout)

	passing, timeout, failing = [], [], []
	for result, cmd in zip(results, commands):
	if result == TestResult.SUCCESS:
	passing.append(cmd)

	if result == TestResult.TIMEOUT:
	timeout.append(cmd)

	if result == TestResult.FAILURE:
	failing.append(cmd)
	print("")

	return passing, timeout, failing


	def get_testnames(cmd):
	names = []
	for c in cmd:
	testname = " ".join(c)
	testname = re.search("[^ /]::[^ ]::[^ ]*", testname)[0]
	names.append(testname)
	return names


	def write_results(filename, results):
	if filename is not None:
	with open(filename, "w") as f:
	for line in results:
	f.write(line + "\n")


	def load_results(filename):
	if not filename or not os.path.isfile(filename):
	return []
	expected = []
	with open(filename, "r") as f:
	for line in f:
	expected.append(line.strip())
	return expected


	def compare_results(expected, passing):
	passing = set(passing)
	expected = set(expected)
	new_failures = expected - passing
	new_passing = passing - expected
	return new_passing, new_failures


	print("Querying All Tests")
	tests = get_tests(args.testfiles)

	print("Generating test suite")
	commands = generate_test_commands(tests)

	print(
	f"Executing {len(commands)} tests across {args.jobs} threads with timeout = {args.timeout}"
	)
	passing, timeout, failing = exec_testsuite(
	commands, jobs=args.jobs, timeout=args.timeout
	)

	expected = load_results(args.expected)

	# Break into passing vs failing
	failing = failing + timeout

	# Get the testnames
	passing = get_testnames(passing)
	failing = get_testnames(failing)

	write_results(args.passing, passing)
	write_results(args.failing, failing)

	print("Total:", len(commands))
	print("Passing:", len(passing))
	print("Failing:", len(failing))
	print("Failing (timed out):", len(timeout))

	if expected:
	new_passing, new_failures = compare_results(expected, passing)

	if new_passing:
	print("Newly Passing Tests:")
	for test in new_passing:
	print(" ", test)

	if new_failures:
	print("Newly Failing Tests:")
	for test in new_failures:
	print(" ", test)

	if len(expected) > len(passing):
	exit(1)