benchmarks/fastrnns/test_bench.py - platform/external/pytorch - Git at Google

 import pytest

 import torch

 from .fuser import set_fuser
 from .runner import get_nn_runners


 @pytest.fixture(scope="class")
 def modeldef(request, net_name, executor, fuser):
     set_fuser(fuser, executor)

     # Given a 'net_name' provided by generate_tests, build the thing
     name, rnn_creator, context = get_nn_runners(net_name)[0]
     creator_args = creator_args = {
         "seqLength": 100,
         "numLayers": 1,
         "inputSize": 512,
         "hiddenSize": 512,
         "miniBatch": 64,
         "device": "cuda",
         "seed": None,
     }
     return rnn_creator(**creator_args)


 def cuda_sync(func, *args, **kwargs):
     out = func(*args, **kwargs)
     torch.cuda.synchronize()
     return out


 @pytest.mark.benchmark(
     warmup=True,
     warmup_iterations=3,
     disable_gc=True,
     max_time=0.1,
     group="fastrnns",
 )
 class TestBenchNetwork:
     # See 'modeldef' fixture, which provides the things to benchmark
     def test_forward(self, modeldef, benchmark):
         forward_output = benchmark(cuda_sync, modeldef.forward, *modeldef.inputs)

     def test_backward(self, modeldef, benchmark):
         backward_input = modeldef.forward(*modeldef.inputs)
         if modeldef.backward_setup is not None:
             backward_input = modeldef.backward_setup(backward_input)

         if modeldef.backward is not None:
             benchmark(cuda_sync, modeldef.backward, *backward_input, retain_graph=True)

             with torch.no_grad():
                 for param in modeldef.params:
                     assert param.grad is not None
                     param.grad.zero_()
	import pytest

	import torch

	from .fuser import set_fuser
	from .runner import get_nn_runners


	@pytest.fixture(scope="class")
	def modeldef(request, net_name, executor, fuser):
	set_fuser(fuser, executor)

	# Given a 'net_name' provided by generate_tests, build the thing
	name, rnn_creator, context = get_nn_runners(net_name)[0]
	creator_args = creator_args = {
	"seqLength": 100,
	"numLayers": 1,
	"inputSize": 512,
	"hiddenSize": 512,
	"miniBatch": 64,
	"device": "cuda",
	"seed": None,
	}
	return rnn_creator(**creator_args)


	def cuda_sync(func, args, *kwargs):
	out = func(args, *kwargs)
	torch.cuda.synchronize()
	return out


	@pytest.mark.benchmark(
	warmup=True,
	warmup_iterations=3,
	disable_gc=True,
	max_time=0.1,
	group="fastrnns",
	)
	class TestBenchNetwork:
	# See 'modeldef' fixture, which provides the things to benchmark
	def test_forward(self, modeldef, benchmark):
	forward_output = benchmark(cuda_sync, modeldef.forward, *modeldef.inputs)

	def test_backward(self, modeldef, benchmark):
	backward_input = modeldef.forward(*modeldef.inputs)
	if modeldef.backward_setup is not None:
	backward_input = modeldef.backward_setup(backward_input)

	if modeldef.backward is not None:
	benchmark(cuda_sync, modeldef.backward, *backward_input, retain_graph=True)

	with torch.no_grad():
	for param in modeldef.params:
	assert param.grad is not None
	param.grad.zero_()