Birch-san · November 5, 2022 01:02 · Birch-san · Nov 5, 2022 · Birch-san · Nov 5, 2022
diff --git a/benchmark2.py b/benchmark2.py
 import torch
 from torch import einsum, matmul, bmm
 import time

 repeats = 10

 batch_duration = 0
 for ix in range(repeats):
  attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
  v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
  start = time.perf_counter()
  einsum('b i j, b j d -> b i d', attn, v).max().item()
  duration = time.perf_counter()-start
  print('einsum 1 iteration %d took %.4f seconds' % (ix, duration))
  batch_duration += duration
 print('%d iterations of einsum 1 took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))

 batch_duration = 0
 for ix in range(repeats):
  attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
  v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
  start = time.perf_counter()
  matmul(attn, v).max().item()
  duration = time.perf_counter()-start
  print('matmul iteration %d took %.4f seconds' % (ix, duration))
  batch_duration += duration
 print('%d iterations of matmul took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))

 batch_duration = 0
 for ix in range(repeats):
  attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
  v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
  start = time.perf_counter()
  bmm(attn, v).max().item()
  duration = time.perf_counter()-start
  print('bmm iteration %d took %.4f seconds' % (ix, duration))
  batch_duration += duration
 print('%d iterations of bmm took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))
	import torch
	from torch import einsum, matmul, bmm
	import time

	repeats = 10

	batch_duration = 0
	for ix in range(repeats):
	attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
	v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
	start = time.perf_counter()
	einsum('b i j, b j d -> b i d', attn, v).max().item()
	duration = time.perf_counter()-start
	print('einsum 1 iteration %d took %.4f seconds' % (ix, duration))
	batch_duration += duration
	print('%d iterations of einsum 1 took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))

	batch_duration = 0
	for ix in range(repeats):
	attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
	v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
	start = time.perf_counter()
	matmul(attn, v).max().item()
	duration = time.perf_counter()-start
	print('matmul iteration %d took %.4f seconds' % (ix, duration))
	batch_duration += duration
	print('%d iterations of matmul took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))

	batch_duration = 0
	for ix in range(repeats):
	attn = torch.rand(16, 4096, 4096, dtype=torch.float, device="mps")
	v = torch.rand(16, 4096, 40, dtype=torch.float, device="mps")
	start = time.perf_counter()
	bmm(attn, v).max().item()
	duration = time.perf_counter()-start
	print('bmm iteration %d took %.4f seconds' % (ix, duration))
	batch_duration += duration
	print('%d iterations of bmm took %.4f seconds; avg %.4f secs' % (repeats, batch_duration, batch_duration/repeats))