Skip to content

Instantly share code, notes, and snippets.

@sandeepkumar-skb
Created December 21, 2020 22:30
Show Gist options
  • Save sandeepkumar-skb/794600adc584c3aabc53475486c2ae96 to your computer and use it in GitHub Desktop.
Save sandeepkumar-skb/794600adc584c3aabc53475486c2ae96 to your computer and use it in GitHub Desktop.
import torch
n = 1024
x = torch.randn(n,n, device='cuda')
y = torch.randn(n,n, device='cuda')
num_iter = 100
# Warmup
for _ in range(num_iter):
z = torch.matmul(x,y)
torch.cuda.synchronize()
start = torch.cuda.Event(enable_timing=True)
end = torch.cuda.Event(enable_timing=True)
start.record()
for _ in range(num_iter):
z = torch.matmul(x, y)
end.record()
end.synchronize()
duration = start.elapsed_time(end)
print("Duration: {:.4f} ms".format(duration))
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment