We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent e99c858 commit 009c4dcCopy full SHA for 009c4dc
diag/conv1d.py
@@ -10,16 +10,16 @@
10
11
# Parameters
12
13
-channel_in = 3
14
-channel_out = channel_in
+batch_size=16384
15
length = 512
+k = 3
16
+channel_in = 1
17
+channel_out = channel_in
18
-n0 = 16384
19
+n0 = batch_size
20
n1 = length*channel_out
21
n2 = 1
-k = 2
22
-batch_size=n0*n2
23
# i0, i1, i2 = torch.meshgrid(
24
# torch.arange(batch_size, device=device, dtype=real_t),
25
# torch.arange(channel_in, device=device, dtype=real_t),
@@ -61,6 +61,7 @@ def sum_and_normalize(data):
61
output = conv1d_scripted(data) # Use pre-compiled model
62
torch.cuda.synchronize()
63
end.record()
64
+torch.cuda.synchronize()
65
elapsed_time = start.elapsed_time(end)/1000
66
67
# Compute final sum and normalization
0 commit comments