Skip to content

Commit 7b3288c

Browse files
committed
Make matmul intensity consistent through all benchs
1 parent d8c4e11 commit 7b3288c

File tree

2 files changed

+51
-50
lines changed

2 files changed

+51
-50
lines changed

bench/ndarray/roofline-analysis.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -153,8 +153,9 @@ def setup_arrays(mem_mode: bool):
153153
shape = (15_000, 15_000)
154154
large_shape = (2,) + shape
155155
else:
156-
shape = (30_000, 30_000)
157-
large_shape = (15,) + shape
156+
# shape = (30_000, 30_000)
157+
shape = (15_000, 15_000)
158+
large_shape = (60,) + shape
158159

159160
nelem = math.prod(shape)
160161
large_nelem = math.prod(large_shape)

bench/ndarray/roofline-plot.py

Lines changed: 48 additions & 48 deletions
Original file line numberDiff line numberDiff line change
@@ -31,15 +31,15 @@
3131
{'blosc2': {'low': {'GFLOPS': 2.570591026389536,
3232
'Intensity': 5.5,
3333
'Time': 28.884407997131348},
34-
'matmul0': {'GFLOPS': 140.5119122729633,
35-
'Intensity': 2000,
36-
'Time': 0.12810301780700684},
37-
'matmul1': {'GFLOPS': 451.58033046881854,
34+
'matmul0': {'GFLOPS': 46.26183975097429,
35+
'Intensity': 1000,
36+
'Time': 0.04863619804382324},
37+
'matmul1': {'GFLOPS': 438.1365321396617,
38+
'Intensity': 5000,
39+
'Time': 0.641923189163208},
40+
'matmul2': {'GFLOPS': 448.8428100084526,
3841
'Intensity': 10000,
39-
'Time': 4.982502222061157},
40-
'matmul2': {'GFLOPS': 31.289500989233293,
41-
'Intensity': 20000,
42-
'Time': 575.2728369235992},
42+
'Time': 5.012890815734863},
4343
'medium': {'GFLOPS': 14.146962346220464,
4444
'Intensity': 36.75,
4545
'Time': 35.06936597824097},
@@ -49,15 +49,15 @@
4949
'blosc2-nocomp': {'low': {'GFLOPS': 0.03860960944488331,
5050
'Intensity': 5.5,
5151
'Time': 1923.0963759422302},
52-
'matmul0': {'GFLOPS': 45.80092854633905,
53-
'Intensity': 2000,
54-
'Time': 0.3930051326751709},
55-
'matmul1': {'GFLOPS': 397.06715432984515,
52+
'matmul0': {'GFLOPS': 32.9184188862999,
53+
'Intensity': 1000,
54+
'Time': 0.06835079193115234},
55+
'matmul1': {'GFLOPS': 375.8405170559847,
56+
'Intensity': 5000,
57+
'Time': 0.7483227252960205},
58+
'matmul2': {'GFLOPS': 399.46900484462606,
5659
'Intensity': 10000,
57-
'Time': 5.666547775268555},
58-
'matmul2': {'GFLOPS': 17.419778699450802,
59-
'Intensity': 20000,
60-
'Time': 1033.3081901073456},
60+
'Time': 5.632477045059204},
6161
'medium': {'GFLOPS': 0.46027450974226586,
6262
'Intensity': 36.75,
6363
'Time': 1077.8893671035767},
@@ -67,15 +67,15 @@
6767
'numpy/numexpr': {'low': {'GFLOPS': 0.03342497696428004,
6868
'Intensity': 5.5,
6969
'Time': 2221.3927052021027},
70-
'matmul0': {'GFLOPS': 2.5741052434472507,
71-
'Intensity': 2000,
72-
'Time': 6.992721080780029},
73-
'matmul1': {'GFLOPS': 285.998135244872,
70+
'matmul0': {'GFLOPS': 3.6124326198946726,
71+
'Intensity': 1000,
72+
'Time': 0.6228489875793457},
73+
'matmul1': {'GFLOPS': 93.36108303946814,
74+
'Intensity': 5000,
75+
'Time': 3.0124971866607666},
76+
'matmul2': {'GFLOPS': 277.86243889802796,
7477
'Intensity': 10000,
75-
'Time': 7.867184162139893},
76-
'matmul2': {'GFLOPS': 452.12915677286617,
77-
'Intensity': 20000,
78-
'Time': 39.81163287162781},
78+
'Time': 8.097532033920288},
7979
'medium': {'GFLOPS': 0.09460263438020816,
8080
'Intensity': 36.75,
8181
'Time': 5244.3042759895325},
@@ -145,15 +145,15 @@
145145
{'blosc2': {'low': {'GFLOPS': 2.6569613592385535,
146146
'Intensity': 5.5,
147147
'Time': 27.945457220077515},
148-
'matmul0': {'GFLOPS': 110.16077007145368,
149-
'Intensity': 2000,
150-
'Time': 0.16339755058288574},
151-
'matmul1': {'GFLOPS': 278.1667526617581,
148+
'matmul0': {'GFLOPS': 12.553085867977686,
149+
'Intensity': 1000,
150+
'Time': 0.17923879623413086},
151+
'matmul1': {'GFLOPS': 240.360991381506,
152+
'Intensity': 5000,
153+
'Time': 1.1701149940490723},
154+
'matmul2': {'GFLOPS': 268.0288488506098,
152155
'Intensity': 10000,
153-
'Time': 8.08867335319519},
154-
'matmul2': {'GFLOPS': 254.47585605595123,
155-
'Intensity': 20000,
156-
'Time': 70.73362588882446},
156+
'Time': 8.39461874961853},
157157
'medium': {'GFLOPS': 15.532085276343903,
158158
'Intensity': 36.75,
159159
'Time': 31.941944122314453},
@@ -163,15 +163,15 @@
163163
'blosc2-nocomp': {'low': {'GFLOPS': 1.0313162899034,
164164
'Intensity': 5.5,
165165
'Time': 71.99537205696106},
166-
'matmul0': {'GFLOPS': 5.026447790269603,
167-
'Intensity': 2000,
168-
'Time': 3.5810577869415283},
169-
'matmul1': {'GFLOPS': 240.53695304016009,
166+
'matmul0': {'GFLOPS': 14.36429529261525,
167+
'Intensity': 1000,
168+
'Time': 0.15663838386535645},
169+
'matmul1': {'GFLOPS': 215.303286764059,
170+
'Intensity': 5000,
171+
'Time': 1.3062968254089355},
172+
'matmul2': {'GFLOPS': 273.333776088537,
170173
'Intensity': 10000,
171-
'Time': 9.354072093963623},
172-
'matmul2': {'GFLOPS': 244.4603185993202,
173-
'Intensity': 20000,
174-
'Time': 73.63158202171326},
174+
'Time': 8.231693983078003},
175175
'medium': {'GFLOPS': 6.643671590137467,
176176
'Intensity': 36.75,
177177
'Time': 74.67632818222046},
@@ -181,15 +181,15 @@
181181
'numpy/numexpr': {'low': {'GFLOPS': 1.357592296775474,
182182
'Intensity': 5.5,
183183
'Time': 54.69241404533386},
184-
'matmul0': {'GFLOPS': 2.7506948651842946,
185-
'Intensity': 2000,
186-
'Time': 6.5438010692596436},
187-
'matmul1': {'GFLOPS': 275.4348725971461,
184+
'matmul0': {'GFLOPS': 14.61036282906348,
185+
'Intensity': 1000,
186+
'Time': 0.15400028228759766},
187+
'matmul1': {'GFLOPS': 219.1569896084874,
188+
'Intensity': 5000,
189+
'Time': 1.2833266258239746},
190+
'matmul2': {'GFLOPS': 309.16178854453585,
188191
'Intensity': 10000,
189-
'Time': 8.16890025138855},
190-
'matmul2': {'GFLOPS': 342.9817247403082,
191-
'Intensity': 20000,
192-
'Time': 52.48093032836914},
192+
'Time': 7.277742862701416},
193193
'medium': {'GFLOPS': 7.66225952699885,
194194
'Intensity': 36.75,
195195
'Time': 64.74917721748352},

0 commit comments

Comments
 (0)