@@ -6,7 +6,6 @@ function prefetchisagoodidea(ls::LoopSet, op::Operation, td::UnrollArgs)
6
6
isvectorized (op) || return 0
7
7
((u₁ > 1 ) & (u₂max > 1 )) || return 0
8
8
u₂loopsym === Symbol (" ##undefined##" ) && return 0
9
- # @show cache_lnsze(ls) reg_size(ls) pointer_from_objref(ls.register_size)
10
9
dontskip = (cache_lnsze (ls) ÷ reg_size (ls)) - 1
11
10
# u₂loopsym is vectorized
12
11
# u₁vectorized = vectorized === u₁loopsym
@@ -209,7 +208,6 @@ function lower_load_for_optranslation!(
209
208
step₂ = gethint (step (u₂loop))
210
209
# abs of steps are equal
211
210
equal_steps = (step₁ == step₂) ⊻ (posindicator ≠ 0x03 )
212
- # @show step₁, step₂, posindicator, equal_steps
213
211
_td = UnrollArgs (u₁loop, u₂loop, vloop, u₁, u₂max, Core. ifelse (equal_steps, 0 , u₂max - 1 ))
214
212
gespinds = mem_offset (op, _td, inds_by_ptroff, false , ls)
215
213
ptr = vptr (op)
@@ -230,7 +228,6 @@ function lower_load_for_optranslation!(
230
228
indices = copy (getindices (ref))
231
229
# old_translation_index = indices[translationind]
232
230
# indices[translationind] = u₁loop.itersymbol
233
- # @show indices, translationind, vloop
234
231
# getindicesonly returns a view of `getindices`
235
232
dummyref = ArrayReference (ref. array, indices, zero (getoffsets (ref)), getstrides (ref))
236
233
# loopedindex[translationind] = true
@@ -249,10 +246,8 @@ function lower_load_for_optranslation!(
249
246
end
250
247
end
251
248
end
252
- # @show indices
253
249
_td = UnrollArgs (u₁loop, u₂loop, vloop, total_unroll, u₂max, - 1 )
254
250
op. ref = dummymref
255
- # @show isu₁unrolled(op), isu₂unrolled(op)
256
251
_lower_load! (q, ls, op, _td, mask)
257
252
# set old values
258
253
op. ref = mref
@@ -329,7 +324,6 @@ function _lower_load!(
329
324
omop = offsetloadcollection (ls)
330
325
@unpack opids, opidcollectionmap, batchedcollections, batchedcollectionmap = omop
331
326
batchid, opind = batchedcollectionmap[identifier (op)]
332
- @show batchid, opind
333
327
for (bid, oid) ∈ batchedcollectionmap # this relies on `for op ∈ ops` in codegen/operation_evaluation_order.jl
334
328
if bid == batchid
335
329
if oid == opind
@@ -362,7 +356,6 @@ function rejectcurly(ls::LoopSet, op::Operation, u₁loopsym::Symbol, vloopsym::
362
356
li = op. ref. loopedindex
363
357
AV = AU = false
364
358
for (n,ind) ∈ enumerate (indices)
365
- # @show AU, op, n, ind, vloopsym, u₁loopsym
366
359
if li[n]
367
360
if ind === vloopsym
368
361
AV && return true
@@ -374,7 +367,6 @@ function rejectcurly(ls::LoopSet, op::Operation, u₁loopsym::Symbol, vloopsym::
374
367
end
375
368
else
376
369
opp = findop (parents (op), ind)
377
- # @show opp
378
370
if isvectorized (opp)
379
371
AV && return true
380
372
AV = true
0 commit comments