|
74 | 74 | type *in1p = (type *) (in1); \
|
75 | 75 | type *op1p = (type *) (op1); \
|
76 | 76 | while (_n_ > _chunk_size) { \
|
77 |
| - vml_func((MKL_INT) _chunk_size, in1p, op1p); \ |
78 |
| - _n_ -= _chunk_size; \ |
79 |
| - in1p += _chunk_size; \ |
80 |
| - op1p += _chunk_size; \ |
| 77 | + npy_intp _current_chunk = (_n_ > _chunk_size) ? _chunk_size : _n_; \ |
| 78 | + vml_func((MKL_INT) _current_chunk, in1p, op1p); \ |
| 79 | + _n_ -= _current_chunk; \ |
| 80 | + in1p += _current_chunk; \ |
| 81 | + op1p += _current_chunk; \ |
81 | 82 | } \
|
82 | 83 | if (_n_) { \
|
83 | 84 | vml_func((MKL_INT) _n_, in1p, op1p); \
|
|
92 | 93 | type *in2p = (type *) (in2); \
|
93 | 94 | type *op1p = (type *) (op1); \
|
94 | 95 | while (_n_ > _chunk_size) { \
|
95 |
| - vml_func((MKL_INT) _chunk_size, in1p, in2p, op1p); \ |
96 |
| - _n_ -= _chunk_size; \ |
97 |
| - in1p += _chunk_size; \ |
98 |
| - in2p += _chunk_size; \ |
99 |
| - op1p += _chunk_size; \ |
| 96 | + npy_intp _current_chunk = (_n_ > _chunk_size) ? _chunk_size : _n_; \ |
| 97 | + vml_func((MKL_INT) _current_chunk, in1p, in2p, op1p); \ |
| 98 | + _n_ -= _current_chunk; \ |
| 99 | + in1p += _current_chunk; \ |
| 100 | + in2p += _current_chunk; \ |
| 101 | + op1p += _current_chunk; \ |
100 | 102 | } \
|
101 | 103 | if (_n_) { \
|
102 | 104 | vml_func((MKL_INT)_n_, in1p, in2p, op1p); \
|
|
115 | 117 | const type _scaleB = (scaleB); \
|
116 | 118 | const type _shiftB = (shiftB); \
|
117 | 119 | while (_n_ > _chunk_size) { \
|
118 |
| - vml_func(_chunk_size, in1p, in1p, _scaleA, _shiftA, _scaleB, _shiftB, op1p); \ |
119 |
| - _n_ -= _chunk_size; \ |
120 |
| - in1p += _chunk_size; \ |
121 |
| - op1p += _chunk_size; \ |
| 120 | + npy_intp _current_chunk = (_n_ > _chunk_size) ? _chunk_size : _n_; \ |
| 121 | + vml_func(_current_chunk, in1p, in1p, _scaleA, _shiftA, _scaleB, _shiftB, op1p); \ |
| 122 | + _n_ -= _current_chunk; \ |
| 123 | + in1p += _current_chunk; \ |
| 124 | + op1p += _current_chunk; \ |
122 | 125 | } \
|
123 | 126 | if (_n_) { \
|
124 | 127 | vml_func((MKL_INT)_n_, in1p, in1p, _scaleA, _shiftA, _scaleB, _shiftB, op1p); \
|
|
0 commit comments