File tree Expand file tree Collapse file tree 1 file changed +10
-1
lines changed
Expand file tree Collapse file tree 1 file changed +10
-1
lines changed Original file line number Diff line number Diff line change @@ -111,7 +111,7 @@ struct MatrixSplit {
111111 }
112112
113113 /* Split the matrix using round-to-nearest. This is an implementation of
114- * Algorithm 8 in
114+ * Algorithm 8 in:
115115 *
116116 * Uchino Y., Ozaki K., Imamura T. Performance enanchcement of the Ozaki
117117 * scheme on integer matrix multiplication unit. arXiv:2409.13313 [cs.DC]. 2024.
@@ -139,6 +139,15 @@ struct MatrixSplit {
139139 }
140140 }
141141
142+ /* Split the matrix using bit masking, which is equivalent to truncation.
143+ * This is an implementation of Algorithm 4 in:
144+ *
145+ * Ootomo H., Ozaki K., Yokota R. DGEMM on integer matrix multiplication
146+ * unit. Int. J. High Performance Comput. App. 2024;38(4):297-313.
147+ * DOI: 10.1177/10943420241239588
148+ *
149+ * Integer products are accumulated in floating-point arithmetic one by one.
150+ */
142151 void computeSplitsWithBitMasking () {
143152 this ->splitType = splittingStrategy::bitMasking;
144153 // Compute splits one row/column at a time.
You can’t perform that action at this time.
0 commit comments