Skip to content

Commit 18bd89f

Browse files
committed
Revert "change gemm function"
This reverts commit ab61eb4.
1 parent 626e867 commit 18bd89f

File tree

14 files changed

+548
-548
lines changed

14 files changed

+548
-548
lines changed

source/module_hamilt_lcao/module_gint/kernels/cuda/code_gen.cuh

Lines changed: 233 additions & 233 deletions
Large diffs are not rendered by default.
Lines changed: 23 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -1,48 +1,48 @@
11
#include "vbatch_matrix_mul.cuh"
22

3-
template void gemm_time_measure<double, 2, 16, 16, 32, 2, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3+
template void gemm_time_measure<double, 2, 16, 16, 32, 2, 2, 16, 2, 16>(int, int, int*, int*, int*, double**, int*, double**, int*, double**, int*, int, cudaStream_t, float&, matrix_multiple_func_type&, double*, double*, double*);
44

5-
template void gemm_time_measure<double, 2, 16, 16, 32, 4, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
5+
template void gemm_time_measure<double, 2, 16, 16, 32, 4, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
66

7-
template void gemm_time_measure<double, 2, 16, 16, 32, 6, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
7+
template void gemm_time_measure<double, 2, 16, 16, 32, 6, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
88

9-
template void gemm_time_measure<double, 2, 16, 16, 32, 8, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
9+
template void gemm_time_measure<double, 2, 16, 16, 32, 8, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
1010

11-
template void gemm_time_measure<double, 2, 16, 16, 48, 2, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
11+
template void gemm_time_measure<double, 2, 16, 16, 48, 2, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
1212

13-
template void gemm_time_measure<double, 2, 16, 16, 48, 4, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
13+
template void gemm_time_measure<double, 2, 16, 16, 48, 4, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
1414

15-
template void gemm_time_measure<double, 2, 16, 16, 48, 6, 2, 16, 2, 16>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
15+
template void gemm_time_measure<double, 2, 16, 16, 48, 6, 2, 16, 2, 16>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
1616

17-
template void gemm_time_measure<double, 4, 8, 8, 24, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
17+
template void gemm_time_measure<double, 4, 8, 8, 24, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
1818

19-
template void gemm_time_measure<double, 4, 8, 8, 24, 8, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
19+
template void gemm_time_measure<double, 4, 8, 8, 24, 8, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
2020

21-
template void gemm_time_measure<double, 4, 8, 8, 24, 12, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
21+
template void gemm_time_measure<double, 4, 8, 8, 24, 12, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
2222

23-
template void gemm_time_measure<double, 4, 8, 8, 32, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
23+
template void gemm_time_measure<double, 4, 8, 8, 32, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
2424

25-
template void gemm_time_measure<double, 4, 8, 8, 32, 8, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
25+
template void gemm_time_measure<double, 4, 8, 8, 32, 8, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
2626

27-
template void gemm_time_measure<double, 4, 8, 8, 40, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
27+
template void gemm_time_measure<double, 4, 8, 8, 40, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
2828

29-
template void gemm_time_measure<double, 4, 8, 8, 40, 8, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
29+
template void gemm_time_measure<double, 4, 8, 8, 40, 8, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3030

31-
template void gemm_time_measure<double, 4, 8, 8, 48, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
31+
template void gemm_time_measure<double, 4, 8, 8, 48, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3232

33-
template void gemm_time_measure<double, 4, 8, 8, 56, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
33+
template void gemm_time_measure<double, 4, 8, 8, 56, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3434

35-
template void gemm_time_measure<double, 4, 8, 8, 64, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
35+
template void gemm_time_measure<double, 4, 8, 8, 64, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3636

37-
template void gemm_time_measure<double, 4, 8, 16, 16, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
37+
template void gemm_time_measure<double, 4, 8, 16, 16, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
3838

39-
template void gemm_time_measure<double, 4, 8, 16, 16, 8, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
39+
template void gemm_time_measure<double, 4, 8, 16, 16, 8, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
4040

41-
template void gemm_time_measure<double, 4, 8, 16, 16, 12, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
41+
template void gemm_time_measure<double, 4, 8, 16, 16, 12, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
4242

43-
template void gemm_time_measure<double, 4, 8, 16, 24, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
43+
template void gemm_time_measure<double, 4, 8, 16, 24, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
4444

45-
template void gemm_time_measure<double, 4, 8, 16, 24, 8, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
45+
template void gemm_time_measure<double, 4, 8, 16, 24, 8, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
4646

47-
template void gemm_time_measure<double, 4, 8, 16, 32, 4, 4, 8, 4, 8>(int,int,const int*,const int*,const int*,const double* const*,const int*,const double* const*,const int*,double**,const int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
47+
template void gemm_time_measure<double, 4, 8, 16, 32, 4, 4, 8, 4, 8>(int,int,int*,int*,int*,double**,int*,double**,int*,double**,int*,int,cudaStream_t,float&,matrix_multiple_func_type&,double*,double*,double*);
4848

0 commit comments

Comments
 (0)