@@ -850,14 +850,96 @@ struct get_device_info_impl<
850850 matrix_type::sint32, matrix_type::sint32},
851851 {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
852852 matrix_type::fp32, matrix_type::fp32},
853+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
854+ matrix_type::fp16, matrix_type::fp32},
855+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
856+ matrix_type::fp32, matrix_type::fp16},
857+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
858+ matrix_type::fp16, matrix_type::fp16},
859+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
860+ matrix_type::fp32, matrix_type::fp16},
861+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
862+ matrix_type::fp16, matrix_type::fp16},
863+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
864+ matrix_type::fp32, matrix_type::fp32},
865+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
866+ matrix_type::fp16, matrix_type::fp32},
867+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
868+ matrix_type::fp32, matrix_type::fp16},
869+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
870+ matrix_type::fp16, matrix_type::fp16},
871+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
872+ matrix_type::fp32, matrix_type::fp32},
873+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
874+ matrix_type::fp16, matrix_type::fp32},
875+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
876+ matrix_type::fp32, matrix_type::bf16 },
877+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
878+ matrix_type::fp16, matrix_type::fp16},
879+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
880+ matrix_type::fp32, matrix_type::fp32},
881+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
882+ matrix_type::fp16, matrix_type::fp32},
883+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
884+ matrix_type::fp32, matrix_type::fp16},
885+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
886+ matrix_type::fp16, matrix_type::fp16},
887+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
888+ matrix_type::fp32, matrix_type::fp32},
889+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
890+ matrix_type::fp16, matrix_type::fp32},
891+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
892+ matrix_type::fp32, matrix_type::fp16},
893+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
894+ matrix_type::fp16, matrix_type::fp16},
895+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
896+ matrix_type::bf16 , matrix_type::bf16 },
897+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
898+ matrix_type::fp32, matrix_type::bf16 },
899+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
900+ matrix_type::bf16 , matrix_type::fp32},
853901 {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
854902 matrix_type::fp32, matrix_type::fp32},
855903 {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
856904 matrix_type::fp32, matrix_type::fp32},
905+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
906+ matrix_type::bf16 , matrix_type::fp32},
907+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
908+ matrix_type::fp32, matrix_type::bf16 },
909+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
910+ matrix_type::bf16 , matrix_type::bf16 },
857911 {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
858912 matrix_type::fp32, matrix_type::fp32},
913+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
914+ matrix_type::bf16 , matrix_type::fp32},
915+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
916+ matrix_type::fp32, matrix_type::bf16 },
917+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
918+ matrix_type::bf16 , matrix_type::bf16 },
859919 {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
860920 matrix_type::fp32, matrix_type::fp32},
921+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
922+ matrix_type::bf16 , matrix_type::fp32},
923+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
924+ matrix_type::fp32, matrix_type::bf16 },
925+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
926+ matrix_type::bf16 , matrix_type::bf16 },
927+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
928+ matrix_type::fp32, matrix_type::fp32},
929+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
930+ matrix_type::bf16 , matrix_type::fp32},
931+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
932+ matrix_type::fp32, matrix_type::bf16 },
933+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
934+ matrix_type::bf16 , matrix_type::bf16 },
935+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
936+ matrix_type::fp32, matrix_type::fp32},
937+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
938+ matrix_type::bf16 , matrix_type::fp32},
939+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
940+ matrix_type::fp32, matrix_type::bf16 },
941+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
942+ matrix_type::bf16 , matrix_type::bf16 },
861943 {8 , 0 , 0 , 0 , 16 , 8 , matrix_type::tf32, matrix_type::tf32,
862944 matrix_type::fp32, matrix_type::fp32},
863945 };
0 commit comments