@@ -849,14 +849,96 @@ struct get_device_info_impl<
849849 matrix_type::sint32, matrix_type::sint32},
850850 {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
851851 matrix_type::fp32, matrix_type::fp32},
852+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
853+ matrix_type::fp16, matrix_type::fp32},
854+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
855+ matrix_type::fp32, matrix_type::fp16},
856+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
857+ matrix_type::fp16, matrix_type::fp16},
858+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
859+ matrix_type::fp32, matrix_type::fp16},
860+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
861+ matrix_type::fp16, matrix_type::fp16},
862+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
863+ matrix_type::fp32, matrix_type::fp32},
864+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
865+ matrix_type::fp16, matrix_type::fp32},
866+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
867+ matrix_type::fp32, matrix_type::fp16},
868+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
869+ matrix_type::fp16, matrix_type::fp16},
870+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
871+ matrix_type::fp32, matrix_type::fp32},
872+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
873+ matrix_type::fp16, matrix_type::fp32},
874+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
875+ matrix_type::fp32, matrix_type::bf16 },
876+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
877+ matrix_type::fp16, matrix_type::fp16},
878+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
879+ matrix_type::fp32, matrix_type::fp32},
880+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
881+ matrix_type::fp16, matrix_type::fp32},
882+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
883+ matrix_type::fp32, matrix_type::fp16},
884+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
885+ matrix_type::fp16, matrix_type::fp16},
886+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
887+ matrix_type::fp32, matrix_type::fp32},
888+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
889+ matrix_type::fp16, matrix_type::fp32},
890+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
891+ matrix_type::fp32, matrix_type::fp16},
892+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
893+ matrix_type::fp16, matrix_type::fp16},
894+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
895+ matrix_type::bf16 , matrix_type::bf16 },
896+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
897+ matrix_type::fp32, matrix_type::bf16 },
898+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
899+ matrix_type::bf16 , matrix_type::fp32},
852900 {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
853901 matrix_type::fp32, matrix_type::fp32},
854902 {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
855903 matrix_type::fp32, matrix_type::fp32},
904+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
905+ matrix_type::bf16 , matrix_type::fp32},
906+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
907+ matrix_type::fp32, matrix_type::bf16 },
908+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
909+ matrix_type::bf16 , matrix_type::bf16 },
856910 {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
857911 matrix_type::fp32, matrix_type::fp32},
912+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
913+ matrix_type::bf16 , matrix_type::fp32},
914+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
915+ matrix_type::fp32, matrix_type::bf16 },
916+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
917+ matrix_type::bf16 , matrix_type::bf16 },
858918 {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
859919 matrix_type::fp32, matrix_type::fp32},
920+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
921+ matrix_type::bf16 , matrix_type::fp32},
922+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
923+ matrix_type::fp32, matrix_type::bf16 },
924+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
925+ matrix_type::bf16 , matrix_type::bf16 },
926+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
927+ matrix_type::fp32, matrix_type::fp32},
928+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
929+ matrix_type::bf16 , matrix_type::fp32},
930+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
931+ matrix_type::fp32, matrix_type::bf16 },
932+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
933+ matrix_type::bf16 , matrix_type::bf16 },
934+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
935+ matrix_type::fp32, matrix_type::fp32},
936+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
937+ matrix_type::bf16 , matrix_type::fp32},
938+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
939+ matrix_type::fp32, matrix_type::bf16 },
940+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
941+ matrix_type::bf16 , matrix_type::bf16 },
860942 {8 , 0 , 0 , 0 , 16 , 8 , matrix_type::tf32, matrix_type::tf32,
861943 matrix_type::fp32, matrix_type::fp32},
862944 };
0 commit comments