@@ -850,14 +850,96 @@ struct get_device_info_impl<
850
850
matrix_type::sint32, matrix_type::sint32},
851
851
{8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
852
852
matrix_type::fp32, matrix_type::fp32},
853
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
854
+ matrix_type::fp16, matrix_type::fp32},
855
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
856
+ matrix_type::fp32, matrix_type::fp16},
857
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
858
+ matrix_type::fp16, matrix_type::fp16},
859
+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
860
+ matrix_type::fp32, matrix_type::fp16},
861
+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::fp16, matrix_type::fp16,
862
+ matrix_type::fp16, matrix_type::fp16},
863
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
864
+ matrix_type::fp32, matrix_type::fp32},
865
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
866
+ matrix_type::fp16, matrix_type::fp32},
867
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
868
+ matrix_type::fp32, matrix_type::fp16},
869
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
870
+ matrix_type::fp16, matrix_type::fp16},
871
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
872
+ matrix_type::fp32, matrix_type::fp32},
873
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
874
+ matrix_type::fp16, matrix_type::fp32},
875
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
876
+ matrix_type::fp32, matrix_type::bf16 },
877
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::fp16, matrix_type::fp16,
878
+ matrix_type::fp16, matrix_type::fp16},
879
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
880
+ matrix_type::fp32, matrix_type::fp32},
881
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
882
+ matrix_type::fp16, matrix_type::fp32},
883
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
884
+ matrix_type::fp32, matrix_type::fp16},
885
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
886
+ matrix_type::fp16, matrix_type::fp16},
887
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
888
+ matrix_type::fp32, matrix_type::fp32},
889
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
890
+ matrix_type::fp16, matrix_type::fp32},
891
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
892
+ matrix_type::fp32, matrix_type::fp16},
893
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::fp16, matrix_type::fp16,
894
+ matrix_type::fp16, matrix_type::fp16},
895
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
896
+ matrix_type::bf16 , matrix_type::bf16 },
897
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
898
+ matrix_type::fp32, matrix_type::bf16 },
899
+ {8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
900
+ matrix_type::bf16 , matrix_type::fp32},
853
901
{8 , 0 , 0 , 0 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
854
902
matrix_type::fp32, matrix_type::fp32},
855
903
{0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
856
904
matrix_type::fp32, matrix_type::fp32},
905
+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
906
+ matrix_type::bf16 , matrix_type::fp32},
907
+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
908
+ matrix_type::fp32, matrix_type::bf16 },
909
+ {0 , 0 , 0 , 16 , 16 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
910
+ matrix_type::bf16 , matrix_type::bf16 },
857
911
{0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
858
912
matrix_type::fp32, matrix_type::fp32},
913
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
914
+ matrix_type::bf16 , matrix_type::fp32},
915
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
916
+ matrix_type::fp32, matrix_type::bf16 },
917
+ {0 , 0 , 0 , 1 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
918
+ matrix_type::bf16 , matrix_type::bf16 },
859
919
{0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
860
920
matrix_type::fp32, matrix_type::fp32},
921
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
922
+ matrix_type::bf16 , matrix_type::fp32},
923
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
924
+ matrix_type::fp32, matrix_type::bf16 },
925
+ {0 , 0 , 0 , 32 , 64 , 16 , matrix_type::bf16 , matrix_type::bf16 ,
926
+ matrix_type::bf16 , matrix_type::bf16 },
927
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
928
+ matrix_type::fp32, matrix_type::fp32},
929
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
930
+ matrix_type::bf16 , matrix_type::fp32},
931
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
932
+ matrix_type::fp32, matrix_type::bf16 },
933
+ {0 , 0 , 0 , 1 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
934
+ matrix_type::bf16 , matrix_type::bf16 },
935
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
936
+ matrix_type::fp32, matrix_type::fp32},
937
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
938
+ matrix_type::bf16 , matrix_type::fp32},
939
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
940
+ matrix_type::fp32, matrix_type::bf16 },
941
+ {0 , 0 , 0 , 32 , 64 , 32 , matrix_type::bf16 , matrix_type::bf16 ,
942
+ matrix_type::bf16 , matrix_type::bf16 },
861
943
{8 , 0 , 0 , 0 , 16 , 8 , matrix_type::tf32, matrix_type::tf32,
862
944
matrix_type::fp32, matrix_type::fp32},
863
945
};
0 commit comments