Skip to content

Commit ff69048

Browse files
authored
[SYCL][Matrix] Add matrix combinations 16x16x16 and 32x64x16 bfloat16 for PVC (intel#12026)
1 parent 8083f8a commit ff69048

File tree

3 files changed

+13
-3
lines changed

3 files changed

+13
-3
lines changed

sycl/doc/extensions/experimental/sycl_ext_matrix/sycl_ext_oneapi_matrix.asciidoc

+5-3
Original file line numberDiff line numberDiff line change
@@ -915,9 +915,11 @@ architecture::intel_gpu_dg2_g11, architecture::intel_gpu_dg2_g12`
915915
`matrix_type::fp32` .2+| +<=+ 8 | 16 .2+| 16 |
916916
`architecture::intel_gpu_pvc`|8| `architecture::intel_gpu_dg2_g10,
917917
architecture::intel_gpu_dg2_g11, architecture::intel_gpu_dg2_g12`
918-
.2+| `matrix_type::bf16` .2+| `matrix_type::bf16` .2+|
919-
`matrix_type::fp32` .2+| +<=+ 8 | 16 .2+| 16 |
920-
`architecture::intel_gpu_pvc` |8| `architecture::intel_gpu_dg2_g10,
918+
.4+| `matrix_type::bf16` .4+| `matrix_type::bf16` .4+|
919+
`matrix_type::fp32` | 16 | 16 | 16 .3+|`architecture::intel_gpu_pvc` |
920+
32 | 64 | 16
921+
.2+| +<=+ 8 | 16 .2+| 16
922+
|8 | `architecture::intel_gpu_dg2_g10,
921923
architecture::intel_gpu_dg2_g11, architecture::intel_gpu_dg2_g12`
922924
| `matrix_type::tf32` | `matrix_type::tf32` |
923925
`matrix_type::fp32` | +<=+ 8 | 16 | 8 |

sycl/source/detail/device_info.hpp

+4
Original file line numberDiff line numberDiff line change
@@ -763,6 +763,10 @@ struct get_device_info_impl<
763763
matrix_type::fp32, matrix_type::fp32},
764764
{8, 0, 0, 0, 16, 16, matrix_type::bf16, matrix_type::bf16,
765765
matrix_type::fp32, matrix_type::fp32},
766+
{0, 0, 0, 16, 16, 16, matrix_type::bf16, matrix_type::bf16,
767+
matrix_type::fp32, matrix_type::fp32},
768+
{0, 0, 0, 32, 64, 16, matrix_type::bf16, matrix_type::bf16,
769+
matrix_type::fp32, matrix_type::fp32},
766770
{8, 0, 0, 0, 16, 8, matrix_type::tf32, matrix_type::tf32,
767771
matrix_type::fp32, matrix_type::fp32},
768772
};

sycl/test-e2e/Matrix/runtime_query_pvc.cpp

+4
Original file line numberDiff line numberDiff line change
@@ -28,6 +28,10 @@ int main() {
2828
matrix_type::fp32, matrix_type::fp32},
2929
{8, 0, 0, 0, 16, 16, matrix_type::bf16, matrix_type::bf16,
3030
matrix_type::fp32, matrix_type::fp32},
31+
{0, 0, 0, 16, 16, 16, matrix_type::bf16, matrix_type::bf16,
32+
matrix_type::fp32, matrix_type::fp32},
33+
{0, 0, 0, 32, 64, 16, matrix_type::bf16, matrix_type::bf16,
34+
matrix_type::fp32, matrix_type::fp32},
3135
{8, 0, 0, 0, 16, 8, matrix_type::tf32, matrix_type::tf32,
3236
matrix_type::fp32, matrix_type::fp32},
3337
};

0 commit comments

Comments
 (0)