@@ -42,7 +42,7 @@ void ggml_sycl_host_free(void* ptr);
4242
4343extern int g_ggml_sycl_debug;
4444extern int g_ggml_sycl_disable_optimize;
45- extern int g_ggml_sycl_disable_mmvq ;
45+ extern int g_ggml_sycl_prioritize_dmmv ;
4646
4747#define GGML_SYCL_DEBUG (...) \
4848 do { \
@@ -286,11 +286,25 @@ struct ggml_tensor_extra_gpu {
286286
287287void release_extra_gpu (ggml_tensor_extra_gpu * extra, std::vector<queue_ptr> streams={});
288288
289- inline optimize_feature check_gpu_optimize_feature (syclex::architecture &/* arch*/ ) {
289+ inline optimize_feature check_gpu_optimize_feature (syclex::architecture &arch) {
290290 optimize_feature opt;
291291
292- // TODO: Romain change to Intel vendor?
293- opt.reorder = true ;
292+ opt.reorder =
293+ (arch == syclex::architecture::intel_gpu_dg1 ||
294+ arch == syclex::architecture::intel_gpu_acm_g10 ||
295+ arch == syclex::architecture::intel_gpu_acm_g11 ||
296+ arch == syclex::architecture::intel_gpu_acm_g12 ||
297+ arch == syclex::architecture::intel_gpu_pvc ||
298+ arch == syclex::architecture::intel_gpu_pvc_vg ||
299+ arch == syclex::architecture::intel_gpu_mtl_u ||
300+ arch == syclex::architecture::intel_gpu_mtl_s ||
301+ arch == syclex::architecture::intel_gpu_mtl_h ||
302+ arch == syclex::architecture::intel_gpu_arl_u ||
303+ arch == syclex::architecture::intel_gpu_arl_s ||
304+ arch == syclex::architecture::intel_gpu_arl_h ||
305+ arch == syclex::architecture::intel_gpu_bmg_g21 ||
306+ arch == syclex::architecture::intel_gpu_lnl_m
307+ );
294308
295309 return opt;
296310}
0 commit comments