@@ -42,7 +42,7 @@ void ggml_sycl_host_free(void* ptr);
4242
4343extern  int  g_ggml_sycl_debug;
4444extern  int  g_ggml_sycl_disable_optimize;
45- extern  int  g_ggml_sycl_disable_mmvq ;
45+ extern  int  g_ggml_sycl_prioritize_dmmv ;
4646
4747#define  GGML_SYCL_DEBUG (...)        \
4848  do  {                              \
@@ -286,11 +286,25 @@ struct ggml_tensor_extra_gpu {
286286
287287void  release_extra_gpu (ggml_tensor_extra_gpu * extra, std::vector<queue_ptr> streams={});
288288
289- inline  optimize_feature check_gpu_optimize_feature (syclex::architecture &/* arch*/  ) {
289+ inline  optimize_feature check_gpu_optimize_feature (syclex::architecture &arch) {
290290    optimize_feature opt;
291291
292-     //  TODO: Romain change to Intel vendor?
293-     opt.reorder  = true ;
292+     opt.reorder  =
293+         (arch == syclex::architecture::intel_gpu_dg1 ||
294+          arch == syclex::architecture::intel_gpu_acm_g10 ||
295+          arch == syclex::architecture::intel_gpu_acm_g11 ||
296+          arch == syclex::architecture::intel_gpu_acm_g12 ||
297+          arch == syclex::architecture::intel_gpu_pvc ||
298+          arch == syclex::architecture::intel_gpu_pvc_vg ||
299+          arch == syclex::architecture::intel_gpu_mtl_u ||
300+          arch == syclex::architecture::intel_gpu_mtl_s ||
301+          arch == syclex::architecture::intel_gpu_mtl_h ||
302+          arch == syclex::architecture::intel_gpu_arl_u ||
303+          arch == syclex::architecture::intel_gpu_arl_s ||
304+          arch == syclex::architecture::intel_gpu_arl_h ||
305+          arch == syclex::architecture::intel_gpu_bmg_g21 ||
306+          arch == syclex::architecture::intel_gpu_lnl_m
307+         );
294308
295309    return  opt;
296310}
0 commit comments