@@ -132,11 +132,10 @@ def __init__(self, target: tuple) -> None:
132132 raise TypeError ("target.arch is not a dict" )
133133 dirname = os .path .dirname (os .path .realpath (__file__ ))
134134 mod = compile_module_from_src (Path (os .path .join (dirname , "arch_parser.c" )).read_text (), "arch_utils" )
135- # breakpoint()
136- # self.device_arch = mod.parse_device_arch(target.arch.get('architecture', 0))
137- # self.properties = self.parse_target(target.arch)
138- self .device_arch = "dg2"
139- self .properties = {'name' : 'Intel(R) Arc(TM) A770 Graphics' , 'platform_name' : 'Intel(R) oneAPI Unified Runtime over Level-Zero' , 'vendor' : 'Intel(R) Corporation' , 'version' : '12.55.8' , 'gpu_eu_count' : 512 , 'gpu_subslice_count' : 32 , 'max_work_group_size' : 1024 , 'max_num_sub_groups' : 128 , 'sub_group_sizes' : [8 , 16 , 32 ], 'has_fp64' : False , 'has_subgroup_matrix_multiply_accumulate' : True , 'has_subgroup_matrix_multiply_accumulate_tensor_float32' : False , 'has_subgroup_2d_block_io' : False , 'has_bfloat16_conversions' : True }
135+ self .device_arch = mod .parse_device_arch (target .arch .get ('architecture' , 0 ))
136+ self .properties = self .parse_target (target .arch )
137+ # self.device_arch = "dg2"
138+ # self.properties = {'name': 'Intel(R) Arc(TM) A770 Graphics', 'platform_name': 'Intel(R) oneAPI Unified Runtime over Level-Zero', 'vendor': 'Intel(R) Corporation', 'version': '12.55.8', 'gpu_eu_count': 512, 'gpu_subslice_count': 32, 'max_work_group_size': 1024, 'max_num_sub_groups': 128, 'sub_group_sizes': [8, 16, 32], 'has_fp64': False, 'has_subgroup_matrix_multiply_accumulate': True, 'has_subgroup_matrix_multiply_accumulate_tensor_float32': False, 'has_subgroup_2d_block_io': False, 'has_bfloat16_conversions': True}
140139 print ("DEVICE PROPS:" )
141140 print (self .device_arch )
142141 print (self .properties )
@@ -331,7 +330,7 @@ def make_llir(src, metadata, options):
331330 if options .extern_libs :
332331 paths = [path for (name , path ) in options .extern_libs ]
333332 llvm .link_extern_libs (llvm_mod , paths )
334- intel .optimize_module (llvm_mod , llvm .OPTIMIZE_O3 )
333+ intel .optimize_module (llvm_mod , llvm .OPTIMIZE_O0 )
335334 intel .post_process_llir (llvm_mod )
336335
337336 # Get some metadata
0 commit comments