@@ -1158,8 +1158,6 @@ static int CreateAclTensorWeight(const void *hostData, const std::vector<int64_t
11581158 strides[i] = shape[i + 1 ] * strides[i + 1 ];
11591159 }
11601160
1161- // std::vector<int64_t> storageShape;
1162- // storageShape.push_back(size);
11631161 *tensor = aclCreateTensor (shape.data (), shape.size (), dataType, strides.data (), 0 , aclFormat::ACL_FORMAT_ND,
11641162 shape.data (), shape.size (), *deviceAddr);
11651163 return 0 ;
@@ -1169,13 +1167,9 @@ static void weight_format_to_nz(ggml_tensor *tensor, const void *data, size_t of
11691167 aclrtStream stream;
11701168 ACL_CHECK (aclrtCreateStream (&stream));
11711169
1172- std::vector<int64_t > weightShape = {tensor->ne [0 ], tensor->ne [1 ]};
11731170 std::vector<int64_t > weightTransposedShape = {tensor->ne [1 ], tensor->ne [0 ]};
1174- void *weightDeviceAddr = nullptr ;
11751171 void *weightTransposedDeviceAddr = nullptr ;
1176- aclTensor *weight = nullptr ;
11771172 aclTensor *weightTransposed = nullptr ;
1178- CreateAclTensorWeight (data, weightShape, &weightDeviceAddr, ggml_cann_type_mapping (tensor->type ), &weight);
11791173 CreateAclTensorWeight (data, weightTransposedShape, &weightTransposedDeviceAddr,
11801174 ggml_cann_type_mapping (tensor->type ), &weightTransposed);
11811175
@@ -1196,13 +1190,8 @@ static void weight_format_to_nz(ggml_tensor *tensor, const void *data, size_t of
11961190
11971191 aclrtMemcpy ((char *)tensor->data + offset, size,
11981192 weightTransposedDeviceAddr, size, ACL_MEMCPY_HOST_TO_DEVICE);
1199- ACL_CHECK (aclDestroyTensor (weight));
12001193 ACL_CHECK (aclDestroyTensor (weightTransposed));
1201- aclrtFree (weightDeviceAddr);
12021194 aclrtFree (weightTransposedDeviceAddr);
1203- if (workspaceSize > 0 ) {
1204- aclrtFree (workspaceAddr);
1205- }
12061195}
12071196
12081197// TODO: need handle tensor which has paddings.
@@ -1246,9 +1235,6 @@ static void ggml_backend_cann_buffer_set_tensor(
12461235 ACL_CHECK (aclrtMemcpy ((char *)tensor->data + offset, size,
12471236 transform_buffer, size,
12481237 ACL_MEMCPY_HOST_TO_DEVICE));
1249- if (weightToNZ && is_matmul_weight ((const ggml_tensor*)tensor)) {
1250- weight_format_to_nz (tensor, transform_buffer, offset);
1251- }
12521238 free (transform_buffer);
12531239 }
12541240}
0 commit comments