-
Notifications
You must be signed in to change notification settings - Fork 22
Expand file tree
/
Copy pathIP.h
More file actions
40 lines (29 loc) · 1.83 KB
/
IP.h
File metadata and controls
40 lines (29 loc) · 1.83 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
/*
* Copyright (c) 2006-Present, Redis Ltd.
* All rights reserved.
*
* Licensed under your choice of the Redis Source Available License 2.0
* (RSALv2); or (b) the Server Side Public License v1 (SSPLv1); or (c) the
* GNU Affero General Public License v3 (AGPLv3).
*/
#pragma once
#include <cstdlib>
// pVect1v vector of type fp32 and pVect2v vector of type uint8
float SQ8_InnerProduct(const void *pVect1v, const void *pVect2v, size_t dimension);
// pVect1v vector of type fp32 and pVect2v vector of type uint8
float SQ8_Cosine(const void *pVect1v, const void *pVect2v, size_t dimension);
// SQ8-to-SQ8: Both vectors are uint8 quantized with precomputed sum
// Vector layout: [uint8_t values (dim)] [min_val (float)] [delta (float)] [sum (float)]
float SQ8_SQ8_InnerProduct(const void *pVect1v, const void *pVect2v, size_t dimension);
// SQ8-to-SQ8: Both vectors are uint8 quantized and normalized with precomputed sum
// Vector layout: [uint8_t values (dim)] [min_val (float)] [delta (float)] [sum (float)]
float SQ8_SQ8_Cosine(const void *pVect1v, const void *pVect2v, size_t dimension);
float FP32_InnerProduct(const void *pVect1, const void *pVect2, size_t dimension);
double FP64_InnerProduct(const void *pVect1, const void *pVect2, size_t dimension);
float FP16_InnerProduct(const void *pVect1, const void *pVect2, size_t dimension);
float BF16_InnerProduct_LittleEndian(const void *pVect1v, const void *pVect2v, size_t dimension);
float BF16_InnerProduct_BigEndian(const void *pVect1v, const void *pVect2v, size_t dimension);
float INT8_InnerProduct(const void *pVect1, const void *pVect2, size_t dimension);
float INT8_Cosine(const void *pVect1, const void *pVect2, size_t dimension);
float UINT8_InnerProduct(const void *pVect1, const void *pVect2, size_t dimension);
float UINT8_Cosine(const void *pVect1, const void *pVect2, size_t dimension);