-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathembedding.go
More file actions
67 lines (56 loc) · 1.17 KB
/
embedding.go
File metadata and controls
67 lines (56 loc) · 1.17 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
package golsh
import (
"bytes"
"fmt"
"math/rand"
)
type random interface {
draw() float32
}
type gauss struct{}
func (g *gauss) draw() float32 {
return float32(rand.NormFloat64())
}
type embedding struct {
normals [][]float32
}
func newEmbedding(d int, size int, r random) embedding {
normals := make([][]float32, d, d)
for i := 0; i < d; i++ {
normals[i] = normal(size, r)
}
return embedding{normals}
}
func normal(size int, r random) []float32 {
result := make([]float32, size, size)
for i := 0; i < size; i++ {
result[i] = r.draw()
}
return result
}
// returns an embedding of size d
func (e *embedding) embed(id int, vector []float32) string {
result := make([]bool, len(e.normals), len(e.normals))
for i, normal := range e.normals {
result[i] = dimension(vector, normal)
}
return fmt.Sprintf("%d-%s", id, bitToString(result))
}
func dimension(vecA []float32, vecB []float32) bool {
dot := dot(vecA, vecB)
if dot > 0 {
return true
}
return false
}
func bitToString(bits []bool) string {
var buffer bytes.Buffer
for _, bit := range bits {
if bit {
buffer.WriteString("1")
} else {
buffer.WriteString("0")
}
}
return buffer.String()
}