Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
118 changes: 118 additions & 0 deletions pkg/dataobj/metastore/iter.go
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,7 @@ import (
"github.com/grafana/dskit/user"

"github.com/grafana/loki/v3/pkg/dataobj"
"github.com/grafana/loki/v3/pkg/dataobj/sections/indexpointers"
"github.com/grafana/loki/v3/pkg/dataobj/sections/pointers"
)

Expand Down Expand Up @@ -332,6 +333,123 @@ func forEachMatchedPointerSectionKey(
return nil
}

func forEachIndexPointer(
ctx context.Context,
object *dataobj.Object,
sStart, sEnd *scalar.Timestamp,
f func(pointer indexpointers.IndexPointer),
) error {
targetTenant, err := user.ExtractOrgID(ctx)
if err != nil {
return fmt.Errorf("extracting org ID: %w", err)
}
var reader indexpointers.Reader
defer reader.Close()

const batchSize = 1024
buf := make([]indexpointers.IndexPointer, batchSize)

// iterate over the sections and fill buf column by column
// once the read operation is over invoke client's [f] on every read row (numRows not always the same as len(buf))
for _, section := range object.Sections().Filter(indexpointers.CheckSection) {
if section.Tenant != targetTenant {
continue
}

sec, err := indexpointers.Open(ctx, section)
if err != nil {
return fmt.Errorf("opening section: %w", err)
}

var (
colPath *indexpointers.Column
colMinTimestamp *indexpointers.Column
colMaxTimestamp *indexpointers.Column
)

for _, c := range sec.Columns() {
if c.Type == indexpointers.ColumnTypePath {
colPath = c
}
if c.Type == indexpointers.ColumnTypeMinTimestamp {
colMinTimestamp = c
}
if c.Type == indexpointers.ColumnTypeMaxTimestamp {
colMaxTimestamp = c
}
if colPath != nil && colMinTimestamp != nil && colMaxTimestamp != nil {
break
}
}

if colPath == nil || colMinTimestamp == nil || colMaxTimestamp == nil {
return fmt.Errorf("one of the mandatory columns is missing: (path=%t, minTimestamp=%t, maxTimestamp=%t)", colPath == nil, colMinTimestamp == nil, colMaxTimestamp == nil)
}

reader.Reset(indexpointers.ReaderOptions{
Columns: sec.Columns(),
Predicates: []indexpointers.Predicate{
indexpointers.WhereTimeRangeOverlapsWith(colMinTimestamp, colMaxTimestamp, sStart, sEnd),
},
})

for {
rec, readErr := reader.Read(ctx, batchSize)
if readErr != nil && !errors.Is(readErr, io.EOF) {
return fmt.Errorf("reading recordBatch: %w", readErr)
}
numRows := int(rec.NumRows())
if numRows == 0 && errors.Is(readErr, io.EOF) {
break
}

for colIdx := range int(rec.NumCols()) {
col := rec.Column(colIdx)
pointerCol := sec.Columns()[colIdx]

switch pointerCol.Type {
case indexpointers.ColumnTypePath:
values := col.(*array.String)
for rIdx := range numRows {
if col.IsNull(rIdx) {
continue
}
buf[rIdx].Path = values.Value(rIdx)
}
case indexpointers.ColumnTypeMinTimestamp:
values := col.(*array.Timestamp)
for rIdx := range numRows {
if col.IsNull(rIdx) {
continue
}
buf[rIdx].StartTs = time.Unix(0, int64(values.Value(rIdx)))
}
case indexpointers.ColumnTypeMaxTimestamp:
values := col.(*array.Timestamp)
for rIdx := range numRows {
if col.IsNull(rIdx) {
continue
}
buf[rIdx].EndTs = time.Unix(0, int64(values.Value(rIdx)))
}
default:
continue
}
}

for rowIdx := range numRows {
f(buf[rowIdx])
}

if errors.Is(readErr, io.EOF) {
break
}
}
}

return nil
}

func findPointersColumnsByTypes(allColumns []*pointers.Column, columnTypes ...pointers.ColumnType) ([]*pointers.Column, error) {
result := make([]*pointers.Column, 0, len(columnTypes))

Expand Down
58 changes: 6 additions & 52 deletions pkg/dataobj/metastore/object.go
Original file line number Diff line number Diff line change
Expand Up @@ -401,10 +401,13 @@ func (m *ObjectMetastore) listObjectsFromTables(ctx context.Context, tablePaths
objects := make([][]string, len(tablePaths))
g, ctx := errgroup.WithContext(ctx)

sStart := scalar.NewTimestampScalar(arrow.Timestamp(start.UnixNano()), arrow.FixedWidthTypes.Timestamp_ns)
sEnd := scalar.NewTimestampScalar(arrow.Timestamp(end.UnixNano()), arrow.FixedWidthTypes.Timestamp_ns)

for i, path := range tablePaths {
g.Go(func() error {
var err error
objects[i], err = m.listObjects(ctx, path, start, end)
objects[i], err = m.listObjects(ctx, path, sStart, sEnd)
// If the metastore object is not found, it means it's outside of any existing window
// and we can safely ignore it.
if err != nil && !m.bucket.IsObjNotFoundErr(err) {
Expand Down Expand Up @@ -627,7 +630,7 @@ func addLabels(mtx *sync.Mutex, streams map[uint64][]*labels.Labels, newLabels *
streams[key] = append(streams[key], newLabels)
}

func (m *ObjectMetastore) listObjects(ctx context.Context, path string, start, end time.Time) ([]string, error) {
func (m *ObjectMetastore) listObjects(ctx context.Context, path string, sStart, sEnd *scalar.Timestamp) ([]string, error) {
var buf bytes.Buffer
objectReader, err := m.bucket.Get(ctx, path)
if err != nil {
Expand All @@ -645,12 +648,7 @@ func (m *ObjectMetastore) listObjects(ctx context.Context, path string, start, e
}
var objectPaths []string

// Read all relevant entries from the table of contents
predicate := indexpointers.TimeRangeRowPredicate{
Start: start.UTC(),
End: end.UTC(),
}
err = forEachIndexPointer(ctx, object, predicate, func(indexPointer indexpointers.IndexPointer) {
err = forEachIndexPointer(ctx, object, sStart, sEnd, func(indexPointer indexpointers.IndexPointer) {
objectPaths = append(objectPaths, indexPointer.Path)
})
if err != nil {
Expand All @@ -660,50 +658,6 @@ func (m *ObjectMetastore) listObjects(ctx context.Context, path string, start, e
return objectPaths, nil
}

func forEachIndexPointer(ctx context.Context, object *dataobj.Object, predicate indexpointers.RowPredicate, f func(indexpointers.IndexPointer)) error {
targetTenant, err := user.ExtractOrgID(ctx)
if err != nil {
return fmt.Errorf("extracting org ID: %w", err)
}
var reader indexpointers.RowReader
defer reader.Close()

buf := make([]indexpointers.IndexPointer, 1024)

for _, section := range object.Sections().Filter(indexpointers.CheckSection) {
if section.Tenant != targetTenant {
continue
}
sec, err := indexpointers.Open(ctx, section)
if err != nil {
return fmt.Errorf("opening section: %w", err)
}

reader.Reset(sec)
if predicate != nil {
err := reader.SetPredicate(predicate)
if err != nil {
return err
}
}

for {
num, err := reader.Read(ctx, buf)
if err != nil && !errors.Is(err, io.EOF) {
return err
}
if num == 0 && errors.Is(err, io.EOF) {
break
}
for _, indexPointer := range buf[:num] {
f(indexPointer)
}
}
}

return nil
}

func forEachStream(ctx context.Context, object *dataobj.Object, predicate streams.RowPredicate, f func(streams.Stream)) error {
targetTenant, err := user.ExtractOrgID(ctx)
if err != nil {
Expand Down
11 changes: 6 additions & 5 deletions pkg/dataobj/sections/indexpointers/builder_test.go
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
package indexpointers
package indexpointers_test

import (
"context"
Expand All @@ -8,6 +8,7 @@ import (
"github.com/stretchr/testify/require"

"github.com/grafana/loki/v3/pkg/dataobj"
"github.com/grafana/loki/v3/pkg/dataobj/sections/indexpointers"
)

func TestBuilder(t *testing.T) {
Expand All @@ -22,7 +23,7 @@ func TestBuilder(t *testing.T) {
{path: "bar", start: unixTime(10), end: unixTime(20)},
}

ib := NewBuilder(nil, 1024, 0)
ib := indexpointers.NewBuilder(nil, 1024, 0)
for _, p := range pp {
ib.Append(p.path, p.start, p.end)
}
Expand All @@ -34,7 +35,7 @@ func TestBuilder(t *testing.T) {
require.NoError(t, err)
defer closer.Close()

expect := []IndexPointer{
expect := []indexpointers.IndexPointer{
{
Path: "foo",
StartTs: unixTime(10),
Expand All @@ -47,8 +48,8 @@ func TestBuilder(t *testing.T) {
},
}

var actual []IndexPointer
for result := range Iter(context.Background(), obj) {
var actual []indexpointers.IndexPointer
for result := range indexpointers.Iter(context.Background(), obj) {
pointer, err := result.Value()
require.NoError(t, err)
actual = append(actual, pointer)
Expand Down
Loading
Loading