Skip to content

Commit 1244ab6

Browse files
committed
Fix bug when do LFS GC
1 parent a16ca3c commit 1244ab6

File tree

4 files changed

+99
-22
lines changed

4 files changed

+99
-22
lines changed

models/git/lfs.go

Lines changed: 9 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -312,23 +312,20 @@ func IterateRepositoryIDsWithLFSMetaObjects(ctx context.Context, f func(ctx cont
312312

313313
// IterateLFSMetaObjectsForRepoOptions provides options for IterateLFSMetaObjectsForRepo
314314
type IterateLFSMetaObjectsForRepoOptions struct {
315-
OlderThan timeutil.TimeStamp
316-
UpdatedLessRecentlyThan timeutil.TimeStamp
317-
OrderByUpdated bool
318-
LoopFunctionAlwaysUpdates bool
315+
OlderThan timeutil.TimeStamp
316+
UpdatedLessRecentlyThan timeutil.TimeStamp
319317
}
320318

321319
// IterateLFSMetaObjectsForRepo provides a iterator for LFSMetaObjects per Repo
322320
func IterateLFSMetaObjectsForRepo(ctx context.Context, repoID int64, f func(context.Context, *LFSMetaObject, int64) error, opts *IterateLFSMetaObjectsForRepoOptions) error {
323-
var start int
324321
batchSize := setting.Database.IterateBufferSize
325322
engine := db.GetEngine(ctx)
326323
type CountLFSMetaObject struct {
327324
Count int64
328325
LFSMetaObject `xorm:"extends"`
329326
}
330327

331-
id := int64(0)
328+
lastID := int64(0)
332329

333330
for {
334331
beans := make([]*CountLFSMetaObject, 0, batchSize)
@@ -341,29 +338,23 @@ func IterateLFSMetaObjectsForRepo(ctx context.Context, repoID int64, f func(cont
341338
if !opts.UpdatedLessRecentlyThan.IsZero() {
342339
sess.And("`lfs_meta_object`.updated_unix < ?", opts.UpdatedLessRecentlyThan)
343340
}
344-
sess.GroupBy("`lfs_meta_object`.id")
345-
if opts.OrderByUpdated {
346-
sess.OrderBy("`lfs_meta_object`.updated_unix ASC")
347-
} else {
348-
sess.And("`lfs_meta_object`.id > ?", id)
349-
sess.OrderBy("`lfs_meta_object`.id ASC")
350-
}
351-
if err := sess.Limit(batchSize, start).Find(&beans); err != nil {
341+
sess.GroupBy("`lfs_meta_object`.id").
342+
And("`lfs_meta_object`.id > ?", lastID).
343+
OrderBy("`lfs_meta_object`.id ASC")
344+
345+
if err := sess.Limit(batchSize).Find(&beans); err != nil {
352346
return err
353347
}
354348
if len(beans) == 0 {
355349
return nil
356350
}
357-
if !opts.LoopFunctionAlwaysUpdates {
358-
start += len(beans)
359-
}
360351

361352
for _, bean := range beans {
362353
if err := f(ctx, &bean.LFSMetaObject, bean.Count); err != nil {
363354
return err
364355
}
365356
}
366-
id = beans[len(beans)-1].ID
357+
lastID = beans[len(beans)-1].ID
367358
}
368359
}
369360

models/git/lfs_test.go

Lines changed: 61 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,61 @@
1+
// Copyright 2024 The Gitea Authors. All rights reserved.
2+
// SPDX-License-Identifier: MIT
3+
4+
package git_test
5+
6+
import (
7+
"bytes"
8+
"context"
9+
"strconv"
10+
"testing"
11+
"time"
12+
13+
"code.gitea.io/gitea/models/db"
14+
git_model "code.gitea.io/gitea/models/git"
15+
repo_model "code.gitea.io/gitea/models/repo"
16+
"code.gitea.io/gitea/models/unittest"
17+
"code.gitea.io/gitea/modules/lfs"
18+
"code.gitea.io/gitea/modules/setting"
19+
"code.gitea.io/gitea/modules/test"
20+
"code.gitea.io/gitea/modules/timeutil"
21+
22+
"github.com/stretchr/testify/assert"
23+
)
24+
25+
func TestIterateLFSMetaObjectsForRepoUpdatesDoNotSkip(t *testing.T) {
26+
unittest.PrepareTestEnv(t)
27+
28+
ctx := t.Context()
29+
repo, err := repo_model.GetRepositoryByOwnerAndName(ctx, "user2", "repo1")
30+
assert.NoError(t, err)
31+
32+
test.MockVariableValue(&setting.Database.IterateBufferSize, 1)
33+
34+
created := make([]*git_model.LFSMetaObject, 0, 3)
35+
for i := 0; i < 3; i++ {
36+
content := []byte("gitea-lfs-" + strconv.Itoa(i))
37+
pointer, err := lfs.GeneratePointer(bytes.NewReader(content))
38+
assert.NoError(t, err)
39+
40+
meta, err := git_model.NewLFSMetaObject(ctx, repo.ID, pointer)
41+
assert.NoError(t, err)
42+
created = append(created, meta)
43+
}
44+
45+
iterated := make([]int64, 0, len(created))
46+
cutoff := time.Now().Add(24 * time.Hour)
47+
iterErr := git_model.IterateLFSMetaObjectsForRepo(ctx, repo.ID, func(ctx context.Context, meta *git_model.LFSMetaObject, count int64) error {
48+
iterated = append(iterated, meta.ID)
49+
_, err := db.GetEngine(ctx).ID(meta.ID).Cols("updated_unix").Update(&git_model.LFSMetaObject{
50+
UpdatedUnix: timeutil.TimeStamp(time.Now().Unix()),
51+
})
52+
return err
53+
}, &git_model.IterateLFSMetaObjectsForRepoOptions{
54+
OlderThan: timeutil.TimeStamp(cutoff.Unix()),
55+
UpdatedLessRecentlyThan: timeutil.TimeStamp(cutoff.Unix()),
56+
})
57+
assert.NoError(t, iterErr)
58+
59+
expected := []int64{created[0].ID, created[1].ID, created[2].ID}
60+
assert.Equal(t, expected, iterated)
61+
}

services/repository/lfs.go

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -123,10 +123,8 @@ func GarbageCollectLFSMetaObjectsForRepo(ctx context.Context, repo *repo_model.R
123123
//
124124
// It is likely that a week is potentially excessive but it should definitely be enough that any
125125
// unassociated LFS object is genuinely unassociated.
126-
OlderThan: timeutil.TimeStamp(opts.OlderThan.Unix()),
127-
UpdatedLessRecentlyThan: timeutil.TimeStamp(opts.UpdatedLessRecentlyThan.Unix()),
128-
OrderByUpdated: true,
129-
LoopFunctionAlwaysUpdates: true,
126+
OlderThan: timeutil.TimeStamp(opts.OlderThan.Unix()),
127+
UpdatedLessRecentlyThan: timeutil.TimeStamp(opts.UpdatedLessRecentlyThan.Unix()),
130128
})
131129

132130
if err == errStop {

services/repository/lfs_test.go

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,7 @@ import (
1414
"code.gitea.io/gitea/modules/lfs"
1515
"code.gitea.io/gitea/modules/setting"
1616
"code.gitea.io/gitea/modules/storage"
17+
"code.gitea.io/gitea/modules/test"
1718
repo_service "code.gitea.io/gitea/services/repository"
1819

1920
"github.com/stretchr/testify/assert"
@@ -46,6 +47,32 @@ func TestGarbageCollectLFSMetaObjects(t *testing.T) {
4647
assert.ErrorIs(t, err, git_model.ErrLFSObjectNotExist)
4748
}
4849

50+
func TestGarbageCollectLFSMetaObjectsForRepoAutoFix(t *testing.T) {
51+
unittest.PrepareTestEnv(t)
52+
53+
test.MockVariableValue(&setting.LFS.StartServer, true)
54+
55+
err := storage.Init()
56+
assert.NoError(t, err)
57+
58+
repo := unittest.AssertExistsAndLoadBean(t, &repo_model.Repository{ID: 1})
59+
60+
// add lfs object
61+
lfsContent := []byte("gitea2")
62+
lfsOid := storeObjectInRepo(t, repo.ID, &lfsContent)
63+
64+
err = repo_service.GarbageCollectLFSMetaObjectsForRepo(t.Context(), repo, repo_service.GarbageCollectLFSMetaObjectsOptions{
65+
LogDetail: func(string, ...any) {},
66+
AutoFix: true,
67+
OlderThan: time.Now().Add(24 * time.Hour * 7),
68+
UpdatedLessRecentlyThan: time.Now().Add(24 * time.Hour * 3),
69+
})
70+
assert.NoError(t, err)
71+
72+
_, err = git_model.GetLFSMetaObjectByOid(t.Context(), repo.ID, lfsOid)
73+
assert.Equal(t, git_model.ErrLFSObjectNotExist, err)
74+
}
75+
4976
func storeObjectInRepo(t *testing.T, repositoryID int64, content *[]byte) string {
5077
pointer, err := lfs.GeneratePointer(bytes.NewReader(*content))
5178
assert.NoError(t, err)

0 commit comments

Comments
 (0)