Skip to content

Commit ae3d392

Browse files
committed
Protect DB against parallel reloads
Signed-off-by: ArthurSens <[email protected]>
1 parent 9e0351e commit ae3d392

File tree

2 files changed

+62
-4
lines changed

2 files changed

+62
-4
lines changed

tsdb/db.go

+11-3
Original file line numberDiff line numberDiff line change
@@ -979,6 +979,12 @@ func (db *DB) reloadBlocks() (err error) {
979979
db.metrics.reloads.Inc()
980980
}()
981981

982+
// Now that we reload TSDB every minute, there is high chance for race condition with a reload
983+
// triggered by CleanTombstones(). We need to lock the reload to avoid the situation where
984+
// a normal reload and CleanTombstones try to delete the same block.
985+
db.mtx.Lock()
986+
defer db.mtx.Unlock()
987+
982988
loadable, corrupted, err := openBlocks(db.logger, db.dir, db.blocks, db.chunkPool)
983989
if err != nil {
984990
return err
@@ -1044,10 +1050,8 @@ func (db *DB) reloadBlocks() (err error) {
10441050
}
10451051

10461052
// Swap new blocks first for subsequently created readers to be seen.
1047-
db.mtx.Lock()
10481053
oldBlocks := db.blocks
10491054
db.blocks = toLoad
1050-
db.mtx.Unlock()
10511055

10521056
blockMetas := make([]BlockMeta, 0, len(toLoad))
10531057
for _, b := range toLoad {
@@ -1554,7 +1558,11 @@ func (db *DB) CleanTombstones() (err error) {
15541558

15551559
// In case tombstones of the old block covers the whole block,
15561560
// then there would be no resultant block to tell the parent.
1561+
// The lock protects against race conditions when deleting blocks
1562+
// during an already running reload.
1563+
db.mtx.Lock()
15571564
pb.meta.Compaction.Deletable = safeToDelete
1565+
db.mtx.Unlock()
15581566
cleanUpCompleted = false
15591567
if err = db.reloadBlocks(); err == nil { // Will try to delete old block.
15601568
// Successful reload will change the existing blocks.
@@ -1563,7 +1571,7 @@ func (db *DB) CleanTombstones() (err error) {
15631571
}
15641572

15651573
// Delete new block if it was created.
1566-
if uid != nil {
1574+
if uid != nil && *uid != (ulid.ULID{}) {
15671575
dir := filepath.Join(db.Dir(), uid.String())
15681576
if err := os.RemoveAll(dir); err != nil {
15691577
level.Error(db.logger).Log("msg", "failed to delete block after failed `CleanTombstones`", "dir", dir, "err", err)

tsdb/db_test.go

+51-1
Original file line numberDiff line numberDiff line change
@@ -1185,14 +1185,64 @@ func TestTombstoneCleanFail(t *testing.T) {
11851185
// The compactor should trigger a failure here.
11861186
require.Error(t, db.CleanTombstones())
11871187

1188-
// Now check that the CleanTombstones replaced the old block even after a failure.
1188+
// Now check that the cleanTombstones replaced the old block even after a failure.
11891189
actualBlockDirs, err := blockDirs(db.dir)
11901190
require.NoError(t, err)
11911191
// Only one block should have been replaced by a new block.
11921192
require.Equal(t, len(oldBlockDirs), len(actualBlockDirs))
11931193
require.Equal(t, len(intersection(oldBlockDirs, actualBlockDirs)), len(actualBlockDirs)-1)
11941194
}
11951195

1196+
// TestTombstoneCleanRetentionLimitsRace tests that a CleanTombstones operation
1197+
// and retention limit policies, when triggered at the same time,
1198+
// won't race against each other.
1199+
func TestTombstoneCleanRetentionLimitsRace(t *testing.T) {
1200+
opts := DefaultOptions()
1201+
var wg sync.WaitGroup
1202+
1203+
// We want to make sure that a race doesn't happen when a normal reload and a CleanTombstones()
1204+
// reload try to delete the same block. Without the correct lock placement, it can happen if a
1205+
// block is marked for deletion due to retention limits and also has tombstones to be cleaned at
1206+
// the same time.
1207+
//
1208+
// That is something tricky to trigger, so let's try several times just to make sure.
1209+
for i := 0; i < 20; i++ {
1210+
db := openTestDB(t, opts, nil)
1211+
totalBlocks := 20
1212+
dbDir := db.Dir()
1213+
// Generate some blocks with old mint (near epoch).
1214+
for j := 0; j < totalBlocks; j++ {
1215+
blockDir := createBlock(t, dbDir, genSeries(10, 1, int64(j), int64(j)+1))
1216+
block, err := OpenBlock(nil, blockDir, nil)
1217+
require.NoError(t, err)
1218+
// Cover block with tombstones so it can be deleted with CleanTombstones() as well.
1219+
tomb := tombstones.NewMemTombstones()
1220+
tomb.AddInterval(0, tombstones.Interval{Mint: int64(j), Maxt: int64(j) + 1})
1221+
block.tombstones = tomb
1222+
1223+
db.blocks = append(db.blocks, block)
1224+
}
1225+
1226+
wg.Add(2)
1227+
// Run reload and cleanTombstones together, with a small time window randomization
1228+
go func() {
1229+
defer wg.Done()
1230+
time.Sleep(time.Duration(rand.Float64() * 100 * float64(time.Millisecond)))
1231+
require.NoError(t, db.reloadBlocks())
1232+
}()
1233+
go func() {
1234+
defer wg.Done()
1235+
time.Sleep(time.Duration(rand.Float64() * 100 * float64(time.Millisecond)))
1236+
require.NoError(t, db.CleanTombstones())
1237+
}()
1238+
1239+
wg.Wait()
1240+
1241+
require.NoError(t, db.Close())
1242+
}
1243+
1244+
}
1245+
11961246
func intersection(oldBlocks, actualBlocks []string) (intersection []string) {
11971247
hash := make(map[string]bool)
11981248
for _, e := range oldBlocks {

0 commit comments

Comments
 (0)