2017-05-17 03:06:56 +00:00
|
|
|
package tsdb
|
|
|
|
|
|
|
|
import (
|
|
|
|
"encoding/binary"
|
2017-05-23 11:57:45 +00:00
|
|
|
"fmt"
|
|
|
|
"hash/crc32"
|
2017-05-17 03:06:56 +00:00
|
|
|
"io/ioutil"
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
|
|
|
)
|
|
|
|
|
|
|
|
const tombstoneFilename = "tombstones"
|
|
|
|
|
2017-05-23 11:57:45 +00:00
|
|
|
const (
|
|
|
|
// MagicTombstone is 4 bytes at the head of a tombstone file.
|
|
|
|
MagicTombstone = 0x130BA30
|
|
|
|
|
|
|
|
tombstoneFormatV1 = 1
|
|
|
|
)
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
func writeTombstoneFile(dir string, tr tombstoneReader) error {
|
2017-05-17 03:06:56 +00:00
|
|
|
path := filepath.Join(dir, tombstoneFilename)
|
|
|
|
tmp := path + ".tmp"
|
2017-05-23 11:57:45 +00:00
|
|
|
hash := crc32.New(crc32.MakeTable(crc32.Castagnoli))
|
2017-05-17 03:06:56 +00:00
|
|
|
|
|
|
|
f, err := os.Create(tmp)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
stoneOff := make(map[uint32]int64) // The map that holds the ref to offset vals.
|
|
|
|
refs := []uint32{} // Sorted refs.
|
|
|
|
|
|
|
|
pos := int64(0)
|
|
|
|
buf := encbuf{b: make([]byte, 2*binary.MaxVarintLen64)}
|
2017-05-23 11:57:45 +00:00
|
|
|
buf.reset()
|
|
|
|
// Write the meta.
|
|
|
|
buf.putBE32(MagicTombstone)
|
|
|
|
buf.putByte(tombstoneFormatV1)
|
|
|
|
n, err := f.Write(buf.get())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
pos += int64(n)
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
for k, v := range tr {
|
|
|
|
refs = append(refs, k)
|
|
|
|
stoneOff[k] = pos
|
2017-05-17 03:06:56 +00:00
|
|
|
|
|
|
|
// Write the ranges.
|
|
|
|
buf.reset()
|
2017-05-24 05:54:24 +00:00
|
|
|
buf.putUvarint(len(v))
|
2017-05-17 03:06:56 +00:00
|
|
|
n, err := f.Write(buf.get())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
pos += int64(n)
|
|
|
|
|
2017-05-23 11:57:45 +00:00
|
|
|
buf.reset()
|
2017-05-24 05:54:24 +00:00
|
|
|
for _, r := range v {
|
2017-05-17 03:06:56 +00:00
|
|
|
buf.putVarint64(r.mint)
|
|
|
|
buf.putVarint64(r.maxt)
|
|
|
|
}
|
2017-05-23 11:57:45 +00:00
|
|
|
buf.putHash(hash)
|
|
|
|
|
|
|
|
n, err = f.Write(buf.get())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
pos += int64(n)
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Write the offset table.
|
2017-05-23 11:57:45 +00:00
|
|
|
// Pad first.
|
|
|
|
if p := 4 - (int(pos) % 4); p != 0 {
|
|
|
|
if _, err := f.Write(make([]byte, p)); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
pos += int64(p)
|
|
|
|
}
|
|
|
|
|
2017-05-17 03:06:56 +00:00
|
|
|
buf.reset()
|
|
|
|
buf.putBE32int(len(refs))
|
|
|
|
if _, err := f.Write(buf.get()); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, ref := range refs {
|
|
|
|
buf.reset()
|
|
|
|
buf.putBE32(ref)
|
|
|
|
buf.putBE64int64(stoneOff[ref])
|
|
|
|
_, err = f.Write(buf.get())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Write the offset to the offset table.
|
|
|
|
buf.reset()
|
|
|
|
buf.putBE64int64(pos)
|
|
|
|
_, err = f.Write(buf.get())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := f.Close(); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return renameFile(tmp, path)
|
|
|
|
}
|
|
|
|
|
|
|
|
// stone holds the information on the posting and time-range
|
|
|
|
// that is deleted.
|
|
|
|
type stone struct {
|
2017-05-22 11:12:36 +00:00
|
|
|
ref uint32
|
|
|
|
intervals intervals
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// TombstoneReader is the iterator over tombstones.
|
|
|
|
type TombstoneReader interface {
|
2017-05-24 05:54:24 +00:00
|
|
|
At(ref uint32) intervals
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
func readTombstones(dir string) (tombstoneReader, error) {
|
2017-05-17 03:06:56 +00:00
|
|
|
b, err := ioutil.ReadFile(filepath.Join(dir, tombstoneFilename))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2017-05-23 11:57:45 +00:00
|
|
|
d := &decbuf{b: b}
|
|
|
|
if mg := d.be32(); mg != MagicTombstone {
|
|
|
|
return nil, fmt.Errorf("invalid magic number %x", mg)
|
|
|
|
}
|
|
|
|
|
2017-05-17 03:06:56 +00:00
|
|
|
offsetBytes := b[len(b)-8:]
|
2017-05-23 11:57:45 +00:00
|
|
|
d = &decbuf{b: offsetBytes}
|
2017-05-17 03:06:56 +00:00
|
|
|
off := d.be64int64()
|
|
|
|
if err := d.err(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
d = &decbuf{b: b[off:]}
|
|
|
|
numStones := d.be32int()
|
|
|
|
if err := d.err(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2017-05-21 17:50:05 +00:00
|
|
|
off += 4 // For the numStones which has been read.
|
2017-05-17 03:06:56 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
stones := b[off : off+int64(numStones*12)]
|
|
|
|
stonesMap := make(map[uint32]intervals)
|
|
|
|
for len(stones) >= 12 {
|
|
|
|
d := &decbuf{b: stones[:12]}
|
|
|
|
ref := d.be32()
|
|
|
|
off := d.be64int64()
|
2017-05-17 03:06:56 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
d = &decbuf{b: b[off:]}
|
|
|
|
numRanges := d.uvarint()
|
2017-05-17 03:06:56 +00:00
|
|
|
if err := d.err(); err != nil {
|
2017-05-24 05:54:24 +00:00
|
|
|
return nil, err
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
dranges := make(intervals, 0, numRanges)
|
|
|
|
for i := 0; i < int(numRanges); i++ {
|
|
|
|
mint := d.varint64()
|
|
|
|
maxt := d.varint64()
|
|
|
|
if err := d.err(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2017-05-17 03:06:56 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
dranges = append(dranges, interval{mint, maxt})
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
2017-05-22 05:01:50 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
// TODO(gouthamve): Verify checksum.
|
|
|
|
stones = stones[12:]
|
|
|
|
stonesMap[ref] = dranges
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
return newTombstoneReader(stonesMap), nil
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
type tombstoneReader map[uint32]intervals
|
2017-05-17 09:19:42 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
func newTombstoneReader(ts map[uint32]intervals) tombstoneReader {
|
|
|
|
return tombstoneReader(ts)
|
|
|
|
}
|
2017-05-17 09:19:42 +00:00
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
func newEmptyTombstoneReader() tombstoneReader {
|
|
|
|
return tombstoneReader(make(map[uint32]intervals))
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
|
|
|
|
2017-05-24 05:54:24 +00:00
|
|
|
func (t tombstoneReader) At(ref uint32) intervals {
|
|
|
|
return t[ref]
|
2017-05-17 03:06:56 +00:00
|
|
|
}
|
2017-05-17 09:19:42 +00:00
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
type interval struct {
|
2017-05-17 09:19:42 +00:00
|
|
|
mint, maxt int64
|
|
|
|
}
|
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
func (tr interval) inBounds(t int64) bool {
|
2017-05-17 09:19:42 +00:00
|
|
|
return t >= tr.mint && t <= tr.maxt
|
|
|
|
}
|
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
func (tr interval) isSubrange(dranges intervals) bool {
|
|
|
|
for _, r := range dranges {
|
2017-05-17 09:19:42 +00:00
|
|
|
if r.inBounds(tr.mint) && r.inBounds(tr.maxt) {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
type intervals []interval
|
|
|
|
|
2017-05-17 09:19:42 +00:00
|
|
|
// This adds the new time-range to the existing ones.
|
2017-05-21 17:50:05 +00:00
|
|
|
// The existing ones must be sorted.
|
2017-05-22 11:12:36 +00:00
|
|
|
func (itvs intervals) add(n interval) intervals {
|
|
|
|
for i, r := range itvs {
|
2017-05-17 09:19:42 +00:00
|
|
|
// TODO(gouthamve): Make this codepath easier to digest.
|
2017-05-22 11:12:36 +00:00
|
|
|
if r.inBounds(n.mint-1) || r.inBounds(n.mint) {
|
2017-05-17 09:19:42 +00:00
|
|
|
if n.maxt > r.maxt {
|
2017-05-22 11:12:36 +00:00
|
|
|
itvs[i].maxt = n.maxt
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
j := 0
|
2017-05-22 11:12:36 +00:00
|
|
|
for _, r2 := range itvs[i+1:] {
|
2017-05-17 09:19:42 +00:00
|
|
|
if n.maxt < r2.mint {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
j++
|
|
|
|
}
|
|
|
|
if j != 0 {
|
2017-05-22 11:12:36 +00:00
|
|
|
if itvs[i+j].maxt > n.maxt {
|
|
|
|
itvs[i].maxt = itvs[i+j].maxt
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
2017-05-22 11:12:36 +00:00
|
|
|
itvs = append(itvs[:i+1], itvs[i+j+1:]...)
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
2017-05-22 11:12:36 +00:00
|
|
|
return itvs
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
if r.inBounds(n.maxt+1) || r.inBounds(n.maxt) {
|
2017-05-17 09:19:42 +00:00
|
|
|
if n.mint < r.maxt {
|
2017-05-22 11:12:36 +00:00
|
|
|
itvs[i].mint = n.mint
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
2017-05-22 11:12:36 +00:00
|
|
|
return itvs
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|
2017-05-22 11:12:36 +00:00
|
|
|
|
2017-05-17 09:19:42 +00:00
|
|
|
if n.mint < r.mint {
|
2017-05-22 11:12:36 +00:00
|
|
|
newRange := make(intervals, i, len(itvs[:i])+1)
|
|
|
|
copy(newRange, itvs[:i])
|
2017-05-17 09:19:42 +00:00
|
|
|
newRange = append(newRange, n)
|
2017-05-22 11:12:36 +00:00
|
|
|
newRange = append(newRange, itvs[i:]...)
|
2017-05-17 09:19:42 +00:00
|
|
|
|
|
|
|
return newRange
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-05-22 11:12:36 +00:00
|
|
|
itvs = append(itvs, n)
|
|
|
|
return itvs
|
2017-05-17 09:19:42 +00:00
|
|
|
}
|