2018-12-04 01:29:28 +08:00
|
|
|
package pstoreds
|
|
|
|
|
|
|
|
import (
|
2019-02-06 01:53:50 +08:00
|
|
|
"context"
|
2018-12-04 01:29:28 +08:00
|
|
|
"fmt"
|
|
|
|
"strconv"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
ds "github.com/ipfs/go-datastore"
|
|
|
|
query "github.com/ipfs/go-datastore/query"
|
|
|
|
|
|
|
|
peer "github.com/libp2p/go-libp2p-peer"
|
|
|
|
pb "github.com/libp2p/go-libp2p-peerstore/pb"
|
|
|
|
|
2019-03-01 02:33:47 +08:00
|
|
|
b32 "github.com/multiformats/go-base32"
|
2018-12-04 01:29:28 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
var (
|
2019-02-06 22:35:39 +08:00
|
|
|
// GC lookahead entries are stored in key pattern:
|
2018-12-04 01:29:28 +08:00
|
|
|
// /peers/gc/addrs/<unix timestamp of next visit>/<peer ID b32> => nil
|
2019-02-06 22:35:39 +08:00
|
|
|
// in databases with lexicographical key order, this time-indexing allows us to visit
|
|
|
|
// only the timeslice we are interested in.
|
2018-12-04 01:29:28 +08:00
|
|
|
gcLookaheadBase = ds.NewKey("/peers/gc/addrs")
|
2019-02-06 01:53:50 +08:00
|
|
|
|
2018-12-04 01:29:28 +08:00
|
|
|
// queries
|
2019-02-06 17:35:10 +08:00
|
|
|
purgeLookaheadQuery = query.Query{
|
2019-02-05 23:07:30 +08:00
|
|
|
Prefix: gcLookaheadBase.String(),
|
|
|
|
Orders: []query.Order{query.OrderByKey{}},
|
|
|
|
KeysOnly: true,
|
|
|
|
}
|
2019-02-06 01:53:50 +08:00
|
|
|
|
2019-02-06 17:35:10 +08:00
|
|
|
purgeStoreQuery = query.Query{
|
|
|
|
Prefix: addrBookBase.String(),
|
|
|
|
Orders: []query.Order{query.OrderByKey{}},
|
|
|
|
KeysOnly: false,
|
|
|
|
}
|
|
|
|
|
2019-02-05 23:07:30 +08:00
|
|
|
populateLookaheadQuery = query.Query{
|
|
|
|
Prefix: addrBookBase.String(),
|
|
|
|
Orders: []query.Order{query.OrderByKey{}},
|
|
|
|
KeysOnly: true,
|
|
|
|
}
|
2018-12-04 01:29:28 +08:00
|
|
|
)
|
|
|
|
|
2019-02-19 00:35:48 +08:00
|
|
|
// dsAddrBookGc is responsible for garbage collection in a datastore-backed address book.
|
2019-02-06 01:53:50 +08:00
|
|
|
type dsAddrBookGc struct {
|
2019-02-06 17:35:10 +08:00
|
|
|
ctx context.Context
|
|
|
|
ab *dsAddrBook
|
|
|
|
running chan struct{}
|
|
|
|
lookaheadEnabled bool
|
|
|
|
purgeFunc func()
|
|
|
|
currWindowEnd int64
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
|
|
|
|
2019-02-06 17:35:10 +08:00
|
|
|
func newAddressBookGc(ctx context.Context, ab *dsAddrBook) (*dsAddrBookGc, error) {
|
|
|
|
if ab.opts.GCPurgeInterval < 0 {
|
|
|
|
return nil, fmt.Errorf("negative GC purge interval provided: %s", ab.opts.GCPurgeInterval)
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
2019-02-06 17:35:10 +08:00
|
|
|
if ab.opts.GCLookaheadInterval < 0 {
|
|
|
|
return nil, fmt.Errorf("negative GC lookahead interval provided: %s", ab.opts.GCLookaheadInterval)
|
|
|
|
}
|
|
|
|
if ab.opts.GCInitialDelay < 0 {
|
|
|
|
return nil, fmt.Errorf("negative GC initial delay provided: %s", ab.opts.GCInitialDelay)
|
|
|
|
}
|
2019-02-06 22:35:39 +08:00
|
|
|
if ab.opts.GCLookaheadInterval > 0 && ab.opts.GCLookaheadInterval < ab.opts.GCPurgeInterval {
|
|
|
|
return nil, fmt.Errorf("lookahead interval must be larger than purge interval, respectively: %s, %s",
|
|
|
|
ab.opts.GCLookaheadInterval, ab.opts.GCPurgeInterval)
|
|
|
|
}
|
2019-02-06 17:35:10 +08:00
|
|
|
|
|
|
|
lookaheadEnabled := ab.opts.GCLookaheadInterval > 0
|
|
|
|
gc := &dsAddrBookGc{
|
|
|
|
ctx: ctx,
|
|
|
|
ab: ab,
|
|
|
|
running: make(chan struct{}, 1),
|
|
|
|
lookaheadEnabled: lookaheadEnabled,
|
|
|
|
}
|
|
|
|
|
|
|
|
if lookaheadEnabled {
|
|
|
|
gc.purgeFunc = gc.purgeLookahead
|
|
|
|
} else {
|
|
|
|
gc.purgeFunc = gc.purgeStore
|
|
|
|
}
|
|
|
|
|
|
|
|
// do not start GC timers if purge is disabled; this GC can only be triggered manually.
|
|
|
|
if ab.opts.GCPurgeInterval > 0 {
|
2019-02-16 02:43:17 +08:00
|
|
|
gc.ab.childrenDone.Add(1)
|
2019-02-06 17:35:10 +08:00
|
|
|
go gc.background()
|
|
|
|
}
|
|
|
|
|
|
|
|
return gc, nil
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
// gc prunes expired addresses from the datastore at regular intervals. It should be spawned as a goroutine.
|
|
|
|
func (gc *dsAddrBookGc) background() {
|
2019-02-16 02:43:17 +08:00
|
|
|
defer gc.ab.childrenDone.Done()
|
2018-12-04 01:29:28 +08:00
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
select {
|
|
|
|
case <-time.After(gc.ab.opts.GCInitialDelay):
|
|
|
|
case <-gc.ab.ctx.Done():
|
|
|
|
// yield if we have been cancelled/closed before the delay elapses.
|
|
|
|
return
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
purgeTimer := time.NewTicker(gc.ab.opts.GCPurgeInterval)
|
|
|
|
defer purgeTimer.Stop()
|
2018-12-04 01:29:28 +08:00
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
var lookaheadCh <-chan time.Time
|
2019-02-06 17:35:10 +08:00
|
|
|
if gc.lookaheadEnabled {
|
2019-02-06 01:53:50 +08:00
|
|
|
lookaheadTimer := time.NewTicker(gc.ab.opts.GCLookaheadInterval)
|
|
|
|
lookaheadCh = lookaheadTimer.C
|
2019-02-07 00:00:54 +08:00
|
|
|
gc.populateLookahead() // do a lookahead now
|
2019-02-06 01:53:50 +08:00
|
|
|
defer lookaheadTimer.Stop()
|
2018-12-04 19:47:22 +08:00
|
|
|
}
|
2019-02-06 01:53:50 +08:00
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-purgeTimer.C:
|
2019-02-06 17:35:10 +08:00
|
|
|
gc.purgeFunc()
|
2019-02-06 01:53:50 +08:00
|
|
|
|
|
|
|
case <-lookaheadCh:
|
|
|
|
// will never trigger if lookahead is disabled (nil Duration).
|
|
|
|
gc.populateLookahead()
|
|
|
|
|
|
|
|
case <-gc.ctx.Done():
|
|
|
|
return
|
|
|
|
}
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-06 00:52:27 +08:00
|
|
|
// purgeCycle runs a single GC purge cycle. It operates within the lookahead window if lookahead is enabled; else it
|
|
|
|
// visits all entries in the datastore, deleting the addresses that have expired.
|
2019-02-06 17:35:10 +08:00
|
|
|
func (gc *dsAddrBookGc) purgeLookahead() {
|
2019-02-06 01:53:50 +08:00
|
|
|
select {
|
|
|
|
case gc.running <- struct{}{}:
|
|
|
|
defer func() { <-gc.running }()
|
|
|
|
default:
|
2018-12-04 01:29:28 +08:00
|
|
|
// yield if lookahead is running.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
var id peer.ID
|
2019-02-06 00:52:27 +08:00
|
|
|
record := &addrsRecord{AddrBookRecord: &pb.AddrBookRecord{}} // empty record to reuse and avoid allocs.
|
2019-02-06 22:35:39 +08:00
|
|
|
batch, err := newCyclicBatch(gc.ab.ds, defaultOpsPerCyclicBatch)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while creating batch to purge GC entries: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// This function drops an unparseable GC entry; this is for safety. It is an escape hatch in case
|
|
|
|
// we modify the format of keys going forward. If a user runs a new version against an old DB,
|
|
|
|
// if we don't clean up unparseable entries we'll end up accumulating garbage.
|
|
|
|
dropInError := func(key ds.Key, err error, msg string) {
|
|
|
|
if err != nil {
|
2019-02-19 00:35:48 +08:00
|
|
|
log.Warningf("failed while %s record with GC key: %v, err: %v; deleting", msg, key, err)
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|
|
|
|
if err = batch.Delete(key); err != nil {
|
|
|
|
log.Warningf("failed to delete corrupt GC lookahead entry: %v, err: %v", key, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// This function drops a GC key if the entry is cleaned correctly. It may reschedule another visit
|
|
|
|
// if the next earliest expiry falls within the current window again.
|
|
|
|
dropOrReschedule := func(key ds.Key, ar *addrsRecord) {
|
|
|
|
if err := batch.Delete(key); err != nil {
|
|
|
|
log.Warningf("failed to delete lookahead entry: %v, err: %v", key, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// re-add the record if it needs to be visited again in this window.
|
2019-02-06 01:53:50 +08:00
|
|
|
if len(ar.Addrs) != 0 && ar.Addrs[0].Expiry <= gc.currWindowEnd {
|
2018-12-04 01:29:28 +08:00
|
|
|
gcKey := gcLookaheadBase.ChildString(fmt.Sprintf("%d/%s", ar.Addrs[0].Expiry, key.Name()))
|
|
|
|
if err := batch.Put(gcKey, []byte{}); err != nil {
|
|
|
|
log.Warningf("failed to add new GC key: %v, err: %v", gcKey, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-06 17:35:10 +08:00
|
|
|
results, err := gc.ab.ds.Query(purgeLookaheadQuery)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while fetching entries to purge: %v", err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
defer results.Close()
|
|
|
|
|
|
|
|
now := time.Now().Unix()
|
|
|
|
|
|
|
|
// keys: /peers/gc/addrs/<unix timestamp of next visit>/<peer ID b32>
|
|
|
|
// values: nil
|
|
|
|
for result := range results.Next() {
|
|
|
|
gcKey := ds.RawKey(result.Key)
|
|
|
|
ts, err := strconv.ParseInt(gcKey.Parent().Name(), 10, 64)
|
|
|
|
if err != nil {
|
|
|
|
dropInError(gcKey, err, "parsing timestamp")
|
|
|
|
log.Warningf("failed while parsing timestamp from key: %v, err: %v", result.Key, err)
|
|
|
|
continue
|
|
|
|
} else if ts > now {
|
|
|
|
// this is an ordered cursor; when we hit an entry with a timestamp beyond now, we can break.
|
|
|
|
break
|
|
|
|
}
|
|
|
|
|
|
|
|
idb32, err := b32.RawStdEncoding.DecodeString(gcKey.Name())
|
|
|
|
if err != nil {
|
|
|
|
dropInError(gcKey, err, "parsing peer ID")
|
|
|
|
log.Warningf("failed while parsing b32 peer ID from key: %v, err: %v", result.Key, err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
id, err = peer.IDFromBytes(idb32)
|
|
|
|
if err != nil {
|
|
|
|
dropInError(gcKey, err, "decoding peer ID")
|
|
|
|
log.Warningf("failed while decoding peer ID from key: %v, err: %v", result.Key, err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
// if the record is in cache, we clean it and flush it if necessary.
|
2019-02-06 01:53:50 +08:00
|
|
|
if e, ok := gc.ab.cache.Peek(id); ok {
|
2018-12-04 01:29:28 +08:00
|
|
|
cached := e.(*addrsRecord)
|
|
|
|
cached.Lock()
|
2019-02-06 22:40:51 +08:00
|
|
|
if cached.clean() {
|
2019-02-06 00:52:27 +08:00
|
|
|
if err = cached.flush(batch); err != nil {
|
2018-12-04 01:29:28 +08:00
|
|
|
log.Warningf("failed to flush entry modified by GC for peer: &v, err: %v", id.Pretty(), err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
dropOrReschedule(gcKey, cached)
|
|
|
|
cached.Unlock()
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
record.Reset()
|
|
|
|
|
|
|
|
// otherwise, fetch it from the store, clean it and flush it.
|
|
|
|
entryKey := addrBookBase.ChildString(gcKey.Name())
|
2019-02-06 01:53:50 +08:00
|
|
|
val, err := gc.ab.ds.Get(entryKey)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
// captures all errors, including ErrNotFound.
|
|
|
|
dropInError(gcKey, err, "fetching entry")
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
err = record.Unmarshal(val)
|
|
|
|
if err != nil {
|
|
|
|
dropInError(gcKey, err, "unmarshalling entry")
|
|
|
|
continue
|
|
|
|
}
|
2019-02-06 22:40:51 +08:00
|
|
|
if record.clean() {
|
2019-02-06 00:52:27 +08:00
|
|
|
err = record.flush(batch)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed to flush entry modified by GC for peer: &v, err: %v", id.Pretty(), err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
dropOrReschedule(gcKey, record)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = batch.Commit(); err != nil {
|
|
|
|
log.Warningf("failed to commit GC purge batch: %v", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-06 17:35:10 +08:00
|
|
|
func (gc *dsAddrBookGc) purgeStore() {
|
|
|
|
select {
|
|
|
|
case gc.running <- struct{}{}:
|
|
|
|
defer func() { <-gc.running }()
|
|
|
|
default:
|
|
|
|
// yield if lookahead is running.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
record := &addrsRecord{AddrBookRecord: &pb.AddrBookRecord{}} // empty record to reuse and avoid allocs.
|
2019-02-06 22:35:39 +08:00
|
|
|
batch, err := newCyclicBatch(gc.ab.ds, defaultOpsPerCyclicBatch)
|
2019-02-06 17:35:10 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while creating batch to purge GC entries: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
results, err := gc.ab.ds.Query(purgeStoreQuery)
|
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while opening iterator: %v", err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
defer results.Close()
|
|
|
|
|
|
|
|
// keys: /peers/addrs/<peer ID b32>
|
|
|
|
for result := range results.Next() {
|
|
|
|
record.Reset()
|
|
|
|
if err = record.Unmarshal(result.Value); err != nil {
|
|
|
|
// TODO log
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
id := record.Id.ID
|
2019-02-06 22:40:51 +08:00
|
|
|
if !record.clean() {
|
2019-02-06 17:35:10 +08:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := record.flush(batch); err != nil {
|
|
|
|
log.Warningf("failed to flush entry modified by GC for peer: &v, err: %v", id, err)
|
|
|
|
}
|
|
|
|
gc.ab.cache.Remove(id)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = batch.Commit(); err != nil {
|
|
|
|
log.Warningf("failed to commit GC purge batch: %v", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-12-04 01:29:28 +08:00
|
|
|
// populateLookahead populates the lookahead window by scanning the entire store and picking entries whose earliest
|
2019-02-06 01:53:50 +08:00
|
|
|
// expiration falls within the window period.
|
2018-12-04 01:29:28 +08:00
|
|
|
//
|
|
|
|
// Those entries are stored in the lookahead region in the store, indexed by the timestamp when they need to be
|
|
|
|
// visited, to facilitate temporal range scans.
|
2019-02-06 01:53:50 +08:00
|
|
|
func (gc *dsAddrBookGc) populateLookahead() {
|
2019-02-06 17:35:10 +08:00
|
|
|
if gc.ab.opts.GCLookaheadInterval == 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
select {
|
|
|
|
case gc.running <- struct{}{}:
|
|
|
|
defer func() { <-gc.running }()
|
|
|
|
default:
|
|
|
|
// yield if something's running.
|
2018-12-04 01:29:28 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
until := time.Now().Add(gc.ab.opts.GCLookaheadInterval).Unix()
|
2018-12-04 01:29:28 +08:00
|
|
|
|
|
|
|
var id peer.ID
|
|
|
|
record := &addrsRecord{AddrBookRecord: &pb.AddrBookRecord{}}
|
2019-02-06 01:53:50 +08:00
|
|
|
results, err := gc.ab.ds.Query(populateLookaheadQuery)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while querying to populate lookahead GC window: %v", err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
defer results.Close()
|
|
|
|
|
2019-02-06 22:35:39 +08:00
|
|
|
batch, err := newCyclicBatch(gc.ab.ds, defaultOpsPerCyclicBatch)
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while creating batch to populate lookahead GC window: %v", err)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
for result := range results.Next() {
|
|
|
|
idb32 := ds.RawKey(result.Key).Name()
|
|
|
|
k, err := b32.RawStdEncoding.DecodeString(idb32)
|
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed while decoding peer ID from key: %v, err: %v", result.Key, err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if id, err = peer.IDFromBytes(k); err != nil {
|
|
|
|
log.Warningf("failed while decoding peer ID from key: %v, err: %v", result.Key, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// if the record is in cache, use the cached version.
|
2019-02-06 01:53:50 +08:00
|
|
|
if e, ok := gc.ab.cache.Peek(id); ok {
|
2018-12-04 01:29:28 +08:00
|
|
|
cached := e.(*addrsRecord)
|
|
|
|
cached.RLock()
|
|
|
|
if len(cached.Addrs) == 0 || cached.Addrs[0].Expiry > until {
|
|
|
|
cached.RUnlock()
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
gcKey := gcLookaheadBase.ChildString(fmt.Sprintf("%d/%s", cached.Addrs[0].Expiry, idb32))
|
|
|
|
if err = batch.Put(gcKey, []byte{}); err != nil {
|
|
|
|
log.Warningf("failed while inserting GC entry for peer: %v, err: %v", id.Pretty(), err)
|
|
|
|
}
|
|
|
|
cached.RUnlock()
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
record.Reset()
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
val, err := gc.ab.ds.Get(ds.RawKey(result.Key))
|
2018-12-04 01:29:28 +08:00
|
|
|
if err != nil {
|
|
|
|
log.Warningf("failed which getting record from store for peer: %v, err: %v", id.Pretty(), err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if err := record.Unmarshal(val); err != nil {
|
|
|
|
log.Warningf("failed while unmarshalling record from store for peer: %v, err: %v", id.Pretty(), err)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if len(record.Addrs) > 0 && record.Addrs[0].Expiry <= until {
|
|
|
|
gcKey := gcLookaheadBase.ChildString(fmt.Sprintf("%d/%s", record.Addrs[0].Expiry, idb32))
|
|
|
|
if err = batch.Put(gcKey, []byte{}); err != nil {
|
|
|
|
log.Warningf("failed while inserting GC entry for peer: %v, err: %v", id.Pretty(), err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if err = batch.Commit(); err != nil {
|
|
|
|
log.Warningf("failed to commit GC lookahead batch: %v", err)
|
|
|
|
}
|
|
|
|
|
2019-02-06 01:53:50 +08:00
|
|
|
gc.currWindowEnd = until
|
2018-12-04 01:29:28 +08:00
|
|
|
}
|