2020-04-30 15:07:27 +08:00
|
|
|
package raftstore
|
|
|
|
|
|
|
|
import (
|
|
|
|
"sync"
|
|
|
|
|
|
|
|
"github.com/Connor1996/badger"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/config"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/raftstore/message"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/raftstore/meta"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/raftstore/runner"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/raftstore/snap"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/raftstore/util"
|
|
|
|
"github.com/pingcap-incubator/tinykv/kv/util/engine_util"
|
|
|
|
"github.com/pingcap-incubator/tinykv/log"
|
|
|
|
"github.com/pingcap-incubator/tinykv/proto/pkg/metapb"
|
|
|
|
rspb "github.com/pingcap-incubator/tinykv/proto/pkg/raft_serverpb"
|
|
|
|
"github.com/pingcap-incubator/tinykv/proto/pkg/schedulerpb"
|
|
|
|
"github.com/pingcap/errors"
|
|
|
|
)
|
|
|
|
|
|
|
|
type StoreTick int
|
|
|
|
|
|
|
|
const (
|
|
|
|
StoreTickSchedulerStoreHeartbeat StoreTick = 1
|
|
|
|
StoreTickSnapGC StoreTick = 2
|
|
|
|
)
|
|
|
|
|
|
|
|
type storeState struct {
|
|
|
|
id uint64
|
|
|
|
receiver <-chan message.Msg
|
|
|
|
ticker *ticker
|
|
|
|
}
|
|
|
|
|
|
|
|
func newStoreState(cfg *config.Config) (chan<- message.Msg, *storeState) {
|
|
|
|
ch := make(chan message.Msg, 40960)
|
|
|
|
state := &storeState{
|
|
|
|
receiver: (<-chan message.Msg)(ch),
|
|
|
|
ticker: newStoreTicker(cfg),
|
|
|
|
}
|
|
|
|
return (chan<- message.Msg)(ch), state
|
|
|
|
}
|
|
|
|
|
|
|
|
// storeWorker runs store commands.
|
|
|
|
type storeWorker struct {
|
|
|
|
*storeState
|
|
|
|
ctx *GlobalContext
|
|
|
|
}
|
|
|
|
|
|
|
|
func newStoreWorker(ctx *GlobalContext, state *storeState) *storeWorker {
|
|
|
|
return &storeWorker{
|
|
|
|
storeState: state,
|
|
|
|
ctx: ctx,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (sw *storeWorker) run(closeCh <-chan struct{}, wg *sync.WaitGroup) {
|
|
|
|
defer wg.Done()
|
|
|
|
for {
|
|
|
|
var msg message.Msg
|
|
|
|
select {
|
|
|
|
case <-closeCh:
|
|
|
|
return
|
|
|
|
case msg = <-sw.receiver:
|
|
|
|
}
|
|
|
|
sw.handleMsg(msg)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) onTick(tick StoreTick) {
|
|
|
|
switch tick {
|
|
|
|
case StoreTickSchedulerStoreHeartbeat:
|
2021-02-23 20:20:22 +08:00
|
|
|
d.onSchedulerStoreHeartbeatTick()
|
2020-04-30 15:07:27 +08:00
|
|
|
case StoreTickSnapGC:
|
|
|
|
d.onSnapMgrGC()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) handleMsg(msg message.Msg) {
|
|
|
|
switch msg.Type {
|
|
|
|
case message.MsgTypeStoreRaftMessage:
|
|
|
|
if err := d.onRaftMessage(msg.Data.(*rspb.RaftMessage)); err != nil {
|
|
|
|
log.Errorf("handle raft message failed storeID %d, %v", d.id, err)
|
|
|
|
}
|
|
|
|
case message.MsgTypeStoreTick:
|
|
|
|
d.onTick(msg.Data.(StoreTick))
|
|
|
|
case message.MsgTypeStoreStart:
|
|
|
|
d.start(msg.Data.(*metapb.Store))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) start(store *metapb.Store) {
|
|
|
|
d.id = store.Id
|
|
|
|
d.ticker.scheduleStore(StoreTickSchedulerStoreHeartbeat)
|
|
|
|
d.ticker.scheduleStore(StoreTickSnapGC)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Checks if the message is targeting a stale peer.
|
|
|
|
///
|
|
|
|
/// Returns true means the message can be dropped silently.
|
|
|
|
func (d *storeWorker) checkMsg(msg *rspb.RaftMessage) (bool, error) {
|
|
|
|
regionID := msg.GetRegionId()
|
|
|
|
fromEpoch := msg.GetRegionEpoch()
|
|
|
|
msgType := msg.Message.MsgType
|
|
|
|
isVoteMsg := util.IsVoteMessage(msg.Message)
|
|
|
|
fromStoreID := msg.FromPeer.StoreId
|
|
|
|
|
|
|
|
// Check if the target is tombstone,
|
|
|
|
stateKey := meta.RegionStateKey(regionID)
|
|
|
|
localState := new(rspb.RegionLocalState)
|
|
|
|
err := engine_util.GetMeta(d.ctx.engine.Kv, stateKey, localState)
|
|
|
|
if err != nil {
|
|
|
|
if err == badger.ErrKeyNotFound {
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
return false, err
|
|
|
|
}
|
|
|
|
if localState.State != rspb.PeerState_Tombstone {
|
|
|
|
// Maybe split, but not registered yet.
|
|
|
|
if util.IsFirstVoteMessage(msg.Message) {
|
|
|
|
meta := d.ctx.storeMeta
|
2020-07-27 15:27:24 +08:00
|
|
|
meta.RLock()
|
|
|
|
defer meta.RUnlock()
|
2020-04-30 15:07:27 +08:00
|
|
|
// Last check on whether target peer is created, otherwise, the
|
|
|
|
// vote message will never be comsumed.
|
|
|
|
if _, ok := meta.regions[regionID]; ok {
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
meta.pendingVotes = append(meta.pendingVotes, msg)
|
|
|
|
log.Infof("region %d doesn't exist yet, wait for it to be split.", regionID)
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
return false, errors.Errorf("region %d not exists but not tombstone: %s", regionID, localState)
|
|
|
|
}
|
|
|
|
log.Debugf("region %d in tombstone state: %s", regionID, localState)
|
|
|
|
region := localState.Region
|
|
|
|
regionEpoch := region.RegionEpoch
|
|
|
|
// The region in this peer is already destroyed
|
|
|
|
if util.IsEpochStale(fromEpoch, regionEpoch) {
|
|
|
|
log.Infof("tombstone peer receives a stale message. region_id:%d, from_region_epoch:%s, current_region_epoch:%s, msg_type:%s",
|
|
|
|
regionID, fromEpoch, regionEpoch, msgType)
|
|
|
|
notExist := util.FindPeer(region, fromStoreID) == nil
|
|
|
|
handleStaleMsg(d.ctx.trans, msg, regionEpoch, isVoteMsg && notExist)
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
if fromEpoch.ConfVer == regionEpoch.ConfVer {
|
|
|
|
return false, errors.Errorf("tombstone peer [epoch: %s] received an invalid message %s, ignore it",
|
|
|
|
regionEpoch, msgType)
|
|
|
|
}
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) onRaftMessage(msg *rspb.RaftMessage) error {
|
|
|
|
regionID := msg.RegionId
|
|
|
|
if err := d.ctx.router.send(regionID, message.Msg{Type: message.MsgTypeRaftMessage, Data: msg}); err == nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
log.Debugf("handle raft message. from_peer:%d, to_peer:%d, store:%d, region:%d, msg:%+v",
|
|
|
|
msg.FromPeer.Id, msg.ToPeer.Id, d.storeState.id, regionID, msg.Message)
|
|
|
|
if msg.ToPeer.StoreId != d.ctx.store.Id {
|
|
|
|
log.Warnf("store not match, ignore it. store_id:%d, to_store_id:%d, region_id:%d",
|
|
|
|
d.ctx.store.Id, msg.ToPeer.StoreId, regionID)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if msg.RegionEpoch == nil {
|
|
|
|
log.Errorf("missing region epoch in raft message, ignore it. region_id:%d", regionID)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
if msg.IsTombstone {
|
|
|
|
// Target tombstone peer doesn't exist, so ignore it.
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
ok, err := d.checkMsg(msg)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if ok {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
created, err := d.maybeCreatePeer(regionID, msg)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if !created {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
_ = d.ctx.router.send(regionID, message.Msg{Type: message.MsgTypeRaftMessage, Data: msg})
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
/// If target peer doesn't exist, create it.
|
|
|
|
///
|
|
|
|
/// return false to indicate that target peer is in invalid state or
|
|
|
|
/// doesn't exist and can't be created.
|
|
|
|
func (d *storeWorker) maybeCreatePeer(regionID uint64, msg *rspb.RaftMessage) (bool, error) {
|
|
|
|
// we may encounter a message with larger peer id, which means
|
|
|
|
// current peer is stale, then we should remove current peer
|
|
|
|
meta := d.ctx.storeMeta
|
2020-07-27 15:27:24 +08:00
|
|
|
meta.Lock()
|
|
|
|
defer meta.Unlock()
|
2020-04-30 15:07:27 +08:00
|
|
|
if _, ok := meta.regions[regionID]; ok {
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
if !util.IsInitialMsg(msg.Message) {
|
|
|
|
log.Debugf("target peer %s doesn't exist", msg.ToPeer)
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, region := range meta.getOverlapRegions(&metapb.Region{
|
|
|
|
StartKey: msg.StartKey,
|
|
|
|
EndKey: msg.EndKey,
|
|
|
|
}) {
|
|
|
|
log.Debugf("msg %s is overlapped with exist region %s", msg, region)
|
|
|
|
if util.IsFirstVoteMessage(msg.Message) {
|
|
|
|
meta.pendingVotes = append(meta.pendingVotes, msg)
|
|
|
|
}
|
|
|
|
return false, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
peer, err := replicatePeer(
|
|
|
|
d.ctx.store.Id, d.ctx.cfg, d.ctx.regionTaskSender, d.ctx.engine, regionID, msg.ToPeer)
|
|
|
|
if err != nil {
|
|
|
|
return false, err
|
|
|
|
}
|
2020-04-23 17:48:15 +08:00
|
|
|
// following snapshot may overlap, should insert into regionRanges after
|
2020-04-30 15:07:27 +08:00
|
|
|
// snapshot is applied.
|
|
|
|
meta.regions[regionID] = peer.Region()
|
|
|
|
d.ctx.router.register(peer)
|
|
|
|
_ = d.ctx.router.send(regionID, message.Msg{Type: message.MsgTypeStart})
|
|
|
|
return true, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) storeHeartbeatScheduler() {
|
|
|
|
stats := new(schedulerpb.StoreStats)
|
|
|
|
stats.StoreId = d.ctx.store.Id
|
2020-07-27 15:27:24 +08:00
|
|
|
meta := d.ctx.storeMeta
|
|
|
|
meta.RLock()
|
|
|
|
stats.RegionCount = uint32(len(meta.regions))
|
|
|
|
meta.RUnlock()
|
2020-04-30 15:07:27 +08:00
|
|
|
d.ctx.schedulerTaskSender <- &runner.SchedulerStoreHeartbeatTask{
|
|
|
|
Stats: stats,
|
|
|
|
Engine: d.ctx.engine.Kv,
|
|
|
|
Path: d.ctx.engine.KvPath,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-23 20:20:22 +08:00
|
|
|
func (d *storeWorker) onSchedulerStoreHeartbeatTick() {
|
2020-04-30 15:07:27 +08:00
|
|
|
d.storeHeartbeatScheduler()
|
|
|
|
d.ticker.scheduleStore(StoreTickSchedulerStoreHeartbeat)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) handleSnapMgrGC() error {
|
|
|
|
mgr := d.ctx.snapMgr
|
|
|
|
snapKeys, err := mgr.ListIdleSnap()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if len(snapKeys) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
var lastRegionID uint64
|
|
|
|
var keys []snap.SnapKeyWithSending
|
|
|
|
for _, pair := range snapKeys {
|
|
|
|
key := pair.SnapKey
|
|
|
|
if lastRegionID == key.RegionID {
|
|
|
|
keys = append(keys, pair)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if len(keys) > 0 {
|
|
|
|
err = d.scheduleGCSnap(lastRegionID, keys)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
keys = nil
|
|
|
|
}
|
|
|
|
lastRegionID = key.RegionID
|
|
|
|
keys = append(keys, pair)
|
|
|
|
}
|
|
|
|
if len(keys) > 0 {
|
|
|
|
return d.scheduleGCSnap(lastRegionID, keys)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) scheduleGCSnap(regionID uint64, keys []snap.SnapKeyWithSending) error {
|
|
|
|
gcSnap := message.Msg{Type: message.MsgTypeGcSnap, Data: &message.MsgGCSnap{Snaps: keys}}
|
|
|
|
if d.ctx.router.send(regionID, gcSnap) != nil {
|
|
|
|
// The snapshot exists because MsgAppend has been rejected. So the
|
|
|
|
// peer must have been exist. But now it's disconnected, so the peer
|
|
|
|
// has to be destroyed instead of being created.
|
|
|
|
log.Infof("region %d is disconnected, remove snaps %v", regionID, keys)
|
|
|
|
for _, pair := range keys {
|
|
|
|
key := pair.SnapKey
|
|
|
|
isSending := pair.IsSending
|
|
|
|
var snapshot snap.Snapshot
|
|
|
|
var err error
|
|
|
|
if isSending {
|
|
|
|
snapshot, err = d.ctx.snapMgr.GetSnapshotForSending(key)
|
|
|
|
} else {
|
|
|
|
snapshot, err = d.ctx.snapMgr.GetSnapshotForApplying(key)
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
d.ctx.snapMgr.DeleteSnapshot(key, snapshot, false)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (d *storeWorker) onSnapMgrGC() {
|
|
|
|
if err := d.handleSnapMgrGC(); err != nil {
|
|
|
|
log.Errorf("handle snap GC failed store_id %d, err %s", d.storeState.id, err)
|
|
|
|
}
|
|
|
|
d.ticker.scheduleStore(StoreTickSnapGC)
|
|
|
|
}
|