package storage import ( "context" "time" "github.com/filecoin-project/go-state-types/dline" "golang.org/x/xerrors" "github.com/filecoin-project/go-address" "github.com/filecoin-project/go-state-types/abi" "github.com/filecoin-project/go-state-types/dline" "github.com/filecoin-project/specs-storage/storage" "github.com/filecoin-project/lotus/api" "github.com/filecoin-project/lotus/build" "github.com/filecoin-project/lotus/chain/store" "github.com/filecoin-project/lotus/chain/types" sectorstorage "github.com/filecoin-project/lotus/extern/sector-storage" "github.com/filecoin-project/lotus/journal" "github.com/filecoin-project/lotus/node/config" "go.opencensus.io/trace" ) const StartConfidence = 4 // TODO: config type WindowPoStScheduler struct { api storageMinerApi feeCfg config.MinerFeeConfig prover storage.Prover faultTracker sectorstorage.FaultTracker proofType abi.RegisteredPoStProof partitionSectors uint64 actor address.Address worker address.Address cur *types.TipSet // if a post is in progress, this indicates for which ElectionPeriodStart activeDeadline *dline.Info abort context.CancelFunc evtTypes [4]journal.EventType // failed abi.ChainEpoch // eps // failLk sync.Mutex } func NewWindowedPoStScheduler(api storageMinerApi, fc config.MinerFeeConfig, sb storage.Prover, ft sectorstorage.FaultTracker, actor address.Address, worker address.Address) (*WindowPoStScheduler, error) { mi, err := api.StateMinerInfo(context.TODO(), actor, types.EmptyTSK) if err != nil { return nil, xerrors.Errorf("getting sector size: %w", err) } rt, err := mi.SealProofType.RegisteredWindowPoStProof() if err != nil { return nil, err } return &WindowPoStScheduler{ api: api, feeCfg: fc, prover: sb, faultTracker: ft, proofType: rt, partitionSectors: mi.WindowPoStPartitionSectors, actor: actor, worker: worker, evtTypes: [...]journal.EventType{ evtTypeWdPoStScheduler: journal.J.RegisterEventType("wdpost", "scheduler"), evtTypeWdPoStProofs: journal.J.RegisterEventType("wdpost", "proofs_processed"), evtTypeWdPoStRecoveries: journal.J.RegisterEventType("wdpost", "recoveries_processed"), evtTypeWdPoStFaults: journal.J.RegisterEventType("wdpost", "faults_processed"), }, }, nil } func deadlineEquals(a, b *dline.Info) bool { if a == nil || b == nil { return b == a } return a.PeriodStart == b.PeriodStart && a.Index == b.Index && a.Challenge == b.Challenge } func (s *WindowPoStScheduler) Run(ctx context.Context) { defer s.abortActivePoSt() var notifs <-chan []*api.HeadChange var err error var gotCur bool // not fine to panic after this point for { if notifs == nil { notifs, err = s.api.ChainNotify(ctx) if err != nil { log.Errorf("ChainNotify error: %+v", err) build.Clock.Sleep(10 * time.Second) continue } gotCur = false } select { case changes, ok := <-notifs: if !ok { log.Warn("WindowPoStScheduler notifs channel closed") notifs = nil continue } if !gotCur { if len(changes) != 1 { log.Errorf("expected first notif to have len = 1") continue } chg := changes[0] if chg.Type != store.HCCurrent { log.Errorf("expected first notif to tell current ts") continue } if err := s.update(ctx, chg.Val); err != nil { log.Errorf("%+v", err) } gotCur = true continue } ctx, span := trace.StartSpan(ctx, "WindowPoStScheduler.headChange") var lowest, highest *types.TipSet = s.cur, nil for _, change := range changes { if change.Val == nil { log.Errorf("change.Val was nil") } switch change.Type { case store.HCRevert: lowest = change.Val case store.HCApply: highest = change.Val } } if err := s.revert(ctx, lowest); err != nil { log.Error("handling head reverts in windowPost sched: %+v", err) } if err := s.update(ctx, highest); err != nil { log.Error("handling head updates in windowPost sched: %+v", err) } span.End() case <-ctx.Done(): return } } } func (s *WindowPoStScheduler) revert(ctx context.Context, newLowest *types.TipSet) error { if s.cur == newLowest { return nil } s.cur = newLowest newDeadline, err := s.api.StateMinerProvingDeadline(ctx, s.actor, newLowest.Key()) if err != nil { return err } if !deadlineEquals(s.activeDeadline, newDeadline) { s.abortActivePoSt() } return nil } func (s *WindowPoStScheduler) update(ctx context.Context, new *types.TipSet) error { if new == nil { return xerrors.Errorf("no new tipset in WindowPoStScheduler.update") } di, err := s.api.StateMinerProvingDeadline(ctx, s.actor, new.Key()) if err != nil { return err } if deadlineEquals(s.activeDeadline, di) { return nil // already working on this deadline } if !di.PeriodStarted() { return nil // not proving anything yet } s.abortActivePoSt() // TODO: wait for di.Challenge here, will give us ~10min more to compute windowpost // (Need to get correct deadline above, which is tricky) if di.Open+StartConfidence >= new.Height() { log.Info("not starting windowPost yet, waiting for startconfidence", di.Open, di.Open+StartConfidence, new.Height()) return nil } /*s.failLk.Lock() if s.failed > 0 { s.failed = 0 s.activeEPS = 0 } s.failLk.Unlock()*/ log.Infof("at %d, doPost for P %d, dd %d", new.Height(), di.PeriodStart, di.Index) s.doPost(ctx, di, new) return nil } func (s *WindowPoStScheduler) abortActivePoSt() { if s.activeDeadline == nil { return // noop } if s.abort != nil { s.abort() journal.J.RecordEvent(s.evtTypes[evtTypeWdPoStScheduler], func() interface{} { return WdPoStSchedulerEvt{ evtCommon: s.getEvtCommon(nil), State: SchedulerStateAborted, } }) log.Warnf("Aborting Window PoSt (Deadline: %+v)", s.activeDeadline) } s.activeDeadline = nil s.abort = nil } // getEvtCommon populates and returns common attributes from state, for a // WdPoSt journal event. func (s *WindowPoStScheduler) getEvtCommon(err error) evtCommon { c := evtCommon{Error: err} if s.cur != nil { c.Deadline = s.activeDeadline c.Height = s.cur.Height() c.TipSet = s.cur.Cids() } return c }