lotus/chain/index/msgindex.go

342 lines
7.2 KiB
Go
Raw Normal View History

2023-03-11 14:49:07 +00:00
package index
import (
"context"
"database/sql"
"errors"
"io/fs"
"os"
"path"
2023-03-11 17:11:08 +00:00
"sync"
2023-03-11 14:49:07 +00:00
"time"
logging "github.com/ipfs/go-log/v2"
_ "github.com/mattn/go-sqlite3"
"golang.org/x/xerrors"
2023-03-11 16:21:16 +00:00
"github.com/filecoin-project/go-state-types/abi"
2023-03-11 14:49:07 +00:00
"github.com/filecoin-project/lotus/chain/store"
"github.com/filecoin-project/lotus/chain/types"
2023-03-11 16:21:16 +00:00
"github.com/ipfs/go-cid"
2023-03-11 14:49:07 +00:00
)
2023-03-11 17:11:08 +00:00
var log = logging.Logger("msgindex")
var (
dbName = "msgindex.db"
coalesceMinDelay = 100 * time.Millisecond
coalesceMaxDelay = time.Second
coalesceMergeInterval = 100 * time.Millisecond
)
2023-03-11 15:55:48 +00:00
// chain store interface; we could use store.ChainStore directly,
// but this simplifies unit testing.
type ChainStore interface {
SubscribeHeadChanges(f store.ReorgNotifee)
2023-03-11 17:11:08 +00:00
MessagesForBlock(ctx context.Context, b *types.BlockHeader) ([]*types.Message, []*types.SignedMessage, error)
2023-03-11 15:55:48 +00:00
}
var _ ChainStore = (*store.ChainStore)(nil)
2023-03-11 14:49:07 +00:00
type msgIndex struct {
2023-03-11 15:55:48 +00:00
cs ChainStore
2023-03-11 14:49:07 +00:00
2023-03-11 16:21:16 +00:00
db *sql.DB
selectMsgStmt *sql.Stmt
2023-03-11 17:11:08 +00:00
insertMsgStmt *sql.Stmt
2023-03-11 16:21:16 +00:00
deleteTipSetStmt *sql.Stmt
2023-03-11 14:49:07 +00:00
2023-03-11 17:11:08 +00:00
sema chan struct{}
mx sync.Mutex
pend []headChange
2023-03-11 14:49:07 +00:00
2023-03-11 17:11:08 +00:00
cancel func()
}
2023-03-11 14:49:07 +00:00
2023-03-11 17:11:08 +00:00
var _ MsgIndex = (*msgIndex)(nil)
2023-03-11 14:49:07 +00:00
2023-03-11 17:11:08 +00:00
type headChange struct {
rev []*types.TipSet
app []*types.TipSet
}
2023-03-11 14:49:07 +00:00
2023-03-11 15:55:48 +00:00
func NewMsgIndex(basePath string, cs ChainStore) (MsgIndex, error) {
2023-03-11 14:49:07 +00:00
var (
mkdb bool
dbPath string
err error
)
if basePath == ":memory:" {
// for testing
mkdb = true
dbPath = basePath
goto opendb
}
err = os.MkdirAll(basePath, 0755)
if err != nil {
return nil, xerrors.Errorf("error creating msgindex base directory: %w", err)
}
dbPath = path.Join(basePath, dbName)
_, err = os.Stat(dbPath)
switch {
case errors.Is(err, fs.ErrNotExist):
mkdb = true
case err != nil:
return nil, xerrors.Errorf("error stating msgindex database: %w", err)
}
opendb:
db, err := sql.Open("sqlite3", dbPath)
if err != nil {
// TODO [nice to have]: automaticaly delete corrupt databases
// but for now we can just error and let the operator delete.
return nil, xerrors.Errorf("error opening msgindex database: %w", err)
}
if mkdb {
err = createTables(db)
if err != nil {
return nil, xerrors.Errorf("error creating msgindex database: %w", err)
}
} else {
err = reconcileIndex(db, cs)
if err != nil {
return nil, xerrors.Errorf("error reconciling msgindex database: %w", err)
}
}
2023-03-11 17:11:08 +00:00
ctx, cancel := context.WithCancel(context.Background())
msgIndex := &msgIndex{
db: db,
cs: cs,
sema: make(chan struct{}, 1),
cancel: cancel,
}
2023-03-11 14:49:07 +00:00
err = msgIndex.prepareStatements()
if err != nil {
err2 := db.Close()
if err2 != nil {
log.Errorf("error closing msgindex database: %s", err2)
}
return nil, xerrors.Errorf("error preparing msgindex database statements: %w", err)
}
rnf := store.WrapHeadChangeCoalescer(
msgIndex.onHeadChange,
coalesceMinDelay,
coalesceMaxDelay,
coalesceMergeInterval,
)
cs.SubscribeHeadChanges(rnf)
2023-03-11 17:11:08 +00:00
go msgIndex.background(ctx)
2023-03-11 14:49:07 +00:00
return msgIndex, nil
}
// init utilities
func createTables(db *sql.DB) error {
2023-03-11 16:21:16 +00:00
// Just a single table for now; ghetto, but this an index so we denormalize to avoid joins.
if _, err := db.Exec("CREATE TABLE Messages (cid VARCHAR(80) PRIMARY KEY, tipset VARCHAR(80), xepoch INTEGER, xindex INTEGER)"); err != nil {
return err
}
// TODO Should we add an index for tipset to speed up deletion on revert?
return nil
2023-03-11 14:49:07 +00:00
}
2023-03-11 15:55:48 +00:00
func reconcileIndex(db *sql.DB, cs ChainStore) error {
2023-03-11 14:49:07 +00:00
// TODO
return errors.New("TODO: index.reconcileIndex")
}
func (x *msgIndex) prepareStatements() error {
2023-03-11 16:21:16 +00:00
stmt, err := x.db.Prepare("SELECT (tipset, xepoch, xindex) FROM Messages WHERE cid = ?")
if err != nil {
return err
}
x.selectMsgStmt = stmt
2023-03-11 17:11:08 +00:00
stmt, err = x.db.Prepare("INSERT INTO Messages VALUES (?, ?, ?, ?)")
if err != nil {
return err
}
x.insertMsgStmt = stmt
2023-03-11 16:21:16 +00:00
stmt, err = x.db.Prepare("DELETE FROM Messages WHERE tipset = ?")
if err != nil {
return err
}
x.deleteTipSetStmt = stmt
// TODO reconciliation stmts
return nil
2023-03-11 14:49:07 +00:00
}
// head change notifee
func (x *msgIndex) onHeadChange(rev, app []*types.TipSet) error {
2023-03-11 17:11:08 +00:00
// do it in the background to avoid blocking head change processing
x.mx.Lock()
x.pend = append(x.pend, headChange{rev: rev, app: app})
// TODO log loudly if this is building backlog (it shouldn't but better be safe on this)
x.mx.Unlock()
select {
case x.sema <- struct{}{}:
default:
}
return nil
}
func (x *msgIndex) background(ctx context.Context) {
for {
select {
case <-x.sema:
err := x.processHeadChanges(ctx)
if err != nil {
// TODO should we shut down the index altogether? we just log for now.
log.Errorf("error processing head change notifications: %s", err)
}
case <-ctx.Done():
return
}
}
}
func (x *msgIndex) processHeadChanges(ctx context.Context) error {
x.mx.Lock()
pend := x.pend
x.pend = nil
x.mx.Unlock()
txn, err := x.db.Begin()
if err != nil {
return xerrors.Errorf("error creating transaction: %w", err)
}
for _, hc := range pend {
for _, ts := range hc.rev {
if err := x.doRevert(ctx, ts); err != nil {
txn.Rollback()
return xerrors.Errorf("error reverting %s: %w", ts, err)
}
}
for _, ts := range hc.app {
if err := x.doApply(ctx, ts); err != nil {
txn.Rollback()
return xerrors.Errorf("error applying %s: %w", ts, err)
}
}
}
return txn.Commit()
}
func (x *msgIndex) doRevert(ctx context.Context, ts *types.TipSet) error {
tskey, err := ts.Key().Cid()
if err != nil {
return xerrors.Errorf("error computing tipset cid: %w", err)
}
key := tskey.String()
_, err = x.deleteTipSetStmt.Exec(key)
return err
}
func (x *msgIndex) doApply(ctx context.Context, ts *types.TipSet) error {
tscid, err := ts.Key().Cid()
if err != nil {
return xerrors.Errorf("error computing tipset cid: %w", err)
}
tskey := tscid.String()
xepoch := int64(ts.Height())
var xindex int64
seen := make(map[string]struct{})
insert := func(key string) error {
if _, ok := seen[key]; ok {
return nil
}
if _, err := x.insertMsgStmt.Exec(key, tskey, xepoch, xindex); err != nil {
return err
}
seen[key] = struct{}{}
xindex++
return nil
}
for _, blk := range ts.Blocks() {
bmsgs, smsgs, err := x.cs.MessagesForBlock(ctx, blk)
if err != nil {
return xerrors.Errorf("error retrieving messages for block %s in %s: %w", blk, ts, err)
}
for _, m := range bmsgs {
key := m.Cid().String()
if err := insert(key); err != nil {
return err
}
}
for _, m := range smsgs {
key := m.Cid().String()
if err := insert(key); err != nil {
return err
}
}
}
return nil
2023-03-11 14:49:07 +00:00
}
// interface
func (x *msgIndex) GetMsgInfo(ctx context.Context, m cid.Cid) (MsgInfo, error) {
2023-03-11 16:21:16 +00:00
var (
tipset string
epoch int64
index int64
)
key := m.String()
row := x.selectMsgStmt.QueryRow(key)
err := row.Scan(&tipset, &epoch, &index)
switch {
case err == sql.ErrNoRows:
return MsgInfo{}, ErrNotFound
case err != nil:
return MsgInfo{}, xerrors.Errorf("error querying msgindex database: %w", err)
}
tipsetCid, err := cid.Decode(tipset)
if err != nil {
return MsgInfo{}, xerrors.Errorf("error decoding tipset cid: %w", err)
}
return MsgInfo{
Message: m,
Tipset: tipsetCid,
Epoch: abi.ChainEpoch(epoch),
Index: int(index),
}, nil
2023-03-11 14:49:07 +00:00
}
func (x *msgIndex) Close() error {
// TODO
return errors.New("TODO: msgIndex.Close")
}