2023-11-03 12:51:01 +00:00
package lpmessage
import (
2023-11-29 15:22:20 +00:00
"bytes"
2023-11-03 12:51:01 +00:00
"context"
2023-11-29 15:22:20 +00:00
"time"
2023-11-04 10:04:46 +00:00
"github.com/google/uuid"
"github.com/ipfs/go-cid"
logging "github.com/ipfs/go-log/v2"
2023-11-29 15:22:20 +00:00
"go.uber.org/multierr"
2023-11-04 10:04:46 +00:00
"golang.org/x/xerrors"
2023-11-03 12:51:01 +00:00
"github.com/filecoin-project/go-address"
"github.com/filecoin-project/go-state-types/big"
2023-11-04 10:04:46 +00:00
2023-11-03 12:51:01 +00:00
"github.com/filecoin-project/lotus/api"
"github.com/filecoin-project/lotus/chain/types"
"github.com/filecoin-project/lotus/lib/harmony/harmonydb"
2023-11-29 15:22:20 +00:00
"github.com/filecoin-project/lotus/lib/harmony/harmonytask"
"github.com/filecoin-project/lotus/lib/harmony/resources"
"github.com/filecoin-project/lotus/lib/promise"
2023-11-03 12:51:01 +00:00
)
2023-11-03 21:40:28 +00:00
var log = logging . Logger ( "lpmessage" )
2023-11-30 17:29:10 +00:00
var SendLockedWait = 100 * time . Millisecond
2023-11-03 12:51:01 +00:00
type SenderAPI interface {
StateAccountKey ( ctx context . Context , addr address . Address , tsk types . TipSetKey ) ( address . Address , error )
GasEstimateMessageGas ( ctx context . Context , msg * types . Message , spec * api . MessageSendSpec , tsk types . TipSetKey ) ( * types . Message , error )
WalletBalance ( ctx context . Context , addr address . Address ) ( big . Int , error )
MpoolGetNonce ( context . Context , address . Address ) ( uint64 , error )
2023-11-03 21:40:28 +00:00
MpoolPush ( context . Context , * types . SignedMessage ) ( cid . Cid , error )
2023-11-03 12:51:01 +00:00
}
type SignerAPI interface {
WalletSignMessage ( context . Context , address . Address , * types . Message ) ( * types . SignedMessage , error )
}
// Sender abstracts away highly-available message sending with coordination through
// HarmonyDB. It make sure that nonces are assigned transactionally, and that
2023-11-29 15:22:20 +00:00
// messages are correctly broadcasted to the network. It ensures that messages
// are sent serially, and that failures to send don't cause nonce gaps.
2023-11-03 12:51:01 +00:00
type Sender struct {
2023-11-29 15:22:20 +00:00
api SenderAPI
sendTask * SendTask
db * harmonydb . DB
}
type SendTask struct {
sendTF promise . Promise [ harmonytask . AddTaskFunc ]
2023-11-03 12:51:01 +00:00
api SenderAPI
signer SignerAPI
2023-11-21 00:05:59 +00:00
db * harmonydb . DB
2023-11-03 12:51:01 +00:00
}
2023-11-29 15:22:20 +00:00
func ( s * SendTask ) Do ( taskID harmonytask . TaskID , stillOwned func ( ) bool ) ( done bool , err error ) {
ctx := context . TODO ( )
// get message from db
var dbMsg struct {
FromKey string ` db:"from_key" `
ToAddr string ` db:"to_addr" `
UnsignedData [ ] byte ` db:"unsigned_data" `
UnsignedCid string ` db:"unsigned_cid" `
// may not be null if we have somehow already signed but failed to send this message
Nonce * uint64 ` db:"nonce" `
SignedData [ ] byte ` db:"signed_data" `
}
2023-12-05 19:45:08 +00:00
err = s . db . QueryRow ( ctx , `
SELECT from_key , nonce , to_addr , unsigned_data , unsigned_cid
FROM message_sends
WHERE send_task_id = $ 1 ` , taskID ) . Scan (
& dbMsg . FromKey , & dbMsg . Nonce , & dbMsg . ToAddr , & dbMsg . UnsignedData , & dbMsg . UnsignedCid )
2023-11-29 15:22:20 +00:00
if err != nil {
return false , xerrors . Errorf ( "getting message from db: %w" , err )
}
// deserialize the message
var msg types . Message
err = msg . UnmarshalCBOR ( bytes . NewReader ( dbMsg . UnsignedData ) )
if err != nil {
return false , xerrors . Errorf ( "unmarshaling unsigned db message: %w" , err )
}
// get db send lock
for {
// check if we still own the task
if ! stillOwned ( ) {
return false , xerrors . Errorf ( "lost ownership of task" )
}
// try to acquire lock
2023-12-05 19:45:08 +00:00
cn , err := s . db . Exec ( ctx , `
INSERT INTO message_send_locks ( from_key , task_id , claimed_at )
VALUES ( $ 1 , $ 2 , CURRENT_TIMESTAMP ) ON CONFLICT ( from_key ) DO UPDATE
SET task_id = EXCLUDED . task_id , claimed_at = CURRENT_TIMESTAMP
WHERE message_send_locks . task_id = $ 2 ; ` , dbMsg . FromKey , taskID )
2023-11-29 15:22:20 +00:00
if err != nil {
return false , xerrors . Errorf ( "acquiring send lock: %w" , err )
}
if cn == 1 {
// we got the lock
break
}
// we didn't get the lock, wait a bit and try again
log . Infow ( "waiting for send lock" , "task_id" , taskID , "from" , dbMsg . FromKey )
2023-11-30 17:29:10 +00:00
time . Sleep ( SendLockedWait )
2023-11-29 15:22:20 +00:00
}
// defer release db send lock
defer func ( ) {
2023-12-05 19:45:08 +00:00
_ , err2 := s . db . Exec ( ctx , `
DELETE from message_send_locks WHERE from_key = $ 1 AND task_id = $ 2 ` , dbMsg . FromKey , taskID )
2023-12-01 22:06:21 +00:00
if err2 != nil {
log . Errorw ( "releasing send lock" , "task_id" , taskID , "from" , dbMsg . FromKey , "error" , err2 )
2023-11-29 15:22:20 +00:00
// make sure harmony retries this task so that we eventually release this lock
done = false
2023-12-01 22:06:21 +00:00
err = multierr . Append ( err , xerrors . Errorf ( "releasing send lock: %w" , err2 ) )
2023-11-29 15:22:20 +00:00
}
} ( )
// assign nonce IF NOT ASSIGNED (max(api.MpoolGetNonce, db nonce+1))
var sigMsg * types . SignedMessage
if dbMsg . Nonce == nil {
msgNonce , err := s . api . MpoolGetNonce ( ctx , msg . From )
if err != nil {
return false , xerrors . Errorf ( "getting nonce from mpool: %w" , err )
}
// get nonce from db
var dbNonce * uint64
2023-12-05 19:45:08 +00:00
r := s . db . QueryRow ( ctx , `
SELECT MAX ( nonce ) FROM message_sends WHERE from_key = $ 1 AND send_success = true ` , msg . From . String ( ) )
2023-11-29 15:22:20 +00:00
if err := r . Scan ( & dbNonce ) ; err != nil {
return false , xerrors . Errorf ( "getting nonce from db: %w" , err )
}
if dbNonce != nil && * dbNonce + 1 > msgNonce {
msgNonce = * dbNonce + 1
}
msg . Nonce = msgNonce
// sign message
sigMsg , err = s . signer . WalletSignMessage ( ctx , msg . From , & msg )
if err != nil {
return false , xerrors . Errorf ( "signing message: %w" , err )
}
data , err := sigMsg . Serialize ( )
if err != nil {
return false , xerrors . Errorf ( "serializing message: %w" , err )
}
jsonBytes , err := sigMsg . MarshalJSON ( )
if err != nil {
return false , xerrors . Errorf ( "marshaling message: %w" , err )
}
// write to db
2023-12-05 19:45:08 +00:00
n , err := s . db . Exec ( ctx , `
UPDATE message_sends SET nonce = $ 1 , signed_data = $ 2 , signed_json = $ 3 , signed_cid = $ 4
WHERE send_task_id = $ 5 ` ,
2023-11-29 15:22:20 +00:00
msg . Nonce , data , string ( jsonBytes ) , sigMsg . Cid ( ) . String ( ) , taskID )
if err != nil {
return false , xerrors . Errorf ( "updating db record: %w" , err )
}
if n != 1 {
log . Errorw ( "updating db record: expected 1 row to be affected, got %d" , n )
return false , xerrors . Errorf ( "updating db record: expected 1 row to be affected, got %d" , n )
}
} else {
// Note: this handles an unlikely edge-case:
// We have previously signed the message but either failed to send it or failed to update the db
// note that when that happens the likely cause is the provider process losing its db connection
// or getting killed before it can update the db. In that case the message lock will still be held
// so it will be safe to rebroadcast the signed message
// deserialize the signed message
sigMsg = new ( types . SignedMessage )
err = sigMsg . UnmarshalCBOR ( bytes . NewReader ( dbMsg . SignedData ) )
if err != nil {
return false , xerrors . Errorf ( "unmarshaling signed db message: %w" , err )
}
}
// send!
_ , err = s . api . MpoolPush ( ctx , sigMsg )
// persist send result
var sendSuccess = err == nil
var sendError string
if err != nil {
sendError = err . Error ( )
}
2023-12-05 19:45:08 +00:00
_ , err = s . db . Exec ( ctx , `
UPDATE message_sends SET send_success = $ 1 , send_error = $ 2 , send_time = CURRENT_TIMESTAMP
WHERE send_task_id = $ 3 ` , sendSuccess , sendError , taskID )
2023-11-29 15:22:20 +00:00
if err != nil {
return false , xerrors . Errorf ( "updating db record: %w" , err )
}
return true , nil
}
func ( s * SendTask ) CanAccept ( ids [ ] harmonytask . TaskID , engine * harmonytask . TaskEngine ) ( * harmonytask . TaskID , error ) {
if len ( ids ) == 0 {
// probably can't happen, but panicking is bad
return nil , nil
}
if s . signer == nil {
// can't sign messages here
return nil , nil
}
return & ids [ 0 ] , nil
}
func ( s * SendTask ) TypeDetails ( ) harmonytask . TaskTypeDetails {
return harmonytask . TaskTypeDetails {
Max : 1024 ,
Name : "SendMessage" ,
Cost : resources . Resources {
Cpu : 0 ,
Gpu : 0 ,
Ram : 1 << 20 ,
} ,
MaxFailures : 1000 ,
Follows : nil ,
}
}
func ( s * SendTask ) Adder ( taskFunc harmonytask . AddTaskFunc ) {
s . sendTF . Set ( taskFunc )
}
var _ harmonytask . TaskInterface = & SendTask { }
2023-11-03 12:51:01 +00:00
// NewSender creates a new Sender.
2023-11-29 15:22:20 +00:00
func NewSender ( api SenderAPI , signer SignerAPI , db * harmonydb . DB ) ( * Sender , * SendTask ) {
st := & SendTask {
2023-11-03 12:51:01 +00:00
api : api ,
signer : signer ,
2023-11-17 00:22:03 +00:00
db : db ,
2023-11-03 12:51:01 +00:00
}
2023-11-29 15:22:20 +00:00
return & Sender {
api : api ,
db : db ,
sendTask : st ,
} , st
2023-11-03 12:51:01 +00:00
}
// Send atomically assigns a nonce, signs, and pushes a message
// to mempool.
// maxFee is only used when GasFeeCap/GasPremium fields aren't specified
//
// When maxFee is set to 0, Send will guess appropriate fee
// based on current chain conditions
//
// Send behaves much like fullnodeApi.MpoolPushMessage, but it coordinates
// through HarmonyDB, making it safe to broadcast messages from multiple independent
// API nodes
//
// Send is also currently more strict about required parameters than MpoolPushMessage
func ( s * Sender ) Send ( ctx context . Context , msg * types . Message , mss * api . MessageSendSpec , reason string ) ( cid . Cid , error ) {
if mss == nil {
return cid . Undef , xerrors . Errorf ( "MessageSendSpec cannot be nil" )
}
if ( mss . MsgUuid != uuid . UUID { } ) {
return cid . Undef , xerrors . Errorf ( "MessageSendSpec.MsgUuid must be zero" )
}
fromA , err := s . api . StateAccountKey ( ctx , msg . From , types . EmptyTSK )
if err != nil {
return cid . Undef , xerrors . Errorf ( "getting key address: %w" , err )
}
2023-11-04 11:32:27 +00:00
msg . From = fromA
2023-11-03 12:51:01 +00:00
if msg . Nonce != 0 {
return cid . Undef , xerrors . Errorf ( "Send expects message nonce to be 0, was %d" , msg . Nonce )
}
msg , err = s . api . GasEstimateMessageGas ( ctx , msg , mss , types . EmptyTSK )
if err != nil {
return cid . Undef , xerrors . Errorf ( "GasEstimateMessageGas error: %w" , err )
}
b , err := s . api . WalletBalance ( ctx , msg . From )
if err != nil {
return cid . Undef , xerrors . Errorf ( "mpool push: getting origin balance: %w" , err )
}
requiredFunds := big . Add ( msg . Value , msg . RequiredFunds ( ) )
if b . LessThan ( requiredFunds ) {
return cid . Undef , xerrors . Errorf ( "mpool push: not enough funds: %s < %s" , b , requiredFunds )
}
2023-11-29 15:22:20 +00:00
// push the task
taskAdder := s . sendTask . sendTF . Val ( ctx )
unsBytes := new ( bytes . Buffer )
err = msg . MarshalCBOR ( unsBytes )
if err != nil {
return cid . Undef , xerrors . Errorf ( "marshaling message: %w" , err )
}
2023-11-03 12:51:01 +00:00
2023-12-06 19:53:50 +00:00
var sendTaskID * harmonytask . TaskID
2023-11-29 15:22:20 +00:00
taskAdder ( func ( id harmonytask . TaskID , tx * harmonydb . Tx ) ( shouldCommit bool , seriousError error ) {
_ , err := tx . Exec ( ` insert into message_sends (from_key, to_addr, send_reason, unsigned_data, unsigned_cid, send_task_id) values ($1, $2, $3, $4, $5, $6) ` ,
msg . From . String ( ) , msg . To . String ( ) , reason , unsBytes . Bytes ( ) , msg . Cid ( ) . String ( ) , id )
2023-11-03 12:51:01 +00:00
if err != nil {
2023-11-29 15:22:20 +00:00
return false , xerrors . Errorf ( "inserting message into db: %w" , err )
2023-11-03 12:51:01 +00:00
}
2023-12-06 19:53:50 +00:00
sendTaskID = & id
2023-11-29 15:22:20 +00:00
return true , nil
} )
2023-11-03 12:51:01 +00:00
2023-12-06 19:53:50 +00:00
if sendTaskID == nil {
return cid . Undef , xerrors . Errorf ( "failed to add task" )
}
2023-11-29 15:22:20 +00:00
// wait for exec
var (
pollInterval = 50 * time . Millisecond
pollIntervalMul = 2
maxPollInterval = 5 * time . Second
pollLoops = 0
sigCid cid . Cid
sendErr error
)
for {
var err error
2023-12-06 21:54:46 +00:00
var sigCidStr , sendError * string
2023-11-29 15:22:20 +00:00
var sendSuccess * bool
2023-11-03 12:51:01 +00:00
2023-12-06 19:53:50 +00:00
err = s . db . QueryRow ( ctx , ` select signed_cid, send_success, send_error from message_sends where send_task_id = $1 ` , & sendTaskID ) . Scan ( & sigCidStr , & sendSuccess , & sendError )
2023-11-03 12:51:01 +00:00
if err != nil {
2023-11-29 15:22:20 +00:00
return cid . Undef , xerrors . Errorf ( "getting cid for task: %w" , err )
2023-11-03 12:51:01 +00:00
}
2023-11-29 15:22:20 +00:00
if sendSuccess == nil {
2023-11-30 17:29:10 +00:00
time . Sleep ( pollInterval )
pollLoops ++
pollInterval *= time . Duration ( pollIntervalMul )
if pollInterval > maxPollInterval {
pollInterval = maxPollInterval
}
2023-11-29 15:22:20 +00:00
continue
2023-11-03 12:51:01 +00:00
}
2023-12-06 21:54:46 +00:00
if sigCidStr == nil || sendError == nil {
// should never happen because sendSuccess is already not null here
return cid . Undef , xerrors . Errorf ( "got null values for sigCidStr or sendError, this should never happen" )
}
2023-11-29 15:22:20 +00:00
if ! * sendSuccess {
2023-12-06 22:00:53 +00:00
sendErr = xerrors . Errorf ( "send error: %s" , * sendError )
2023-11-29 15:22:20 +00:00
} else {
2023-12-06 22:00:53 +00:00
sigCid , err = cid . Parse ( * sigCidStr )
2023-11-29 15:22:20 +00:00
if err != nil {
return cid . Undef , xerrors . Errorf ( "parsing signed cid: %w" , err )
}
2023-11-03 12:51:01 +00:00
}
2023-11-29 15:22:20 +00:00
break
2023-11-03 12:51:01 +00:00
}
2024-02-11 13:14:42 +00:00
log . Infow ( "sent message" , "cid" , sigCid , "task_id" , sendTaskID , "send_error" , sendErr , "poll_loops" , pollLoops )
2023-11-03 21:40:28 +00:00
2023-11-29 15:22:20 +00:00
return sigCid , sendErr
2023-11-03 12:51:01 +00:00
}