2019-11-21 14:10:51 +00:00
|
|
|
package main
|
2019-11-21 00:52:59 +00:00
|
|
|
|
|
|
|
import (
|
2020-03-13 01:37:38 +00:00
|
|
|
"context"
|
2020-03-16 18:46:02 +00:00
|
|
|
"encoding/json"
|
2020-06-17 15:23:07 +00:00
|
|
|
"fmt"
|
2020-03-16 18:46:02 +00:00
|
|
|
"io/ioutil"
|
2020-03-16 17:50:07 +00:00
|
|
|
"net"
|
2020-03-13 01:37:38 +00:00
|
|
|
"net/http"
|
2019-11-21 00:52:59 +00:00
|
|
|
"os"
|
2020-03-16 18:46:02 +00:00
|
|
|
"path/filepath"
|
2020-07-23 03:01:50 +00:00
|
|
|
"strings"
|
2020-06-17 15:23:07 +00:00
|
|
|
"time"
|
2019-12-06 00:27:32 +00:00
|
|
|
|
2020-03-16 18:46:02 +00:00
|
|
|
"github.com/google/uuid"
|
2020-09-14 07:44:55 +00:00
|
|
|
"github.com/ipfs/go-datastore/namespace"
|
2020-01-08 19:10:57 +00:00
|
|
|
logging "github.com/ipfs/go-log/v2"
|
2020-08-30 18:28:58 +00:00
|
|
|
manet "github.com/multiformats/go-multiaddr/net"
|
2020-06-02 18:12:53 +00:00
|
|
|
"github.com/urfave/cli/v2"
|
2020-10-21 08:37:50 +00:00
|
|
|
"go.opencensus.io/stats/view"
|
|
|
|
"go.opencensus.io/tag"
|
2020-06-05 22:59:01 +00:00
|
|
|
"golang.org/x/xerrors"
|
2019-11-21 00:52:59 +00:00
|
|
|
|
2020-05-20 18:23:51 +00:00
|
|
|
"github.com/filecoin-project/go-jsonrpc/auth"
|
2020-03-11 01:57:52 +00:00
|
|
|
paramfetch "github.com/filecoin-project/go-paramfetch"
|
2020-09-14 07:44:55 +00:00
|
|
|
"github.com/filecoin-project/go-statestore"
|
2020-03-23 11:40:02 +00:00
|
|
|
|
2020-03-11 01:57:52 +00:00
|
|
|
"github.com/filecoin-project/lotus/api"
|
2019-11-21 00:52:59 +00:00
|
|
|
"github.com/filecoin-project/lotus/build"
|
2020-03-11 01:57:52 +00:00
|
|
|
lcli "github.com/filecoin-project/lotus/cli"
|
2021-03-05 20:08:14 +00:00
|
|
|
cliutil "github.com/filecoin-project/lotus/cli/util"
|
2022-03-24 22:37:01 +00:00
|
|
|
"github.com/filecoin-project/lotus/cmd/lotus-worker/sealworker"
|
2020-08-17 13:39:33 +00:00
|
|
|
sectorstorage "github.com/filecoin-project/lotus/extern/sector-storage"
|
2020-08-17 13:26:18 +00:00
|
|
|
"github.com/filecoin-project/lotus/extern/sector-storage/sealtasks"
|
|
|
|
"github.com/filecoin-project/lotus/extern/sector-storage/stores"
|
2022-01-18 10:57:04 +00:00
|
|
|
"github.com/filecoin-project/lotus/extern/sector-storage/storiface"
|
2020-01-08 13:49:34 +00:00
|
|
|
"github.com/filecoin-project/lotus/lib/lotuslog"
|
2022-03-28 22:07:54 +00:00
|
|
|
"github.com/filecoin-project/lotus/lib/ulimit"
|
2020-10-21 08:37:50 +00:00
|
|
|
"github.com/filecoin-project/lotus/metrics"
|
2020-09-14 07:44:55 +00:00
|
|
|
"github.com/filecoin-project/lotus/node/modules"
|
2019-12-09 12:36:56 +00:00
|
|
|
"github.com/filecoin-project/lotus/node/repo"
|
2019-11-21 00:52:59 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
var log = logging.Logger("main")
|
|
|
|
|
2020-07-09 03:04:45 +00:00
|
|
|
const FlagWorkerRepo = "worker-repo"
|
2020-07-17 13:18:40 +00:00
|
|
|
|
2020-07-10 12:18:09 +00:00
|
|
|
// TODO remove after deprecation period
|
|
|
|
const FlagWorkerRepoDeprecation = "workerrepo"
|
2020-03-13 01:37:38 +00:00
|
|
|
|
2019-11-21 00:52:59 +00:00
|
|
|
func main() {
|
2021-03-05 21:01:20 +00:00
|
|
|
api.RunningNodeType = api.NodeWorker
|
2020-09-08 18:54:37 +00:00
|
|
|
|
2020-01-08 13:49:34 +00:00
|
|
|
lotuslog.SetupLogLevels()
|
2019-11-21 00:52:59 +00:00
|
|
|
|
|
|
|
local := []*cli.Command{
|
|
|
|
runCmd,
|
2020-08-30 18:28:58 +00:00
|
|
|
infoCmd,
|
|
|
|
storageCmd,
|
2020-10-27 16:28:44 +00:00
|
|
|
setCmd,
|
|
|
|
waitQuietCmd,
|
2021-11-29 15:11:04 +00:00
|
|
|
resourcesCmd,
|
2020-11-26 16:33:22 +00:00
|
|
|
tasksCmd,
|
2019-11-21 00:52:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
app := &cli.App{
|
2021-05-24 07:00:47 +00:00
|
|
|
Name: "lotus-worker",
|
|
|
|
Usage: "Remote miner worker",
|
|
|
|
Version: build.UserVersion(),
|
|
|
|
EnableBashCompletion: true,
|
2019-11-21 00:52:59 +00:00
|
|
|
Flags: []cli.Flag{
|
|
|
|
&cli.StringFlag{
|
2020-07-08 10:38:59 +00:00
|
|
|
Name: FlagWorkerRepo,
|
2020-07-10 12:18:09 +00:00
|
|
|
Aliases: []string{FlagWorkerRepoDeprecation},
|
|
|
|
EnvVars: []string{"LOTUS_WORKER_PATH", "WORKER_PATH"},
|
2019-11-21 00:52:59 +00:00
|
|
|
Value: "~/.lotusworker", // TODO: Consider XDG_DATA_HOME
|
2020-07-10 12:18:09 +00:00
|
|
|
Usage: fmt.Sprintf("Specify worker repo path. flag %s and env WORKER_PATH are DEPRECATION, will REMOVE SOON", FlagWorkerRepoDeprecation),
|
2019-11-21 00:52:59 +00:00
|
|
|
},
|
2021-09-17 22:01:54 +00:00
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "panic-reports",
|
|
|
|
EnvVars: []string{"LOTUS_PANIC_REPORT_PATH"},
|
|
|
|
Hidden: true,
|
2021-09-30 13:06:55 +00:00
|
|
|
Value: "~/.lotusworker", // should follow --repo default
|
2021-09-17 22:01:54 +00:00
|
|
|
},
|
2019-11-21 00:52:59 +00:00
|
|
|
&cli.StringFlag{
|
2020-07-08 10:38:59 +00:00
|
|
|
Name: "miner-repo",
|
2020-07-10 12:18:09 +00:00
|
|
|
Aliases: []string{"storagerepo"},
|
|
|
|
EnvVars: []string{"LOTUS_MINER_PATH", "LOTUS_STORAGE_PATH"},
|
2020-07-08 10:38:59 +00:00
|
|
|
Value: "~/.lotusminer", // TODO: Consider XDG_DATA_HOME
|
2020-07-10 12:18:09 +00:00
|
|
|
Usage: fmt.Sprintf("Specify miner repo path. flag storagerepo and env LOTUS_STORAGE_PATH are DEPRECATION, will REMOVE SOON"),
|
2019-11-21 00:52:59 +00:00
|
|
|
},
|
2019-12-07 14:19:46 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "enable-gpu-proving",
|
|
|
|
Usage: "enable use of GPU for mining operations",
|
|
|
|
Value: true,
|
|
|
|
},
|
2019-11-21 00:52:59 +00:00
|
|
|
},
|
|
|
|
|
2021-09-17 22:01:54 +00:00
|
|
|
After: func(c *cli.Context) error {
|
|
|
|
if r := recover(); r != nil {
|
|
|
|
// Generate report in LOTUS_PATH and re-raise panic
|
|
|
|
build.GeneratePanicReport(c.String("panic-reports"), c.String(FlagWorkerRepo), c.App.Name)
|
|
|
|
panic(r)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
},
|
2019-11-21 00:52:59 +00:00
|
|
|
Commands: local,
|
|
|
|
}
|
2019-12-09 12:36:56 +00:00
|
|
|
app.Setup()
|
2020-03-25 21:15:10 +00:00
|
|
|
app.Metadata["repoType"] = repo.Worker
|
2019-11-21 00:52:59 +00:00
|
|
|
|
|
|
|
if err := app.Run(os.Args); err != nil {
|
2019-11-21 18:38:43 +00:00
|
|
|
log.Warnf("%+v", err)
|
2019-11-21 00:52:59 +00:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
var runCmd = &cli.Command{
|
|
|
|
Name: "run",
|
2019-11-21 14:10:51 +00:00
|
|
|
Usage: "Start lotus worker",
|
2020-03-16 17:50:07 +00:00
|
|
|
Flags: []cli.Flag{
|
|
|
|
&cli.StringFlag{
|
2020-08-06 00:54:00 +00:00
|
|
|
Name: "listen",
|
|
|
|
Usage: "host address and port the worker api will listen on",
|
2020-07-24 15:07:31 +00:00
|
|
|
Value: "0.0.0.0:3456",
|
2020-03-16 17:50:07 +00:00
|
|
|
},
|
2020-08-06 00:54:00 +00:00
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "address",
|
|
|
|
Hidden: true,
|
|
|
|
},
|
2020-03-16 18:46:02 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "no-local-storage",
|
|
|
|
Usage: "don't use storageminer repo for sector storage",
|
|
|
|
},
|
2020-09-30 06:23:35 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "no-swap",
|
|
|
|
Usage: "don't use swap",
|
|
|
|
Value: false,
|
|
|
|
},
|
2020-08-14 14:06:53 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "addpiece",
|
|
|
|
Usage: "enable addpiece",
|
|
|
|
Value: true,
|
|
|
|
},
|
2020-03-25 21:15:10 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "precommit1",
|
|
|
|
Usage: "enable precommit1 (32G sectors: 1 core, 128GiB Memory)",
|
|
|
|
Value: true,
|
|
|
|
},
|
2020-08-04 12:32:09 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "unseal",
|
|
|
|
Usage: "enable unsealing (32G sectors: 1 core, 128GiB Memory)",
|
|
|
|
Value: true,
|
|
|
|
},
|
2020-03-25 21:15:10 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "precommit2",
|
|
|
|
Usage: "enable precommit2 (32G sectors: all cores, 96GiB Memory)",
|
|
|
|
Value: true,
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "commit",
|
|
|
|
Usage: "enable commit (32G sectors: all cores or GPUs, 128GiB Memory + 64GiB swap)",
|
|
|
|
Value: true,
|
|
|
|
},
|
2021-12-08 17:11:19 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "replica-update",
|
|
|
|
Usage: "enable replica update",
|
|
|
|
Value: true,
|
|
|
|
},
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "prove-replica-update2",
|
|
|
|
Usage: "enable prove replica update 2",
|
|
|
|
Value: true,
|
|
|
|
},
|
2022-02-14 18:28:49 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "regen-sector-key",
|
|
|
|
Usage: "enable regen sector key",
|
|
|
|
Value: true,
|
|
|
|
},
|
2021-07-27 03:15:53 +00:00
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "windowpost",
|
|
|
|
Usage: "enable window post",
|
|
|
|
Value: false,
|
|
|
|
},
|
|
|
|
|
|
|
|
&cli.BoolFlag{
|
|
|
|
Name: "winningpost",
|
|
|
|
Usage: "enable winning post",
|
|
|
|
Value: false,
|
|
|
|
},
|
2022-01-14 13:11:04 +00:00
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "parallel-fetch-limit",
|
|
|
|
Usage: "maximum fetch operations to run in parallel",
|
|
|
|
Value: 5,
|
|
|
|
},
|
2022-03-24 23:42:44 +00:00
|
|
|
&cli.IntFlag{
|
|
|
|
Name: "post-parallel-reads",
|
|
|
|
Usage: "maximum number of parallel challenge reads (0 = no limit)",
|
2022-03-29 17:22:58 +00:00
|
|
|
Value: 128,
|
2022-03-24 23:42:44 +00:00
|
|
|
},
|
|
|
|
&cli.DurationFlag{
|
|
|
|
Name: "post-read-timeout",
|
|
|
|
Usage: "time limit for reading PoSt challenges (0 = no limit)",
|
|
|
|
Value: 0,
|
|
|
|
},
|
2022-01-14 13:11:04 +00:00
|
|
|
&cli.StringFlag{
|
|
|
|
Name: "timeout",
|
|
|
|
Usage: "used when 'listen' is unspecified. must be a valid duration recognized by golang's time.ParseDuration function",
|
|
|
|
Value: "30m",
|
|
|
|
},
|
2020-03-16 17:50:07 +00:00
|
|
|
},
|
2020-08-06 00:54:00 +00:00
|
|
|
Before: func(cctx *cli.Context) error {
|
|
|
|
if cctx.IsSet("address") {
|
|
|
|
log.Warnf("The '--address' flag is deprecated, it has been replaced by '--listen'")
|
|
|
|
if err := cctx.Set("listen", cctx.String("address")); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
},
|
2019-11-21 00:52:59 +00:00
|
|
|
Action: func(cctx *cli.Context) error {
|
2020-08-30 18:28:58 +00:00
|
|
|
log.Info("Starting lotus worker")
|
|
|
|
|
2020-03-11 01:57:52 +00:00
|
|
|
if !cctx.Bool("enable-gpu-proving") {
|
2020-05-27 20:53:20 +00:00
|
|
|
if err := os.Setenv("BELLMAN_NO_GPU", "true"); err != nil {
|
|
|
|
return xerrors.Errorf("could not set no-gpu env: %+v", err)
|
|
|
|
}
|
2020-03-11 01:57:52 +00:00
|
|
|
}
|
|
|
|
|
2022-03-28 22:07:54 +00:00
|
|
|
limit, _, err := ulimit.GetLimit()
|
|
|
|
switch {
|
|
|
|
case err == ulimit.ErrUnsupported:
|
|
|
|
log.Errorw("checking file descriptor limit failed", "error", err)
|
|
|
|
case err != nil:
|
|
|
|
return xerrors.Errorf("checking fd limit: %w", err)
|
|
|
|
default:
|
|
|
|
if limit < build.MinerFDLimit {
|
|
|
|
return xerrors.Errorf("soft file descriptor limit (ulimit -n) too low, want %d, current %d", build.MinerFDLimit, limit)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-16 17:50:07 +00:00
|
|
|
// Connect to storage-miner
|
2020-10-18 17:53:23 +00:00
|
|
|
ctx := lcli.ReqContext(cctx)
|
|
|
|
|
2020-06-17 15:23:07 +00:00
|
|
|
var nodeApi api.StorageMiner
|
|
|
|
var closer func()
|
|
|
|
for {
|
2021-03-05 20:08:14 +00:00
|
|
|
nodeApi, closer, err = lcli.GetStorageMinerAPI(cctx, cliutil.StorageMinerUseHttp)
|
2020-06-17 15:23:07 +00:00
|
|
|
if err == nil {
|
2020-10-18 17:53:23 +00:00
|
|
|
_, err = nodeApi.Version(ctx)
|
|
|
|
if err == nil {
|
|
|
|
break
|
|
|
|
}
|
2020-06-17 15:23:07 +00:00
|
|
|
}
|
|
|
|
fmt.Printf("\r\x1b[0KConnecting to miner API... (%s)", err)
|
|
|
|
time.Sleep(time.Second)
|
|
|
|
continue
|
2020-03-11 01:57:52 +00:00
|
|
|
}
|
2020-06-17 15:43:16 +00:00
|
|
|
|
2020-03-11 01:57:52 +00:00
|
|
|
defer closer()
|
2020-03-18 23:23:28 +00:00
|
|
|
ctx, cancel := context.WithCancel(ctx)
|
|
|
|
defer cancel()
|
2020-03-11 01:57:52 +00:00
|
|
|
|
2020-10-21 08:37:50 +00:00
|
|
|
// Register all metric views
|
|
|
|
if err := view.Register(
|
|
|
|
metrics.DefaultViews...,
|
|
|
|
); err != nil {
|
|
|
|
log.Fatalf("Cannot register the view: %v", err)
|
|
|
|
}
|
|
|
|
|
2020-03-11 01:57:52 +00:00
|
|
|
v, err := nodeApi.Version(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2021-04-15 22:19:26 +00:00
|
|
|
if v.APIVersion != api.MinerAPIVersion0 {
|
|
|
|
return xerrors.Errorf("lotus-miner API version doesn't match: expected: %s", api.APIVersion{APIVersion: api.MinerAPIVersion0})
|
2020-03-11 01:57:52 +00:00
|
|
|
}
|
2020-03-13 01:37:38 +00:00
|
|
|
log.Infof("Remote version %s", v)
|
2020-03-11 01:57:52 +00:00
|
|
|
|
2020-03-16 17:50:07 +00:00
|
|
|
// Check params
|
|
|
|
|
2020-03-11 01:57:52 +00:00
|
|
|
act, err := nodeApi.ActorAddress(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
ssize, err := nodeApi.ActorSectorSize(ctx, act)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-03-25 21:15:10 +00:00
|
|
|
if cctx.Bool("commit") {
|
2021-03-10 15:16:44 +00:00
|
|
|
if err := paramfetch.GetParams(ctx, build.ParametersJSON(), build.SrsJSON(), uint64(ssize)); err != nil {
|
2020-03-25 21:15:10 +00:00
|
|
|
return xerrors.Errorf("get params: %w", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
var taskTypes []sealtasks.TaskType
|
2022-03-24 22:28:45 +00:00
|
|
|
var workerType string
|
2020-03-25 21:15:10 +00:00
|
|
|
|
2022-01-14 13:11:04 +00:00
|
|
|
if cctx.Bool("windowpost") {
|
2022-03-24 22:28:45 +00:00
|
|
|
workerType = sealtasks.WorkerWindowPoSt
|
2022-01-14 13:11:04 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTGenerateWindowPoSt)
|
|
|
|
}
|
|
|
|
if cctx.Bool("winningpost") {
|
2022-03-24 22:28:45 +00:00
|
|
|
workerType = sealtasks.WorkerWinningPoSt
|
2022-01-14 13:11:04 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTGenerateWinningPoSt)
|
|
|
|
}
|
|
|
|
|
2022-03-24 22:28:45 +00:00
|
|
|
if workerType == "" {
|
|
|
|
workerType = sealtasks.WorkerSealing
|
2022-03-09 15:27:03 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTFetch, sealtasks.TTCommit1, sealtasks.TTProveReplicaUpdate1, sealtasks.TTFinalize, sealtasks.TTFinalizeReplicaUpdate)
|
2022-01-14 13:11:04 +00:00
|
|
|
}
|
2020-04-28 10:57:24 +00:00
|
|
|
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("addpiece")) && cctx.Bool("addpiece") {
|
2022-04-26 16:22:52 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTAddPiece, sealtasks.TTDataCid)
|
2020-08-14 14:06:53 +00:00
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("precommit1")) && cctx.Bool("precommit1") {
|
2020-03-25 21:15:10 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTPreCommit1)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("unseal")) && cctx.Bool("unseal") {
|
2020-08-04 12:32:09 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTUnseal)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("precommit2")) && cctx.Bool("precommit2") {
|
2020-03-25 21:15:10 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTPreCommit2)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("commit")) && cctx.Bool("commit") {
|
2020-03-25 21:15:10 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTCommit2)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("replica-update")) && cctx.Bool("replica-update") {
|
2021-12-08 17:11:19 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTReplicaUpdate)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("prove-replica-update2")) && cctx.Bool("prove-replica-update2") {
|
2021-12-08 17:11:19 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTProveReplicaUpdate2)
|
|
|
|
}
|
2022-03-26 20:26:19 +00:00
|
|
|
if (workerType == sealtasks.WorkerSealing || cctx.IsSet("regen-sector-key")) && cctx.Bool("regen-sector-key") {
|
2022-02-14 18:28:49 +00:00
|
|
|
taskTypes = append(taskTypes, sealtasks.TTRegenSectorKey)
|
|
|
|
}
|
2020-03-25 21:15:10 +00:00
|
|
|
|
|
|
|
if len(taskTypes) == 0 {
|
|
|
|
return xerrors.Errorf("no task types specified")
|
2020-03-11 01:57:52 +00:00
|
|
|
}
|
2022-03-24 22:28:45 +00:00
|
|
|
for _, taskType := range taskTypes {
|
|
|
|
if taskType.WorkerType() != workerType {
|
|
|
|
return xerrors.Errorf("expected all task types to be for %s worker, but task %s is for %s worker", workerType, taskType, taskType.WorkerType())
|
|
|
|
}
|
2022-01-14 13:11:04 +00:00
|
|
|
}
|
2020-03-11 01:57:52 +00:00
|
|
|
|
2020-03-16 17:50:07 +00:00
|
|
|
// Open repo
|
|
|
|
|
2020-07-08 10:38:59 +00:00
|
|
|
repoPath := cctx.String(FlagWorkerRepo)
|
2020-03-13 01:37:38 +00:00
|
|
|
r, err := repo.NewFS(repoPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
ok, err := r.Exists()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if !ok {
|
2020-03-16 18:46:02 +00:00
|
|
|
if err := r.Init(repo.Worker); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
lr, err := r.Lock(repo.Worker)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-03-27 20:08:06 +00:00
|
|
|
var localPaths []stores.LocalPath
|
2020-03-16 18:46:02 +00:00
|
|
|
|
|
|
|
if !cctx.Bool("no-local-storage") {
|
2020-03-19 15:10:19 +00:00
|
|
|
b, err := json.MarshalIndent(&stores.LocalStorageMeta{
|
2022-01-18 10:57:04 +00:00
|
|
|
ID: storiface.ID(uuid.New().String()),
|
2020-03-16 18:46:02 +00:00
|
|
|
Weight: 10,
|
|
|
|
CanSeal: true,
|
|
|
|
CanStore: false,
|
|
|
|
}, "", " ")
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("marshaling storage config: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := ioutil.WriteFile(filepath.Join(lr.Path(), "sectorstore.json"), b, 0644); err != nil {
|
|
|
|
return xerrors.Errorf("persisting storage metadata (%s): %w", filepath.Join(lr.Path(), "sectorstore.json"), err)
|
|
|
|
}
|
|
|
|
|
2020-03-27 20:08:06 +00:00
|
|
|
localPaths = append(localPaths, stores.LocalPath{
|
2020-03-16 18:46:02 +00:00
|
|
|
Path: lr.Path(),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-03-27 20:08:06 +00:00
|
|
|
if err := lr.SetStorage(func(sc *stores.StorageConfig) {
|
2020-03-16 18:46:02 +00:00
|
|
|
sc.StoragePaths = append(sc.StoragePaths, localPaths...)
|
|
|
|
}); err != nil {
|
|
|
|
return xerrors.Errorf("set storage config: %w", err)
|
|
|
|
}
|
|
|
|
|
2020-03-18 23:23:28 +00:00
|
|
|
{
|
|
|
|
// init datastore for r.Exists
|
2021-01-26 10:25:34 +00:00
|
|
|
_, err := lr.Datastore(context.Background(), "/metadata")
|
2020-03-18 23:23:28 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
2020-03-16 18:46:02 +00:00
|
|
|
if err := lr.Close(); err != nil {
|
|
|
|
return xerrors.Errorf("close repo: %w", err)
|
|
|
|
}
|
2020-03-13 01:37:38 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
lr, err := r.Lock(repo.Worker)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2020-09-23 14:12:15 +00:00
|
|
|
defer func() {
|
|
|
|
if err := lr.Close(); err != nil {
|
|
|
|
log.Error("closing repo", err)
|
|
|
|
}
|
|
|
|
}()
|
2021-01-26 10:25:34 +00:00
|
|
|
ds, err := lr.Datastore(context.Background(), "/metadata")
|
2020-09-23 14:12:15 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2020-03-13 01:37:38 +00:00
|
|
|
|
2020-03-19 15:10:19 +00:00
|
|
|
log.Info("Opening local storage; connecting to master")
|
2020-07-23 19:29:23 +00:00
|
|
|
const unspecifiedAddress = "0.0.0.0"
|
2020-08-06 00:54:00 +00:00
|
|
|
address := cctx.String("listen")
|
2020-07-23 19:29:23 +00:00
|
|
|
addressSlice := strings.Split(address, ":")
|
|
|
|
if ip := net.ParseIP(addressSlice[0]); ip != nil {
|
|
|
|
if ip.String() == unspecifiedAddress {
|
|
|
|
timeout, err := time.ParseDuration(cctx.String("timeout"))
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
rip, err := extractRoutableIP(timeout)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
address = rip + ":" + addressSlice[1]
|
|
|
|
}
|
|
|
|
}
|
2020-03-19 15:10:19 +00:00
|
|
|
|
2020-07-23 03:01:50 +00:00
|
|
|
localStore, err := stores.NewLocal(ctx, lr, nodeApi, []string{"http://" + address + "/remote"})
|
2020-03-13 01:37:38 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-03-16 17:50:07 +00:00
|
|
|
// Setup remote sector store
|
2020-03-13 01:37:38 +00:00
|
|
|
sminfo, err := lcli.GetAPIInfo(cctx, repo.StorageMiner)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("could not get api info: %w", err)
|
|
|
|
}
|
|
|
|
|
2021-05-20 11:01:25 +00:00
|
|
|
remote := stores.NewRemote(localStore, nodeApi, sminfo.AuthHeader(), cctx.Int("parallel-fetch-limit"),
|
|
|
|
&stores.DefaultPartialFileHandler{})
|
2020-03-13 01:37:38 +00:00
|
|
|
|
2021-05-19 13:50:48 +00:00
|
|
|
fh := &stores.FetchHandler{Local: localStore, PfHandler: &stores.DefaultPartialFileHandler{}}
|
2020-11-25 16:05:45 +00:00
|
|
|
remoteHandler := func(w http.ResponseWriter, r *http.Request) {
|
2021-03-25 14:09:50 +00:00
|
|
|
if !auth.HasPerm(r.Context(), nil, api.PermAdmin) {
|
2020-11-25 16:05:45 +00:00
|
|
|
w.WriteHeader(401)
|
|
|
|
_ = json.NewEncoder(w).Encode(struct{ Error string }{"unauthorized: missing admin permission"})
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
fh.ServeHTTP(w, r)
|
|
|
|
}
|
|
|
|
|
2020-03-16 17:50:07 +00:00
|
|
|
// Create / expose the worker
|
|
|
|
|
2020-09-23 14:12:15 +00:00
|
|
|
wsts := statestore.New(namespace.Wrap(ds, modules.WorkerCallsPrefix))
|
2020-09-14 07:44:55 +00:00
|
|
|
|
2022-01-14 13:11:04 +00:00
|
|
|
workerApi := &sealworker.Worker{
|
2020-03-23 11:40:02 +00:00
|
|
|
LocalWorker: sectorstorage.NewLocalWorker(sectorstorage.WorkerConfig{
|
2022-03-24 23:42:44 +00:00
|
|
|
TaskTypes: taskTypes,
|
|
|
|
NoSwap: cctx.Bool("no-swap"),
|
|
|
|
MaxParallelChallengeReads: cctx.Int("post-parallel-reads"),
|
|
|
|
ChallengeReadTimeout: cctx.Duration("post-read-timeout"),
|
2020-09-14 07:44:55 +00:00
|
|
|
}, remote, localStore, nodeApi, nodeApi, wsts),
|
2022-01-14 13:11:04 +00:00
|
|
|
LocalStore: localStore,
|
|
|
|
Storage: lr,
|
2020-03-13 01:37:38 +00:00
|
|
|
}
|
|
|
|
|
2020-07-23 03:01:50 +00:00
|
|
|
log.Info("Setting up control endpoint at " + address)
|
2020-03-18 04:40:25 +00:00
|
|
|
|
2020-03-18 23:23:28 +00:00
|
|
|
srv := &http.Server{
|
2022-01-14 13:11:04 +00:00
|
|
|
Handler: sealworker.WorkerHandler(nodeApi.AuthVerify, remoteHandler, workerApi, true),
|
2020-03-18 23:23:28 +00:00
|
|
|
BaseContext: func(listener net.Listener) context.Context {
|
2020-10-21 08:37:50 +00:00
|
|
|
ctx, _ := tag.New(context.Background(), tag.Upsert(metrics.APIInterface, "lotus-worker"))
|
2020-03-18 23:23:28 +00:00
|
|
|
return ctx
|
|
|
|
},
|
|
|
|
}
|
2020-03-13 01:37:38 +00:00
|
|
|
|
|
|
|
go func() {
|
2020-03-18 04:40:25 +00:00
|
|
|
<-ctx.Done()
|
2020-06-02 19:30:45 +00:00
|
|
|
log.Warn("Shutting down...")
|
2020-03-13 01:37:38 +00:00
|
|
|
if err := srv.Shutdown(context.TODO()); err != nil {
|
|
|
|
log.Errorf("shutting down RPC server failed: %s", err)
|
|
|
|
}
|
|
|
|
log.Warn("Graceful shutdown successful")
|
|
|
|
}()
|
2020-03-16 17:50:07 +00:00
|
|
|
|
2020-07-23 03:01:50 +00:00
|
|
|
nl, err := net.Listen("tcp", address)
|
2020-03-16 17:50:07 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-08-30 18:28:58 +00:00
|
|
|
{
|
|
|
|
a, err := net.ResolveTCPAddr("tcp", address)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("parsing address: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
ma, err := manet.FromNetAddr(a)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("creating api multiaddress: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := lr.SetAPIEndpoint(ma); err != nil {
|
|
|
|
return xerrors.Errorf("setting api endpoint: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
ainfo, err := lcli.GetAPIInfo(cctx, repo.StorageMiner)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("could not get miner API info: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: ideally this would be a token with some permissions dropped
|
|
|
|
if err := lr.SetAPIToken(ainfo.Token); err != nil {
|
|
|
|
return xerrors.Errorf("setting api token: %w", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-10-18 15:56:29 +00:00
|
|
|
minerSession, err := nodeApi.Session(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return xerrors.Errorf("getting miner session: %w", err)
|
|
|
|
}
|
|
|
|
|
2020-10-30 17:00:48 +00:00
|
|
|
waitQuietCh := func() chan struct{} {
|
|
|
|
out := make(chan struct{})
|
|
|
|
go func() {
|
|
|
|
workerApi.LocalWorker.WaitQuiet()
|
|
|
|
close(out)
|
|
|
|
}()
|
|
|
|
return out
|
|
|
|
}
|
|
|
|
|
2020-03-18 23:23:28 +00:00
|
|
|
go func() {
|
2020-10-18 15:56:29 +00:00
|
|
|
heartbeats := time.NewTicker(stores.HeartbeatInterval)
|
|
|
|
defer heartbeats.Stop()
|
|
|
|
|
2020-10-30 17:00:48 +00:00
|
|
|
var redeclareStorage bool
|
|
|
|
var readyCh chan struct{}
|
2020-09-22 16:36:44 +00:00
|
|
|
for {
|
2020-10-18 15:56:29 +00:00
|
|
|
// If we're reconnecting, redeclare storage first
|
2020-10-30 17:00:48 +00:00
|
|
|
if redeclareStorage {
|
2020-09-28 19:11:25 +00:00
|
|
|
log.Info("Redeclaring local storage")
|
|
|
|
|
2020-09-28 19:06:49 +00:00
|
|
|
if err := localStore.Redeclare(ctx); err != nil {
|
|
|
|
log.Errorf("Redeclaring local storage failed: %+v", err)
|
2020-10-18 15:56:29 +00:00
|
|
|
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return // graceful shutdown
|
|
|
|
case <-heartbeats.C:
|
|
|
|
}
|
|
|
|
continue
|
2020-09-28 19:06:49 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-28 19:11:25 +00:00
|
|
|
// TODO: we could get rid of this, but that requires tracking resources for restarted tasks correctly
|
2020-10-30 17:00:48 +00:00
|
|
|
if readyCh == nil {
|
|
|
|
log.Info("Making sure no local tasks are running")
|
|
|
|
readyCh = waitQuietCh()
|
|
|
|
}
|
2020-09-28 19:11:25 +00:00
|
|
|
|
2020-10-18 15:56:29 +00:00
|
|
|
for {
|
|
|
|
curSession, err := nodeApi.Session(ctx)
|
|
|
|
if err != nil {
|
|
|
|
log.Errorf("heartbeat: checking remote session failed: %+v", err)
|
|
|
|
} else {
|
|
|
|
if curSession != minerSession {
|
|
|
|
minerSession = curSession
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
2020-06-17 15:43:16 +00:00
|
|
|
|
2020-10-18 15:56:29 +00:00
|
|
|
select {
|
2020-10-30 17:00:48 +00:00
|
|
|
case <-readyCh:
|
|
|
|
if err := nodeApi.WorkerConnect(ctx, "http://"+address+"/rpc/v0"); err != nil {
|
|
|
|
log.Errorf("Registering worker failed: %+v", err)
|
|
|
|
cancel()
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
log.Info("Worker registered successfully, waiting for tasks")
|
|
|
|
|
|
|
|
readyCh = nil
|
|
|
|
case <-heartbeats.C:
|
2020-10-18 15:56:29 +00:00
|
|
|
case <-ctx.Done():
|
|
|
|
return // graceful shutdown
|
|
|
|
}
|
2020-09-22 16:36:44 +00:00
|
|
|
}
|
2020-06-17 15:43:16 +00:00
|
|
|
|
2020-09-22 16:36:44 +00:00
|
|
|
log.Errorf("LOTUS-MINER CONNECTION LOST")
|
2020-09-28 19:06:49 +00:00
|
|
|
|
2020-10-30 17:00:48 +00:00
|
|
|
redeclareStorage = true
|
2020-09-22 16:36:44 +00:00
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
return srv.Serve(nl)
|
|
|
|
},
|
2020-06-17 15:43:16 +00:00
|
|
|
}
|
2020-07-23 03:01:50 +00:00
|
|
|
|
2020-07-23 19:29:23 +00:00
|
|
|
func extractRoutableIP(timeout time.Duration) (string, error) {
|
2020-07-23 03:01:50 +00:00
|
|
|
minerMultiAddrKey := "MINER_API_INFO"
|
|
|
|
deprecatedMinerMultiAddrKey := "STORAGE_API_INFO"
|
|
|
|
env, ok := os.LookupEnv(minerMultiAddrKey)
|
|
|
|
if !ok {
|
|
|
|
// TODO remove after deprecation period
|
2020-08-20 04:49:10 +00:00
|
|
|
_, ok = os.LookupEnv(deprecatedMinerMultiAddrKey)
|
2020-07-23 03:01:50 +00:00
|
|
|
if ok {
|
2020-07-23 19:29:23 +00:00
|
|
|
log.Warnf("Using a deprecated env(%s) value, please use env(%s) instead.", deprecatedMinerMultiAddrKey, minerMultiAddrKey)
|
2020-07-23 03:01:50 +00:00
|
|
|
}
|
|
|
|
return "", xerrors.New("MINER_API_INFO environment variable required to extract IP")
|
|
|
|
}
|
|
|
|
minerAddr := strings.Split(env, "/")
|
2020-07-23 19:29:23 +00:00
|
|
|
conn, err := net.DialTimeout("tcp", minerAddr[2]+":"+minerAddr[4], timeout)
|
2020-07-23 03:01:50 +00:00
|
|
|
if err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
2020-08-20 04:49:10 +00:00
|
|
|
defer conn.Close() //nolint:errcheck
|
2020-07-23 03:01:50 +00:00
|
|
|
|
|
|
|
localAddr := conn.LocalAddr().(*net.TCPAddr)
|
|
|
|
|
|
|
|
return strings.Split(localAddr.IP.String(), ":")[0], nil
|
|
|
|
}
|