lotus/storage/sealer/sched_resources.go

package sealer

import (
	"sync"

	"github.com/filecoin-project/lotus/storage/sealer/sealtasks"
	"github.com/filecoin-project/lotus/storage/sealer/storiface"
)

type ActiveResources struct {
	memUsedMin uint64
	memUsedMax uint64
	gpuUsed    float64
	cpuUse     uint64

	taskCounters *taskCounter

	cond    *sync.Cond
	waiting int
}

type taskCounter struct {
	taskCounters map[sealtasks.SealTaskType]int

	// this lock is technically redundant, as ActiveResources is always accessed
	// with the worker lock, but let's not panic if we ever change that
	lk sync.Mutex
}

func newTaskCounter() *taskCounter {
	return &taskCounter{
		taskCounters: map[sealtasks.SealTaskType]int{},
	}
}

func (tc *taskCounter) Add(tt sealtasks.SealTaskType) {
	tc.lk.Lock()
	defer tc.lk.Unlock()
	tc.taskCounters[tt]++
}

func (tc *taskCounter) Free(tt sealtasks.SealTaskType) {
	tc.lk.Lock()
	defer tc.lk.Unlock()
	tc.taskCounters[tt]--
}

func (tc *taskCounter) Get(tt sealtasks.SealTaskType) int {
	tc.lk.Lock()
	defer tc.lk.Unlock()
	return tc.taskCounters[tt]
}

func (tc *taskCounter) Sum() int {
	tc.lk.Lock()
	defer tc.lk.Unlock()
	sum := 0
	for _, v := range tc.taskCounters {
		sum += v
	}
	return sum
}

func (tc *taskCounter) ForEach(cb func(tt sealtasks.SealTaskType, count int)) {
	tc.lk.Lock()
	defer tc.lk.Unlock()
	for tt, count := range tc.taskCounters {
		cb(tt, count)
	}
}

func NewActiveResources(tc *taskCounter) *ActiveResources {
	return &ActiveResources{
		taskCounters: tc,
	}
}

func (a *ActiveResources) withResources(id storiface.WorkerID, wr storiface.WorkerInfo, tt sealtasks.SealTaskType, r storiface.Resources, locker sync.Locker, cb func() error) error {
	for !a.CanHandleRequest(tt, r, id, "withResources", wr) {
		if a.cond == nil {
			a.cond = sync.NewCond(locker)
		}
		a.waiting++
		a.cond.Wait()
		a.waiting--
	}

	a.Add(tt, wr.Resources, r)

	err := cb()

	a.Free(tt, wr.Resources, r)

	return err
}

// must be called with the same lock as the one passed to withResources
func (a *ActiveResources) hasWorkWaiting() bool {
	return a.waiting > 0
}

// add task resources to ActiveResources and return utilization difference
func (a *ActiveResources) Add(tt sealtasks.SealTaskType, wr storiface.WorkerResources, r storiface.Resources) float64 {
	startUtil := a.utilization(wr)

	if r.GPUUtilization > 0 {
		a.gpuUsed += r.GPUUtilization
	}
	a.cpuUse += r.Threads(wr.CPUs, len(wr.GPUs))
	a.memUsedMin += r.MinMemory
	a.memUsedMax += r.MaxMemory
	a.taskCounters.Add(tt)

	return a.utilization(wr) - startUtil
}

func (a *ActiveResources) Free(tt sealtasks.SealTaskType, wr storiface.WorkerResources, r storiface.Resources) {
	if r.GPUUtilization > 0 {
		a.gpuUsed -= r.GPUUtilization
	}
	a.cpuUse -= r.Threads(wr.CPUs, len(wr.GPUs))
	a.memUsedMin -= r.MinMemory
	a.memUsedMax -= r.MaxMemory
	a.taskCounters.Free(tt)

	if a.cond != nil {
		a.cond.Broadcast()
	}
}

// CanHandleRequest evaluates if the worker has enough available resources to
// handle the request.
func (a *ActiveResources) CanHandleRequest(tt sealtasks.SealTaskType, needRes storiface.Resources, wid storiface.WorkerID, caller string, info storiface.WorkerInfo) bool {
	if needRes.MaxConcurrent > 0 {
		if a.taskCounters.Get(tt) >= needRes.MaxConcurrent {
			log.Debugf("sched: not scheduling on worker %s for %s; at task limit tt=%s, curcount=%d", wid, caller, tt, a.taskCounters.Get(tt))
			return false
		}
	}

	if info.IgnoreResources {
		// shortcircuit; if this worker is ignoring resources, it can always handle the request.
		return true
	}

	res := info.Resources

	// TODO: dedupe needRes.BaseMinMemory per task type (don't add if that task is already running)
	memNeeded := needRes.MinMemory + needRes.BaseMinMemory
	memUsed := a.memUsedMin
	// assume that MemUsed can be swapped, so only check it in the vmem Check
	memAvail := res.MemPhysical - memUsed
	if memNeeded > memAvail {
		log.Debugf("sched: not scheduling on worker %s for %s; not enough physical memory - need: %dM, have %dM available", wid, caller, memNeeded/mib, memAvail/mib)
		return false
	}

	vmemNeeded := needRes.MaxMemory + needRes.BaseMinMemory
	vmemUsed := a.memUsedMax
	workerMemoryReserved := res.MemUsed + res.MemSwapUsed // memory used outside lotus-worker (used by the OS, etc.)

	if vmemUsed < workerMemoryReserved {
		vmemUsed = workerMemoryReserved
	}
	vmemAvail := (res.MemPhysical + res.MemSwap) - vmemUsed

	if vmemNeeded > vmemAvail {
		log.Debugf("sched: not scheduling on worker %s for %s; not enough virtual memory - need: %dM, have %dM available", wid, caller, vmemNeeded/mib, vmemAvail/mib)
		return false
	}

	if a.cpuUse+needRes.Threads(res.CPUs, len(res.GPUs)) > res.CPUs {
		log.Debugf("sched: not scheduling on worker %s for %s; not enough threads, need %d, %d in use, target %d", wid, caller, needRes.Threads(res.CPUs, len(res.GPUs)), a.cpuUse, res.CPUs)
		return false
	}

	if len(res.GPUs) > 0 && needRes.GPUUtilization > 0 {
		if a.gpuUsed+needRes.GPUUtilization > float64(len(res.GPUs)) {
			log.Debugf("sched: not scheduling on worker %s for %s; GPU(s) in use", wid, caller)
			return false
		}
	}

	return true
}

// utilization returns a number in 0..1 range indicating fraction of used resources
func (a *ActiveResources) utilization(wr storiface.WorkerResources) float64 { // todo task type
	var max float64

	cpu := float64(a.cpuUse) / float64(wr.CPUs)
	max = cpu

	memUsed := a.memUsedMin
	if memUsed < wr.MemUsed {
		memUsed = wr.MemUsed
	}
	memMin := float64(memUsed) / float64(wr.MemPhysical)
	if memMin > max {
		max = memMin
	}

	vmemUsed := a.memUsedMax
	if a.memUsedMax < wr.MemUsed+wr.MemSwapUsed {
		vmemUsed = wr.MemUsed + wr.MemSwapUsed
	}
	memMax := float64(vmemUsed) / float64(wr.MemPhysical+wr.MemSwap)

	if memMax > max {
		max = memMax
	}

	if len(wr.GPUs) > 0 {
		gpuMax := a.gpuUsed / float64(len(wr.GPUs))
		if gpuMax > max {
			max = gpuMax
		}
	}

	return max
}

func (a *ActiveResources) taskCount(tt *sealtasks.SealTaskType) int {
	// nil means all tasks
	if tt == nil {
		return a.taskCounters.Sum()
	}

	return a.taskCounters.Get(*tt)
}

func (wh *WorkerHandle) Utilization() float64 {
	wh.lk.Lock()
	u := wh.active.utilization(wh.Info.Resources)
	u += wh.preparing.utilization(wh.Info.Resources)
	wh.lk.Unlock()
	wh.wndLk.Lock()
	for _, window := range wh.activeWindows {
		u += window.Allocated.utilization(wh.Info.Resources)
	}
	wh.wndLk.Unlock()

	return u
}

func (wh *WorkerHandle) TaskCounts() int {
	wh.lk.Lock()
	u := wh.active.taskCount(nil)
	u += wh.preparing.taskCount(nil)
	wh.lk.Unlock()
	wh.wndLk.Lock()
	for _, window := range wh.activeWindows {
		u += window.Allocated.taskCount(nil)
	}
	wh.wndLk.Unlock()

	return u
}

func (wh *WorkerHandle) TaskCount(tt *sealtasks.SealTaskType) int {
	wh.lk.Lock()
	u := wh.active.taskCount(tt)
	u += wh.preparing.taskCount(tt)
	wh.lk.Unlock()
	wh.wndLk.Lock()
	for _, window := range wh.activeWindows {
		u += window.Allocated.taskCount(tt)
	}
	wh.wndLk.Unlock()

	return u
}
storage: Move extern/sector-storage to storage/sealer 2022-06-14 18:03:38 +00:00			`package sealer`
sched: implement runWorker 2020-07-09 11:49:01 +00:00
			`import (`
fix sched_test 2022-11-28 17:02:16 +00:00			`"sync"`

storage: Move extern/sector-storage to storage/sealer 2022-06-14 18:03:38 +00:00			`"github.com/filecoin-project/lotus/storage/sealer/sealtasks"`
chore: remove redundant import prefixes 2022-06-15 10:06:22 +00:00			`"github.com/filecoin-project/lotus/storage/sealer/storiface"`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`)`

fix lint 2022-05-27 14:15:52 +00:00			`type ActiveResources struct {`
feat: sched: Worker task count limits for all task types 2022-05-25 12:44:11 +00:00			`memUsedMin uint64`
			`memUsedMax uint64`
			`gpuUsed float64`
			`cpuUse uint64`

sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`taskCounters *taskCounter`
feat: sched: Worker task count limits for all task types 2022-05-25 12:44:11 +00:00
			`cond *sync.Cond`
			`waiting int`
			`}`

sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`type taskCounter struct {`
			`taskCounters map[sealtasks.SealTaskType]int`

			`// this lock is technically redundant, as ActiveResources is always accessed`
			`// with the worker lock, but let's not panic if we ever change that`
			`lk sync.Mutex`
			`}`

			`func newTaskCounter() *taskCounter {`
			`return &taskCounter{`
feat: sched: Worker task count limits for all task types 2022-05-25 12:44:11 +00:00			`taskCounters: map[sealtasks.SealTaskType]int{},`
			`}`
			`}`

sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`func (tc *taskCounter) Add(tt sealtasks.SealTaskType) {`
			`tc.lk.Lock()`
			`defer tc.lk.Unlock()`
			`tc.taskCounters[tt]++`
			`}`

			`func (tc *taskCounter) Free(tt sealtasks.SealTaskType) {`
			`tc.lk.Lock()`
			`defer tc.lk.Unlock()`
			`tc.taskCounters[tt]--`
			`}`

			`func (tc *taskCounter) Get(tt sealtasks.SealTaskType) int {`
			`tc.lk.Lock()`
			`defer tc.lk.Unlock()`
			`return tc.taskCounters[tt]`
			`}`

			`func (tc *taskCounter) Sum() int {`
			`tc.lk.Lock()`
			`defer tc.lk.Unlock()`
			`sum := 0`
			`for _, v := range tc.taskCounters {`
			`sum += v`
			`}`
			`return sum`
			`}`

			`func (tc *taskCounter) ForEach(cb func(tt sealtasks.SealTaskType, count int)) {`
			`tc.lk.Lock()`
			`defer tc.lk.Unlock()`
			`for tt, count := range tc.taskCounters {`
			`cb(tt, count)`
			`}`
			`}`

			`func NewActiveResources(tc taskCounter) ActiveResources {`
			`return &ActiveResources{`
			`taskCounters: tc,`
			`}`
			`}`

fix lint 2022-05-27 14:15:52 +00:00			`func (a *ActiveResources) withResources(id storiface.WorkerID, wr storiface.WorkerInfo, tt sealtasks.SealTaskType, r storiface.Resources, locker sync.Locker, cb func() error) error {`
Merge remote-tracking branch 'origin/master' into feat/worker-task-count-limits 2022-05-27 14:01:32 +00:00			`for !a.CanHandleRequest(tt, r, id, "withResources", wr) {`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`if a.cond == nil {`
			`a.cond = sync.NewCond(locker)`
			`}`
wip improve scheduling of ready work 2021-09-15 14:37:27 +00:00			`a.waiting++`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`a.cond.Wait()`
wip improve scheduling of ready work 2021-09-15 14:37:27 +00:00			`a.waiting--`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`}`

Merge remote-tracking branch 'origin/master' into feat/worker-task-count-limits 2022-05-27 14:01:32 +00:00			`a.Add(tt, wr.Resources, r)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00
			`err := cb()`

Merge remote-tracking branch 'origin/master' into feat/worker-task-count-limits 2022-05-27 14:01:32 +00:00			`a.Free(tt, wr.Resources, r)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00
			`return err`
			`}`

wip improve scheduling of ready work 2021-09-15 14:37:27 +00:00			`// must be called with the same lock as the one passed to withResources`
fix lint 2022-05-27 14:15:52 +00:00			`func (a *ActiveResources) hasWorkWaiting() bool {`
wip improve scheduling of ready work 2021-09-15 14:37:27 +00:00			`return a.waiting > 0`
			`}`

fix lint 2022-05-27 14:15:52 +00:00			`// add task resources to ActiveResources and return utilization difference`
			`func (a *ActiveResources) Add(tt sealtasks.SealTaskType, wr storiface.WorkerResources, r storiface.Resources) float64 {`
feat: sched: Improve worker assigning logic 2022-04-06 20:55:28 +00:00			`startUtil := a.utilization(wr)`

Use a float to represent GPU utilization Before this change workers can only be allocated one GPU task, regardless of how much of the GPU resources that task uses, or how many GPUs are in the system. This makes GPUUtilization a float which can represent that a task needs a portion, or multiple GPUs. GPUs are accounted for like RAM and CPUs so that workers with more GPUs can be allocated more tasks. A known issue is that PC2 cannot use multiple GPUs. And even if the worker has multiple GPUs and is allocated multiple PC2 tasks, those tasks will only run on the first GPU. This could result in unexpected behavior when a worker with multiple GPUs is assigned multiple PC2 tasks. But this should not suprise any existing users who upgrade, as any existing users who run workers with multiple GPUs should already know this and be running a worker per GPU for PC2. But now those users have the freedom to customize the GPU utilization of PC2 to be less than one and effectively run multiple PC2 processes in a single worker. C2 is capable of utilizing multiple GPUs, and now workers can be customized for C2 accordingly. 2021-09-01 01:59:25 +00:00			`if r.GPUUtilization > 0 {`
			`a.gpuUsed += r.GPUUtilization`
extern/sector-storage: fix GPU usage overwrite bug 2020-10-28 18:52:33 +00:00			`}`
sched resources: Separate Parallelism defaults depending on GPU presence 2021-11-29 11:40:54 +00:00			`a.cpuUse += r.Threads(wr.CPUs, len(wr.GPUs))`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`a.memUsedMin += r.MinMemory`
			`a.memUsedMax += r.MaxMemory`
sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`a.taskCounters.Add(tt)`
feat: sched: Improve worker assigning logic 2022-04-06 20:55:28 +00:00
			`return a.utilization(wr) - startUtil`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`}`

fix lint 2022-05-27 14:15:52 +00:00			`func (a *ActiveResources) Free(tt sealtasks.SealTaskType, wr storiface.WorkerResources, r storiface.Resources) {`
Use a float to represent GPU utilization Before this change workers can only be allocated one GPU task, regardless of how much of the GPU resources that task uses, or how many GPUs are in the system. This makes GPUUtilization a float which can represent that a task needs a portion, or multiple GPUs. GPUs are accounted for like RAM and CPUs so that workers with more GPUs can be allocated more tasks. A known issue is that PC2 cannot use multiple GPUs. And even if the worker has multiple GPUs and is allocated multiple PC2 tasks, those tasks will only run on the first GPU. This could result in unexpected behavior when a worker with multiple GPUs is assigned multiple PC2 tasks. But this should not suprise any existing users who upgrade, as any existing users who run workers with multiple GPUs should already know this and be running a worker per GPU for PC2. But now those users have the freedom to customize the GPU utilization of PC2 to be less than one and effectively run multiple PC2 processes in a single worker. C2 is capable of utilizing multiple GPUs, and now workers can be customized for C2 accordingly. 2021-09-01 01:59:25 +00:00			`if r.GPUUtilization > 0 {`
			`a.gpuUsed -= r.GPUUtilization`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`}`
sched resources: Separate Parallelism defaults depending on GPU presence 2021-11-29 11:40:54 +00:00			`a.cpuUse -= r.Threads(wr.CPUs, len(wr.GPUs))`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`a.memUsedMin -= r.MinMemory`
			`a.memUsedMax -= r.MaxMemory`
sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`a.taskCounters.Free(tt)`
wip improve scheduling of ready work 2021-09-15 14:37:27 +00:00
			`if a.cond != nil {`
			`a.cond.Broadcast()`
			`}`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`}`

feat: sealing: Put scheduler assign logic behind an interface 2022-05-18 13:47:08 +00:00			`// CanHandleRequest evaluates if the worker has enough available resources to`
move scheduling filtering logic down. 2021-06-21 19:49:16 +00:00			`// handle the request.`
fix lint 2022-05-27 14:15:52 +00:00			`func (a *ActiveResources) CanHandleRequest(tt sealtasks.SealTaskType, needRes storiface.Resources, wid storiface.WorkerID, caller string, info storiface.WorkerInfo) bool {`
feat: sched: Worker task count limits for all task types 2022-05-25 12:44:11 +00:00			`if needRes.MaxConcurrent > 0 {`
sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`if a.taskCounters.Get(tt) >= needRes.MaxConcurrent {`
			`log.Debugf("sched: not scheduling on worker %s for %s; at task limit tt=%s, curcount=%d", wid, caller, tt, a.taskCounters.Get(tt))`
feat: sched: Worker task count limits for all task types 2022-05-25 12:44:11 +00:00			`return false`
			`}`
			`}`

move scheduling filtering logic down. 2021-06-21 19:49:16 +00:00			`if info.IgnoreResources {`
			`// shortcircuit; if this worker is ignoring resources, it can always handle the request.`
			`return true`
			`}`
sched: implement runWorker 2020-07-09 11:49:01 +00:00
move scheduling filtering logic down. 2021-06-21 19:49:16 +00:00			`res := info.Resources`
Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`// TODO: dedupe needRes.BaseMinMemory per task type (don't add if that task is already running)`
Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`memNeeded := needRes.MinMemory + needRes.BaseMinMemory`
			`memUsed := a.memUsedMin`
			`// assume that MemUsed can be swapped, so only check it in the vmem Check`
			`memAvail := res.MemPhysical - memUsed`
			`if memNeeded > memAvail {`
			`log.Debugf("sched: not scheduling on worker %s for %s; not enough physical memory - need: %dM, have %dM available", wid, caller, memNeeded/mib, memAvail/mib)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`return false`
			`}`

Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`vmemNeeded := needRes.MaxMemory + needRes.BaseMinMemory`
			`vmemUsed := a.memUsedMax`
Address Scheduler enhancements (#7703) review 2021-11-30 19:50:34 +00:00			`workerMemoryReserved := res.MemUsed + res.MemSwapUsed // memory used outside lotus-worker (used by the OS, etc.)`

			`if vmemUsed < workerMemoryReserved {`
			`vmemUsed = workerMemoryReserved`
Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`}`
Address Scheduler enhancements (#7703) review 2021-11-30 19:50:34 +00:00			`vmemAvail := (res.MemPhysical + res.MemSwap) - vmemUsed`
sched: implement runWorker 2020-07-09 11:49:01 +00:00
Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`if vmemNeeded > vmemAvail {`
			`log.Debugf("sched: not scheduling on worker %s for %s; not enough virtual memory - need: %dM, have %dM available", wid, caller, vmemNeeded/mib, vmemAvail/mib)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`return false`
			`}`

sched resources: Separate Parallelism defaults depending on GPU presence 2021-11-29 11:40:54 +00:00			`if a.cpuUse+needRes.Threads(res.CPUs, len(res.GPUs)) > res.CPUs {`
			`log.Debugf("sched: not scheduling on worker %s for %s; not enough threads, need %d, %d in use, target %d", wid, caller, needRes.Threads(res.CPUs, len(res.GPUs)), a.cpuUse, res.CPUs)`
sched: Allow some single-thread tasks to run in parallel with PC2/C2 2020-09-30 22:27:54 +00:00			`return false`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`}`

Use a float to represent GPU utilization Before this change workers can only be allocated one GPU task, regardless of how much of the GPU resources that task uses, or how many GPUs are in the system. This makes GPUUtilization a float which can represent that a task needs a portion, or multiple GPUs. GPUs are accounted for like RAM and CPUs so that workers with more GPUs can be allocated more tasks. A known issue is that PC2 cannot use multiple GPUs. And even if the worker has multiple GPUs and is allocated multiple PC2 tasks, those tasks will only run on the first GPU. This could result in unexpected behavior when a worker with multiple GPUs is assigned multiple PC2 tasks. But this should not suprise any existing users who upgrade, as any existing users who run workers with multiple GPUs should already know this and be running a worker per GPU for PC2. But now those users have the freedom to customize the GPU utilization of PC2 to be less than one and effectively run multiple PC2 processes in a single worker. C2 is capable of utilizing multiple GPUs, and now workers can be customized for C2 accordingly. 2021-09-01 01:59:25 +00:00			`if len(res.GPUs) > 0 && needRes.GPUUtilization > 0 {`
			`if a.gpuUsed+needRes.GPUUtilization > float64(len(res.GPUs)) {`
			`log.Debugf("sched: not scheduling on worker %s for %s; GPU(s) in use", wid, caller)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`return false`
			`}`
			`}`

			`return true`
			`}`

feat: sched: Improve worker assigning logic 2022-04-06 20:55:28 +00:00			`// utilization returns a number in 0..1 range indicating fraction of used resources`
fix lint 2022-05-27 14:15:52 +00:00			`func (a *ActiveResources) utilization(wr storiface.WorkerResources) float64 { // todo task type`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`var max float64`

			`cpu := float64(a.cpuUse) / float64(wr.CPUs)`
			`max = cpu`

Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`memUsed := a.memUsedMin`
			`if memUsed < wr.MemUsed {`
			`memUsed = wr.MemUsed`
			`}`
			`memMin := float64(memUsed) / float64(wr.MemPhysical)`
sched: implement runWorker 2020-07-09 11:49:01 +00:00			`if memMin > max {`
			`max = memMin`
			`}`

Report memory used and swap used in worker res Attempting to report "memory used by other processes" in the MemReserved field fails to take into account the fact that the system's memory used includes memory used by ongoing tasks. To properly account for this, worker should report the memory and swap used, then the scheduler that is aware of the memory requirements for a task can determine if there is sufficient memory available for a task. 2021-09-09 21:41:59 +00:00			`vmemUsed := a.memUsedMax`
			`if a.memUsedMax < wr.MemUsed+wr.MemSwapUsed {`
			`vmemUsed = wr.MemUsed + wr.MemSwapUsed`
			`}`
			`memMax := float64(vmemUsed) / float64(wr.MemPhysical+wr.MemSwap)`

sched: implement runWorker 2020-07-09 11:49:01 +00:00			`if memMax > max {`
			`max = memMax`
			`}`

feat: sched: Improve worker assigning logic 2022-04-06 20:55:28 +00:00			`if len(wr.GPUs) > 0 {`
			`gpuMax := a.gpuUsed / float64(len(wr.GPUs))`
			`if gpuMax > max {`
			`max = gpuMax`
			`}`
			`}`

sched: implement runWorker 2020-07-09 11:49:01 +00:00			`return max`
			`}`
sealing sched: Factor worker queues into utilization calc 2020-08-31 11:31:11 +00:00
feat: sched: Assigner experiments 2023-02-27 16:44:38 +00:00			`func (a ActiveResources) taskCount(tt sealtasks.SealTaskType) int {`
			`// nil means all tasks`
			`if tt == nil {`
sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`return a.taskCounters.Sum()`
feat: sched: Assigner experiments 2023-02-27 16:44:38 +00:00			`}`

sched: Share active/preparing task counters 2023-02-28 08:02:18 +00:00			`return a.taskCounters.Get(*tt)`
feat: sched: Assigner experiments 2023-02-27 16:44:38 +00:00			`}`

feat: sealing: Put scheduler assign logic behind an interface 2022-05-18 13:47:08 +00:00			`func (wh *WorkerHandle) Utilization() float64 {`
sealing sched: Factor worker queues into utilization calc 2020-08-31 11:31:11 +00:00			`wh.lk.Lock()`
feat: sealing: Put scheduler assign logic behind an interface 2022-05-18 13:47:08 +00:00			`u := wh.active.utilization(wh.Info.Resources)`
			`u += wh.preparing.utilization(wh.Info.Resources)`
sealing sched: Factor worker queues into utilization calc 2020-08-31 11:31:11 +00:00			`wh.lk.Unlock()`
			`wh.wndLk.Lock()`
			`for _, window := range wh.activeWindows {`
feat: sealing: Put scheduler assign logic behind an interface 2022-05-18 13:47:08 +00:00			`u += window.Allocated.utilization(wh.Info.Resources)`
sealing sched: Factor worker queues into utilization calc 2020-08-31 11:31:11 +00:00			`}`
			`wh.wndLk.Unlock()`

			`return u`
			`}`
feat: sched: Assigner experiments 2023-02-27 16:44:38 +00:00
			`func (wh *WorkerHandle) TaskCounts() int {`
			`wh.lk.Lock()`
			`u := wh.active.taskCount(nil)`
			`u += wh.preparing.taskCount(nil)`
			`wh.lk.Unlock()`
			`wh.wndLk.Lock()`
			`for _, window := range wh.activeWindows {`
			`u += window.Allocated.taskCount(nil)`
			`}`
			`wh.wndLk.Unlock()`

			`return u`
			`}`

			`func (wh WorkerHandle) TaskCount(tt sealtasks.SealTaskType) int {`
			`wh.lk.Lock()`
			`u := wh.active.taskCount(tt)`
			`u += wh.preparing.taskCount(tt)`
			`wh.lk.Unlock()`
			`wh.wndLk.Lock()`
			`for _, window := range wh.activeWindows {`
			`u += window.Allocated.taskCount(tt)`
			`}`
			`wh.wndLk.Unlock()`

			`return u`
			`}`