safing-portmaster/spn/docks/op_capacity.go
Daniel Hååvi 80664d1a27
Restructure modules ()
* Move portbase into monorepo

* Add new simple module mgr

* [WIP] Switch to new simple module mgr

* Add StateMgr and more worker variants

* [WIP] Switch more modules

* [WIP] Switch more modules

* [WIP] swtich more modules

* [WIP] switch all SPN modules

* [WIP] switch all service modules

* [WIP] Convert all workers to the new module system

* [WIP] add new task system to module manager

* [WIP] Add second take for scheduling workers

* [WIP] Add FIXME for bugs in new scheduler

* [WIP] Add minor improvements to scheduler

* [WIP] Add new worker scheduler

* [WIP] Fix more bug related to new module system

* [WIP] Fix start handing of the new module system

* [WIP] Improve startup process

* [WIP] Fix minor issues

* [WIP] Fix missing subsystem in settings

* [WIP] Initialize managers in constructor

* [WIP] Move module event initialization to constrictors

* [WIP] Fix setting for enabling and disabling the SPN module

* [WIP] Move API registeration into module construction

* [WIP] Update states mgr for all modules

* [WIP] Add CmdLine operation support

* Add state helper methods to module group and instance

* Add notification and module status handling to status package

* Fix starting issues

* Remove pilot widget and update security lock to new status data

* Remove debug logs

* Improve http server shutdown

* Add workaround for cleanly shutting down firewall+netquery

* Improve logging

* Add syncing states with notifications for new module system

* Improve starting, stopping, shutdown; resolve FIXMEs/TODOs

* [WIP] Fix most unit tests

* Review new module system and fix minor issues

* Push shutdown and restart events again via API

* Set sleep mode via interface

* Update example/template module

* [WIP] Fix spn/cabin unit test

* Remove deprecated UI elements

* Make log output more similar for the logging transition phase

* Switch spn hub and observer cmds to new module system

* Fix log sources

* Make worker mgr less error prone

* Fix tests and minor issues

* Fix observation hub

* Improve shutdown and restart handling

* Split up big connection.go source file

* Move varint and dsd packages to structures repo

* Improve expansion test

* Fix linter warnings

* Fix interception module on windows

* Fix linter errors

---------

Co-authored-by: Vladimir Stoilov <vladimir@safing.io>
2024-08-09 18:15:48 +03:00

356 lines
9.3 KiB
Go

package docks
import (
"bytes"
"sync/atomic"
"time"
"github.com/tevino/abool"
"github.com/safing/portmaster/base/log"
"github.com/safing/portmaster/service/mgr"
"github.com/safing/portmaster/spn/terminal"
"github.com/safing/structures/container"
"github.com/safing/structures/dsd"
)
const (
// CapacityTestOpType is the type ID of the capacity test operation.
CapacityTestOpType = "capacity"
defaultCapacityTestVolume = 50000000 // 50MB
maxCapacityTestVolume = 100000000 // 100MB
defaultCapacityTestMaxTime = 5 * time.Second
maxCapacityTestMaxTime = 15 * time.Second
capacityTestTimeout = 30 * time.Second
capacityTestMsgSize = 1000
capacityTestSendTimeout = 1000 * time.Millisecond
)
var (
capacityTestSendData = make([]byte, capacityTestMsgSize)
capacityTestDataReceivedSignal = []byte("ACK")
capacityTestRunning = abool.New()
)
// CapacityTestOp is used for capacity test operations.
type CapacityTestOp struct { //nolint:maligned
terminal.OperationBase
opts *CapacityTestOptions
started bool
startTime time.Time
senderStarted bool
recvQueue chan *terminal.Msg
dataReceived int
dataReceivedAckWasAckd bool
dataSent *int64
dataSentWasAckd *abool.AtomicBool
testResult int
result chan *terminal.Error
}
// CapacityTestOptions holds options for the capacity test.
type CapacityTestOptions struct {
TestVolume int
MaxTime time.Duration
testing bool
}
// Type returns the type ID.
func (op *CapacityTestOp) Type() string {
return CapacityTestOpType
}
func init() {
terminal.RegisterOpType(terminal.OperationFactory{
Type: CapacityTestOpType,
Requires: terminal.IsCraneController,
Start: startCapacityTestOp,
})
}
// NewCapacityTestOp runs a capacity test.
func NewCapacityTestOp(t terminal.Terminal, opts *CapacityTestOptions) (*CapacityTestOp, *terminal.Error) {
// Check options.
if opts == nil {
opts = &CapacityTestOptions{
TestVolume: defaultCapacityTestVolume,
MaxTime: defaultCapacityTestMaxTime,
}
}
// Check if another test is already running.
if !opts.testing && !capacityTestRunning.SetToIf(false, true) {
return nil, terminal.ErrTryAgainLater.With("another capacity op is already running")
}
// Create and init.
op := &CapacityTestOp{
opts: opts,
recvQueue: make(chan *terminal.Msg),
dataSent: new(int64),
dataSentWasAckd: abool.New(),
result: make(chan *terminal.Error, 1),
}
// Make capacity test request.
request, err := dsd.Dump(op.opts, dsd.CBOR)
if err != nil {
capacityTestRunning.UnSet()
return nil, terminal.ErrInternalError.With("failed to serialize capactity test options: %w", err)
}
// Send test request.
tErr := t.StartOperation(op, container.New(request), 1*time.Second)
if tErr != nil {
capacityTestRunning.UnSet()
return nil, tErr
}
// Start handler.
module.mgr.Go("op capacity handler", op.handler)
return op, nil
}
func startCapacityTestOp(t terminal.Terminal, opID uint32, data *container.Container) (terminal.Operation, *terminal.Error) {
// Check if another test is already running.
if !capacityTestRunning.SetToIf(false, true) {
return nil, terminal.ErrTryAgainLater.With("another capacity op is already running")
}
// Parse options.
opts := &CapacityTestOptions{}
_, err := dsd.Load(data.CompileData(), opts)
if err != nil {
capacityTestRunning.UnSet()
return nil, terminal.ErrMalformedData.With("failed to parse options: %w", err)
}
// Check options.
if opts.TestVolume > maxCapacityTestVolume {
capacityTestRunning.UnSet()
return nil, terminal.ErrInvalidOptions.With("maximum volume exceeded")
}
if opts.MaxTime > maxCapacityTestMaxTime {
capacityTestRunning.UnSet()
return nil, terminal.ErrInvalidOptions.With("maximum maxtime exceeded")
}
// Create operation.
op := &CapacityTestOp{
opts: opts,
recvQueue: make(chan *terminal.Msg, 1000),
dataSent: new(int64),
dataSentWasAckd: abool.New(),
result: make(chan *terminal.Error, 1),
}
op.InitOperationBase(t, opID)
// Start handler and sender.
op.senderStarted = true
module.mgr.Go("op capacity handler", op.handler)
module.mgr.Go("op capacity sender", op.sender)
return op, nil
}
func (op *CapacityTestOp) handler(ctx *mgr.WorkerCtx) error {
defer capacityTestRunning.UnSet()
returnErr := terminal.ErrStopping
defer func() {
// Linters don't get that returnErr is used when directly used as defer.
op.Stop(op, returnErr)
}()
var maxTestTimeReached <-chan time.Time
opTimeout := time.After(capacityTestTimeout)
// Setup unit handling
var msg *terminal.Msg
defer msg.Finish()
// Handle receives.
for {
msg.Finish()
select {
case <-ctx.Done():
returnErr = terminal.ErrCanceled
return nil
case <-opTimeout:
returnErr = terminal.ErrTimeout
return nil
case <-maxTestTimeReached:
returnErr = op.reportMeasuredCapacity()
return nil
case msg = <-op.recvQueue:
// Record start time and start sender.
if !op.started {
op.started = true
op.startTime = time.Now()
maxTestTimeReached = time.After(op.opts.MaxTime)
if !op.senderStarted {
op.senderStarted = true
module.mgr.Go("op capacity sender", op.sender)
}
}
// Add to received data counter.
op.dataReceived += msg.Data.Length()
// Check if we received the data received signal.
if msg.Data.Length() == len(capacityTestDataReceivedSignal) &&
bytes.Equal(msg.Data.CompileData(), capacityTestDataReceivedSignal) {
op.dataSentWasAckd.Set()
}
// Send the data received signal when we received the full test volume.
if op.dataReceived >= op.opts.TestVolume && !op.dataReceivedAckWasAckd {
tErr := op.Send(op.NewMsg(capacityTestDataReceivedSignal), capacityTestSendTimeout)
if tErr != nil {
returnErr = tErr.Wrap("failed to send data received signal")
return nil
}
atomic.AddInt64(op.dataSent, int64(len(capacityTestDataReceivedSignal)))
op.dataReceivedAckWasAckd = true
// Flush last message.
op.Flush(10 * time.Second)
}
// Check if we can complete the test.
if op.dataReceivedAckWasAckd &&
op.dataSentWasAckd.IsSet() {
returnErr = op.reportMeasuredCapacity()
return nil
}
}
}
}
func (op *CapacityTestOp) sender(ctx *mgr.WorkerCtx) error {
for {
// Send next chunk.
msg := op.NewMsg(capacityTestSendData)
msg.Unit.MakeHighPriority()
tErr := op.Send(msg, capacityTestSendTimeout)
if tErr != nil {
op.Stop(op, tErr.Wrap("failed to send capacity test data"))
return nil
}
// Add to sent data counter and stop sending if sending is complete.
if atomic.AddInt64(op.dataSent, int64(len(capacityTestSendData))) >= int64(op.opts.TestVolume) {
return nil
}
// Check if we have received an ack.
if op.dataSentWasAckd.IsSet() {
return nil
}
// Check if op has ended.
if op.Stopped() {
return nil
}
}
}
func (op *CapacityTestOp) reportMeasuredCapacity() *terminal.Error {
// Calculate lane capacity and set it.
timeNeeded := time.Since(op.startTime)
if timeNeeded <= 0 {
timeNeeded = 1
}
duplexBits := float64((int64(op.dataReceived) + atomic.LoadInt64(op.dataSent)) * 8)
duplexNSBitRate := duplexBits / float64(timeNeeded)
bitRate := (duplexNSBitRate / 2) * float64(time.Second)
op.testResult = int(bitRate)
// Save the result to the crane.
if controller, ok := op.Terminal().(*CraneControllerTerminal); ok {
if controller.Crane.ConnectedHub != nil {
controller.Crane.ConnectedHub.GetMeasurements().SetCapacity(op.testResult)
log.Infof(
"docks: measured capacity to %s: %.2f Mbit/s (%.2fMB down / %.2fMB up in %s)",
controller.Crane.ConnectedHub,
float64(op.testResult)/1000000,
float64(op.dataReceived)/1000000,
float64(atomic.LoadInt64(op.dataSent))/1000000,
timeNeeded,
)
return nil
} else if controller.Crane.IsMine() {
return terminal.ErrInternalError.With("capacity operation was run on %s without a connected hub set", controller.Crane)
}
} else if !runningTests {
return terminal.ErrInternalError.With("capacity operation was run on terminal that is not a crane controller, but %T", op.Terminal())
}
return nil
}
// Deliver delivers a message.
func (op *CapacityTestOp) Deliver(msg *terminal.Msg) *terminal.Error {
// Optimized delivery with 1s timeout.
select {
case op.recvQueue <- msg:
default:
select {
case op.recvQueue <- msg:
case <-time.After(1 * time.Second):
msg.Finish()
return terminal.ErrTimeout
}
}
return nil
}
// HandleStop gives the operation the ability to cleanly shut down.
// The returned error is the error to send to the other side.
// Should never be called directly. Call Stop() instead.
func (op *CapacityTestOp) HandleStop(tErr *terminal.Error) (errorToSend *terminal.Error) {
// Return result to waiting routine.
select {
case op.result <- tErr:
default:
}
// Drain the recvQueue to finish the message units.
drain:
for {
select {
case msg := <-op.recvQueue:
msg.Finish()
default:
select {
case msg := <-op.recvQueue:
msg.Finish()
case <-time.After(3 * time.Millisecond):
// Give some additional time buffer to drain the queue.
break drain
}
}
}
// Return error as is.
return tErr
}
// Result returns the result (end error) of the operation.
func (op *CapacityTestOp) Result() <-chan *terminal.Error {
return op.result
}