2024-09-07 13:46:59 +00:00
|
|
|
// Package children manages the creation, lifetime, and shutdown of child
|
|
|
|
// processes created by the daemon.
|
|
|
|
package children
|
2024-07-06 13:36:48 +00:00
|
|
|
|
|
|
|
import (
|
2025-01-04 14:50:17 +00:00
|
|
|
"cmp"
|
2024-07-06 13:36:48 +00:00
|
|
|
"context"
|
2024-07-13 12:34:06 +00:00
|
|
|
"errors"
|
2024-07-06 13:36:48 +00:00
|
|
|
"fmt"
|
2025-01-04 14:50:17 +00:00
|
|
|
"slices"
|
2024-07-06 13:36:48 +00:00
|
|
|
|
|
|
|
"code.betamike.com/micropelago/pmux/pmuxlib"
|
2024-10-27 13:31:10 +00:00
|
|
|
"dev.mediocregopher.com/mediocre-go-lib.git/mctx"
|
2024-07-06 13:36:48 +00:00
|
|
|
"dev.mediocregopher.com/mediocre-go-lib.git/mlog"
|
2025-01-04 14:50:17 +00:00
|
|
|
"golang.org/x/exp/maps"
|
2024-09-07 13:46:59 +00:00
|
|
|
|
|
|
|
"isle/bootstrap"
|
|
|
|
"isle/daemon/daecommon"
|
2025-01-04 14:50:17 +00:00
|
|
|
"isle/garage"
|
2024-09-07 13:46:59 +00:00
|
|
|
"isle/secrets"
|
2024-09-09 14:34:00 +00:00
|
|
|
"isle/toolkit"
|
2024-07-06 13:36:48 +00:00
|
|
|
)
|
|
|
|
|
2025-01-04 14:50:17 +00:00
|
|
|
type garageProc struct {
|
|
|
|
*pmuxlib.Process
|
|
|
|
alloc daecommon.ConfigStorageAllocation
|
|
|
|
adminAddr string
|
|
|
|
}
|
|
|
|
|
2025-01-01 11:38:16 +00:00
|
|
|
// Opts are optional fields which can be passed into New. A nil value is
|
|
|
|
// equivalent to a zero value.
|
|
|
|
type Opts struct {
|
|
|
|
// GarageNewCluster should be true if the garage instances being started
|
|
|
|
// are the first instances in a cluster which is being created.
|
|
|
|
GarageNewCluster bool
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o *Opts) withDefaults() *Opts {
|
|
|
|
if o == nil {
|
|
|
|
o = new(Opts)
|
|
|
|
}
|
|
|
|
return o
|
|
|
|
}
|
|
|
|
|
2024-07-06 13:36:48 +00:00
|
|
|
// Children manages all child processes of a network. Child processes are
|
|
|
|
// comprised of:
|
|
|
|
// - nebula
|
|
|
|
// - dnsmasq
|
|
|
|
// - garage (0 or more, depending on configured storage allocations)
|
|
|
|
type Children struct {
|
2024-12-12 21:02:00 +00:00
|
|
|
logger *mlog.Logger
|
|
|
|
binDirPath string
|
|
|
|
runtimeDir toolkit.Dir
|
|
|
|
garageAdminToken string
|
|
|
|
nebulaDeviceNamer *NebulaDeviceNamer
|
2024-10-27 13:31:10 +00:00
|
|
|
|
|
|
|
garageRPCSecret string
|
2024-07-06 13:36:48 +00:00
|
|
|
|
2024-10-29 14:11:13 +00:00
|
|
|
nebulaProc *pmuxlib.Process
|
|
|
|
dnsmasqProc *pmuxlib.Process
|
2025-01-04 14:50:17 +00:00
|
|
|
garageProcs map[string]garageProc
|
2024-07-06 13:36:48 +00:00
|
|
|
}
|
|
|
|
|
2024-09-07 13:46:59 +00:00
|
|
|
// New initializes and returns a Children instance. If initialization fails an
|
|
|
|
// error is returned.
|
|
|
|
func New(
|
2024-07-06 13:36:48 +00:00
|
|
|
ctx context.Context,
|
|
|
|
logger *mlog.Logger,
|
2024-07-13 12:34:06 +00:00
|
|
|
binDirPath string,
|
|
|
|
secretsStore secrets.Store,
|
2024-09-10 20:51:33 +00:00
|
|
|
networkConfig daecommon.NetworkConfig,
|
2024-09-09 14:34:00 +00:00
|
|
|
runtimeDir toolkit.Dir,
|
2024-07-14 10:19:39 +00:00
|
|
|
garageAdminToken string,
|
2024-12-12 21:02:00 +00:00
|
|
|
nebulaDeviceNamer *NebulaDeviceNamer,
|
2024-07-06 13:36:48 +00:00
|
|
|
hostBootstrap bootstrap.Bootstrap,
|
2025-01-01 11:38:16 +00:00
|
|
|
opts *Opts,
|
2024-07-06 13:36:48 +00:00
|
|
|
) (
|
|
|
|
*Children, error,
|
|
|
|
) {
|
2025-01-01 11:38:16 +00:00
|
|
|
opts = opts.withDefaults()
|
|
|
|
|
2024-07-13 12:34:06 +00:00
|
|
|
logger.Info(ctx, "Loading secrets")
|
2024-09-07 13:11:04 +00:00
|
|
|
garageRPCSecret, err := daecommon.GetGarageRPCSecret(ctx, secretsStore)
|
2024-07-13 12:34:06 +00:00
|
|
|
if err != nil && !errors.Is(err, secrets.ErrNotFound) {
|
|
|
|
return nil, fmt.Errorf("loading garage RPC secret: %w", err)
|
|
|
|
}
|
|
|
|
|
2024-07-06 13:36:48 +00:00
|
|
|
c := &Children{
|
2024-12-12 21:02:00 +00:00
|
|
|
logger: logger,
|
|
|
|
binDirPath: binDirPath,
|
|
|
|
runtimeDir: runtimeDir,
|
|
|
|
garageAdminToken: garageAdminToken,
|
|
|
|
nebulaDeviceNamer: nebulaDeviceNamer,
|
|
|
|
garageRPCSecret: garageRPCSecret,
|
2024-07-06 13:36:48 +00:00
|
|
|
}
|
|
|
|
|
2024-10-29 14:11:13 +00:00
|
|
|
if c.nebulaProc, err = nebulaPmuxProc(
|
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
c.runtimeDir.Path,
|
|
|
|
c.binDirPath,
|
2024-12-12 21:02:00 +00:00
|
|
|
c.nebulaDeviceNamer,
|
2024-10-29 14:11:13 +00:00
|
|
|
networkConfig,
|
|
|
|
hostBootstrap,
|
|
|
|
); err != nil {
|
|
|
|
return nil, fmt.Errorf("starting nebula: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := waitForNebula(ctx, c.logger, hostBootstrap); err != nil {
|
|
|
|
logger.Warn(ctx, "Failed waiting for nebula to initialize, shutting down child processes", err)
|
|
|
|
c.Shutdown()
|
|
|
|
return nil, fmt.Errorf("waiting for nebula to start: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if c.dnsmasqProc, err = dnsmasqPmuxProc(
|
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
c.runtimeDir.Path,
|
|
|
|
c.binDirPath,
|
|
|
|
networkConfig,
|
|
|
|
hostBootstrap,
|
|
|
|
); err != nil {
|
|
|
|
logger.Warn(ctx, "Failed to start dnsmasq, shutting down child processes", err)
|
|
|
|
c.Shutdown()
|
|
|
|
return nil, fmt.Errorf("starting dnsmasq: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if c.garageProcs, err = garagePmuxProcs(
|
2024-07-14 10:19:39 +00:00
|
|
|
ctx,
|
2024-10-29 14:11:13 +00:00
|
|
|
c.logger,
|
2024-07-14 10:19:39 +00:00
|
|
|
garageRPCSecret,
|
2024-10-29 14:11:13 +00:00
|
|
|
c.runtimeDir.Path,
|
|
|
|
c.binDirPath,
|
2024-09-10 20:51:33 +00:00
|
|
|
networkConfig,
|
2024-07-14 10:19:39 +00:00
|
|
|
garageAdminToken,
|
|
|
|
hostBootstrap,
|
2024-10-29 14:11:13 +00:00
|
|
|
); err != nil {
|
|
|
|
logger.Warn(ctx, "Failed to start garage processes, shutting down child processes", err)
|
|
|
|
c.Shutdown()
|
|
|
|
return nil, fmt.Errorf("starting garage processes: %w", err)
|
2024-07-06 13:36:48 +00:00
|
|
|
}
|
|
|
|
|
2024-10-29 14:11:13 +00:00
|
|
|
if err := waitForGarage(
|
2025-01-01 11:38:16 +00:00
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
garageAdminToken,
|
2025-01-04 14:50:17 +00:00
|
|
|
c.garageProcs,
|
2025-01-01 11:38:16 +00:00
|
|
|
opts.GarageNewCluster,
|
2024-10-29 14:11:13 +00:00
|
|
|
); err != nil {
|
|
|
|
logger.Warn(ctx, "Failed waiting for garage processes to initialize, shutting down child processes", err)
|
2024-07-20 09:07:11 +00:00
|
|
|
c.Shutdown()
|
2024-10-29 14:11:13 +00:00
|
|
|
return nil, fmt.Errorf("waiting for garage processes to initialize: %w", err)
|
2024-07-06 13:36:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
|
2024-10-24 19:19:58 +00:00
|
|
|
func (c *Children) reloadDNSMasq(
|
2024-10-27 13:31:10 +00:00
|
|
|
ctx context.Context,
|
2024-10-24 19:19:58 +00:00
|
|
|
networkConfig daecommon.NetworkConfig,
|
|
|
|
hostBootstrap bootstrap.Bootstrap,
|
|
|
|
) error {
|
2024-10-27 13:31:10 +00:00
|
|
|
if _, changed, err := dnsmasqWriteConfig(
|
|
|
|
ctx, c.logger, c.runtimeDir.Path, networkConfig, hostBootstrap,
|
|
|
|
); err != nil {
|
2024-07-19 18:49:04 +00:00
|
|
|
return fmt.Errorf("writing new dnsmasq config: %w", err)
|
2024-10-27 13:31:10 +00:00
|
|
|
} else if !changed {
|
|
|
|
c.logger.Info(ctx, "No changes to dnsmasq config file")
|
|
|
|
return nil
|
2024-07-19 18:49:04 +00:00
|
|
|
}
|
|
|
|
|
2024-10-27 13:31:10 +00:00
|
|
|
c.logger.Info(ctx, "dnsmasq config file has changed, restarting process")
|
2024-10-29 14:11:13 +00:00
|
|
|
c.dnsmasqProc.Restart()
|
2024-10-27 13:31:10 +00:00
|
|
|
|
2024-07-19 18:49:04 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-10-24 19:19:58 +00:00
|
|
|
func (c *Children) reloadNebula(
|
|
|
|
ctx context.Context,
|
|
|
|
networkConfig daecommon.NetworkConfig,
|
|
|
|
hostBootstrap bootstrap.Bootstrap,
|
|
|
|
) error {
|
2024-10-27 13:31:10 +00:00
|
|
|
if _, changed, err := nebulaWriteConfig(
|
2024-12-12 21:02:00 +00:00
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
c.runtimeDir.Path,
|
|
|
|
c.nebulaDeviceNamer,
|
|
|
|
networkConfig,
|
|
|
|
hostBootstrap,
|
2024-10-27 13:31:10 +00:00
|
|
|
); err != nil {
|
2024-07-19 18:49:04 +00:00
|
|
|
return fmt.Errorf("writing a new nebula config: %w", err)
|
2024-10-27 13:31:10 +00:00
|
|
|
} else if !changed {
|
|
|
|
c.logger.Info(ctx, "No changes to nebula config file")
|
|
|
|
return nil
|
2024-07-19 18:49:04 +00:00
|
|
|
}
|
|
|
|
|
2024-10-27 13:31:10 +00:00
|
|
|
c.logger.Info(ctx, "nebula config file has changed, restarting process")
|
2024-10-29 14:11:13 +00:00
|
|
|
c.nebulaProc.Restart()
|
2024-10-24 19:19:58 +00:00
|
|
|
|
|
|
|
if err := waitForNebula(ctx, c.logger, hostBootstrap); err != nil {
|
|
|
|
return fmt.Errorf("waiting for nebula to start: %w", err)
|
|
|
|
}
|
|
|
|
|
2024-07-19 18:49:04 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-10-27 13:31:10 +00:00
|
|
|
func (c *Children) reloadGarage(
|
|
|
|
ctx context.Context,
|
|
|
|
networkConfig daecommon.NetworkConfig,
|
|
|
|
hostBootstrap bootstrap.Bootstrap,
|
|
|
|
) error {
|
|
|
|
allocs := networkConfig.Storage.Allocations
|
|
|
|
if len(allocs) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2025-01-04 14:50:17 +00:00
|
|
|
thisHost := hostBootstrap.ThisHost()
|
|
|
|
|
2025-01-01 12:07:35 +00:00
|
|
|
var anyCreated bool
|
2024-10-27 13:31:10 +00:00
|
|
|
for _, alloc := range allocs {
|
|
|
|
var (
|
|
|
|
procName = garagePmuxProcName(alloc)
|
|
|
|
ctx = mctx.Annotate(
|
|
|
|
ctx,
|
|
|
|
"garageProcName", procName,
|
|
|
|
"garageDataPath", alloc.DataPath,
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
2025-01-01 12:07:35 +00:00
|
|
|
childConfigPath, err := garageWriteChildConfig(
|
2024-10-27 13:31:10 +00:00
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
c.garageRPCSecret,
|
|
|
|
c.runtimeDir.Path,
|
|
|
|
c.garageAdminToken,
|
|
|
|
hostBootstrap,
|
|
|
|
alloc,
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("writing child config file for alloc %+v: %w", alloc, err)
|
|
|
|
}
|
|
|
|
|
2025-01-01 12:07:35 +00:00
|
|
|
if _, ok := c.garageProcs[procName]; ok {
|
|
|
|
c.logger.Info(ctx, "Garage instance already exists")
|
2024-10-29 14:11:13 +00:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2025-01-01 12:07:35 +00:00
|
|
|
anyCreated = true
|
|
|
|
|
|
|
|
c.logger.Info(ctx, "Garage config has been added, creating process")
|
2025-01-04 14:50:17 +00:00
|
|
|
c.garageProcs[procName] = garageProc{
|
|
|
|
Process: garagePmuxProc(
|
|
|
|
ctx, c.logger, c.binDirPath, procName, childConfigPath,
|
|
|
|
),
|
|
|
|
alloc: alloc,
|
|
|
|
adminAddr: garageAllocAdminAddr(thisHost, alloc),
|
|
|
|
}
|
2024-10-27 13:31:10 +00:00
|
|
|
}
|
|
|
|
|
2025-01-01 12:07:35 +00:00
|
|
|
if anyCreated {
|
2024-10-27 13:31:10 +00:00
|
|
|
if err := waitForGarage(
|
2025-01-01 11:38:16 +00:00
|
|
|
ctx,
|
|
|
|
c.logger,
|
|
|
|
c.garageAdminToken,
|
2025-01-04 14:50:17 +00:00
|
|
|
c.garageProcs,
|
2025-01-01 11:38:16 +00:00
|
|
|
false,
|
2024-10-27 13:31:10 +00:00
|
|
|
); err != nil {
|
|
|
|
return fmt.Errorf("waiting for garage to start: %w", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-09-07 13:46:59 +00:00
|
|
|
// Reload applies a ReloadDiff to the Children, using the given bootstrap which
|
|
|
|
// must be the same one which was passed to CalculateReloadDiff.
|
|
|
|
func (c *Children) Reload(
|
2024-10-24 19:19:58 +00:00
|
|
|
ctx context.Context,
|
|
|
|
newNetworkConfig daecommon.NetworkConfig,
|
|
|
|
newBootstrap bootstrap.Bootstrap,
|
2024-09-07 13:46:59 +00:00
|
|
|
) error {
|
2024-10-27 13:31:10 +00:00
|
|
|
if err := c.reloadNebula(ctx, newNetworkConfig, newBootstrap); err != nil {
|
|
|
|
return fmt.Errorf("reloading nebula: %w", err)
|
|
|
|
}
|
|
|
|
|
2024-09-07 13:46:59 +00:00
|
|
|
var errs []error
|
|
|
|
|
2024-10-27 13:31:10 +00:00
|
|
|
if err := c.reloadDNSMasq(ctx, newNetworkConfig, newBootstrap); err != nil {
|
|
|
|
errs = append(errs, fmt.Errorf("reloading dnsmasq: %w", err))
|
2024-09-07 13:46:59 +00:00
|
|
|
}
|
|
|
|
|
2024-10-27 13:31:10 +00:00
|
|
|
if err := c.reloadGarage(ctx, newNetworkConfig, newBootstrap); err != nil {
|
|
|
|
errs = append(errs, fmt.Errorf("reloading garage: %w", err))
|
2024-09-07 13:46:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return errors.Join(errs...)
|
|
|
|
}
|
|
|
|
|
2025-01-04 14:50:17 +00:00
|
|
|
// GarageAdminClient returns an admin client for an active local garage process,
|
|
|
|
// or false if there are no garage processes.
|
|
|
|
func (c *Children) GarageAdminClient() (*garage.AdminClient, bool) {
|
|
|
|
if len(c.garageProcs) == 0 {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
|
|
|
|
procsSlice := maps.Values(c.garageProcs)
|
|
|
|
slices.SortFunc(procsSlice, func(a, b garageProc) int {
|
|
|
|
return cmp.Compare(a.alloc.RPCPort, b.alloc.RPCPort)
|
|
|
|
})
|
|
|
|
|
|
|
|
return garage.NewAdminClient(
|
|
|
|
garageAdminClientLogger(c.logger),
|
|
|
|
procsSlice[0].adminAddr,
|
|
|
|
c.garageAdminToken,
|
|
|
|
), true
|
|
|
|
}
|
|
|
|
|
|
|
|
// GarageAdminClientForAlloc returns an admin client for a particular allocation
|
|
|
|
// which has a currently running garage instance, or false if there the
|
|
|
|
// allocation has no currently running instance.
|
|
|
|
func (c *Children) GarageAdminClientForAlloc(
|
|
|
|
alloc daecommon.ConfigStorageAllocation,
|
|
|
|
) (
|
|
|
|
*garage.AdminClient, bool,
|
|
|
|
) {
|
|
|
|
procName := garagePmuxProcName(alloc)
|
|
|
|
proc, ok := c.garageProcs[procName]
|
|
|
|
if !ok {
|
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
|
|
|
|
return garage.NewAdminClient(
|
|
|
|
garageAdminClientLogger(c.logger),
|
|
|
|
proc.adminAddr,
|
|
|
|
c.garageAdminToken,
|
|
|
|
), true
|
|
|
|
}
|
|
|
|
|
2024-07-06 13:36:48 +00:00
|
|
|
// Shutdown blocks until all child processes have gracefully shut themselves
|
|
|
|
// down.
|
2024-07-20 09:07:11 +00:00
|
|
|
func (c *Children) Shutdown() {
|
2024-10-29 14:11:13 +00:00
|
|
|
for _, proc := range c.garageProcs {
|
|
|
|
proc.Stop()
|
|
|
|
}
|
|
|
|
|
|
|
|
if c.dnsmasqProc != nil {
|
|
|
|
c.dnsmasqProc.Stop()
|
|
|
|
}
|
|
|
|
|
|
|
|
if c.nebulaProc != nil {
|
|
|
|
c.nebulaProc.Stop()
|
|
|
|
}
|
2024-07-06 13:36:48 +00:00
|
|
|
}
|