mirror of
https://github.com/edgelesssys/constellation.git
synced 2024-12-11 17:04:22 -05:00
005e865a13
* [wip] use state file in CLI Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> tidy Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * use state file in CLI Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> take clusterConfig from IDFile for compat Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> various fixes Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> wip Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add GCP-specific values in Helm loader test Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove unnecessary pointer Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * write ClusterValues in one step Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * move stub to test file Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove mention of id-file Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * move output to `migrateTerraform` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * unconditional assignments converting from idFile Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * move require block in go modules file Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * fall back to id file on upgrade Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * tidy Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * fix linter check Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add notice to remove Terraform state check on manual migration Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add `name` field Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> fix name tests Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * return early if no Terraform diff Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * tidy Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * return infrastructure state even if no diff exists Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add TODO to remove comment Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * use state-file in miniconstellation Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * cli: remove id-file (#2402) * remove id-file from `constellation create` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add file renaming to handler * rename id-file after upgrade * use idFile on `constellation init` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove id-file from `constellation verify` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * linter fixes Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove id-file from `constellation mini` * remove id-file from `constellation recover` * linter fixes * remove id-file from `constellation terminate` * fix initSecret type * fix recover argument precedence * fix terminate test * generate * add TODO to remove id-file removal * Update cli/internal/cmd/init.go Co-authored-by: Adrian Stobbe <stobbe.adrian@gmail.com> * fix verify arg parse logic Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * add version test Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove id-file from docs * add file not found log * use state-file in miniconstellation Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove id-file from `constellation iam destroy` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * remove id-file from `cdbg deploy` Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> --------- Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> Co-authored-by: Adrian Stobbe <stobbe.adrian@gmail.com> * use state-file in CI Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> * update orchestration docs --------- Signed-off-by: Moritz Sanft <58110325+msanft@users.noreply.github.com> Co-authored-by: Adrian Stobbe <stobbe.adrian@gmail.com>
264 lines
7.9 KiB
Go
264 lines
7.9 KiB
Go
/*
|
|
Copyright (c) Edgeless Systems GmbH
|
|
|
|
SPDX-License-Identifier: AGPL-3.0-only
|
|
*/
|
|
|
|
package cmd
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"net"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/edgelesssys/constellation/v2/cli/internal/cloudcmd"
|
|
"github.com/edgelesssys/constellation/v2/cli/internal/cmd/pathprefix"
|
|
"github.com/edgelesssys/constellation/v2/cli/internal/state"
|
|
"github.com/edgelesssys/constellation/v2/disk-mapper/recoverproto"
|
|
"github.com/edgelesssys/constellation/v2/internal/api/attestationconfigapi"
|
|
"github.com/edgelesssys/constellation/v2/internal/atls"
|
|
"github.com/edgelesssys/constellation/v2/internal/cloud/cloudprovider"
|
|
"github.com/edgelesssys/constellation/v2/internal/config"
|
|
"github.com/edgelesssys/constellation/v2/internal/constants"
|
|
"github.com/edgelesssys/constellation/v2/internal/file"
|
|
"github.com/edgelesssys/constellation/v2/internal/grpc/dialer"
|
|
grpcRetry "github.com/edgelesssys/constellation/v2/internal/grpc/retry"
|
|
"github.com/edgelesssys/constellation/v2/internal/kms/uri"
|
|
"github.com/edgelesssys/constellation/v2/internal/retry"
|
|
"github.com/spf13/afero"
|
|
"github.com/spf13/cobra"
|
|
)
|
|
|
|
// NewRecoverCmd returns a new cobra.Command for the recover command.
|
|
func NewRecoverCmd() *cobra.Command {
|
|
cmd := &cobra.Command{
|
|
Use: "recover",
|
|
Short: "Recover a completely stopped Constellation cluster",
|
|
Long: "Recover a Constellation cluster by sending a recovery key to an instance in the boot stage.\n\n" +
|
|
"This is only required if instances restart without other instances available for bootstrapping.",
|
|
Args: cobra.ExactArgs(0),
|
|
RunE: runRecover,
|
|
}
|
|
cmd.Flags().StringP("endpoint", "e", "", "endpoint of the instance, passed as HOST[:PORT]")
|
|
return cmd
|
|
}
|
|
|
|
type recoverCmd struct {
|
|
log debugLog
|
|
configFetcher attestationconfigapi.Fetcher
|
|
pf pathprefix.PathPrefixer
|
|
}
|
|
|
|
func runRecover(cmd *cobra.Command, _ []string) error {
|
|
log, err := newCLILogger(cmd)
|
|
if err != nil {
|
|
return fmt.Errorf("creating logger: %w", err)
|
|
}
|
|
defer log.Sync()
|
|
fileHandler := file.NewHandler(afero.NewOsFs())
|
|
newDialer := func(validator atls.Validator) *dialer.Dialer {
|
|
return dialer.New(nil, validator, &net.Dialer{})
|
|
}
|
|
r := &recoverCmd{log: log, configFetcher: attestationconfigapi.NewFetcher()}
|
|
return r.recover(cmd, fileHandler, 5*time.Second, &recoverDoer{log: r.log}, newDialer)
|
|
}
|
|
|
|
func (r *recoverCmd) recover(
|
|
cmd *cobra.Command, fileHandler file.Handler, interval time.Duration,
|
|
doer recoverDoerInterface, newDialer func(validator atls.Validator) *dialer.Dialer,
|
|
) error {
|
|
flags, err := r.parseRecoverFlags(cmd, fileHandler)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
r.log.Debugf("Using flags: %+v", flags)
|
|
|
|
var masterSecret uri.MasterSecret
|
|
r.log.Debugf("Loading master secret file from %s", r.pf.PrefixPrintablePath(constants.MasterSecretFilename))
|
|
if err := fileHandler.ReadJSON(constants.MasterSecretFilename, &masterSecret); err != nil {
|
|
return err
|
|
}
|
|
|
|
r.log.Debugf("Loading configuration file from %q", r.pf.PrefixPrintablePath(constants.ConfigFilename))
|
|
conf, err := config.New(fileHandler, constants.ConfigFilename, r.configFetcher, flags.force)
|
|
var configValidationErr *config.ValidationError
|
|
if errors.As(err, &configValidationErr) {
|
|
cmd.PrintErrln(configValidationErr.LongMessage())
|
|
}
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
provider := conf.GetProvider()
|
|
r.log.Debugf("Got provider %s", provider.String())
|
|
if provider == cloudprovider.Azure {
|
|
interval = 20 * time.Second // Azure LB takes a while to remove unhealthy instances
|
|
}
|
|
|
|
conf.UpdateMAAURL(flags.maaURL)
|
|
r.log.Debugf("Creating aTLS Validator for %s", conf.GetAttestationConfig().GetVariant())
|
|
validator, err := cloudcmd.NewValidator(cmd, conf.GetAttestationConfig(), r.log)
|
|
if err != nil {
|
|
return fmt.Errorf("creating new validator: %w", err)
|
|
}
|
|
r.log.Debugf("Created a new validator")
|
|
doer.setDialer(newDialer(validator), flags.endpoint)
|
|
r.log.Debugf("Set dialer for endpoint %s", flags.endpoint)
|
|
doer.setURIs(masterSecret.EncodeToURI(), uri.NoStoreURI)
|
|
r.log.Debugf("Set secrets")
|
|
if err := r.recoverCall(cmd.Context(), cmd.OutOrStdout(), interval, doer); err != nil {
|
|
if grpcRetry.ServiceIsUnavailable(err) {
|
|
return nil
|
|
}
|
|
return fmt.Errorf("recovering cluster: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (r *recoverCmd) recoverCall(ctx context.Context, out io.Writer, interval time.Duration, doer recoverDoerInterface) error {
|
|
var err error
|
|
ctr := 0
|
|
for {
|
|
once := sync.Once{}
|
|
retryOnceOnFailure := func(err error) bool {
|
|
var retry bool
|
|
// retry transient GCP LB errors
|
|
if grpcRetry.LoadbalancerIsNotReady(err) {
|
|
retry = true
|
|
} else {
|
|
// retry connection errors once
|
|
// this is necessary because Azure's LB takes a while to remove unhealthy instances
|
|
once.Do(func() {
|
|
retry = grpcRetry.ServiceIsUnavailable(err)
|
|
})
|
|
}
|
|
|
|
r.log.Debugf("Encountered error (retriable: %t): %s", retry, err)
|
|
return retry
|
|
}
|
|
|
|
retrier := retry.NewIntervalRetrier(doer, interval, retryOnceOnFailure)
|
|
r.log.Debugf("Created new interval retrier")
|
|
err = retrier.Do(ctx)
|
|
if err != nil {
|
|
break
|
|
}
|
|
fmt.Fprintln(out, "Pushed recovery key.")
|
|
ctr++
|
|
}
|
|
r.log.Debugf("Retry counter is %d", ctr)
|
|
if ctr > 0 {
|
|
fmt.Fprintf(out, "Recovered %d control-plane nodes.\n", ctr)
|
|
} else if grpcRetry.ServiceIsUnavailable(err) {
|
|
fmt.Fprintln(out, "No control-plane nodes in need of recovery found. Exiting.")
|
|
return nil
|
|
}
|
|
return err
|
|
}
|
|
|
|
type recoverDoerInterface interface {
|
|
Do(ctx context.Context) error
|
|
setDialer(dialer grpcDialer, endpoint string)
|
|
setURIs(kmsURI, storageURI string)
|
|
}
|
|
|
|
type recoverDoer struct {
|
|
dialer grpcDialer
|
|
endpoint string
|
|
kmsURI string // encodes masterSecret
|
|
storageURI string
|
|
log debugLog
|
|
}
|
|
|
|
// Do performs the recover streaming rpc.
|
|
func (d *recoverDoer) Do(ctx context.Context) (retErr error) {
|
|
conn, err := d.dialer.Dial(ctx, d.endpoint)
|
|
if err != nil {
|
|
return fmt.Errorf("dialing recovery server: %w", err)
|
|
}
|
|
d.log.Debugf("Dialed recovery server")
|
|
defer conn.Close()
|
|
|
|
protoClient := recoverproto.NewAPIClient(conn)
|
|
d.log.Debugf("Created protoClient")
|
|
|
|
req := &recoverproto.RecoverMessage{
|
|
KmsUri: d.kmsURI,
|
|
StorageUri: d.storageURI,
|
|
}
|
|
|
|
_, err = protoClient.Recover(ctx, req)
|
|
if err != nil {
|
|
return fmt.Errorf("calling recover: %w", err)
|
|
}
|
|
|
|
d.log.Debugf("Received confirmation")
|
|
return nil
|
|
}
|
|
|
|
func (d *recoverDoer) setDialer(dialer grpcDialer, endpoint string) {
|
|
d.dialer = dialer
|
|
d.endpoint = endpoint
|
|
}
|
|
|
|
func (d *recoverDoer) setURIs(kmsURI, storageURI string) {
|
|
d.kmsURI = kmsURI
|
|
d.storageURI = storageURI
|
|
}
|
|
|
|
type recoverFlags struct {
|
|
endpoint string
|
|
maaURL string
|
|
force bool
|
|
}
|
|
|
|
func (r *recoverCmd) parseRecoverFlags(cmd *cobra.Command, fileHandler file.Handler) (recoverFlags, error) {
|
|
workDir, err := cmd.Flags().GetString("workspace")
|
|
if err != nil {
|
|
return recoverFlags{}, fmt.Errorf("parsing config path argument: %w", err)
|
|
}
|
|
r.log.Debugf("Workspace set to %q", workDir)
|
|
r.pf = pathprefix.New(workDir)
|
|
|
|
endpoint, err := cmd.Flags().GetString("endpoint")
|
|
r.log.Debugf("Endpoint flag is %s", endpoint)
|
|
if err != nil {
|
|
return recoverFlags{}, fmt.Errorf("parsing endpoint argument: %w", err)
|
|
}
|
|
|
|
force, err := cmd.Flags().GetBool("force")
|
|
if err != nil {
|
|
return recoverFlags{}, fmt.Errorf("parsing force argument: %w", err)
|
|
}
|
|
|
|
var attestationURL string
|
|
stateFile := state.New()
|
|
if endpoint == "" {
|
|
stateFile, err = state.ReadFromFile(fileHandler, constants.StateFilename)
|
|
if err != nil {
|
|
return recoverFlags{}, fmt.Errorf("reading state file: %w", err)
|
|
}
|
|
endpoint = stateFile.Infrastructure.ClusterEndpoint
|
|
}
|
|
|
|
endpoint, err = addPortIfMissing(endpoint, constants.RecoveryPort)
|
|
if err != nil {
|
|
return recoverFlags{}, fmt.Errorf("validating endpoint argument: %w", err)
|
|
}
|
|
r.log.Debugf("Endpoint value after parsing is %s", endpoint)
|
|
|
|
if stateFile.Infrastructure.Azure != nil {
|
|
attestationURL = stateFile.Infrastructure.Azure.AttestationURL
|
|
}
|
|
|
|
return recoverFlags{
|
|
endpoint: endpoint,
|
|
maaURL: attestationURL,
|
|
force: force,
|
|
}, nil
|
|
}
|