mirror of
https://github.com/edgelesssys/constellation.git
synced 2025-01-27 15:57:04 -05:00
bootstrapper: retry helm chart installation (#1151)
Motivation for this change are intermittent timeout errors while installing cert-manager. Co-authored-by: Paul Meyer <49727155+katexochen@users.noreply.github.com>
This commit is contained in:
parent
c275464634
commit
8b7979c500
@ -21,10 +21,13 @@ import (
|
|||||||
"github.com/edgelesssys/constellation/v2/internal/constants"
|
"github.com/edgelesssys/constellation/v2/internal/constants"
|
||||||
"github.com/edgelesssys/constellation/v2/internal/deploy/helm"
|
"github.com/edgelesssys/constellation/v2/internal/deploy/helm"
|
||||||
"github.com/edgelesssys/constellation/v2/internal/logger"
|
"github.com/edgelesssys/constellation/v2/internal/logger"
|
||||||
|
"github.com/edgelesssys/constellation/v2/internal/retry"
|
||||||
"helm.sh/helm/v3/pkg/action"
|
"helm.sh/helm/v3/pkg/action"
|
||||||
|
"helm.sh/helm/v3/pkg/chart"
|
||||||
"helm.sh/helm/v3/pkg/chart/loader"
|
"helm.sh/helm/v3/pkg/chart/loader"
|
||||||
"helm.sh/helm/v3/pkg/cli"
|
"helm.sh/helm/v3/pkg/cli"
|
||||||
corev1 "k8s.io/api/core/v1"
|
corev1 "k8s.io/api/core/v1"
|
||||||
|
"k8s.io/apimachinery/pkg/util/wait"
|
||||||
)
|
)
|
||||||
|
|
||||||
const (
|
const (
|
||||||
@ -35,6 +38,7 @@ const (
|
|||||||
// Client is used to install microservice during cluster initialization. It is a wrapper for a helm install action.
|
// Client is used to install microservice during cluster initialization. It is a wrapper for a helm install action.
|
||||||
type Client struct {
|
type Client struct {
|
||||||
*action.Install
|
*action.Install
|
||||||
|
log *logger.Logger
|
||||||
}
|
}
|
||||||
|
|
||||||
// New creates a new client with the given logger.
|
// New creates a new client with the given logger.
|
||||||
@ -54,6 +58,7 @@ func New(log *logger.Logger) (*Client, error) {
|
|||||||
|
|
||||||
return &Client{
|
return &Client{
|
||||||
action,
|
action,
|
||||||
|
log,
|
||||||
}, nil
|
}, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -178,6 +183,9 @@ func (h *Client) installCiliumGCP(ctx context.Context, kubectl k8sapi.Client, re
|
|||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// install tries to install the given chart and aborts after ~5 tries.
|
||||||
|
// The function will wait 30 seconds before retrying a failed installation attempt.
|
||||||
|
// After 5 minutes the retrier will be canceld and the function returns with an error.
|
||||||
func (h *Client) install(ctx context.Context, chartRaw []byte, values map[string]any) error {
|
func (h *Client) install(ctx context.Context, chartRaw []byte, values map[string]any) error {
|
||||||
reader := bytes.NewReader(chartRaw)
|
reader := bytes.NewReader(chartRaw)
|
||||||
chart, err := loader.LoadArchive(reader)
|
chart, err := loader.LoadArchive(reader)
|
||||||
@ -185,9 +193,43 @@ func (h *Client) install(ctx context.Context, chartRaw []byte, values map[string
|
|||||||
return fmt.Errorf("helm load archive: %w", err)
|
return fmt.Errorf("helm load archive: %w", err)
|
||||||
}
|
}
|
||||||
|
|
||||||
_, err = h.RunWithContext(ctx, chart, values)
|
doer := installDoer{
|
||||||
if err != nil {
|
h,
|
||||||
|
chart,
|
||||||
|
values,
|
||||||
|
h.log,
|
||||||
|
}
|
||||||
|
retrier := retry.NewIntervalRetrier(doer, 30*time.Second, isTimeoutErr)
|
||||||
|
|
||||||
|
// Since we have no precise retry condition we want to stop retrying after 5 minutes.
|
||||||
|
// The helm library only reports a timeout error in the error cases we currently know.
|
||||||
|
// Other errors will not be retried.
|
||||||
|
newCtx, cancel := context.WithTimeout(ctx, 5*time.Minute)
|
||||||
|
defer cancel()
|
||||||
|
if err := retrier.Do(newCtx); err != nil {
|
||||||
return fmt.Errorf("helm install: %w", err)
|
return fmt.Errorf("helm install: %w", err)
|
||||||
}
|
}
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// installDoer is a help struct to enable retrying helm's install action.
|
||||||
|
type installDoer struct {
|
||||||
|
client *Client
|
||||||
|
chart *chart.Chart
|
||||||
|
values map[string]any
|
||||||
|
log *logger.Logger
|
||||||
|
}
|
||||||
|
|
||||||
|
// Do logs which chart is installed and tries to install it.
|
||||||
|
func (i installDoer) Do(ctx context.Context) error {
|
||||||
|
i.log.Debugf("trying helm install for chart %s", i.chart.Name())
|
||||||
|
|
||||||
|
_, err := i.client.RunWithContext(ctx, i.chart, i.values)
|
||||||
|
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
// isTimeoutErr checks if the given error is a timeout error from k8s.io/apimachinery.
|
||||||
|
func isTimeoutErr(err error) bool {
|
||||||
|
return errors.Is(err, wait.ErrWaitTimeout)
|
||||||
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user