From 496d541822e1b3fcd58a47e7c528a6bb467f27ee Mon Sep 17 00:00:00 2001 From: Vishal Dalwadi <51291657+VishalDalwadi@users.noreply.github.com> Date: Tue, 10 Dec 2024 11:45:54 +0530 Subject: [PATCH] NET-1833: add retries to license key validation. (#3222) * feat(go): add retries to license key validation. * feat(go): increase the number of retries. --- pro/license.go | 119 ++++++++++++++++++++++++++++++------------------- utils/utils.go | 41 +++++++++++++++++ 2 files changed, 114 insertions(+), 46 deletions(-) create mode 100644 utils/utils.go diff --git a/pro/license.go b/pro/license.go index 50825d8a3..c623a2409 100644 --- a/pro/license.go +++ b/pro/license.go @@ -9,6 +9,7 @@ import ( "encoding/json" "errors" "fmt" + "github.com/gravitl/netmaker/utils" "io" "net/http" "time" @@ -205,55 +206,81 @@ func validateLicenseKey(encryptedData []byte, publicKey *[32]byte) ([]byte, bool return nil, false, err } - req, err := http.NewRequest( - http.MethodPost, - proLogic.GetAccountsHost()+"/api/v1/license/validate", - bytes.NewReader(requestBody), - ) - if err != nil { - return nil, false, err - } - req.Header.Add("Content-Type", "application/json") - req.Header.Add("Accept", "application/json") - client := &http.Client{} - validateResponse, err := client.Do(req) - if err != nil { // check cache - slog.Warn("proceeding with cached response, Netmaker API may be down") - cachedResp, err := getCachedResponse() - return cachedResp, false, err - } - defer validateResponse.Body.Close() - code := validateResponse.StatusCode - - // if we received a 200, cache the response locally - if code == http.StatusOK { - body, err := io.ReadAll(validateResponse.Body) - if err != nil { - slog.Warn("failed to parse response", "error", err) - return nil, false, err - } - if err := cacheResponse(body); err != nil { - slog.Warn("failed to cache response", "error", err) - } - return body, false, nil + var validateResponse *http.Response + var validationResponse []byte + var timedOut bool + + validationRetries := utils.RetryStrategy{ + WaitTime: time.Second * 5, + WaitTimeIncrease: time.Second * 2, + MaxTries: 15, + Wait: func(duration time.Duration) { + time.Sleep(duration) + }, + Try: func() error { + req, err := http.NewRequest( + http.MethodPost, + proLogic.GetAccountsHost()+"/api/v1/license/validate", + bytes.NewReader(requestBody), + ) + if err != nil { + return err + } + req.Header.Add("Content-Type", "application/json") + req.Header.Add("Accept", "application/json") + client := &http.Client{} + + validateResponse, err = client.Do(req) + if err != nil { + slog.Warn(fmt.Sprintf("error while validating license key: %v", err)) + return err + } + + if validateResponse.StatusCode == http.StatusServiceUnavailable || + validateResponse.StatusCode == http.StatusGatewayTimeout || + validateResponse.StatusCode == http.StatusBadGateway { + timedOut = true + return errors.New("failed to reach netmaker api") + } + + return nil + }, + OnMaxTries: func() { + slog.Warn("proceeding with cached response, Netmaker API may be down") + validationResponse, err = getCachedResponse() + timedOut = false + }, + OnSuccess: func() { + defer validateResponse.Body.Close() + + // if we received a 200, cache the response locally + if validateResponse.StatusCode == http.StatusOK { + validationResponse, err = io.ReadAll(validateResponse.Body) + if err != nil { + slog.Warn("failed to parse response", "error", err) + validationResponse = nil + timedOut = false + return + } + + if err := cacheResponse(validationResponse); err != nil { + slog.Warn("failed to cache response", "error", err) + } + } else { + // at this point the backend returned some undesired state + + // inform failure via logs + body, _ := io.ReadAll(validateResponse.Body) + err = fmt.Errorf("could not validate license with validation backend (status={%d}, body={%s})", + validateResponse.StatusCode, string(body)) + slog.Warn(err.Error()) + } + }, } - // at this point the backend returned some undesired state - - // inform failure via logs - body, _ := io.ReadAll(validateResponse.Body) - err = fmt.Errorf("could not validate license with validation backend (status={%d}, body={%s})", - validateResponse.StatusCode, string(body)) - slog.Warn(err.Error()) - - // try to use cache if we had a temporary error - if code == http.StatusServiceUnavailable || code == http.StatusGatewayTimeout || code == http.StatusBadGateway { - slog.Warn("Netmaker API may be down, will retry later...", "code", code) - return nil, true, nil - } + validationRetries.DoStrategy() - // at this point the error is irreversible, return it - return nil, false, err + return validationResponse, timedOut, err } func cacheResponse(response []byte) error { diff --git a/utils/utils.go b/utils/utils.go new file mode 100644 index 000000000..cb8c41d89 --- /dev/null +++ b/utils/utils.go @@ -0,0 +1,41 @@ +package utils + +import "time" + +// RetryStrategy specifies a strategy to retry an operation after waiting a while, +// with hooks for successful and unsuccessful (>=max) tries. +type RetryStrategy struct { + Wait func(time.Duration) + WaitTime time.Duration + WaitTimeIncrease time.Duration + MaxTries int + Try func() error + OnMaxTries func() + OnSuccess func() +} + +// DoStrategy does the retry strategy specified in the struct, waiting before retrying an operator, +// up to a max number of tries, and if executes a success "finalizer" operation if a retry is successful +func (rs RetryStrategy) DoStrategy() { + err := rs.Try() + if err == nil { + rs.OnSuccess() + return + } + + tries := 1 + for { + if tries >= rs.MaxTries { + rs.OnMaxTries() + return + } + rs.Wait(rs.WaitTime) + if err := rs.Try(); err != nil { + tries++ // we tried, increase count + rs.WaitTime += rs.WaitTimeIncrease // for the next time, sleep more + continue // retry + } + rs.OnSuccess() + return + } +}