Skip to content

Commit

Permalink
feat(konnect): handle BadRequest errors and other unrecoverable error…
Browse files Browse the repository at this point in the history
…s to prevent endless reconciliation
  • Loading branch information
pmalek committed Oct 24, 2024
1 parent 924f43f commit a1f22eb
Show file tree
Hide file tree
Showing 3 changed files with 360 additions and 63 deletions.
49 changes: 44 additions & 5 deletions controller/konnect/ops/ops.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import (
"fmt"
"time"

sdkkonnecterrs "github.com/Kong/sdk-konnect-go/models/sdkerrors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
ctrl "sigs.k8s.io/controller-runtime"
"sigs.k8s.io/controller-runtime/pkg/client"
Expand Down Expand Up @@ -102,7 +103,10 @@ func Create[
return nil, fmt.Errorf("unsupported entity type %T", ent)
}

var errRelationsFailed KonnectEntityCreatedButRelationsFailedError
var (
errRelationsFailed KonnectEntityCreatedButRelationsFailedError
errSDK *sdkkonnecterrs.SDKError
)
switch {
case ErrorIsCreateConflict(err):
// If there was a conflict on the create request, we can assume the entity already exists.
Expand Down Expand Up @@ -161,8 +165,17 @@ func Create[
} else {
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToCreateReason, err.Error())
}

case errors.As(err, &errSDK):
switch {
case ErrorIsSDKErrorTypeField(err):
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToCreateReason, errSDK.Error())
default:
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToCreateReason, err.Error())
}

case errors.As(err, &errRelationsFailed):
SetKonnectEntityProgrammedConditionFalse(e, errRelationsFailed.Reason, err.Error())
SetKonnectEntityProgrammedConditionFalse(e, errRelationsFailed.Reason, errRelationsFailed.Err.Error())
case err != nil:
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToCreateReason, err.Error())
default:
Expand All @@ -171,6 +184,14 @@ func Create[

logOpComplete(ctx, start, CreateOp, e, err)

// If the error is a type field error or bad request error, then don't propagate
// it to the caller.
// We cannot recover from this error as this requires user to change object's
// manifest. The entity's status is already updated with the error.
if ErrorIsSDKErrorTypeField(err) || ErrorIsSDKBadRequestError(err) {
err = nil
}

return e, err
}

Expand Down Expand Up @@ -242,7 +263,7 @@ func Delete[
return fmt.Errorf("unsupported entity type %T", ent)
}

logOpComplete[T, TEnt](ctx, start, DeleteOp, ent, err)
logOpComplete(ctx, start, DeleteOp, ent, err)

return err
}
Expand Down Expand Up @@ -360,8 +381,18 @@ func Update[
return ctrl.Result{}, fmt.Errorf("unsupported entity type %T", ent)
}

var errRelationsFailed KonnectEntityCreatedButRelationsFailedError
var (
errRelationsFailed KonnectEntityCreatedButRelationsFailedError
errSDK *sdkkonnecterrs.SDKError
)
switch {
case errors.As(err, &errSDK):
switch {
case ErrorIsSDKErrorTypeField(err):
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToUpdateReason, errSDK.Body)
default:
SetKonnectEntityProgrammedConditionFalse(e, consts.KonnectEntitiesFailedToUpdateReason, err.Error())
}
case errors.As(err, &errRelationsFailed):
e.SetKonnectID(errRelationsFailed.KonnectID)
SetKonnectEntityProgrammedConditionFalse(e, errRelationsFailed.Reason, err.Error())
Expand All @@ -371,7 +402,15 @@ func Update[
SetKonnectEntityProgrammedCondition(e)
}

logOpComplete[T, TEnt](ctx, now, UpdateOp, e, err)
logOpComplete(ctx, now, UpdateOp, e, err)

// If the error is a type field error or bad request error, then don't propagate
// it to the caller.
// We cannot recover from this error as this requires user to change object's
// manifest. The entity's status is already updated with the error.
if ErrorIsSDKErrorTypeField(err) || ErrorIsSDKBadRequestError(err) {
err = nil
}

return ctrl.Result{}, err
}
Expand Down
140 changes: 82 additions & 58 deletions controller/konnect/ops/ops_errors.go
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ import (
"errors"
"fmt"
"net/http"
"slices"

sdkkonnecterrs "github.com/Kong/sdk-konnect-go/models/sdkerrors"
"sigs.k8s.io/controller-runtime/pkg/client"
Expand Down Expand Up @@ -51,15 +52,17 @@ func (e CantPerformOperationWithoutControlPlaneIDError) Error() string {
)
}

type sdkErrorDetails struct {
TypeAt string `json:"@type"`
Type string `json:"type"`
Field string `json:"field"`
Messages []string `json:"messages"`
}

type sdkErrorBody struct {
Code int `json:"code"`
Message string `json:"message"`
Details []struct {
TypeAt string `json:"@type"`
Type string `json:"type"`
Field string `json:"field"`
Messages []string `json:"messages"`
} `json:"details"`
Code int `json:"code"`
Message string `json:"message"`
Details []sdkErrorDetails `json:"details"`
}

// ParseSDKErrorBody parses the body of an SDK error response.
Expand Down Expand Up @@ -88,6 +91,62 @@ func ParseSDKErrorBody(body string) (sdkErrorBody, error) {
return sdkErr, nil
}

const (
dataConstraintMesasge = "data constraint error"
validationErrorMessage = "validation error"
)

// ErrorIsSDKErrorTypeField returns true if the provided error is a type field error.
// These types of errors are unrecoverable and should be covered by CEL validation
// rules on CRDs but just in case some of those are left unhandled we can handle
// them by reacting to SDKErrors of type ERROR_TYPE_FIELD.
//
// Exemplary body:
//
// {
// "code": 3,
// "message": "validation error",
// "details": [
// {
// "@type": "type.googleapis.com/kong.admin.model.v1.ErrorDetail",
// "type": "ERROR_TYPE_FIELD",
// "field": "tags[0]",
// "messages": [
// "length must be <= 128, but got 138"
// ]
// }
// ]
// }
func ErrorIsSDKErrorTypeField(err error) bool {
var errSDK *sdkkonnecterrs.SDKError
if !errors.As(err, &errSDK) {
return false
}

errSDKBody, err := ParseSDKErrorBody(errSDK.Body)
if err != nil {
return false
}

if errSDKBody.Message != validationErrorMessage {
return false
}

if !slices.ContainsFunc(errSDKBody.Details, func(d sdkErrorDetails) bool {
return d.Type == "ERROR_TYPE_FIELD"
}) {
return false
}

return true
}

// ErrorIsSDKBadRequestError returns true if the provided error is a BadRequestError.
func ErrorIsSDKBadRequestError(err error) bool {
var errSDK *sdkkonnecterrs.BadRequestError
return errors.As(err, &errSDK)
}

// ErrorIsCreateConflict returns true if the provided error is a Konnect conflict error.
//
// NOTE: Konnect APIs specific for Konnect only APIs like Gateway Control Planes
Expand All @@ -114,10 +173,6 @@ func SDKErrorIsConflict(sdkError *sdkkonnecterrs.SDKError) bool {
return false
}

const (
dataConstraintMesasge = "data constraint error"
)

if sdkErrorBody.Message != dataConstraintMesasge {
return false
}
Expand All @@ -129,6 +184,15 @@ func SDKErrorIsConflict(sdkError *sdkkonnecterrs.SDKError) bool {
return false
}

func errIsNotFound(err error) bool {
var (
notFoundError *sdkkonnecterrs.NotFoundError
sdkError *sdkkonnecterrs.SDKError
)
return errors.As(err, &notFoundError) ||
errors.As(err, &sdkError) && sdkError.StatusCode == http.StatusNotFound
}

// handleUpdateError handles errors that occur during an update operation.
// If the entity is not found, then it uses the provided create function to
// recreate the it.
Expand All @@ -141,41 +205,17 @@ func handleUpdateError[
ent TEnt,
createFunc func(ctx context.Context) error,
) error {
var (
sdkError *sdkkonnecterrs.SDKError
id = ent.GetKonnectStatus().GetKonnectID()
)
if errors.As(err, &sdkError) {
switch sdkError.StatusCode {
case http.StatusNotFound:
logEntityNotFoundRecreating(ctx, ent, id)
if err := createFunc(ctx); err != nil {
return FailedKonnectOpError[T]{
Op: UpdateOp,
Err: err,
}
}
return nil
default:
return FailedKonnectOpError[T]{
Op: UpdateOp,
Err: sdkError,
}
}
}

var notFoundError *sdkkonnecterrs.NotFoundError
if errors.As(err, &notFoundError) {
if errIsNotFound(err) {
id := ent.GetKonnectStatus().GetKonnectID()
logEntityNotFoundRecreating(ctx, ent, id)
if err := createFunc(ctx); err != nil {
if createErr := createFunc(ctx); createErr != nil {
return FailedKonnectOpError[T]{
Op: UpdateOp,
Err: err,
Op: CreateOp,
Err: fmt.Errorf("failed to create %s %s: %w", ent.GetTypeName(), id, createErr),
}
}
return nil
}

return FailedKonnectOpError[T]{
Op: UpdateOp,
Err: err,
Expand All @@ -189,32 +229,16 @@ func handleDeleteError[
T constraints.SupportedKonnectEntityType,
TEnt constraints.EntityType[T],
](ctx context.Context, err error, ent TEnt) error {
logDeleteSkipped := func() {
if errIsNotFound(err) {
ctrllog.FromContext(ctx).
Info("entity not found in Konnect, skipping delete",
"op", DeleteOp,
"type", ent.GetTypeName(),
"id", ent.GetKonnectStatus().GetKonnectID(),
)
}

var sdkNotFoundError *sdkkonnecterrs.NotFoundError
if errors.As(err, &sdkNotFoundError) {
logDeleteSkipped()
return nil
}

var sdkError *sdkkonnecterrs.SDKError
if errors.As(err, &sdkError) {
if sdkError.StatusCode == http.StatusNotFound {
logDeleteSkipped()
return nil
}
return FailedKonnectOpError[T]{
Op: DeleteOp,
Err: sdkError,
}
}
return FailedKonnectOpError[T]{
Op: DeleteOp,
Err: err,
Expand Down
Loading

0 comments on commit a1f22eb

Please sign in to comment.