Files
open-cluster-management/pkg/registration/clientcert/cert_controller.go
Jian Qiu e810520961 🌱 Refactor code to fix lint warning (#218)
* Refactor code to fix lint warning

Signed-off-by: Jian Qiu <jqiu@redhat.com>

* enable lint for testing files

Signed-off-by: Jian Qiu <jqiu@redhat.com>

---------

Signed-off-by: Jian Qiu <jqiu@redhat.com>
2023-07-25 07:12:34 +02:00

420 lines
14 KiB
Go

package clientcert
import (
"context"
"crypto/tls"
"crypto/x509/pkix"
"fmt"
"math/rand"
"reflect"
"time"
"github.com/openshift/library-go/pkg/controller/factory"
"github.com/openshift/library-go/pkg/operator/events"
corev1 "k8s.io/api/core/v1"
apierrors "k8s.io/apimachinery/pkg/api/errors"
"k8s.io/apimachinery/pkg/api/meta"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/runtime"
corev1informers "k8s.io/client-go/informers/core/v1"
corev1client "k8s.io/client-go/kubernetes/typed/core/v1"
certutil "k8s.io/client-go/util/cert"
"k8s.io/client-go/util/keyutil"
"k8s.io/klog/v2"
)
const (
// KubeconfigFile is the name of the kubeconfig file in kubeconfigSecret
KubeconfigFile = "kubeconfig"
// TLSKeyFile is the name of tls key file in kubeconfigSecret
TLSKeyFile = "tls.key"
// TLSCertFile is the name of the tls cert file in kubeconfigSecret
TLSCertFile = "tls.crt"
ClusterNameFile = "cluster-name"
AgentNameFile = "agent-name"
// ClusterCertificateRotatedCondition is a condition type that client certificate is rotated
ClusterCertificateRotatedCondition = "ClusterCertificateRotated"
)
// ControllerResyncInterval is exposed so that integration tests can crank up the constroller sync speed.
var ControllerResyncInterval = 5 * time.Minute
// CSROption includes options that is used to create and monitor csrs
type CSROption struct {
// ObjectMeta is the ObjectMeta shared by all created csrs. It should use GenerateName instead of Name
// to generate random csr names
ObjectMeta metav1.ObjectMeta
// Subject represents the subject of the client certificate used to create csrs
Subject *pkix.Name
// DNSNames represents DNS names used to create the client certificate
DNSNames []string
// SignerName is the name of the signer specified in the created csrs
SignerName string
// ExpirationSeconds is the requested duration of validity of the issued
// certificate.
// Certificate signers may not honor this field for various reasons:
//
// 1. Old signer that is unaware of the field (such as the in-tree
// implementations prior to v1.22)
// 2. Signer whose configured maximum is shorter than the requested duration
// 3. Signer whose configured minimum is longer than the requested duration
//
// The minimum valid value for expirationSeconds is 3600, i.e. 1 hour.
ExpirationSeconds *int32
// EventFilterFunc matches csrs created with above options
EventFilterFunc factory.EventFilterFunc
// HaltCSRCreation halt the csr creation
HaltCSRCreation func() bool
}
// ClientCertOption includes options that is used to create client certificate
type ClientCertOption struct {
// SecretNamespace is the namespace of the secret containing client certificate.
SecretNamespace string
// SecretName is the name of the secret containing client certificate. The secret will be created if
// it does not exist.
SecretName string
// AdditonalSecretData contains data that will be added into client certificate secret besides tls.key/tls.crt
AdditionalSecretData map[string][]byte
// AdditonalSecretDataSensitive is true indicates the client cert is sensitive to the AdditonalSecretData.
// That means once AdditonalSecretData changes, the client cert will be recreated.
AdditionalSecretDataSensitive bool
}
type StatusUpdateFunc func(ctx context.Context, cond metav1.Condition) error
// clientCertificateController implements the common logic of hub client certification creation/rotation. It
// creates a client certificate and rotates it before it becomes expired by using csrs. The client
// certificate generated is stored in a specific secret with the keys below:
// 1). tls.key: tls key file
// 2). tls.crt: tls cert file
type clientCertificateController struct {
ClientCertOption
CSROption
csrControl CSRControl
// managementCoreClient is used to create/delete hub kubeconfig secret on the management cluster
managementCoreClient corev1client.CoreV1Interface
controllerName string
// csrName is the name of csr created by controller and waiting for approval.
csrName string
// keyData is the private key data used to created a csr
// csrName and keyData store the internal state of the controller. They are set after controller creates a new csr
// and cleared once the csr is approved and processed by controller. There are 4 combination of their values:
// 1. csrName empty, keyData empty: means we aren't trying to create a new client cert, our current one is valid
// 2. csrName set, keyData empty: there was bug
// 3. csrName set, keyData set: we are waiting for a new cert to be signed.
// 4. csrName empty, keydata set: the CSR failed to create, this shouldn't happen, it's a bug.
keyData []byte
statusUpdater StatusUpdateFunc
}
// NewClientCertificateController return an instance of clientCertificateController
func NewClientCertificateController(
clientCertOption ClientCertOption,
csrOption CSROption,
csrControl CSRControl,
managementSecretInformer corev1informers.SecretInformer,
managementCoreClient corev1client.CoreV1Interface,
statusUpdater StatusUpdateFunc,
recorder events.Recorder,
controllerName string,
) factory.Controller {
c := clientCertificateController{
ClientCertOption: clientCertOption,
CSROption: csrOption,
csrControl: csrControl,
managementCoreClient: managementCoreClient,
controllerName: controllerName,
statusUpdater: statusUpdater,
}
return factory.New().
WithFilteredEventsInformersQueueKeyFunc(func(obj runtime.Object) string {
return factory.DefaultQueueKey
}, func(obj interface{}) bool {
accessor, err := meta.Accessor(obj)
if err != nil {
return false
}
// only enqueue a specific secret
if accessor.GetNamespace() == c.SecretNamespace && accessor.GetName() == c.SecretName {
return true
}
return false
}, managementSecretInformer.Informer()).
WithFilteredEventsInformersQueueKeyFunc(func(obj runtime.Object) string {
return factory.DefaultQueueKey
}, c.EventFilterFunc, csrControl.Informer()).
WithSync(c.sync).
ResyncEvery(ControllerResyncInterval).
ToController(controllerName, recorder)
}
func (c *clientCertificateController) sync(ctx context.Context, syncCtx factory.SyncContext) error {
// get secret containing client certificate
secret, err := c.managementCoreClient.Secrets(c.SecretNamespace).Get(ctx, c.SecretName, metav1.GetOptions{})
switch {
case apierrors.IsNotFound(err):
secret = &corev1.Secret{
ObjectMeta: metav1.ObjectMeta{
Namespace: c.SecretNamespace,
Name: c.SecretName,
},
}
case err != nil:
return fmt.Errorf("unable to get secret %q: %w", c.SecretNamespace+"/"+c.SecretName, err)
}
// reconcile pending csr if exists
if len(c.csrName) > 0 {
// build a secret data map if the csr is approved
newSecretConfig, err := func() (map[string][]byte, error) {
// skip if there is no ongoing csr
if len(c.csrName) == 0 {
return nil, fmt.Errorf("no ongoing csr")
}
// skip if csr is not approved yet
isApproved, err := c.csrControl.isApproved(c.csrName)
if err != nil {
return nil, err
}
if !isApproved {
return nil, nil
}
// skip if csr is not issued
certData, err := c.csrControl.getIssuedCertificate(c.csrName)
if err != nil {
return nil, err
}
if len(certData) == 0 {
return nil, nil
}
klog.V(4).Infof("Sync csr %v", c.csrName)
// check if cert in csr status matches with the corresponding private key
if c.keyData == nil {
return nil, fmt.Errorf("no private key found for certificate in csr: %s", c.csrName)
}
_, err = tls.X509KeyPair(certData, c.keyData)
if err != nil {
return nil, fmt.Errorf("private key does not match with the certificate in csr: %s", c.csrName)
}
data := map[string][]byte{
TLSCertFile: certData,
TLSKeyFile: c.keyData,
}
return data, nil
}()
if err != nil {
c.reset()
if updateErr := c.statusUpdater(ctx, metav1.Condition{
Type: "ClusterCertificateRotated",
Status: metav1.ConditionFalse,
Reason: "ClientCertificateUpdateFailed",
Message: fmt.Sprintf("Failed to rotated client certificate %v", err),
}); updateErr != nil {
return updateErr
}
return err
}
if len(newSecretConfig) == 0 {
return nil
}
// append additional data into client certificate secret
for k, v := range c.AdditionalSecretData {
newSecretConfig[k] = v
}
secret.Data = newSecretConfig
// save the changes into secret
if err := saveSecret(c.managementCoreClient, c.SecretNamespace, secret); err != nil {
if updateErr := c.statusUpdater(ctx, metav1.Condition{
Type: "ClusterCertificateRotated",
Status: metav1.ConditionFalse,
Reason: "ClientCertificateUpdateFailed",
Message: fmt.Sprintf("Failed to rotated client certificate %v", err),
}); updateErr != nil {
return updateErr
}
return err
}
notBefore, notAfter, err := getCertValidityPeriod(secret)
cond := metav1.Condition{
Type: "ClusterCertificateRotated",
Status: metav1.ConditionTrue,
Reason: "ClientCertificateUpdated",
Message: fmt.Sprintf("client certificate rotated starting from %v to %v", *notBefore, *notAfter),
}
if err != nil {
cond = metav1.Condition{
Type: "ClusterCertificateRotated",
Status: metav1.ConditionFalse,
Reason: "ClientCertificateUpdateFailed",
Message: fmt.Sprintf("Failed to rotated client certificate %v", err),
}
}
if updateErr := c.statusUpdater(ctx, cond); updateErr != nil {
return updateErr
}
if err != nil {
c.reset()
return err
}
syncCtx.Recorder().Eventf("ClientCertificateCreated", "A new client certificate for %s is available", c.controllerName)
c.reset()
return nil
}
// create a csr to request new client certificate if
// a. there is no valid client certificate issued for the current cluster/agent;
// b. client certificate is sensitive to the additional secret data and the data changes;
// c. client certificate exists and has less than a random percentage range from 20% to 25% of its life remaining;
shouldCreate, err := shouldCreateCSR(
c.controllerName,
secret,
syncCtx.Recorder(),
c.Subject,
c.AdditionalSecretDataSensitive,
c.AdditionalSecretData)
if err != nil {
return err
}
if !shouldCreate {
return nil
}
shouldHalt := c.CSROption.HaltCSRCreation()
if shouldHalt {
if updateErr := c.statusUpdater(ctx, metav1.Condition{
Type: "ClusterCertificateRotated",
Status: metav1.ConditionFalse,
Reason: "ClientCertificateUpdateFailed",
Message: "Stop creating csr since there are too many csr created already on hub",
}); updateErr != nil {
return updateErr
}
return nil
}
// create a new private key
keyData, err := keyutil.MakeEllipticPrivateKeyPEM()
if err != nil {
return err
}
privateKey, err := keyutil.ParsePrivateKeyPEM(keyData)
if err != nil {
return fmt.Errorf("invalid private key for certificate request: %w", err)
}
csrData, err := certutil.MakeCSR(privateKey, c.Subject, c.DNSNames, nil)
if err != nil {
return fmt.Errorf("unable to generate certificate request: %w", err)
}
createdCSRName, err := c.csrControl.create(ctx, syncCtx.Recorder(), c.ObjectMeta, csrData, c.SignerName, c.ExpirationSeconds)
if err != nil {
return err
}
c.keyData = keyData
c.csrName = createdCSRName
return nil
}
func saveSecret(spokeCoreClient corev1client.CoreV1Interface, secretNamespace string, secret *corev1.Secret) error {
var err error
if secret.ResourceVersion == "" {
_, err = spokeCoreClient.Secrets(secretNamespace).Create(context.Background(), secret, metav1.CreateOptions{})
return err
}
_, err = spokeCoreClient.Secrets(secretNamespace).Update(context.Background(), secret, metav1.UpdateOptions{})
return err
}
func (c *clientCertificateController) reset() {
c.csrName = ""
c.keyData = nil
}
func shouldCreateCSR(
controllerName string,
secret *corev1.Secret,
recorder events.Recorder,
subject *pkix.Name,
additionalSecretDataSensitive bool,
additionalSecretData map[string][]byte) (bool, error) {
switch {
case !hasValidClientCertificate(subject, secret):
recorder.Eventf("NoValidCertificateFound",
"No valid client certificate for %s is found. Bootstrap is required", controllerName)
case additionalSecretDataSensitive && !hasAdditionalSecretData(additionalSecretData, secret):
recorder.Eventf("AdditonalSecretDataChanged",
"The additional secret data is changed. Re-create the client certificate for %s", controllerName)
default:
notBefore, notAfter, err := getCertValidityPeriod(secret)
if err != nil {
return false, err
}
total := notAfter.Sub(*notBefore)
remaining := time.Until(*notAfter)
klog.V(4).Infof("Client certificate for %s: time total=%v, remaining=%v, remaining/total=%v",
controllerName, total, remaining, remaining.Seconds()/total.Seconds())
threshold := jitter(0.2, 0.25)
if remaining.Seconds()/total.Seconds() > threshold {
// Do nothing if the client certificate is valid and has more than a random percentage range from 20% to 25% of its life remaining
klog.V(4).Infof("Client certificate for %s is valid and has more than %.2f%% of its life remaining", controllerName, threshold*100)
return false, nil
}
recorder.Eventf("CertificateRotationStarted",
"The current client certificate for %s expires in %v. Start certificate rotation",
controllerName, remaining.Round(time.Second))
}
return true, nil
}
// hasAdditonalSecretData checks if the secret includes the expected additional secret data.
func hasAdditionalSecretData(additionalSecretData map[string][]byte, secret *corev1.Secret) bool {
for k, v := range additionalSecretData {
value, ok := secret.Data[k]
if !ok {
return false
}
if !reflect.DeepEqual(v, value) {
return false
}
}
return true
}
func jitter(percentage float64, maxFactor float64) float64 {
if maxFactor <= 0.0 {
maxFactor = 1.0
}
newPercentage := percentage + percentage*rand.Float64()*maxFactor //#nosec G404
return newPercentage
}
func hasValidClientCertificate(subject *pkix.Name, secret *corev1.Secret) bool {
if valid, err := IsCertificateValid(secret.Data[TLSCertFile], subject); err == nil {
return valid
}
return false
}