add health probe that detects skew between 'real' system clock and 'monotonic' internal clock
Signed-off-by: Tim Ramlot <42113979+inteon@users.noreply.github.com>
This commit is contained in:
parent
d03c56f670
commit
8d75a003e9
@ -284,7 +284,7 @@ topologySpreadConstraints: []
|
||||
# controller-manager. See:
|
||||
# https://github.com/kubernetes/kubernetes/blob/806b30170c61a38fedd54cc9ede4cd6275a1ad3b/cmd/kubeadm/app/util/staticpod/utils.go#L241-L245
|
||||
livenessProbe:
|
||||
enabled: false
|
||||
enabled: true
|
||||
initialDelaySeconds: 10
|
||||
periodSeconds: 10
|
||||
timeoutSeconds: 15
|
||||
|
||||
64
pkg/healthz/clock_health.go
Normal file
64
pkg/healthz/clock_health.go
Normal file
@ -0,0 +1,64 @@
|
||||
/*
|
||||
Copyright 2020 The cert-manager Authors.
|
||||
|
||||
Licensed under the Apache License, Version 2.0 (the "License");
|
||||
you may not use this file except in compliance with the License.
|
||||
You may obtain a copy of the License at
|
||||
|
||||
http://www.apache.org/licenses/LICENSE-2.0
|
||||
|
||||
Unless required by applicable law or agreed to in writing, software
|
||||
distributed under the License is distributed on an "AS IS" BASIS,
|
||||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
See the License for the specific language governing permissions and
|
||||
limitations under the License.
|
||||
*/
|
||||
|
||||
package healthz
|
||||
|
||||
import (
|
||||
"fmt"
|
||||
"net/http"
|
||||
"time"
|
||||
|
||||
"k8s.io/utils/clock"
|
||||
)
|
||||
|
||||
type clockHealthAdaptor struct {
|
||||
clock clock.Clock
|
||||
startTimeReal time.Time
|
||||
startTimeMonotonic time.Time
|
||||
}
|
||||
|
||||
func NewClockHealthAdaptor(c clock.Clock) *clockHealthAdaptor {
|
||||
return &clockHealthAdaptor{
|
||||
clock: c,
|
||||
startTimeReal: c.Now().Round(0), // .Round(0) removes the monotonic part from the time
|
||||
startTimeMonotonic: c.Now(),
|
||||
}
|
||||
}
|
||||
|
||||
func (c *clockHealthAdaptor) skew() time.Duration {
|
||||
realDuration := c.clock.Since(c.startTimeReal)
|
||||
monotonicDuration := c.clock.Since(c.startTimeMonotonic)
|
||||
|
||||
if monotonicDuration > realDuration {
|
||||
return monotonicDuration - realDuration
|
||||
}
|
||||
|
||||
return realDuration - monotonicDuration
|
||||
}
|
||||
|
||||
// Name returns the name of the health check we are implementing.
|
||||
func (l *clockHealthAdaptor) Name() string {
|
||||
return "clockHealth"
|
||||
}
|
||||
|
||||
// Check is called by the healthz endpoint handler.
|
||||
// It fails (returns an error) if we own the lease but had not been able to renew it.
|
||||
func (l *clockHealthAdaptor) Check(req *http.Request) error {
|
||||
if skew := l.skew(); skew > 1*time.Minute {
|
||||
return fmt.Errorf("the system clock is out of sync with the internal monotonic clock by %v, which is more than the allowed 1m", skew)
|
||||
}
|
||||
return nil
|
||||
}
|
||||
@ -26,6 +26,7 @@ import (
|
||||
"golang.org/x/sync/errgroup"
|
||||
"k8s.io/apiserver/pkg/server/healthz"
|
||||
"k8s.io/client-go/tools/leaderelection"
|
||||
"k8s.io/utils/clock"
|
||||
)
|
||||
|
||||
const (
|
||||
@ -51,8 +52,9 @@ type Server struct {
|
||||
// leader lease time, the leader election will be considered to have failed.
|
||||
func NewServer(leaderElectionHealthzAdaptorTimeout time.Duration) *Server {
|
||||
leaderHealthzAdaptor := leaderelection.NewLeaderHealthzAdaptor(leaderElectionHealthzAdaptorTimeout)
|
||||
clockHealthAdaptor := NewClockHealthAdaptor(clock.RealClock{})
|
||||
mux := http.NewServeMux()
|
||||
healthz.InstallLivezHandler(mux, leaderHealthzAdaptor)
|
||||
healthz.InstallLivezHandler(mux, leaderHealthzAdaptor, clockHealthAdaptor)
|
||||
return &Server{
|
||||
server: &http.Server{
|
||||
ReadTimeout: healthzServerReadTimeout,
|
||||
|
||||
Loading…
Reference in New Issue
Block a user