Merge pull request #5148 from yifan-gu/clean_prober

Refactor pkg/kubelet/kubelet.go: probeContainer().
This commit is contained in:
Victor Marmol 2015-03-06 17:04:57 -08:00
commit 798513844c
3 changed files with 297 additions and 92 deletions

View File

@ -1202,36 +1202,17 @@ func (kl *Kubelet) syncPod(pod *api.BoundPod, containersInPod dockertools.Docker
// look for changes in the container. // look for changes in the container.
containerChanged := hash != 0 && hash != expectedHash containerChanged := hash != 0 && hash != expectedHash
if !containerChanged { if !containerChanged {
// TODO: This should probably be separated out into a separate goroutine. result, err := kl.probeContainer(pod, podStatus, container, dockerContainer)
// If the container's liveness probe is unsuccessful, set readiness to false. If liveness is succesful, do a readiness check and set
// readiness accordingly. If the initalDelay since container creation on liveness probe has not passed the probe will return Success.
// If the initial delay on the readiness probe has not passed the probe will return Failure.
ready := probe.Unknown
live, err := kl.probeContainer(container.LivenessProbe, podFullName, uid, podStatus, container, dockerContainer, probe.Success)
if live == probe.Success {
ready, _ = kl.probeContainer(container.ReadinessProbe, podFullName, uid, podStatus, container, dockerContainer, probe.Failure)
}
if err != nil { if err != nil {
glog.V(1).Infof("liveness/readiness probe errored: %v", err) glog.V(1).Infof("liveness/readiness probe errored: %v", err)
containersInPod.RemoveContainerWithID(containerID) containersInPod.RemoveContainerWithID(containerID)
continue continue
} }
if ready == probe.Success { if result == probe.Success {
kl.readiness.set(dockerContainer.ID, true)
} else {
kl.readiness.set(dockerContainer.ID, false)
}
if live == probe.Success {
containersInPod.RemoveContainerWithID(containerID) containersInPod.RemoveContainerWithID(containerID)
continue continue
} }
ref, ok := kl.getRef(containerID) glog.Infof("pod %q container %q is unhealthy (probe result: %v). Container will be killed and re-created.", podFullName, container.Name, result)
if !ok {
glog.Warningf("No ref for pod '%v' - '%v'", containerID, container.Name)
} else {
kl.recorder.Eventf(ref, "unhealthy", "Liveness Probe Failed %v - %v", containerID, container.Name)
}
glog.Infof("pod %q container %q is unhealthy (probe result: %v). Container will be killed and re-created.", podFullName, container.Name, live)
} else { } else {
glog.Infof("pod %q container %q hash changed (%d vs %d). Container will be killed and re-created.", podFullName, container.Name, hash, expectedHash) glog.Infof("pod %q container %q hash changed (%d vs %d). Container will be killed and re-created.", podFullName, container.Name, hash, expectedHash)
// Also kill associated pod infra container if the container changed. // Also kill associated pod infra container if the container changed.

View File

@ -24,53 +24,102 @@ import (
"time" "time"
"github.com/GoogleCloudPlatform/kubernetes/pkg/api" "github.com/GoogleCloudPlatform/kubernetes/pkg/api"
"github.com/GoogleCloudPlatform/kubernetes/pkg/kubelet/dockertools"
"github.com/GoogleCloudPlatform/kubernetes/pkg/probe" "github.com/GoogleCloudPlatform/kubernetes/pkg/probe"
execprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/exec" execprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/exec"
httprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/http" httprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/http"
tcprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/tcp" tcprobe "github.com/GoogleCloudPlatform/kubernetes/pkg/probe/tcp"
"github.com/GoogleCloudPlatform/kubernetes/pkg/types"
"github.com/GoogleCloudPlatform/kubernetes/pkg/util" "github.com/GoogleCloudPlatform/kubernetes/pkg/util"
"github.com/GoogleCloudPlatform/kubernetes/pkg/util/exec" "github.com/GoogleCloudPlatform/kubernetes/pkg/util/exec"
"github.com/fsouza/go-dockerclient" "github.com/fsouza/go-dockerclient"
"github.com/golang/glog" "github.com/golang/glog"
) )
const maxProbeRetries = 3 const maxProbeRetries = 3
// probeContainer executes the given probe on a container and returns the result. // probeContainer probes the liveness/readiness of the given container.
// If the probe is nil this returns Success. If the probe's initial delay has not passed // If the container's liveness probe is unsuccessful, set readiness to false.
// since the creation of the container, this returns the defaultResult. It will then attempt // If liveness is successful, do a readiness check and set readiness accordingly.
// to execute the probe repeatedly up to maxProbeRetries times, and return on the first func (kl *Kubelet) probeContainer(pod *api.BoundPod, status api.PodStatus, container api.Container, dockerContainer *docker.APIContainers) (probe.Result, error) {
// successful result, else returning the last unsucessful result and error. // Probe liveness.
func (kl *Kubelet) probeContainer(p *api.Probe, live, err := kl.probeContainerLiveness(pod, status, container, dockerContainer)
podFullName string, if err != nil {
podUID types.UID, glog.V(1).Infof("liveness probe errored: %v", err)
status api.PodStatus, kl.readiness.set(dockerContainer.ID, false)
container api.Container, return probe.Unknown, err
dockerContainer *docker.APIContainers, }
defaultResult probe.Result) (probe.Result, error) { if live != probe.Success {
var err error glog.V(1).Infof("liveness probe unsuccessful: %v", live)
result := probe.Unknown kl.readiness.set(dockerContainer.ID, false)
return live, nil
}
// Probe readiness.
ready, err := kl.probeContainerReadiness(pod, status, container, dockerContainer)
if err == nil && ready == probe.Success {
glog.V(1).Infof("readiness probe successful: %v", ready)
kl.readiness.set(dockerContainer.ID, true)
return probe.Success, nil
}
glog.V(1).Infof("readiness probe failed/errored: %v, %v", ready, err)
kl.readiness.set(dockerContainer.ID, false)
containerID := dockertools.DockerID(dockerContainer.ID)
ref, ok := kl.getRef(containerID)
if !ok {
glog.Warningf("No ref for pod '%v' - '%v'", containerID, container.Name)
} else {
kl.recorder.Eventf(ref, "unhealthy", "Liveness Probe Failed %v - %v", containerID, container.Name)
}
return ready, err
}
// probeContainerLiveness probes the liveness of a container.
// If the initalDelay since container creation on liveness probe has not passed the probe will return probe.Success.
func (kl *Kubelet) probeContainerLiveness(pod *api.BoundPod, status api.PodStatus, container api.Container, dockerContainer *docker.APIContainers) (probe.Result, error) {
p := container.LivenessProbe
if p == nil { if p == nil {
return probe.Success, nil return probe.Success, nil
} }
if time.Now().Unix()-dockerContainer.Created < p.InitialDelaySeconds { if time.Now().Unix()-dockerContainer.Created < p.InitialDelaySeconds {
return defaultResult, nil return probe.Success, nil
} }
for i := 0; i < maxProbeRetries; i++ { return kl.runProbeWithRetries(p, pod, status, container, maxProbeRetries)
result, err = kl.runProbe(p, podFullName, podUID, status, container) }
// probeContainerLiveness probes the readiness of a container.
// If the initial delay on the readiness probe has not passed the probe will return probe.Failure.
func (kl *Kubelet) probeContainerReadiness(pod *api.BoundPod, status api.PodStatus, container api.Container, dockerContainer *docker.APIContainers) (probe.Result, error) {
p := container.ReadinessProbe
if p == nil {
return probe.Success, nil
}
if time.Now().Unix()-dockerContainer.Created < p.InitialDelaySeconds {
return probe.Failure, nil
}
return kl.runProbeWithRetries(p, pod, status, container, maxProbeRetries)
}
// runProbeWithRetries tries to probe the container in a finite loop, it returns the last result
// if it never succeeds.
func (kl *Kubelet) runProbeWithRetries(p *api.Probe, pod *api.BoundPod, status api.PodStatus, container api.Container, retires int) (probe.Result, error) {
var err error
var result probe.Result
for i := 0; i < retires; i++ {
result, err = kl.runProbe(p, pod, status, container)
if result == probe.Success { if result == probe.Success {
return result, err return probe.Success, nil
} }
} }
return result, err return result, err
} }
func (kl *Kubelet) runProbe(p *api.Probe, podFullName string, podUID types.UID, status api.PodStatus, container api.Container) (probe.Result, error) { func (kl *Kubelet) runProbe(p *api.Probe, pod *api.BoundPod, status api.PodStatus, container api.Container) (probe.Result, error) {
timeout := time.Duration(p.TimeoutSeconds) * time.Second timeout := time.Duration(p.TimeoutSeconds) * time.Second
if p.Exec != nil { if p.Exec != nil {
return kl.prober.exec.Probe(kl.newExecInContainer(podFullName, podUID, container)) return kl.prober.exec.Probe(kl.newExecInContainer(pod, container))
} }
if p.HTTPGet != nil { if p.HTTPGet != nil {
port, err := extractPort(p.HTTPGet.Port, container) port, err := extractPort(p.HTTPGet.Port, container)
@ -141,9 +190,11 @@ type execInContainer struct {
run func() ([]byte, error) run func() ([]byte, error)
} }
func (kl *Kubelet) newExecInContainer(podFullName string, podUID types.UID, container api.Container) exec.Cmd { func (kl *Kubelet) newExecInContainer(pod *api.BoundPod, container api.Container) exec.Cmd {
uid := pod.UID
podFullName := GetPodFullName(pod)
return execInContainer{func() ([]byte, error) { return execInContainer{func() ([]byte, error) {
return kl.RunInContainer(podFullName, podUID, container.Name, container.LivenessProbe.Exec.Command) return kl.RunInContainer(podFullName, uid, container.Name, container.LivenessProbe.Exec.Command)
}} }}
} }

View File

@ -23,7 +23,6 @@ import (
"github.com/GoogleCloudPlatform/kubernetes/pkg/api" "github.com/GoogleCloudPlatform/kubernetes/pkg/api"
"github.com/GoogleCloudPlatform/kubernetes/pkg/probe" "github.com/GoogleCloudPlatform/kubernetes/pkg/probe"
"github.com/GoogleCloudPlatform/kubernetes/pkg/types"
"github.com/GoogleCloudPlatform/kubernetes/pkg/util" "github.com/GoogleCloudPlatform/kubernetes/pkg/util"
"github.com/GoogleCloudPlatform/kubernetes/pkg/util/exec" "github.com/GoogleCloudPlatform/kubernetes/pkg/util/exec"
@ -147,6 +146,7 @@ func (p fakeExecProber) Probe(_ exec.Cmd) (probe.Result, error) {
func makeTestKubelet(result probe.Result, err error) *Kubelet { func makeTestKubelet(result probe.Result, err error) *Kubelet {
return &Kubelet{ return &Kubelet{
readiness: newReadinessStates(),
prober: probeHolder{ prober: probeHolder{
exec: fakeExecProber{ exec: fakeExecProber{
result: result, result: result,
@ -156,68 +156,239 @@ func makeTestKubelet(result probe.Result, err error) *Kubelet {
} }
} }
// TestProbeContainer tests the functionality of probeContainer.
// Test cases are:
//
// No probe.
// Only LivenessProbe.
// Only ReadinessProbe.
// Both probes.
//
// Also, for each probe, there will be several cases covering whether the initial
// delay has passed, whether the probe handler will return Success, Failure,
// Unknown or error.
//
func TestProbeContainer(t *testing.T) { func TestProbeContainer(t *testing.T) {
dc := &docker.APIContainers{Created: time.Now().Unix()} dc := &docker.APIContainers{
ID: "foobar",
Created: time.Now().Unix(),
}
tests := []struct { tests := []struct {
p *api.Probe testContainer api.Container
defaultResult probe.Result
expectError bool expectError bool
expectedResult probe.Result expectedResult probe.Result
expectedReadiness bool
}{ }{
// No probes.
{ {
defaultResult: probe.Success, testContainer: api.Container{},
expectedResult: probe.Success, expectedResult: probe.Success,
expectedReadiness: true,
}, },
// Only LivenessProbe.
{ {
defaultResult: probe.Failure, testContainer: api.Container{
LivenessProbe: &api.Probe{InitialDelaySeconds: 100},
},
expectedResult: probe.Success, expectedResult: probe.Success,
expectedReadiness: true,
}, },
{ {
p: &api.Probe{InitialDelaySeconds: 100}, testContainer: api.Container{
defaultResult: probe.Failure, LivenessProbe: &api.Probe{InitialDelaySeconds: -100},
expectError: false,
expectedResult: probe.Failure,
}, },
{
p: &api.Probe{
InitialDelaySeconds: -100,
},
defaultResult: probe.Failure,
expectError: false,
expectedResult: probe.Unknown, expectedResult: probe.Unknown,
expectedReadiness: false,
}, },
{ {
p: &api.Probe{ testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100, InitialDelaySeconds: -100,
Handler: api.Handler{ Handler: api.Handler{
Exec: &api.ExecAction{}, Exec: &api.ExecAction{},
}, },
}, },
defaultResult: probe.Failure, },
expectError: false, expectedResult: probe.Failure,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectedResult: probe.Success, expectedResult: probe.Success,
expectedReadiness: true,
}, },
{ {
p: &api.Probe{ testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100, InitialDelaySeconds: -100,
Handler: api.Handler{ Handler: api.Handler{
Exec: &api.ExecAction{}, Exec: &api.ExecAction{},
}, },
}, },
defaultResult: probe.Failure, },
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectError: true, expectError: true,
expectedResult: probe.Unknown, expectedResult: probe.Unknown,
expectedReadiness: false,
},
// Only ReadinessProbe.
{
testContainer: api.Container{
ReadinessProbe: &api.Probe{InitialDelaySeconds: 100},
},
expectedResult: probe.Failure,
expectedReadiness: false,
}, },
{ {
p: &api.Probe{ testContainer: api.Container{
ReadinessProbe: &api.Probe{InitialDelaySeconds: -100},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
ReadinessProbe: &api.Probe{
InitialDelaySeconds: -100, InitialDelaySeconds: -100,
Handler: api.Handler{ Handler: api.Handler{
Exec: &api.ExecAction{}, Exec: &api.ExecAction{},
}, },
}, },
defaultResult: probe.Success, },
expectError: false,
expectedResult: probe.Failure, expectedResult: probe.Failure,
expectedReadiness: false,
},
{
testContainer: api.Container{
ReadinessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectedResult: probe.Success,
expectedReadiness: true,
},
{
testContainer: api.Container{
ReadinessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
ReadinessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectError: true,
expectedResult: probe.Unknown,
expectedReadiness: false,
},
// Both LivenessProbe and ReadinessProbe.
{
testContainer: api.Container{
LivenessProbe: &api.Probe{InitialDelaySeconds: 100},
ReadinessProbe: &api.Probe{InitialDelaySeconds: 100},
},
expectedResult: probe.Failure,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{InitialDelaySeconds: 100},
ReadinessProbe: &api.Probe{InitialDelaySeconds: -100},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{InitialDelaySeconds: -100},
ReadinessProbe: &api.Probe{InitialDelaySeconds: 100},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{InitialDelaySeconds: -100},
ReadinessProbe: &api.Probe{InitialDelaySeconds: -100},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
ReadinessProbe: &api.Probe{InitialDelaySeconds: -100},
},
expectedResult: probe.Unknown,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
ReadinessProbe: &api.Probe{InitialDelaySeconds: -100},
},
expectedResult: probe.Failure,
expectedReadiness: false,
},
{
testContainer: api.Container{
LivenessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
ReadinessProbe: &api.Probe{
InitialDelaySeconds: -100,
Handler: api.Handler{
Exec: &api.ExecAction{},
},
},
},
expectedResult: probe.Success,
expectedReadiness: true,
}, },
} }
@ -229,8 +400,7 @@ func TestProbeContainer(t *testing.T) {
} else { } else {
kl = makeTestKubelet(test.expectedResult, nil) kl = makeTestKubelet(test.expectedResult, nil)
} }
result, err := kl.probeContainer(&api.BoundPod{}, api.PodStatus{}, test.testContainer, dc)
result, err := kl.probeContainer(test.p, "", types.UID(""), api.PodStatus{}, api.Container{}, dc, test.defaultResult)
if test.expectError && err == nil { if test.expectError && err == nil {
t.Error("Expected error but did no error was returned.") t.Error("Expected error but did no error was returned.")
} }
@ -240,5 +410,8 @@ func TestProbeContainer(t *testing.T) {
if test.expectedResult != result { if test.expectedResult != result {
t.Errorf("Expected result was %v but probeContainer() returned %v", test.expectedResult, result) t.Errorf("Expected result was %v but probeContainer() returned %v", test.expectedResult, result)
} }
if test.expectedReadiness != kl.readiness.get(dc.ID) {
t.Errorf("Expected readiness was %v but probeContainer() set %v", test.expectedReadiness, kl.readiness.get(dc.ID))
}
} }
} }