mirror of
https://github.com/k3s-io/kubernetes.git
synced 2025-08-01 07:47:56 +00:00
Increase the timeout on apiserver requests to fetch node stats.
This commit is contained in:
parent
e186582272
commit
e1147184d5
@ -25,6 +25,12 @@ import (
|
|||||||
. "github.com/onsi/ginkgo"
|
. "github.com/onsi/ginkgo"
|
||||||
)
|
)
|
||||||
|
|
||||||
|
const (
|
||||||
|
timeout = 1 * time.Minute
|
||||||
|
maxRetries = 10
|
||||||
|
sleepDuration = time.Minute
|
||||||
|
)
|
||||||
|
|
||||||
var _ = Describe("Cadvisor", func() {
|
var _ = Describe("Cadvisor", func() {
|
||||||
var c *client.Client
|
var c *client.Client
|
||||||
|
|
||||||
@ -44,14 +50,15 @@ func CheckCadvisorHealthOnAllNodes(c *client.Client, timeout time.Duration) {
|
|||||||
nodeList, err := c.Nodes().List()
|
nodeList, err := c.Nodes().List()
|
||||||
expectNoError(err)
|
expectNoError(err)
|
||||||
var errors []error
|
var errors []error
|
||||||
for start := time.Now(); time.Since(start) < timeout; time.Sleep(5 * time.Second) {
|
retries := maxRetries
|
||||||
|
for {
|
||||||
errors = []error{}
|
errors = []error{}
|
||||||
for _, node := range nodeList.Items {
|
for _, node := range nodeList.Items {
|
||||||
// cadvisor is not accessible directly unless its port (4194 by default) is exposed.
|
// cadvisor is not accessible directly unless its port (4194 by default) is exposed.
|
||||||
// Here, we access '/stats/' REST endpoint on the kubelet which polls cadvisor internally.
|
// Here, we access '/stats/' REST endpoint on the kubelet which polls cadvisor internally.
|
||||||
statsResource := fmt.Sprintf("api/v1beta1/proxy/minions/%s/stats/", node.Name)
|
statsResource := fmt.Sprintf("api/v1beta1/proxy/minions/%s/stats/", node.Name)
|
||||||
By(fmt.Sprintf("Querying stats from node %s using url %s", node.Name, statsResource))
|
By(fmt.Sprintf("Querying stats from node %s using url %s", node.Name, statsResource))
|
||||||
_, err = c.Get().AbsPath(statsResource).Timeout(1 * time.Second).Do().Raw()
|
_, err = c.Get().AbsPath(statsResource).Timeout(timeout).Do().Raw()
|
||||||
if err != nil {
|
if err != nil {
|
||||||
errors = append(errors, err)
|
errors = append(errors, err)
|
||||||
}
|
}
|
||||||
@ -59,6 +66,11 @@ func CheckCadvisorHealthOnAllNodes(c *client.Client, timeout time.Duration) {
|
|||||||
if len(errors) == 0 {
|
if len(errors) == 0 {
|
||||||
return
|
return
|
||||||
}
|
}
|
||||||
|
if retries--; retries <= 0 {
|
||||||
|
break
|
||||||
}
|
}
|
||||||
Failf("Timed out after %v waiting for cadvisor to be healthy on all nodes. Errors:\n%v", timeout, errors)
|
Logf("failed to retrieve kubelet stats -\n %v", errors)
|
||||||
|
time.Sleep(sleepDuration)
|
||||||
|
}
|
||||||
|
Failf("Failed after retrying %d times for cadvisor to be healthy on all nodes. Errors:\n%v", maxRetries, errors)
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user