cluster_upgrade.go 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230
  1. /*
  2. Copyright 2016 The Kubernetes Authors.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package e2e
  14. import (
  15. "fmt"
  16. "path"
  17. "strings"
  18. "k8s.io/kubernetes/pkg/api"
  19. client "k8s.io/kubernetes/pkg/client/unversioned"
  20. "k8s.io/kubernetes/pkg/util/wait"
  21. "k8s.io/kubernetes/test/e2e/chaosmonkey"
  22. "k8s.io/kubernetes/test/e2e/framework"
  23. . "github.com/onsi/ginkgo"
  24. )
  25. // TODO(mikedanese): Add setup, validate, and teardown for:
  26. // - secrets
  27. // - volumes
  28. // - persistent volumes
  29. var _ = framework.KubeDescribe("Upgrade [Feature:Upgrade]", func() {
  30. f := framework.NewDefaultFramework("cluster-upgrade")
  31. framework.KubeDescribe("master upgrade", func() {
  32. It("should maintain responsive services [Feature:MasterUpgrade]", func() {
  33. cm := chaosmonkey.New(func() {
  34. v, err := realVersion(framework.TestContext.UpgradeTarget)
  35. framework.ExpectNoError(err)
  36. framework.ExpectNoError(framework.MasterUpgrade(v))
  37. framework.ExpectNoError(checkMasterVersion(f.Client, v))
  38. })
  39. cm.Register(func(sem *chaosmonkey.Semaphore) {
  40. // Close over f.
  41. testServiceRemainsUp(f, sem)
  42. })
  43. cm.Do()
  44. })
  45. })
  46. framework.KubeDescribe("node upgrade", func() {
  47. It("should maintain a functioning cluster [Feature:NodeUpgrade]", func() {
  48. cm := chaosmonkey.New(func() {
  49. v, err := realVersion(framework.TestContext.UpgradeTarget)
  50. framework.ExpectNoError(err)
  51. framework.ExpectNoError(framework.NodeUpgrade(f, v))
  52. framework.ExpectNoError(checkNodesVersions(f.Client, v))
  53. })
  54. cm.Register(func(sem *chaosmonkey.Semaphore) {
  55. // Close over f.
  56. testServiceUpBeforeAndAfter(f, sem)
  57. })
  58. cm.Do()
  59. })
  60. It("should maintain responsive services [Feature:ExperimentalNodeUpgrade]", func() {
  61. cm := chaosmonkey.New(func() {
  62. v, err := realVersion(framework.TestContext.UpgradeTarget)
  63. framework.ExpectNoError(err)
  64. framework.ExpectNoError(framework.NodeUpgrade(f, v))
  65. framework.ExpectNoError(checkNodesVersions(f.Client, v))
  66. })
  67. cm.Register(func(sem *chaosmonkey.Semaphore) {
  68. // Close over f.
  69. testServiceRemainsUp(f, sem)
  70. })
  71. cm.Do()
  72. })
  73. })
  74. framework.KubeDescribe("cluster upgrade", func() {
  75. It("should maintain a functioning cluster [Feature:ClusterUpgrade]", func() {
  76. cm := chaosmonkey.New(func() {
  77. v, err := realVersion(framework.TestContext.UpgradeTarget)
  78. framework.ExpectNoError(err)
  79. framework.ExpectNoError(framework.MasterUpgrade(v))
  80. framework.ExpectNoError(checkMasterVersion(f.Client, v))
  81. framework.ExpectNoError(framework.NodeUpgrade(f, v))
  82. framework.ExpectNoError(checkNodesVersions(f.Client, v))
  83. })
  84. cm.Register(func(sem *chaosmonkey.Semaphore) {
  85. // Close over f.
  86. testServiceUpBeforeAndAfter(f, sem)
  87. })
  88. cm.Do()
  89. })
  90. It("should maintain responsive services [Feature:ExperimentalClusterUpgrade]", func() {
  91. cm := chaosmonkey.New(func() {
  92. v, err := realVersion(framework.TestContext.UpgradeTarget)
  93. framework.ExpectNoError(err)
  94. framework.ExpectNoError(framework.MasterUpgrade(v))
  95. framework.ExpectNoError(checkMasterVersion(f.Client, v))
  96. framework.ExpectNoError(framework.NodeUpgrade(f, v))
  97. framework.ExpectNoError(checkNodesVersions(f.Client, v))
  98. })
  99. cm.Register(func(sem *chaosmonkey.Semaphore) {
  100. // Close over f.
  101. testServiceRemainsUp(f, sem)
  102. })
  103. cm.Do()
  104. })
  105. })
  106. })
  107. // realVersion turns a version constant s into a version string deployable on
  108. // GKE. See hack/get-build.sh for more information.
  109. func realVersion(s string) (string, error) {
  110. framework.Logf(fmt.Sprintf("Getting real version for %q", s))
  111. v, _, err := framework.RunCmd(path.Join(framework.TestContext.RepoRoot, "hack/get-build.sh"), "-v", s)
  112. if err != nil {
  113. return v, err
  114. }
  115. framework.Logf("Version for %q is %q", s, v)
  116. return strings.TrimPrefix(strings.TrimSpace(v), "v"), nil
  117. }
  118. func testServiceUpBeforeAndAfter(f *framework.Framework, sem *chaosmonkey.Semaphore) {
  119. testService(f, sem, false)
  120. }
  121. func testServiceRemainsUp(f *framework.Framework, sem *chaosmonkey.Semaphore) {
  122. testService(f, sem, true)
  123. }
  124. // testService is a helper for testServiceUpBeforeAndAfter and testServiceRemainsUp with a flag for testDuringDisruption
  125. //
  126. // TODO(ihmccreery) remove this abstraction once testServiceUpBeforeAndAfter is no longer needed, because node upgrades
  127. // maintain a responsive service.
  128. func testService(f *framework.Framework, sem *chaosmonkey.Semaphore, testDuringDisruption bool) {
  129. // Setup
  130. serviceName := "service-test"
  131. jig := NewServiceTestJig(f.Client, serviceName)
  132. // nodeIP := pickNodeIP(jig.Client) // for later
  133. By("creating a TCP service " + serviceName + " with type=LoadBalancer in namespace " + f.Namespace.Name)
  134. // TODO it's weird that we have to do this and then wait WaitForLoadBalancer which changes
  135. // tcpService.
  136. tcpService := jig.CreateTCPServiceOrFail(f.Namespace.Name, func(s *api.Service) {
  137. s.Spec.Type = api.ServiceTypeLoadBalancer
  138. })
  139. tcpService = jig.WaitForLoadBalancerOrFail(f.Namespace.Name, tcpService.Name, loadBalancerCreateTimeoutDefault)
  140. jig.SanityCheckService(tcpService, api.ServiceTypeLoadBalancer)
  141. // Get info to hit it with
  142. tcpIngressIP := getIngressPoint(&tcpService.Status.LoadBalancer.Ingress[0])
  143. svcPort := int(tcpService.Spec.Ports[0].Port)
  144. By("creating pod to be part of service " + serviceName)
  145. // TODO newRCTemplate only allows for the creation of one replica... that probably won't
  146. // work so well.
  147. jig.RunOrFail(f.Namespace.Name, nil)
  148. // Hit it once before considering ourselves ready
  149. By("hitting the pod through the service's LoadBalancer")
  150. jig.TestReachableHTTP(tcpIngressIP, svcPort, loadBalancerLagTimeoutDefault)
  151. sem.Ready()
  152. if testDuringDisruption {
  153. // Continuous validation
  154. wait.Until(func() {
  155. By("hitting the pod through the service's LoadBalancer")
  156. jig.TestReachableHTTP(tcpIngressIP, svcPort, framework.Poll)
  157. }, framework.Poll, sem.StopCh)
  158. } else {
  159. // Block until chaosmonkey is done
  160. By("waiting for upgrade to finish without checking if service remains up")
  161. <-sem.StopCh
  162. }
  163. // Sanity check and hit it once more
  164. By("hitting the pod through the service's LoadBalancer")
  165. jig.TestReachableHTTP(tcpIngressIP, svcPort, loadBalancerLagTimeoutDefault)
  166. jig.SanityCheckService(tcpService, api.ServiceTypeLoadBalancer)
  167. }
  168. func checkMasterVersion(c *client.Client, want string) error {
  169. framework.Logf("Checking master version")
  170. v, err := c.Discovery().ServerVersion()
  171. if err != nil {
  172. return fmt.Errorf("checkMasterVersion() couldn't get the master version: %v", err)
  173. }
  174. // We do prefix trimming and then matching because:
  175. // want looks like: 0.19.3-815-g50e67d4
  176. // got looks like: v0.19.3-815-g50e67d4034e858-dirty
  177. got := strings.TrimPrefix(v.GitVersion, "v")
  178. if !strings.HasPrefix(got, want) {
  179. return fmt.Errorf("master had kube-apiserver version %s which does not start with %s",
  180. got, want)
  181. }
  182. framework.Logf("Master is at version %s", want)
  183. return nil
  184. }
  185. func checkNodesVersions(c *client.Client, want string) error {
  186. l := framework.GetReadySchedulableNodesOrDie(c)
  187. for _, n := range l.Items {
  188. // We do prefix trimming and then matching because:
  189. // want looks like: 0.19.3-815-g50e67d4
  190. // kv/kvp look like: v0.19.3-815-g50e67d4034e858-dirty
  191. kv, kpv := strings.TrimPrefix(n.Status.NodeInfo.KubeletVersion, "v"),
  192. strings.TrimPrefix(n.Status.NodeInfo.KubeProxyVersion, "v")
  193. if !strings.HasPrefix(kv, want) {
  194. return fmt.Errorf("node %s had kubelet version %s which does not start with %s",
  195. n.ObjectMeta.Name, kv, want)
  196. }
  197. if !strings.HasPrefix(kpv, want) {
  198. return fmt.Errorf("node %s had kube-proxy version %s which does not start with %s",
  199. n.ObjectMeta.Name, kpv, want)
  200. }
  201. }
  202. return nil
  203. }