autoscaling_utils.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398
  1. /*
  2. Copyright 2015 The Kubernetes Authors.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package e2e
  14. import (
  15. "fmt"
  16. "strconv"
  17. "time"
  18. "k8s.io/kubernetes/pkg/api"
  19. client "k8s.io/kubernetes/pkg/client/unversioned"
  20. "k8s.io/kubernetes/pkg/util/intstr"
  21. "k8s.io/kubernetes/test/e2e/framework"
  22. . "github.com/onsi/ginkgo"
  23. )
  24. const (
  25. dynamicConsumptionTimeInSeconds = 30
  26. staticConsumptionTimeInSeconds = 3600
  27. dynamicRequestSizeInMillicores = 20
  28. dynamicRequestSizeInMegabytes = 100
  29. dynamicRequestSizeCustomMetric = 10
  30. port = 80
  31. targetPort = 8080
  32. timeoutRC = 120 * time.Second
  33. startServiceTimeout = time.Minute
  34. startServiceInterval = 5 * time.Second
  35. resourceConsumerImage = "gcr.io/google_containers/resource_consumer:beta4"
  36. resourceConsumerControllerImage = "gcr.io/google_containers/resource_consumer/controller:beta4"
  37. rcIsNil = "ERROR: replicationController = nil"
  38. deploymentIsNil = "ERROR: deployment = nil"
  39. rsIsNil = "ERROR: replicaset = nil"
  40. invalidKind = "ERROR: invalid workload kind for resource consumer"
  41. customMetricName = "QPS"
  42. )
  43. /*
  44. ResourceConsumer is a tool for testing. It helps create specified usage of CPU or memory (Warning: memory not supported)
  45. typical use case:
  46. rc.ConsumeCPU(600)
  47. // ... check your assumption here
  48. rc.ConsumeCPU(300)
  49. // ... check your assumption here
  50. */
  51. type ResourceConsumer struct {
  52. name string
  53. controllerName string
  54. kind string
  55. framework *framework.Framework
  56. cpu chan int
  57. mem chan int
  58. customMetric chan int
  59. stopCPU chan int
  60. stopMem chan int
  61. stopCustomMetric chan int
  62. consumptionTimeInSeconds int
  63. sleepTime time.Duration
  64. requestSizeInMillicores int
  65. requestSizeInMegabytes int
  66. requestSizeCustomMetric int
  67. }
  68. func NewDynamicResourceConsumer(name, kind string, replicas, initCPUTotal, initMemoryTotal, initCustomMetric int, cpuLimit, memLimit int64, f *framework.Framework) *ResourceConsumer {
  69. return newResourceConsumer(name, kind, replicas, initCPUTotal, initMemoryTotal, initCustomMetric, dynamicConsumptionTimeInSeconds,
  70. dynamicRequestSizeInMillicores, dynamicRequestSizeInMegabytes, dynamicRequestSizeCustomMetric, cpuLimit, memLimit, f)
  71. }
  72. // TODO this still defaults to replication controller
  73. func NewStaticResourceConsumer(name string, replicas, initCPUTotal, initMemoryTotal, initCustomMetric int, cpuLimit, memLimit int64, f *framework.Framework) *ResourceConsumer {
  74. return newResourceConsumer(name, kindRC, replicas, initCPUTotal, initMemoryTotal, initCustomMetric, staticConsumptionTimeInSeconds,
  75. initCPUTotal/replicas, initMemoryTotal/replicas, initCustomMetric/replicas, cpuLimit, memLimit, f)
  76. }
  77. /*
  78. NewResourceConsumer creates new ResourceConsumer
  79. initCPUTotal argument is in millicores
  80. initMemoryTotal argument is in megabytes
  81. memLimit argument is in megabytes, memLimit is a maximum amount of memory that can be consumed by a single pod
  82. cpuLimit argument is in millicores, cpuLimit is a maximum amount of cpu that can be consumed by a single pod
  83. */
  84. func newResourceConsumer(name, kind string, replicas, initCPUTotal, initMemoryTotal, initCustomMetric, consumptionTimeInSeconds, requestSizeInMillicores,
  85. requestSizeInMegabytes int, requestSizeCustomMetric int, cpuLimit, memLimit int64, f *framework.Framework) *ResourceConsumer {
  86. runServiceAndWorkloadForResourceConsumer(f.Client, f.Namespace.Name, name, kind, replicas, cpuLimit, memLimit)
  87. rc := &ResourceConsumer{
  88. name: name,
  89. controllerName: name + "-ctrl",
  90. kind: kind,
  91. framework: f,
  92. cpu: make(chan int),
  93. mem: make(chan int),
  94. customMetric: make(chan int),
  95. stopCPU: make(chan int),
  96. stopMem: make(chan int),
  97. stopCustomMetric: make(chan int),
  98. consumptionTimeInSeconds: consumptionTimeInSeconds,
  99. sleepTime: time.Duration(consumptionTimeInSeconds) * time.Second,
  100. requestSizeInMillicores: requestSizeInMillicores,
  101. requestSizeInMegabytes: requestSizeInMegabytes,
  102. requestSizeCustomMetric: requestSizeCustomMetric,
  103. }
  104. go rc.makeConsumeCPURequests()
  105. rc.ConsumeCPU(initCPUTotal)
  106. go rc.makeConsumeMemRequests()
  107. rc.ConsumeMem(initMemoryTotal)
  108. go rc.makeConsumeCustomMetric()
  109. rc.ConsumeCustomMetric(initCustomMetric)
  110. return rc
  111. }
  112. // ConsumeCPU consumes given number of CPU
  113. func (rc *ResourceConsumer) ConsumeCPU(millicores int) {
  114. framework.Logf("RC %s: consume %v millicores in total", rc.name, millicores)
  115. rc.cpu <- millicores
  116. }
  117. // ConsumeMem consumes given number of Mem
  118. func (rc *ResourceConsumer) ConsumeMem(megabytes int) {
  119. framework.Logf("RC %s: consume %v MB in total", rc.name, megabytes)
  120. rc.mem <- megabytes
  121. }
  122. // ConsumeMem consumes given number of custom metric
  123. func (rc *ResourceConsumer) ConsumeCustomMetric(amount int) {
  124. framework.Logf("RC %s: consume custom metric %v in total", rc.name, amount)
  125. rc.customMetric <- amount
  126. }
  127. func (rc *ResourceConsumer) makeConsumeCPURequests() {
  128. defer GinkgoRecover()
  129. sleepTime := time.Duration(0)
  130. millicores := 0
  131. for {
  132. select {
  133. case millicores = <-rc.cpu:
  134. framework.Logf("RC %s: setting consumption to %v millicores in total", rc.name, millicores)
  135. case <-time.After(sleepTime):
  136. framework.Logf("RC %s: sending request to consume %d millicores", rc.name, millicores)
  137. rc.sendConsumeCPURequest(millicores)
  138. sleepTime = rc.sleepTime
  139. case <-rc.stopCPU:
  140. return
  141. }
  142. }
  143. }
  144. func (rc *ResourceConsumer) makeConsumeMemRequests() {
  145. defer GinkgoRecover()
  146. sleepTime := time.Duration(0)
  147. megabytes := 0
  148. for {
  149. select {
  150. case megabytes = <-rc.mem:
  151. framework.Logf("RC %s: setting consumption to %v MB in total", rc.name, megabytes)
  152. case <-time.After(sleepTime):
  153. framework.Logf("RC %s: sending request to consume %d MB", rc.name, megabytes)
  154. rc.sendConsumeMemRequest(megabytes)
  155. sleepTime = rc.sleepTime
  156. case <-rc.stopMem:
  157. return
  158. }
  159. }
  160. }
  161. func (rc *ResourceConsumer) makeConsumeCustomMetric() {
  162. defer GinkgoRecover()
  163. sleepTime := time.Duration(0)
  164. delta := 0
  165. for {
  166. select {
  167. case delta := <-rc.customMetric:
  168. framework.Logf("RC %s: setting bump of metric %s to %d in total", rc.name, customMetricName, delta)
  169. case <-time.After(sleepTime):
  170. framework.Logf("RC %s: sending request to consume %d of custom metric %s", rc.name, delta, customMetricName)
  171. rc.sendConsumeCustomMetric(delta)
  172. sleepTime = rc.sleepTime
  173. case <-rc.stopCustomMetric:
  174. return
  175. }
  176. }
  177. }
  178. func (rc *ResourceConsumer) sendConsumeCPURequest(millicores int) {
  179. proxyRequest, err := framework.GetServicesProxyRequest(rc.framework.Client, rc.framework.Client.Post())
  180. framework.ExpectNoError(err)
  181. req := proxyRequest.Namespace(rc.framework.Namespace.Name).
  182. Name(rc.controllerName).
  183. Suffix("ConsumeCPU").
  184. Param("millicores", strconv.Itoa(millicores)).
  185. Param("durationSec", strconv.Itoa(rc.consumptionTimeInSeconds)).
  186. Param("requestSizeMillicores", strconv.Itoa(rc.requestSizeInMillicores))
  187. framework.Logf("URL: %v", *req.URL())
  188. _, err = req.DoRaw()
  189. framework.ExpectNoError(err)
  190. }
  191. // sendConsumeMemRequest sends POST request for memory consumption
  192. func (rc *ResourceConsumer) sendConsumeMemRequest(megabytes int) {
  193. proxyRequest, err := framework.GetServicesProxyRequest(rc.framework.Client, rc.framework.Client.Post())
  194. framework.ExpectNoError(err)
  195. req := proxyRequest.Namespace(rc.framework.Namespace.Name).
  196. Name(rc.controllerName).
  197. Suffix("ConsumeMem").
  198. Param("megabytes", strconv.Itoa(megabytes)).
  199. Param("durationSec", strconv.Itoa(rc.consumptionTimeInSeconds)).
  200. Param("requestSizeMegabytes", strconv.Itoa(rc.requestSizeInMegabytes))
  201. framework.Logf("URL: %v", *req.URL())
  202. _, err = req.DoRaw()
  203. framework.ExpectNoError(err)
  204. }
  205. // sendConsumeCustomMetric sends POST request for custom metric consumption
  206. func (rc *ResourceConsumer) sendConsumeCustomMetric(delta int) {
  207. proxyRequest, err := framework.GetServicesProxyRequest(rc.framework.Client, rc.framework.Client.Post())
  208. framework.ExpectNoError(err)
  209. req := proxyRequest.Namespace(rc.framework.Namespace.Name).
  210. Name(rc.controllerName).
  211. Suffix("BumpMetric").
  212. Param("metric", customMetricName).
  213. Param("delta", strconv.Itoa(delta)).
  214. Param("durationSec", strconv.Itoa(rc.consumptionTimeInSeconds)).
  215. Param("requestSizeMetrics", strconv.Itoa(rc.requestSizeCustomMetric))
  216. framework.Logf("URL: %v", *req.URL())
  217. _, err = req.DoRaw()
  218. framework.ExpectNoError(err)
  219. }
  220. func (rc *ResourceConsumer) GetReplicas() int {
  221. switch rc.kind {
  222. case kindRC:
  223. replicationController, err := rc.framework.Client.ReplicationControllers(rc.framework.Namespace.Name).Get(rc.name)
  224. framework.ExpectNoError(err)
  225. if replicationController == nil {
  226. framework.Failf(rcIsNil)
  227. }
  228. return int(replicationController.Status.Replicas)
  229. case kindDeployment:
  230. deployment, err := rc.framework.Client.Deployments(rc.framework.Namespace.Name).Get(rc.name)
  231. framework.ExpectNoError(err)
  232. if deployment == nil {
  233. framework.Failf(deploymentIsNil)
  234. }
  235. return int(deployment.Status.Replicas)
  236. case kindReplicaSet:
  237. rs, err := rc.framework.Client.ReplicaSets(rc.framework.Namespace.Name).Get(rc.name)
  238. framework.ExpectNoError(err)
  239. if rs == nil {
  240. framework.Failf(rsIsNil)
  241. }
  242. return int(rs.Status.Replicas)
  243. default:
  244. framework.Failf(invalidKind)
  245. }
  246. return 0
  247. }
  248. func (rc *ResourceConsumer) WaitForReplicas(desiredReplicas int) {
  249. timeout := 15 * time.Minute
  250. for start := time.Now(); time.Since(start) < timeout; time.Sleep(20 * time.Second) {
  251. if desiredReplicas == rc.GetReplicas() {
  252. framework.Logf("%s: current replicas number is equal to desired replicas number: %d", rc.kind, desiredReplicas)
  253. return
  254. } else {
  255. framework.Logf("%s: current replicas number %d waiting to be %d", rc.kind, rc.GetReplicas(), desiredReplicas)
  256. }
  257. }
  258. framework.Failf("timeout waiting %v for pods size to be %d", timeout, desiredReplicas)
  259. }
  260. func (rc *ResourceConsumer) EnsureDesiredReplicas(desiredReplicas int, timeout time.Duration) {
  261. for start := time.Now(); time.Since(start) < timeout; time.Sleep(10 * time.Second) {
  262. actual := rc.GetReplicas()
  263. if desiredReplicas != actual {
  264. framework.Failf("Number of replicas has changed: expected %v, got %v", desiredReplicas, actual)
  265. }
  266. framework.Logf("Number of replicas is as expected")
  267. }
  268. framework.Logf("Number of replicas was stable over %v", timeout)
  269. }
  270. func (rc *ResourceConsumer) CleanUp() {
  271. By(fmt.Sprintf("Removing consuming RC %s", rc.name))
  272. rc.stopCPU <- 0
  273. rc.stopMem <- 0
  274. rc.stopCustomMetric <- 0
  275. // Wait some time to ensure all child goroutines are finished.
  276. time.Sleep(10 * time.Second)
  277. framework.ExpectNoError(framework.DeleteRCAndPods(rc.framework.Client, rc.framework.Namespace.Name, rc.name))
  278. framework.ExpectNoError(rc.framework.Client.Services(rc.framework.Namespace.Name).Delete(rc.name))
  279. framework.ExpectNoError(framework.DeleteRCAndPods(rc.framework.Client, rc.framework.Namespace.Name, rc.controllerName))
  280. framework.ExpectNoError(rc.framework.Client.Services(rc.framework.Namespace.Name).Delete(rc.controllerName))
  281. }
  282. func runServiceAndWorkloadForResourceConsumer(c *client.Client, ns, name, kind string, replicas int, cpuLimitMillis, memLimitMb int64) {
  283. By(fmt.Sprintf("Running consuming RC %s via %s with %v replicas", name, kind, replicas))
  284. _, err := c.Services(ns).Create(&api.Service{
  285. ObjectMeta: api.ObjectMeta{
  286. Name: name,
  287. },
  288. Spec: api.ServiceSpec{
  289. Ports: []api.ServicePort{{
  290. Port: port,
  291. TargetPort: intstr.FromInt(targetPort),
  292. }},
  293. Selector: map[string]string{
  294. "name": name,
  295. },
  296. },
  297. })
  298. framework.ExpectNoError(err)
  299. rcConfig := framework.RCConfig{
  300. Client: c,
  301. Image: resourceConsumerImage,
  302. Name: name,
  303. Namespace: ns,
  304. Timeout: timeoutRC,
  305. Replicas: replicas,
  306. CpuRequest: cpuLimitMillis,
  307. CpuLimit: cpuLimitMillis,
  308. MemRequest: memLimitMb * 1024 * 1024, // MemLimit is in bytes
  309. MemLimit: memLimitMb * 1024 * 1024,
  310. }
  311. switch kind {
  312. case kindRC:
  313. framework.ExpectNoError(framework.RunRC(rcConfig))
  314. break
  315. case kindDeployment:
  316. dpConfig := framework.DeploymentConfig{
  317. RCConfig: rcConfig,
  318. }
  319. framework.ExpectNoError(framework.RunDeployment(dpConfig))
  320. break
  321. case kindReplicaSet:
  322. rsConfig := framework.ReplicaSetConfig{
  323. RCConfig: rcConfig,
  324. }
  325. framework.ExpectNoError(framework.RunReplicaSet(rsConfig))
  326. break
  327. default:
  328. framework.Failf(invalidKind)
  329. }
  330. By(fmt.Sprintf("Running controller"))
  331. controllerName := name + "-ctrl"
  332. _, err = c.Services(ns).Create(&api.Service{
  333. ObjectMeta: api.ObjectMeta{
  334. Name: controllerName,
  335. },
  336. Spec: api.ServiceSpec{
  337. Ports: []api.ServicePort{{
  338. Port: port,
  339. TargetPort: intstr.FromInt(targetPort),
  340. }},
  341. Selector: map[string]string{
  342. "name": controllerName,
  343. },
  344. },
  345. })
  346. framework.ExpectNoError(err)
  347. dnsClusterFirst := api.DNSClusterFirst
  348. controllerRcConfig := framework.RCConfig{
  349. Client: c,
  350. Image: resourceConsumerControllerImage,
  351. Name: controllerName,
  352. Namespace: ns,
  353. Timeout: timeoutRC,
  354. Replicas: 1,
  355. Command: []string{"/controller", "--consumer-service-name=" + name, "--consumer-service-namespace=" + ns, "--consumer-port=80"},
  356. DNSPolicy: &dnsClusterFirst,
  357. }
  358. framework.ExpectNoError(framework.RunRC(controllerRcConfig))
  359. // Make sure endpoints are propagated.
  360. // TODO(piosz): replace sleep with endpoints watch.
  361. time.Sleep(10 * time.Second)
  362. }