1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963496449654966496749684969497049714972497349744975497649774978497949804981498249834984498549864987498849894990499149924993499449954996499749984999500050015002500350045005500650075008500950105011501250135014501550165017501850195020502150225023502450255026502750285029503050315032503350345035503650375038503950405041504250435044504550465047504850495050505150525053505450555056505750585059506050615062506350645065506650675068506950705071507250735074507550765077507850795080508150825083508450855086508750885089509050915092509350945095 |
- /*
- Copyright 2014 The Kubernetes Authors.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- */
- package framework
- import (
- "bytes"
- "encoding/json"
- "fmt"
- "io"
- "io/ioutil"
- "math"
- "math/rand"
- "net"
- "net/http"
- "net/url"
- "os"
- "os/exec"
- "path"
- "path/filepath"
- "regexp"
- goRuntime "runtime"
- "sort"
- "strconv"
- "strings"
- "sync"
- "syscall"
- "time"
- "k8s.io/kubernetes/federation/client/clientset_generated/federation_release_1_4"
- "k8s.io/kubernetes/pkg/api"
- apierrs "k8s.io/kubernetes/pkg/api/errors"
- "k8s.io/kubernetes/pkg/api/resource"
- "k8s.io/kubernetes/pkg/api/unversioned"
- "k8s.io/kubernetes/pkg/api/v1"
- "k8s.io/kubernetes/pkg/apis/extensions"
- "k8s.io/kubernetes/pkg/client/cache"
- clientset "k8s.io/kubernetes/pkg/client/clientset_generated/internalclientset"
- "k8s.io/kubernetes/pkg/client/restclient"
- "k8s.io/kubernetes/pkg/client/typed/discovery"
- "k8s.io/kubernetes/pkg/client/typed/dynamic"
- client "k8s.io/kubernetes/pkg/client/unversioned"
- "k8s.io/kubernetes/pkg/client/unversioned/clientcmd"
- clientcmdapi "k8s.io/kubernetes/pkg/client/unversioned/clientcmd/api"
- gcecloud "k8s.io/kubernetes/pkg/cloudprovider/providers/gce"
- "k8s.io/kubernetes/pkg/controller"
- deploymentutil "k8s.io/kubernetes/pkg/controller/deployment/util"
- "k8s.io/kubernetes/pkg/fields"
- "k8s.io/kubernetes/pkg/kubectl"
- "k8s.io/kubernetes/pkg/kubelet/util/format"
- "k8s.io/kubernetes/pkg/labels"
- "k8s.io/kubernetes/pkg/master/ports"
- "k8s.io/kubernetes/pkg/runtime"
- sshutil "k8s.io/kubernetes/pkg/ssh"
- "k8s.io/kubernetes/pkg/types"
- uexec "k8s.io/kubernetes/pkg/util/exec"
- labelsutil "k8s.io/kubernetes/pkg/util/labels"
- "k8s.io/kubernetes/pkg/util/sets"
- "k8s.io/kubernetes/pkg/util/system"
- "k8s.io/kubernetes/pkg/util/uuid"
- "k8s.io/kubernetes/pkg/util/wait"
- utilyaml "k8s.io/kubernetes/pkg/util/yaml"
- "k8s.io/kubernetes/pkg/version"
- "k8s.io/kubernetes/pkg/watch"
- "github.com/blang/semver"
- "golang.org/x/crypto/ssh"
- "golang.org/x/net/websocket"
- . "github.com/onsi/ginkgo"
- . "github.com/onsi/gomega"
- gomegatypes "github.com/onsi/gomega/types"
- )
- const (
- // How long to wait for the pod to be listable
- PodListTimeout = time.Minute
- // Initial pod start can be delayed O(minutes) by slow docker pulls
- // TODO: Make this 30 seconds once #4566 is resolved.
- PodStartTimeout = 5 * time.Minute
- // How long to wait for the pod to no longer be running
- podNoLongerRunningTimeout = 30 * time.Second
- // If there are any orphaned namespaces to clean up, this test is running
- // on a long lived cluster. A long wait here is preferably to spurious test
- // failures caused by leaked resources from a previous test run.
- NamespaceCleanupTimeout = 15 * time.Minute
- // Some pods can take much longer to get ready due to volume attach/detach latency.
- slowPodStartTimeout = 15 * time.Minute
- // How long to wait for a service endpoint to be resolvable.
- ServiceStartTimeout = 1 * time.Minute
- // String used to mark pod deletion
- nonExist = "NonExist"
- // How often to Poll pods, nodes and claims.
- Poll = 2 * time.Second
- // service accounts are provisioned after namespace creation
- // a service account is required to support pod creation in a namespace as part of admission control
- ServiceAccountProvisionTimeout = 2 * time.Minute
- // How long to try single API calls (like 'get' or 'list'). Used to prevent
- // transient failures from failing tests.
- // TODO: client should not apply this timeout to Watch calls. Increased from 30s until that is fixed.
- SingleCallTimeout = 5 * time.Minute
- // How long nodes have to be "ready" when a test begins. They should already
- // be "ready" before the test starts, so this is small.
- NodeReadyInitialTimeout = 20 * time.Second
- // How long pods have to be "ready" when a test begins.
- PodReadyBeforeTimeout = 5 * time.Minute
- // How long pods have to become scheduled onto nodes
- podScheduledBeforeTimeout = PodListTimeout + (20 * time.Second)
- podRespondingTimeout = 2 * time.Minute
- ServiceRespondingTimeout = 2 * time.Minute
- EndpointRegisterTimeout = time.Minute
- // How long claims have to become dynamically provisioned
- ClaimProvisionTimeout = 5 * time.Minute
- // When these values are updated, also update cmd/kubelet/app/options/options.go
- currentPodInfraContainerImageName = "gcr.io/google_containers/pause"
- currentPodInfraContainerImageVersion = "3.0"
- // How long each node is given during a process that restarts all nodes
- // before the test is considered failed. (Note that the total time to
- // restart all nodes will be this number times the number of nodes.)
- RestartPerNodeTimeout = 5 * time.Minute
- // How often to Poll the statues of a restart.
- RestartPoll = 20 * time.Second
- // How long a node is allowed to become "Ready" after it is restarted before
- // the test is considered failed.
- RestartNodeReadyAgainTimeout = 5 * time.Minute
- // How long a pod is allowed to become "running" and "ready" after a node
- // restart before test is considered failed.
- RestartPodReadyAgainTimeout = 5 * time.Minute
- // Number of times we want to retry Updates in case of conflict
- UpdateRetries = 5
- )
- var (
- // Label allocated to the image puller static pod that runs on each node
- // before e2es.
- ImagePullerLabels = map[string]string{"name": "e2e-image-puller"}
- // For parsing Kubectl version for version-skewed testing.
- gitVersionRegexp = regexp.MustCompile("GitVersion:\"(v.+?)\"")
- // Slice of regexps for names of pods that have to be running to consider a Node "healthy"
- requiredPerNodePods = []*regexp.Regexp{
- regexp.MustCompile(".*kube-proxy.*"),
- regexp.MustCompile(".*fluentd-elasticsearch.*"),
- regexp.MustCompile(".*node-problem-detector.*"),
- }
- )
- // GetServerArchitecture fetches the architecture of the cluster's apiserver.
- func GetServerArchitecture(c *client.Client) string {
- arch := ""
- sVer, err := c.Discovery().ServerVersion()
- if err != nil || sVer.Platform == "" {
- // If we failed to get the server version for some reason, default to amd64.
- arch = "amd64"
- } else {
- // Split the platform string into OS and Arch separately.
- // The platform string may for example be "linux/amd64", "linux/arm" or "windows/amd64".
- osArchArray := strings.Split(sVer.Platform, "/")
- arch = osArchArray[1]
- }
- return arch
- }
- // GetPauseImageName fetches the pause image name for the same architecture as the apiserver.
- func GetPauseImageName(c *client.Client) string {
- return currentPodInfraContainerImageName + "-" + GetServerArchitecture(c) + ":" + currentPodInfraContainerImageVersion
- }
- // GetPauseImageNameForHostArch fetches the pause image name for the same architecture the test is running on.
- func GetPauseImageNameForHostArch() string {
- return currentPodInfraContainerImageName + "-" + goRuntime.GOARCH + ":" + currentPodInfraContainerImageVersion
- }
- // SubResource proxy should have been functional in v1.0.0, but SubResource
- // proxy via tunneling is known to be broken in v1.0. See
- // https://github.com/kubernetes/kubernetes/pull/15224#issuecomment-146769463
- //
- // TODO(ihmccreery): remove once we don't care about v1.0 anymore, (tentatively
- // in v1.3).
- var SubResourcePodProxyVersion = version.MustParse("v1.1.0")
- var subResourceServiceAndNodeProxyVersion = version.MustParse("v1.2.0")
- func GetServicesProxyRequest(c *client.Client, request *restclient.Request) (*restclient.Request, error) {
- subResourceProxyAvailable, err := ServerVersionGTE(subResourceServiceAndNodeProxyVersion, c)
- if err != nil {
- return nil, err
- }
- if subResourceProxyAvailable {
- return request.Resource("services").SubResource("proxy"), nil
- }
- return request.Prefix("proxy").Resource("services"), nil
- }
- // unique identifier of the e2e run
- var RunId = uuid.NewUUID()
- type CreateTestingNSFn func(baseName string, c *client.Client, labels map[string]string) (*api.Namespace, error)
- type ContainerFailures struct {
- status *api.ContainerStateTerminated
- Restarts int
- }
- func GetMasterHost() string {
- masterUrl, err := url.Parse(TestContext.Host)
- ExpectNoError(err)
- return masterUrl.Host
- }
- // Convenient wrapper around cache.Store that returns list of api.Pod instead of interface{}.
- type PodStore struct {
- cache.Store
- stopCh chan struct{}
- reflector *cache.Reflector
- }
- func NewPodStore(c *client.Client, namespace string, label labels.Selector, field fields.Selector) *PodStore {
- lw := &cache.ListWatch{
- ListFunc: func(options api.ListOptions) (runtime.Object, error) {
- options.LabelSelector = label
- options.FieldSelector = field
- return c.Pods(namespace).List(options)
- },
- WatchFunc: func(options api.ListOptions) (watch.Interface, error) {
- options.LabelSelector = label
- options.FieldSelector = field
- return c.Pods(namespace).Watch(options)
- },
- }
- store := cache.NewStore(cache.MetaNamespaceKeyFunc)
- stopCh := make(chan struct{})
- reflector := cache.NewReflector(lw, &api.Pod{}, store, 0)
- reflector.RunUntil(stopCh)
- return &PodStore{store, stopCh, reflector}
- }
- func (s *PodStore) List() []*api.Pod {
- objects := s.Store.List()
- pods := make([]*api.Pod, 0)
- for _, o := range objects {
- pods = append(pods, o.(*api.Pod))
- }
- return pods
- }
- func (s *PodStore) Stop() {
- close(s.stopCh)
- }
- type RCConfig struct {
- Client *client.Client
- Image string
- Command []string
- Name string
- Namespace string
- PollInterval time.Duration
- Timeout time.Duration
- PodStatusFile *os.File
- Replicas int
- CpuRequest int64 // millicores
- CpuLimit int64 // millicores
- MemRequest int64 // bytes
- MemLimit int64 // bytes
- ReadinessProbe *api.Probe
- DNSPolicy *api.DNSPolicy
- // Env vars, set the same for every pod.
- Env map[string]string
- // Extra labels added to every pod.
- Labels map[string]string
- // Node selector for pods in the RC.
- NodeSelector map[string]string
- // Ports to declare in the container (map of name to containerPort).
- Ports map[string]int
- // Ports to declare in the container as host and container ports.
- HostPorts map[string]int
- Volumes []api.Volume
- VolumeMounts []api.VolumeMount
- // Pointer to a list of pods; if non-nil, will be set to a list of pods
- // created by this RC by RunRC.
- CreatedPods *[]*api.Pod
- // Maximum allowable container failures. If exceeded, RunRC returns an error.
- // Defaults to replicas*0.1 if unspecified.
- MaxContainerFailures *int
- // If set to false starting RC will print progress, otherwise only errors will be printed.
- Silent bool
- }
- type DeploymentConfig struct {
- RCConfig
- }
- type ReplicaSetConfig struct {
- RCConfig
- }
- func nowStamp() string {
- return time.Now().Format(time.StampMilli)
- }
- func log(level string, format string, args ...interface{}) {
- fmt.Fprintf(GinkgoWriter, nowStamp()+": "+level+": "+format+"\n", args...)
- }
- func Logf(format string, args ...interface{}) {
- log("INFO", format, args...)
- }
- func Failf(format string, args ...interface{}) {
- msg := fmt.Sprintf(format, args...)
- log("INFO", msg)
- Fail(nowStamp()+": "+msg, 1)
- }
- func Skipf(format string, args ...interface{}) {
- msg := fmt.Sprintf(format, args...)
- log("INFO", msg)
- Skip(nowStamp() + ": " + msg)
- }
- func SkipUnlessNodeCountIsAtLeast(minNodeCount int) {
- if TestContext.CloudConfig.NumNodes < minNodeCount {
- Skipf("Requires at least %d nodes (not %d)", minNodeCount, TestContext.CloudConfig.NumNodes)
- }
- }
- func SkipUnlessAtLeast(value int, minValue int, message string) {
- if value < minValue {
- Skipf(message)
- }
- }
- func SkipIfProviderIs(unsupportedProviders ...string) {
- if ProviderIs(unsupportedProviders...) {
- Skipf("Not supported for providers %v (found %s)", unsupportedProviders, TestContext.Provider)
- }
- }
- func SkipUnlessProviderIs(supportedProviders ...string) {
- if !ProviderIs(supportedProviders...) {
- Skipf("Only supported for providers %v (not %s)", supportedProviders, TestContext.Provider)
- }
- }
- func SkipIfContainerRuntimeIs(runtimes ...string) {
- for _, runtime := range runtimes {
- if runtime == TestContext.ContainerRuntime {
- Skipf("Not supported under container runtime %s", runtime)
- }
- }
- }
- func ProviderIs(providers ...string) bool {
- for _, provider := range providers {
- if strings.ToLower(provider) == strings.ToLower(TestContext.Provider) {
- return true
- }
- }
- return false
- }
- func SkipUnlessServerVersionGTE(v semver.Version, c discovery.ServerVersionInterface) {
- gte, err := ServerVersionGTE(v, c)
- if err != nil {
- Failf("Failed to get server version: %v", err)
- }
- if !gte {
- Skipf("Not supported for server versions before %q", v)
- }
- }
- // Detects whether the federation namespace exists in the underlying cluster
- func SkipUnlessFederated(c *client.Client) {
- federationNS := os.Getenv("FEDERATION_NAMESPACE")
- if federationNS == "" {
- federationNS = "federation"
- }
- _, err := c.Namespaces().Get(federationNS)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Skipf("Could not find federation namespace %s: skipping federated test", federationNS)
- } else {
- Failf("Unexpected error getting namespace: %v", err)
- }
- }
- }
- // ProvidersWithSSH are those providers where each node is accessible with SSH
- var ProvidersWithSSH = []string{"gce", "gke", "aws"}
- // providersWithMasterSSH are those providers where master node is accessible with SSH
- var providersWithMasterSSH = []string{"gce", "gke", "kubemark", "aws"}
- type podCondition func(pod *api.Pod) (bool, error)
- // podReady returns whether pod has a condition of Ready with a status of true.
- // TODO: should be replaced with api.IsPodReady
- func podReady(pod *api.Pod) bool {
- for _, cond := range pod.Status.Conditions {
- if cond.Type == api.PodReady && cond.Status == api.ConditionTrue {
- return true
- }
- }
- return false
- }
- // logPodStates logs basic info of provided pods for debugging.
- func logPodStates(pods []api.Pod) {
- // Find maximum widths for pod, node, and phase strings for column printing.
- maxPodW, maxNodeW, maxPhaseW, maxGraceW := len("POD"), len("NODE"), len("PHASE"), len("GRACE")
- for i := range pods {
- pod := &pods[i]
- if len(pod.ObjectMeta.Name) > maxPodW {
- maxPodW = len(pod.ObjectMeta.Name)
- }
- if len(pod.Spec.NodeName) > maxNodeW {
- maxNodeW = len(pod.Spec.NodeName)
- }
- if len(pod.Status.Phase) > maxPhaseW {
- maxPhaseW = len(pod.Status.Phase)
- }
- }
- // Increase widths by one to separate by a single space.
- maxPodW++
- maxNodeW++
- maxPhaseW++
- maxGraceW++
- // Log pod info. * does space padding, - makes them left-aligned.
- Logf("%-[1]*[2]s %-[3]*[4]s %-[5]*[6]s %-[7]*[8]s %[9]s",
- maxPodW, "POD", maxNodeW, "NODE", maxPhaseW, "PHASE", maxGraceW, "GRACE", "CONDITIONS")
- for _, pod := range pods {
- grace := ""
- if pod.DeletionGracePeriodSeconds != nil {
- grace = fmt.Sprintf("%ds", *pod.DeletionGracePeriodSeconds)
- }
- Logf("%-[1]*[2]s %-[3]*[4]s %-[5]*[6]s %-[7]*[8]s %[9]s",
- maxPodW, pod.ObjectMeta.Name, maxNodeW, pod.Spec.NodeName, maxPhaseW, pod.Status.Phase, maxGraceW, grace, pod.Status.Conditions)
- }
- Logf("") // Final empty line helps for readability.
- }
- // PodRunningReady checks whether pod p's phase is running and it has a ready
- // condition of status true.
- func PodRunningReady(p *api.Pod) (bool, error) {
- // Check the phase is running.
- if p.Status.Phase != api.PodRunning {
- return false, fmt.Errorf("want pod '%s' on '%s' to be '%v' but was '%v'",
- p.ObjectMeta.Name, p.Spec.NodeName, api.PodRunning, p.Status.Phase)
- }
- // Check the ready condition is true.
- if !podReady(p) {
- return false, fmt.Errorf("pod '%s' on '%s' didn't have condition {%v %v}; conditions: %v",
- p.ObjectMeta.Name, p.Spec.NodeName, api.PodReady, api.ConditionTrue, p.Status.Conditions)
- }
- return true, nil
- }
- func PodRunningReadyOrSucceeded(p *api.Pod) (bool, error) {
- // Check if the phase is succeeded.
- if p.Status.Phase == api.PodSucceeded {
- return true, nil
- }
- return PodRunningReady(p)
- }
- // PodNotReady checks whether pod p's has a ready condition of status false.
- func PodNotReady(p *api.Pod) (bool, error) {
- // Check the ready condition is false.
- if podReady(p) {
- return false, fmt.Errorf("pod '%s' on '%s' didn't have condition {%v %v}; conditions: %v",
- p.ObjectMeta.Name, p.Spec.NodeName, api.PodReady, api.ConditionFalse, p.Status.Conditions)
- }
- return true, nil
- }
- // check if a Pod is controlled by a Replication Controller in the List
- func hasReplicationControllersForPod(rcs *api.ReplicationControllerList, pod api.Pod) bool {
- for _, rc := range rcs.Items {
- selector := labels.SelectorFromSet(rc.Spec.Selector)
- if selector.Matches(labels.Set(pod.ObjectMeta.Labels)) {
- return true
- }
- }
- return false
- }
- // WaitForPodsSuccess waits till all labels matching the given selector enter
- // the Success state. The caller is expected to only invoke this method once the
- // pods have been created.
- func WaitForPodsSuccess(c *client.Client, ns string, successPodLabels map[string]string, timeout time.Duration) error {
- successPodSelector := labels.SelectorFromSet(successPodLabels)
- start, badPods := time.Now(), []api.Pod{}
- if wait.PollImmediate(30*time.Second, timeout, func() (bool, error) {
- podList, err := c.Pods(ns).List(api.ListOptions{LabelSelector: successPodSelector})
- if err != nil {
- Logf("Error getting pods in namespace %q: %v", ns, err)
- return false, nil
- }
- if len(podList.Items) == 0 {
- Logf("Waiting for pods to enter Success, but no pods in %q match label %v", ns, successPodLabels)
- return true, nil
- }
- badPods = []api.Pod{}
- for _, pod := range podList.Items {
- if pod.Status.Phase != api.PodSucceeded {
- badPods = append(badPods, pod)
- }
- }
- successPods := len(podList.Items) - len(badPods)
- Logf("%d / %d pods in namespace %q are in Success state (%d seconds elapsed)",
- successPods, len(podList.Items), ns, int(time.Since(start).Seconds()))
- if len(badPods) == 0 {
- return true, nil
- }
- return false, nil
- }) != nil {
- logPodStates(badPods)
- LogPodsWithLabels(c, ns, successPodLabels)
- return fmt.Errorf("Not all pods in namespace %q are successful within %v", ns, timeout)
- }
- return nil
- }
- // WaitForPodsRunningReady waits up to timeout to ensure that all pods in
- // namespace ns are either running and ready, or failed but controlled by a
- // replication controller. Also, it ensures that at least minPods are running
- // and ready. It has separate behavior from other 'wait for' pods functions in
- // that it requires the list of pods on every iteration. This is useful, for
- // example, in cluster startup, because the number of pods increases while
- // waiting.
- // If ignoreLabels is not empty, pods matching this selector are ignored and
- // this function waits for minPods to enter Running/Ready and for all pods
- // matching ignoreLabels to enter Success phase. Otherwise an error is returned
- // even if there are minPods pods, some of which are in Running/Ready
- // and some in Success. This is to allow the client to decide if "Success"
- // means "Ready" or not.
- func WaitForPodsRunningReady(c *client.Client, ns string, minPods int32, timeout time.Duration, ignoreLabels map[string]string) error {
- ignoreSelector := labels.SelectorFromSet(ignoreLabels)
- start := time.Now()
- Logf("Waiting up to %v for all pods (need at least %d) in namespace '%s' to be running and ready",
- timeout, minPods, ns)
- wg := sync.WaitGroup{}
- wg.Add(1)
- var waitForSuccessError error
- go func() {
- waitForSuccessError = WaitForPodsSuccess(c, ns, ignoreLabels, timeout)
- wg.Done()
- }()
- if wait.PollImmediate(Poll, timeout, func() (bool, error) {
- // We get the new list of pods and replication controllers in every
- // iteration because more pods come online during startup and we want to
- // ensure they are also checked.
- rcList, err := c.ReplicationControllers(ns).List(api.ListOptions{})
- if err != nil {
- Logf("Error getting replication controllers in namespace '%s': %v", ns, err)
- return false, nil
- }
- replicas := int32(0)
- for _, rc := range rcList.Items {
- replicas += rc.Spec.Replicas
- }
- podList, err := c.Pods(ns).List(api.ListOptions{})
- if err != nil {
- Logf("Error getting pods in namespace '%s': %v", ns, err)
- return false, nil
- }
- nOk, replicaOk, badPods := int32(0), int32(0), []api.Pod{}
- for _, pod := range podList.Items {
- if len(ignoreLabels) != 0 && ignoreSelector.Matches(labels.Set(pod.Labels)) {
- Logf("%v in state %v, ignoring", pod.Name, pod.Status.Phase)
- continue
- }
- if res, err := PodRunningReady(&pod); res && err == nil {
- nOk++
- if hasReplicationControllersForPod(rcList, pod) {
- replicaOk++
- }
- } else {
- if pod.Status.Phase != api.PodFailed {
- Logf("The status of Pod %s is %s, waiting for it to be either Running or Failed", pod.ObjectMeta.Name, pod.Status.Phase)
- badPods = append(badPods, pod)
- } else if !hasReplicationControllersForPod(rcList, pod) {
- Logf("Pod %s is Failed, but it's not controlled by a ReplicationController", pod.ObjectMeta.Name)
- badPods = append(badPods, pod)
- }
- //ignore failed pods that are controlled by a replication controller
- }
- }
- Logf("%d / %d pods in namespace '%s' are running and ready (%d seconds elapsed)",
- nOk, len(podList.Items), ns, int(time.Since(start).Seconds()))
- Logf("expected %d pod replicas in namespace '%s', %d are Running and Ready.", replicas, ns, replicaOk)
- if replicaOk == replicas && nOk >= minPods && len(badPods) == 0 {
- return true, nil
- }
- logPodStates(badPods)
- return false, nil
- }) != nil {
- return fmt.Errorf("Not all pods in namespace '%s' running and ready within %v", ns, timeout)
- }
- wg.Wait()
- if waitForSuccessError != nil {
- return waitForSuccessError
- }
- return nil
- }
- func podFromManifest(filename string) (*api.Pod, error) {
- var pod api.Pod
- Logf("Parsing pod from %v", filename)
- data := ReadOrDie(filename)
- json, err := utilyaml.ToJSON(data)
- if err != nil {
- return nil, err
- }
- if err := runtime.DecodeInto(api.Codecs.UniversalDecoder(), json, &pod); err != nil {
- return nil, err
- }
- return &pod, nil
- }
- // Run a test container to try and contact the Kubernetes api-server from a pod, wait for it
- // to flip to Ready, log its output and delete it.
- func RunKubernetesServiceTestContainer(c *client.Client, ns string) {
- path := "test/images/clusterapi-tester/pod.yaml"
- p, err := podFromManifest(path)
- if err != nil {
- Logf("Failed to parse clusterapi-tester from manifest %v: %v", path, err)
- return
- }
- p.Namespace = ns
- if _, err := c.Pods(ns).Create(p); err != nil {
- Logf("Failed to create %v: %v", p.Name, err)
- return
- }
- defer func() {
- if err := c.Pods(ns).Delete(p.Name, nil); err != nil {
- Logf("Failed to delete pod %v: %v", p.Name, err)
- }
- }()
- timeout := 5 * time.Minute
- if err := waitForPodCondition(c, ns, p.Name, "clusterapi-tester", timeout, PodRunningReady); err != nil {
- Logf("Pod %v took longer than %v to enter running/ready: %v", p.Name, timeout, err)
- return
- }
- logs, err := GetPodLogs(c, ns, p.Name, p.Spec.Containers[0].Name)
- if err != nil {
- Logf("Failed to retrieve logs from %v: %v", p.Name, err)
- } else {
- Logf("Output of clusterapi-tester:\n%v", logs)
- }
- }
- func kubectlLogPod(c *client.Client, pod api.Pod, containerNameSubstr string) {
- for _, container := range pod.Spec.Containers {
- if strings.Contains(container.Name, containerNameSubstr) {
- // Contains() matches all strings if substr is empty
- logs, err := GetPodLogs(c, pod.Namespace, pod.Name, container.Name)
- if err != nil {
- logs, err = getPreviousPodLogs(c, pod.Namespace, pod.Name, container.Name)
- if err != nil {
- Logf("Failed to get logs of pod %v, container %v, err: %v", pod.Name, container.Name, err)
- }
- }
- By(fmt.Sprintf("Logs of %v/%v:%v on node %v", pod.Namespace, pod.Name, container.Name, pod.Spec.NodeName))
- Logf("%s : STARTLOG\n%s\nENDLOG for container %v:%v:%v", containerNameSubstr, logs, pod.Namespace, pod.Name, container.Name)
- }
- }
- }
- func LogFailedContainers(c *client.Client, ns string) {
- podList, err := c.Pods(ns).List(api.ListOptions{})
- if err != nil {
- Logf("Error getting pods in namespace '%s': %v", ns, err)
- return
- }
- Logf("Running kubectl logs on non-ready containers in %v", ns)
- for _, pod := range podList.Items {
- if res, err := PodRunningReady(&pod); !res || err != nil {
- kubectlLogPod(c, pod, "")
- }
- }
- }
- func LogPodsWithLabels(c *client.Client, ns string, match map[string]string) {
- podList, err := c.Pods(ns).List(api.ListOptions{LabelSelector: labels.SelectorFromSet(match)})
- if err != nil {
- Logf("Error getting pods in namespace %q: %v", ns, err)
- return
- }
- Logf("Running kubectl logs on pods with labels %v in %v", match, ns)
- for _, pod := range podList.Items {
- kubectlLogPod(c, pod, "")
- }
- }
- func LogContainersInPodsWithLabels(c *client.Client, ns string, match map[string]string, containerSubstr string) {
- podList, err := c.Pods(ns).List(api.ListOptions{LabelSelector: labels.SelectorFromSet(match)})
- if err != nil {
- Logf("Error getting pods in namespace %q: %v", ns, err)
- return
- }
- for _, pod := range podList.Items {
- kubectlLogPod(c, pod, containerSubstr)
- }
- }
- // DeleteNamespaces deletes all namespaces that match the given delete and skip filters.
- // Filter is by simple strings.Contains; first skip filter, then delete filter.
- // Returns the list of deleted namespaces or an error.
- func DeleteNamespaces(c *client.Client, deleteFilter, skipFilter []string) ([]string, error) {
- By("Deleting namespaces")
- nsList, err := c.Namespaces().List(api.ListOptions{})
- Expect(err).NotTo(HaveOccurred())
- var deleted []string
- var wg sync.WaitGroup
- OUTER:
- for _, item := range nsList.Items {
- if skipFilter != nil {
- for _, pattern := range skipFilter {
- if strings.Contains(item.Name, pattern) {
- continue OUTER
- }
- }
- }
- if deleteFilter != nil {
- var shouldDelete bool
- for _, pattern := range deleteFilter {
- if strings.Contains(item.Name, pattern) {
- shouldDelete = true
- break
- }
- }
- if !shouldDelete {
- continue OUTER
- }
- }
- wg.Add(1)
- deleted = append(deleted, item.Name)
- go func(nsName string) {
- defer wg.Done()
- defer GinkgoRecover()
- Expect(c.Namespaces().Delete(nsName)).To(Succeed())
- Logf("namespace : %v api call to delete is complete ", nsName)
- }(item.Name)
- }
- wg.Wait()
- return deleted, nil
- }
- func WaitForNamespacesDeleted(c *client.Client, namespaces []string, timeout time.Duration) error {
- By("Waiting for namespaces to vanish")
- nsMap := map[string]bool{}
- for _, ns := range namespaces {
- nsMap[ns] = true
- }
- //Now POLL until all namespaces have been eradicated.
- return wait.Poll(2*time.Second, timeout,
- func() (bool, error) {
- nsList, err := c.Namespaces().List(api.ListOptions{})
- if err != nil {
- return false, err
- }
- for _, item := range nsList.Items {
- if _, ok := nsMap[item.Name]; ok {
- return false, nil
- }
- }
- return true, nil
- })
- }
- func waitForServiceAccountInNamespace(c *client.Client, ns, serviceAccountName string, timeout time.Duration) error {
- w, err := c.ServiceAccounts(ns).Watch(api.SingleObject(api.ObjectMeta{Name: serviceAccountName}))
- if err != nil {
- return err
- }
- _, err = watch.Until(timeout, w, client.ServiceAccountHasSecrets)
- return err
- }
- func waitForPodCondition(c *client.Client, ns, podName, desc string, timeout time.Duration, condition podCondition) error {
- Logf("Waiting up to %[1]v for pod %[2]s status to be %[3]s", timeout, podName, desc)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- pod, err := c.Pods(ns).Get(podName)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("Pod %q in namespace %q disappeared. Error: %v", podName, ns, err)
- return err
- }
- // Aligning this text makes it much more readable
- Logf("Get pod %[1]s in namespace '%[2]s' failed, ignoring for %[3]v. Error: %[4]v",
- podName, ns, Poll, err)
- continue
- }
- done, err := condition(pod)
- if done {
- return err
- }
- Logf("Waiting for pod %[1]s in namespace '%[2]s' status to be '%[3]s'"+
- "(found phase: %[4]q, readiness: %[5]t) (%[6]v elapsed)",
- podName, ns, desc, pod.Status.Phase, podReady(pod), time.Since(start))
- }
- return fmt.Errorf("gave up waiting for pod '%s' to be '%s' after %v", podName, desc, timeout)
- }
- // WaitForMatchPodsCondition finds match pods based on the input ListOptions.
- // waits and checks if all match pods are in the given podCondition
- func WaitForMatchPodsCondition(c *client.Client, opts api.ListOptions, desc string, timeout time.Duration, condition podCondition) error {
- Logf("Waiting up to %v for matching pods' status to be %s", timeout, desc)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- pods, err := c.Pods(api.NamespaceAll).List(opts)
- if err != nil {
- return err
- }
- conditionNotMatch := []string{}
- for _, pod := range pods.Items {
- done, err := condition(&pod)
- if done && err != nil {
- return fmt.Errorf("Unexpected error: %v", err)
- }
- if !done {
- conditionNotMatch = append(conditionNotMatch, format.Pod(&pod))
- }
- }
- if len(conditionNotMatch) <= 0 {
- return err
- }
- Logf("%d pods are not %s", len(conditionNotMatch), desc)
- }
- return fmt.Errorf("gave up waiting for matching pods to be '%s' after %v", desc, timeout)
- }
- // WaitForDefaultServiceAccountInNamespace waits for the default service account to be provisioned
- // the default service account is what is associated with pods when they do not specify a service account
- // as a result, pods are not able to be provisioned in a namespace until the service account is provisioned
- func WaitForDefaultServiceAccountInNamespace(c *client.Client, namespace string) error {
- return waitForServiceAccountInNamespace(c, namespace, "default", ServiceAccountProvisionTimeout)
- }
- // WaitForFederationApiserverReady waits for the federation apiserver to be ready.
- // It tests the readiness by sending a GET request and expecting a non error response.
- func WaitForFederationApiserverReady(c *federation_release_1_4.Clientset) error {
- return wait.PollImmediate(time.Second, 1*time.Minute, func() (bool, error) {
- _, err := c.Federation().Clusters().List(api.ListOptions{})
- if err != nil {
- return false, nil
- }
- return true, nil
- })
- }
- // WaitForPersistentVolumePhase waits for a PersistentVolume to be in a specific phase or until timeout occurs, whichever comes first.
- func WaitForPersistentVolumePhase(phase api.PersistentVolumePhase, c *client.Client, pvName string, Poll, timeout time.Duration) error {
- Logf("Waiting up to %v for PersistentVolume %s to have phase %s", timeout, pvName, phase)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- pv, err := c.PersistentVolumes().Get(pvName)
- if err != nil {
- Logf("Get persistent volume %s in failed, ignoring for %v: %v", pvName, Poll, err)
- continue
- } else {
- if pv.Status.Phase == phase {
- Logf("PersistentVolume %s found and phase=%s (%v)", pvName, phase, time.Since(start))
- return nil
- } else {
- Logf("PersistentVolume %s found but phase is %s instead of %s.", pvName, pv.Status.Phase, phase)
- }
- }
- }
- return fmt.Errorf("PersistentVolume %s not in phase %s within %v", pvName, phase, timeout)
- }
- // WaitForPersistentVolumeDeleted waits for a PersistentVolume to get deleted or until timeout occurs, whichever comes first.
- func WaitForPersistentVolumeDeleted(c *client.Client, pvName string, Poll, timeout time.Duration) error {
- Logf("Waiting up to %v for PersistentVolume %s to get deleted", timeout, pvName)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- pv, err := c.PersistentVolumes().Get(pvName)
- if err == nil {
- Logf("PersistentVolume %s found and phase=%s (%v)", pvName, pv.Status.Phase, time.Since(start))
- continue
- } else {
- if apierrs.IsNotFound(err) {
- Logf("PersistentVolume %s was removed", pvName)
- return nil
- } else {
- Logf("Get persistent volume %s in failed, ignoring for %v: %v", pvName, Poll, err)
- }
- }
- }
- return fmt.Errorf("PersistentVolume %s still exists within %v", pvName, timeout)
- }
- // WaitForPersistentVolumeClaimPhase waits for a PersistentVolumeClaim to be in a specific phase or until timeout occurs, whichever comes first.
- func WaitForPersistentVolumeClaimPhase(phase api.PersistentVolumeClaimPhase, c *client.Client, ns string, pvcName string, Poll, timeout time.Duration) error {
- Logf("Waiting up to %v for PersistentVolumeClaim %s to have phase %s", timeout, pvcName, phase)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- pvc, err := c.PersistentVolumeClaims(ns).Get(pvcName)
- if err != nil {
- Logf("Get persistent volume claim %s in failed, ignoring for %v: %v", pvcName, Poll, err)
- continue
- } else {
- if pvc.Status.Phase == phase {
- Logf("PersistentVolumeClaim %s found and phase=%s (%v)", pvcName, phase, time.Since(start))
- return nil
- } else {
- Logf("PersistentVolumeClaim %s found but phase is %s instead of %s.", pvcName, pvc.Status.Phase, phase)
- }
- }
- }
- return fmt.Errorf("PersistentVolumeClaim %s not in phase %s within %v", pvcName, phase, timeout)
- }
- // CreateTestingNS should be used by every test, note that we append a common prefix to the provided test name.
- // Please see NewFramework instead of using this directly.
- func CreateTestingNS(baseName string, c *client.Client, labels map[string]string) (*api.Namespace, error) {
- if labels == nil {
- labels = map[string]string{}
- }
- labels["e2e-run"] = string(RunId)
- namespaceObj := &api.Namespace{
- ObjectMeta: api.ObjectMeta{
- GenerateName: fmt.Sprintf("e2e-tests-%v-", baseName),
- Namespace: "",
- Labels: labels,
- },
- Status: api.NamespaceStatus{},
- }
- // Be robust about making the namespace creation call.
- var got *api.Namespace
- if err := wait.PollImmediate(Poll, SingleCallTimeout, func() (bool, error) {
- var err error
- got, err = c.Namespaces().Create(namespaceObj)
- if err != nil {
- Logf("Unexpected error while creating namespace: %v", err)
- return false, nil
- }
- return true, nil
- }); err != nil {
- return nil, err
- }
- if TestContext.VerifyServiceAccount {
- if err := WaitForDefaultServiceAccountInNamespace(c, got.Name); err != nil {
- return nil, err
- }
- }
- return got, nil
- }
- // CheckTestingNSDeletedExcept checks whether all e2e based existing namespaces are in the Terminating state
- // and waits until they are finally deleted. It ignores namespace skip.
- func CheckTestingNSDeletedExcept(c *client.Client, skip string) error {
- // TODO: Since we don't have support for bulk resource deletion in the API,
- // while deleting a namespace we are deleting all objects from that namespace
- // one by one (one deletion == one API call). This basically exposes us to
- // throttling - currently controller-manager has a limit of max 20 QPS.
- // Once #10217 is implemented and used in namespace-controller, deleting all
- // object from a given namespace should be much faster and we will be able
- // to lower this timeout.
- // However, now Density test is producing ~26000 events and Load capacity test
- // is producing ~35000 events, thus assuming there are no other requests it will
- // take ~30 minutes to fully delete the namespace. Thus I'm setting it to 60
- // minutes to avoid any timeouts here.
- timeout := 60 * time.Minute
- Logf("Waiting for terminating namespaces to be deleted...")
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(15 * time.Second) {
- namespaces, err := c.Namespaces().List(api.ListOptions{})
- if err != nil {
- Logf("Listing namespaces failed: %v", err)
- continue
- }
- terminating := 0
- for _, ns := range namespaces.Items {
- if strings.HasPrefix(ns.ObjectMeta.Name, "e2e-tests-") && ns.ObjectMeta.Name != skip {
- if ns.Status.Phase == api.NamespaceActive {
- return fmt.Errorf("Namespace %s is active", ns.ObjectMeta.Name)
- }
- terminating++
- }
- }
- if terminating == 0 {
- return nil
- }
- }
- return fmt.Errorf("Waiting for terminating namespaces to be deleted timed out")
- }
- // deleteNS deletes the provided namespace, waits for it to be completely deleted, and then checks
- // whether there are any pods remaining in a non-terminating state.
- func deleteNS(c *client.Client, clientPool dynamic.ClientPool, namespace string, timeout time.Duration) error {
- if err := c.Namespaces().Delete(namespace); err != nil {
- return err
- }
- // wait for namespace to delete or timeout.
- err := wait.PollImmediate(5*time.Second, timeout, func() (bool, error) {
- if _, err := c.Namespaces().Get(namespace); err != nil {
- if apierrs.IsNotFound(err) {
- return true, nil
- }
- Logf("Error while waiting for namespace to be terminated: %v", err)
- return false, nil
- }
- return false, nil
- })
- // verify there is no more remaining content in the namespace
- remainingContent, cerr := hasRemainingContent(c, clientPool, namespace)
- if cerr != nil {
- return cerr
- }
- // if content remains, let's dump information about the namespace, and system for flake debugging.
- remainingPods := 0
- missingTimestamp := 0
- if remainingContent {
- // log information about namespace, and set of namespaces in api server to help flake detection
- logNamespace(c, namespace)
- logNamespaces(c, namespace)
- // if we can, check if there were pods remaining with no timestamp.
- remainingPods, missingTimestamp, _ = countRemainingPods(c, namespace)
- }
- // a timeout waiting for namespace deletion happened!
- if err != nil {
- // some content remains in the namespace
- if remainingContent {
- // pods remain
- if remainingPods > 0 {
- // but they were all undergoing deletion (kubelet is probably culprit)
- if missingTimestamp == 0 {
- return fmt.Errorf("namespace %v was not deleted with limit: %v, pods remaining: %v, pods missing deletion timestamp: %v", namespace, err, remainingPods, missingTimestamp)
- }
- // pods remained, but were not undergoing deletion (namespace controller is probably culprit)
- return fmt.Errorf("namespace %v was not deleted with limit: %v, pods remaining: %v", namespace, err, remainingPods)
- }
- // other content remains (namespace controller is probably screwed up)
- return fmt.Errorf("namespace %v was not deleted with limit: %v, namespaced content other than pods remain", namespace, err)
- }
- // no remaining content, but namespace was not deleted (namespace controller is probably wedged)
- return fmt.Errorf("namespace %v was not deleted with limit: %v, namespace is empty but is not yet removed", namespace, err)
- }
- return nil
- }
- // logNamespaces logs the number of namespaces by phase
- // namespace is the namespace the test was operating against that failed to delete so it can be grepped in logs
- func logNamespaces(c *client.Client, namespace string) {
- namespaceList, err := c.Namespaces().List(api.ListOptions{})
- if err != nil {
- Logf("namespace: %v, unable to list namespaces: %v", namespace, err)
- return
- }
- numActive := 0
- numTerminating := 0
- for _, namespace := range namespaceList.Items {
- if namespace.Status.Phase == api.NamespaceActive {
- numActive++
- } else {
- numTerminating++
- }
- }
- Logf("namespace: %v, total namespaces: %v, active: %v, terminating: %v", namespace, len(namespaceList.Items), numActive, numTerminating)
- }
- // logNamespace logs detail about a namespace
- func logNamespace(c *client.Client, namespace string) {
- ns, err := c.Namespaces().Get(namespace)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("namespace: %v no longer exists", namespace)
- return
- }
- Logf("namespace: %v, unable to get namespace due to error: %v", namespace, err)
- return
- }
- Logf("namespace: %v, DeletionTimetamp: %v, Finalizers: %v, Phase: %v", ns.Name, ns.DeletionTimestamp, ns.Spec.Finalizers, ns.Status.Phase)
- }
- // countRemainingPods queries the server to count number of remaining pods, and number of pods that had a missing deletion timestamp.
- func countRemainingPods(c *client.Client, namespace string) (int, int, error) {
- // check for remaining pods
- pods, err := c.Pods(namespace).List(api.ListOptions{})
- if err != nil {
- return 0, 0, err
- }
- // nothing remains!
- if len(pods.Items) == 0 {
- return 0, 0, nil
- }
- // stuff remains, log about it
- logPodStates(pods.Items)
- // check if there were any pods with missing deletion timestamp
- numPods := len(pods.Items)
- missingTimestamp := 0
- for _, pod := range pods.Items {
- if pod.DeletionTimestamp == nil {
- missingTimestamp++
- }
- }
- return numPods, missingTimestamp, nil
- }
- // hasRemainingContent checks if there is remaining content in the namespace via API discovery
- func hasRemainingContent(c *client.Client, clientPool dynamic.ClientPool, namespace string) (bool, error) {
- // some tests generate their own framework.Client rather than the default
- // TODO: ensure every test call has a configured clientPool
- if clientPool == nil {
- return false, nil
- }
- // find out what content is supported on the server
- groupVersionResources, err := c.Discovery().ServerPreferredNamespacedResources()
- if err != nil {
- return false, err
- }
- // TODO: temporary hack for https://github.com/kubernetes/kubernetes/issues/31798
- ignoredResources := sets.NewString("bindings")
- contentRemaining := false
- // dump how many of resource type is on the server in a log.
- for _, gvr := range groupVersionResources {
- // get a client for this group version...
- dynamicClient, err := clientPool.ClientForGroupVersion(gvr.GroupVersion())
- if err != nil {
- // not all resource types support list, so some errors here are normal depending on the resource type.
- Logf("namespace: %s, unable to get client - gvr: %v, error: %v", namespace, gvr, err)
- continue
- }
- // get the api resource
- apiResource := unversioned.APIResource{Name: gvr.Resource, Namespaced: true}
- // TODO: temporary hack for https://github.com/kubernetes/kubernetes/issues/31798
- if ignoredResources.Has(apiResource.Name) {
- Logf("namespace: %s, resource: %s, ignored listing per whitelist", namespace, apiResource.Name)
- continue
- }
- obj, err := dynamicClient.Resource(&apiResource, namespace).List(&v1.ListOptions{})
- if err != nil {
- // not all resources support list, so we ignore those
- if apierrs.IsMethodNotSupported(err) || apierrs.IsNotFound(err) || apierrs.IsForbidden(err) {
- continue
- }
- return false, err
- }
- unstructuredList, ok := obj.(*runtime.UnstructuredList)
- if !ok {
- return false, fmt.Errorf("namespace: %s, resource: %s, expected *runtime.UnstructuredList, got %#v", namespace, apiResource.Name, obj)
- }
- if len(unstructuredList.Items) > 0 {
- Logf("namespace: %s, resource: %s, items remaining: %v", namespace, apiResource.Name, len(unstructuredList.Items))
- contentRemaining = true
- }
- }
- return contentRemaining, nil
- }
- func ContainerInitInvariant(older, newer runtime.Object) error {
- oldPod := older.(*api.Pod)
- newPod := newer.(*api.Pod)
- if len(oldPod.Spec.InitContainers) == 0 {
- return nil
- }
- if len(oldPod.Spec.InitContainers) != len(newPod.Spec.InitContainers) {
- return fmt.Errorf("init container list changed")
- }
- if oldPod.UID != newPod.UID {
- return fmt.Errorf("two different pods exist in the condition: %s vs %s", oldPod.UID, newPod.UID)
- }
- if err := initContainersInvariants(oldPod); err != nil {
- return err
- }
- if err := initContainersInvariants(newPod); err != nil {
- return err
- }
- oldInit, _, _ := podInitialized(oldPod)
- newInit, _, _ := podInitialized(newPod)
- if oldInit && !newInit {
- // TODO: we may in the future enable resetting PodInitialized = false if the kubelet needs to restart it
- // from scratch
- return fmt.Errorf("pod cannot be initialized and then regress to not being initialized")
- }
- return nil
- }
- func podInitialized(pod *api.Pod) (ok bool, failed bool, err error) {
- allInit := true
- initFailed := false
- for _, s := range pod.Status.InitContainerStatuses {
- switch {
- case initFailed && s.State.Waiting == nil:
- return allInit, initFailed, fmt.Errorf("container %s is after a failed container but isn't waiting", s.Name)
- case allInit && s.State.Waiting == nil:
- return allInit, initFailed, fmt.Errorf("container %s is after an initializing container but isn't waiting", s.Name)
- case s.State.Terminated == nil:
- allInit = false
- case s.State.Terminated.ExitCode != 0:
- allInit = false
- initFailed = true
- case !s.Ready:
- return allInit, initFailed, fmt.Errorf("container %s initialized but isn't marked as ready", s.Name)
- }
- }
- return allInit, initFailed, nil
- }
- func initContainersInvariants(pod *api.Pod) error {
- allInit, initFailed, err := podInitialized(pod)
- if err != nil {
- return err
- }
- if !allInit || initFailed {
- for _, s := range pod.Status.ContainerStatuses {
- if s.State.Waiting == nil || s.RestartCount != 0 {
- return fmt.Errorf("container %s is not waiting but initialization not complete", s.Name)
- }
- if s.State.Waiting.Reason != "PodInitializing" {
- return fmt.Errorf("container %s should have reason PodInitializing: %s", s.Name, s.State.Waiting.Reason)
- }
- }
- }
- _, c := api.GetPodCondition(&pod.Status, api.PodInitialized)
- if c == nil {
- return fmt.Errorf("pod does not have initialized condition")
- }
- if c.LastTransitionTime.IsZero() {
- return fmt.Errorf("PodInitialized condition should always have a transition time")
- }
- switch {
- case c.Status == api.ConditionUnknown:
- return fmt.Errorf("PodInitialized condition should never be Unknown")
- case c.Status == api.ConditionTrue && (initFailed || !allInit):
- return fmt.Errorf("PodInitialized condition was True but all not all containers initialized")
- case c.Status == api.ConditionFalse && (!initFailed && allInit):
- return fmt.Errorf("PodInitialized condition was False but all containers initialized")
- }
- return nil
- }
- type InvariantFunc func(older, newer runtime.Object) error
- func CheckInvariants(events []watch.Event, fns ...InvariantFunc) error {
- errs := sets.NewString()
- for i := range events {
- j := i + 1
- if j >= len(events) {
- continue
- }
- for _, fn := range fns {
- if err := fn(events[i].Object, events[j].Object); err != nil {
- errs.Insert(err.Error())
- }
- }
- }
- if errs.Len() > 0 {
- return fmt.Errorf("invariants violated:\n* %s", strings.Join(errs.List(), "\n* "))
- }
- return nil
- }
- // Waits default amount of time (PodStartTimeout) for the specified pod to become running.
- // Returns an error if timeout occurs first, or pod goes in to failed state.
- func WaitForPodRunningInNamespace(c *client.Client, pod *api.Pod) error {
- // this short-cicuit is needed for cases when we pass a list of pods instead
- // of newly created pod (eg. VerifyPods) which means we are getting already
- // running pod for which waiting does not make sense and will always fail
- if pod.Status.Phase == api.PodRunning {
- return nil
- }
- return waitTimeoutForPodRunningInNamespace(c, pod.Name, pod.Namespace, pod.ResourceVersion, PodStartTimeout)
- }
- // Waits default amount of time (PodStartTimeout) for the specified pod to become running.
- // Returns an error if timeout occurs first, or pod goes in to failed state.
- func WaitForPodNameRunningInNamespace(c *client.Client, podName, namespace string) error {
- return waitTimeoutForPodRunningInNamespace(c, podName, namespace, "", PodStartTimeout)
- }
- // Waits an extended amount of time (slowPodStartTimeout) for the specified pod to become running.
- // The resourceVersion is used when Watching object changes, it tells since when we care
- // about changes to the pod. Returns an error if timeout occurs first, or pod goes in to failed state.
- func waitForPodRunningInNamespaceSlow(c *client.Client, podName, namespace, resourceVersion string) error {
- return waitTimeoutForPodRunningInNamespace(c, podName, namespace, resourceVersion, slowPodStartTimeout)
- }
- func waitTimeoutForPodRunningInNamespace(c *client.Client, podName, namespace, resourceVersion string, timeout time.Duration) error {
- w, err := c.Pods(namespace).Watch(api.SingleObject(api.ObjectMeta{Name: podName, ResourceVersion: resourceVersion}))
- if err != nil {
- return err
- }
- _, err = watch.Until(timeout, w, client.PodRunning)
- return err
- }
- // Waits default amount of time (podNoLongerRunningTimeout) for the specified pod to stop running.
- // Returns an error if timeout occurs first.
- func WaitForPodNoLongerRunningInNamespace(c *client.Client, podName, namespace, resourceVersion string) error {
- return WaitTimeoutForPodNoLongerRunningInNamespace(c, podName, namespace, resourceVersion, podNoLongerRunningTimeout)
- }
- func WaitTimeoutForPodNoLongerRunningInNamespace(c *client.Client, podName, namespace, resourceVersion string, timeout time.Duration) error {
- w, err := c.Pods(namespace).Watch(api.SingleObject(api.ObjectMeta{Name: podName, ResourceVersion: resourceVersion}))
- if err != nil {
- return err
- }
- _, err = watch.Until(timeout, w, client.PodCompleted)
- return err
- }
- func waitTimeoutForPodReadyInNamespace(c *client.Client, podName, namespace, resourceVersion string, timeout time.Duration) error {
- w, err := c.Pods(namespace).Watch(api.SingleObject(api.ObjectMeta{Name: podName, ResourceVersion: resourceVersion}))
- if err != nil {
- return err
- }
- _, err = watch.Until(timeout, w, client.PodRunningAndReady)
- return err
- }
- // WaitForPodNotPending returns an error if it took too long for the pod to go out of pending state.
- // The resourceVersion is used when Watching object changes, it tells since when we care
- // about changes to the pod.
- func WaitForPodNotPending(c *client.Client, ns, podName, resourceVersion string) error {
- w, err := c.Pods(ns).Watch(api.SingleObject(api.ObjectMeta{Name: podName, ResourceVersion: resourceVersion}))
- if err != nil {
- return err
- }
- _, err = watch.Until(PodStartTimeout, w, client.PodNotPending)
- return err
- }
- // waitForPodTerminatedInNamespace returns an error if it took too long for the pod
- // to terminate or if the pod terminated with an unexpected reason.
- func waitForPodTerminatedInNamespace(c *client.Client, podName, reason, namespace string) error {
- return waitForPodCondition(c, namespace, podName, "terminated due to deadline exceeded", PodStartTimeout, func(pod *api.Pod) (bool, error) {
- if pod.Status.Phase == api.PodFailed {
- if pod.Status.Reason == reason {
- return true, nil
- } else {
- return true, fmt.Errorf("Expected pod %v in namespace %v to be terminated with reason %v, got reason: %v", podName, namespace, reason, pod.Status.Reason)
- }
- }
- return false, nil
- })
- }
- // waitForPodSuccessInNamespaceTimeout returns nil if the pod reached state success, or an error if it reached failure or ran too long.
- func waitForPodSuccessInNamespaceTimeout(c *client.Client, podName string, contName string, namespace string, timeout time.Duration) error {
- return waitForPodCondition(c, namespace, podName, "success or failure", timeout, func(pod *api.Pod) (bool, error) {
- // Cannot use pod.Status.Phase == api.PodSucceeded/api.PodFailed due to #2632
- ci, ok := api.GetContainerStatus(pod.Status.ContainerStatuses, contName)
- if !ok {
- Logf("No Status.Info for container '%s' in pod '%s' yet", contName, podName)
- } else {
- if ci.State.Terminated != nil {
- if ci.State.Terminated.ExitCode == 0 {
- By("Saw pod success")
- return true, nil
- }
- return true, fmt.Errorf("pod '%s' terminated with failure: %+v", podName, ci.State.Terminated)
- }
- Logf("Nil State.Terminated for container '%s' in pod '%s' in namespace '%s' so far", contName, podName, namespace)
- }
- return false, nil
- })
- }
- // WaitForPodSuccessInNamespace returns nil if the pod reached state success, or an error if it reached failure or until podStartupTimeout.
- func WaitForPodSuccessInNamespace(c *client.Client, podName string, contName string, namespace string) error {
- return waitForPodSuccessInNamespaceTimeout(c, podName, contName, namespace, PodStartTimeout)
- }
- // WaitForPodSuccessInNamespaceSlow returns nil if the pod reached state success, or an error if it reached failure or until slowPodStartupTimeout.
- func WaitForPodSuccessInNamespaceSlow(c *client.Client, podName string, contName string, namespace string) error {
- return waitForPodSuccessInNamespaceTimeout(c, podName, contName, namespace, slowPodStartTimeout)
- }
- // waitForRCPodOnNode returns the pod from the given replication controller (described by rcName) which is scheduled on the given node.
- // In case of failure or too long waiting time, an error is returned.
- func waitForRCPodOnNode(c *client.Client, ns, rcName, node string) (*api.Pod, error) {
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": rcName}))
- var p *api.Pod = nil
- err := wait.PollImmediate(10*time.Second, 5*time.Minute, func() (bool, error) {
- Logf("Waiting for pod %s to appear on node %s", rcName, node)
- options := api.ListOptions{LabelSelector: label}
- pods, err := c.Pods(ns).List(options)
- if err != nil {
- return false, err
- }
- for _, pod := range pods.Items {
- if pod.Spec.NodeName == node {
- Logf("Pod %s found on node %s", pod.Name, node)
- p = &pod
- return true, nil
- }
- }
- return false, nil
- })
- return p, err
- }
- // WaitForRCToStabilize waits till the RC has a matching generation/replica count between spec and status.
- func WaitForRCToStabilize(c *client.Client, ns, name string, timeout time.Duration) error {
- options := api.ListOptions{FieldSelector: fields.Set{
- "metadata.name": name,
- "metadata.namespace": ns,
- }.AsSelector()}
- w, err := c.ReplicationControllers(ns).Watch(options)
- if err != nil {
- return err
- }
- _, err = watch.Until(timeout, w, func(event watch.Event) (bool, error) {
- switch event.Type {
- case watch.Deleted:
- return false, apierrs.NewNotFound(unversioned.GroupResource{Resource: "replicationcontrollers"}, "")
- }
- switch rc := event.Object.(type) {
- case *api.ReplicationController:
- if rc.Name == name && rc.Namespace == ns &&
- rc.Generation <= rc.Status.ObservedGeneration &&
- rc.Spec.Replicas == rc.Status.Replicas {
- return true, nil
- }
- Logf("Waiting for rc %s to stabilize, generation %v observed generation %v spec.replicas %d status.replicas %d",
- name, rc.Generation, rc.Status.ObservedGeneration, rc.Spec.Replicas, rc.Status.Replicas)
- }
- return false, nil
- })
- return err
- }
- func WaitForPodToDisappear(c *client.Client, ns, podName string, label labels.Selector, interval, timeout time.Duration) error {
- return wait.PollImmediate(interval, timeout, func() (bool, error) {
- Logf("Waiting for pod %s to disappear", podName)
- options := api.ListOptions{LabelSelector: label}
- pods, err := c.Pods(ns).List(options)
- if err != nil {
- return false, err
- }
- found := false
- for _, pod := range pods.Items {
- if pod.Name == podName {
- Logf("Pod %s still exists", podName)
- found = true
- }
- }
- if !found {
- Logf("Pod %s no longer exists", podName)
- return true, nil
- }
- return false, nil
- })
- }
- // WaitForRCPodToDisappear returns nil if the pod from the given replication controller (described by rcName) no longer exists.
- // In case of failure or too long waiting time, an error is returned.
- func WaitForRCPodToDisappear(c *client.Client, ns, rcName, podName string) error {
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": rcName}))
- // NodeController evicts pod after 5 minutes, so we need timeout greater than that.
- // Additionally, there can be non-zero grace period, so we are setting 10 minutes
- // to be on the safe size.
- return WaitForPodToDisappear(c, ns, podName, label, 20*time.Second, 10*time.Minute)
- }
- // WaitForService waits until the service appears (exist == true), or disappears (exist == false)
- func WaitForService(c *client.Client, namespace, name string, exist bool, interval, timeout time.Duration) error {
- err := wait.PollImmediate(interval, timeout, func() (bool, error) {
- _, err := c.Services(namespace).Get(name)
- switch {
- case err == nil:
- if !exist {
- return false, nil
- }
- Logf("Service %s in namespace %s found.", name, namespace)
- return true, nil
- case apierrs.IsNotFound(err):
- if exist {
- return false, nil
- }
- Logf("Service %s in namespace %s disappeared.", name, namespace)
- return true, nil
- default:
- Logf("Get service %s in namespace %s failed: %v", name, namespace, err)
- return false, nil
- }
- })
- if err != nil {
- stateMsg := map[bool]string{true: "to appear", false: "to disappear"}
- return fmt.Errorf("error waiting for service %s/%s %s: %v", namespace, name, stateMsg[exist], err)
- }
- return nil
- }
- //WaitForServiceEndpointsNum waits until the amount of endpoints that implement service to expectNum.
- func WaitForServiceEndpointsNum(c *client.Client, namespace, serviceName string, expectNum int, interval, timeout time.Duration) error {
- return wait.Poll(interval, timeout, func() (bool, error) {
- Logf("Waiting for amount of service:%s endpoints to be %d", serviceName, expectNum)
- list, err := c.Endpoints(namespace).List(api.ListOptions{})
- if err != nil {
- return false, err
- }
- for _, e := range list.Items {
- if e.Name == serviceName && countEndpointsNum(&e) == expectNum {
- return true, nil
- }
- }
- return false, nil
- })
- }
- func countEndpointsNum(e *api.Endpoints) int {
- num := 0
- for _, sub := range e.Subsets {
- num += len(sub.Addresses)
- }
- return num
- }
- // WaitForReplicationController waits until the RC appears (exist == true), or disappears (exist == false)
- func WaitForReplicationController(c *client.Client, namespace, name string, exist bool, interval, timeout time.Duration) error {
- err := wait.PollImmediate(interval, timeout, func() (bool, error) {
- _, err := c.ReplicationControllers(namespace).Get(name)
- if err != nil {
- Logf("Get ReplicationController %s in namespace %s failed (%v).", name, namespace, err)
- return !exist, nil
- } else {
- Logf("ReplicationController %s in namespace %s found.", name, namespace)
- return exist, nil
- }
- })
- if err != nil {
- stateMsg := map[bool]string{true: "to appear", false: "to disappear"}
- return fmt.Errorf("error waiting for ReplicationController %s/%s %s: %v", namespace, name, stateMsg[exist], err)
- }
- return nil
- }
- func WaitForEndpoint(c *client.Client, ns, name string) error {
- for t := time.Now(); time.Since(t) < EndpointRegisterTimeout; time.Sleep(Poll) {
- endpoint, err := c.Endpoints(ns).Get(name)
- Expect(err).NotTo(HaveOccurred())
- if len(endpoint.Subsets) == 0 || len(endpoint.Subsets[0].Addresses) == 0 {
- Logf("Endpoint %s/%s is not ready yet", ns, name)
- continue
- } else {
- return nil
- }
- }
- return fmt.Errorf("Failed to get endpoints for %s/%s", ns, name)
- }
- // Context for checking pods responses by issuing GETs to them (via the API
- // proxy) and verifying that they answer with ther own pod name.
- type podProxyResponseChecker struct {
- c *client.Client
- ns string
- label labels.Selector
- controllerName string
- respondName bool // Whether the pod should respond with its own name.
- pods *api.PodList
- }
- func PodProxyResponseChecker(c *client.Client, ns string, label labels.Selector, controllerName string, respondName bool, pods *api.PodList) podProxyResponseChecker {
- return podProxyResponseChecker{c, ns, label, controllerName, respondName, pods}
- }
- // CheckAllResponses issues GETs to all pods in the context and verify they
- // reply with their own pod name.
- func (r podProxyResponseChecker) CheckAllResponses() (done bool, err error) {
- successes := 0
- options := api.ListOptions{LabelSelector: r.label}
- currentPods, err := r.c.Pods(r.ns).List(options)
- Expect(err).NotTo(HaveOccurred())
- for i, pod := range r.pods.Items {
- // Check that the replica list remains unchanged, otherwise we have problems.
- if !isElementOf(pod.UID, currentPods) {
- return false, fmt.Errorf("pod with UID %s is no longer a member of the replica set. Must have been restarted for some reason. Current replica set: %v", pod.UID, currentPods)
- }
- subResourceProxyAvailable, err := ServerVersionGTE(SubResourcePodProxyVersion, r.c)
- if err != nil {
- return false, err
- }
- var body []byte
- if subResourceProxyAvailable {
- body, err = r.c.Get().
- Namespace(r.ns).
- Resource("pods").
- SubResource("proxy").
- Name(string(pod.Name)).
- Do().
- Raw()
- } else {
- body, err = r.c.Get().
- Prefix("proxy").
- Namespace(r.ns).
- Resource("pods").
- Name(string(pod.Name)).
- Do().
- Raw()
- }
- if err != nil {
- Logf("Controller %s: Failed to GET from replica %d [%s]: %v:", r.controllerName, i+1, pod.Name, err)
- continue
- }
- // The response checker expects the pod's name unless !respondName, in
- // which case it just checks for a non-empty response.
- got := string(body)
- what := ""
- if r.respondName {
- what = "expected"
- want := pod.Name
- if got != want {
- Logf("Controller %s: Replica %d [%s] expected response %q but got %q",
- r.controllerName, i+1, pod.Name, want, got)
- continue
- }
- } else {
- what = "non-empty"
- if len(got) == 0 {
- Logf("Controller %s: Replica %d [%s] expected non-empty response",
- r.controllerName, i+1, pod.Name)
- continue
- }
- }
- successes++
- Logf("Controller %s: Got %s result from replica %d [%s]: %q, %d of %d required successes so far",
- r.controllerName, what, i+1, pod.Name, got, successes, len(r.pods.Items))
- }
- if successes < len(r.pods.Items) {
- return false, nil
- }
- return true, nil
- }
- // ServerVersionGTE returns true if v is greater than or equal to the server
- // version.
- //
- // TODO(18726): This should be incorporated into client.VersionInterface.
- func ServerVersionGTE(v semver.Version, c discovery.ServerVersionInterface) (bool, error) {
- serverVersion, err := c.ServerVersion()
- if err != nil {
- return false, fmt.Errorf("Unable to get server version: %v", err)
- }
- sv, err := version.Parse(serverVersion.GitVersion)
- if err != nil {
- return false, fmt.Errorf("Unable to parse server version %q: %v", serverVersion.GitVersion, err)
- }
- return sv.GTE(v), nil
- }
- // KubectlVersionGTE returns true if the kubectl version is greater than or
- // equal to v.
- func KubectlVersionGTE(v semver.Version) (bool, error) {
- kv, err := KubectlVersion()
- if err != nil {
- return false, err
- }
- return kv.GTE(v), nil
- }
- // KubectlVersion gets the version of kubectl that's currently being used (see
- // --kubectl-path in e2e.go to use an alternate kubectl).
- func KubectlVersion() (semver.Version, error) {
- output := RunKubectlOrDie("version", "--client")
- matches := gitVersionRegexp.FindStringSubmatch(output)
- if len(matches) != 2 {
- return semver.Version{}, fmt.Errorf("Could not find kubectl version in output %v", output)
- }
- // Don't use the full match, as it contains "GitVersion:\"" and a
- // trailing "\"". Just use the submatch.
- return version.Parse(matches[1])
- }
- func PodsResponding(c *client.Client, ns, name string, wantName bool, pods *api.PodList) error {
- By("trying to dial each unique pod")
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": name}))
- return wait.PollImmediate(Poll, podRespondingTimeout, PodProxyResponseChecker(c, ns, label, name, wantName, pods).CheckAllResponses)
- }
- func PodsCreated(c *client.Client, ns, name string, replicas int32) (*api.PodList, error) {
- timeout := 2 * time.Minute
- // List the pods, making sure we observe all the replicas.
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": name}))
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(5 * time.Second) {
- options := api.ListOptions{LabelSelector: label}
- pods, err := c.Pods(ns).List(options)
- if err != nil {
- return nil, err
- }
- created := []api.Pod{}
- for _, pod := range pods.Items {
- if pod.DeletionTimestamp != nil {
- continue
- }
- created = append(created, pod)
- }
- Logf("Pod name %s: Found %d pods out of %d", name, len(created), replicas)
- if int32(len(created)) == replicas {
- pods.Items = created
- return pods, nil
- }
- }
- return nil, fmt.Errorf("Pod name %s: Gave up waiting %v for %d pods to come up", name, timeout, replicas)
- }
- func podsRunning(c *client.Client, pods *api.PodList) []error {
- // Wait for the pods to enter the running state. Waiting loops until the pods
- // are running so non-running pods cause a timeout for this test.
- By("ensuring each pod is running")
- e := []error{}
- error_chan := make(chan error)
- for _, pod := range pods.Items {
- go func(p api.Pod) {
- error_chan <- WaitForPodRunningInNamespace(c, &p)
- }(pod)
- }
- for range pods.Items {
- err := <-error_chan
- if err != nil {
- e = append(e, err)
- }
- }
- return e
- }
- func VerifyPods(c *client.Client, ns, name string, wantName bool, replicas int32) error {
- pods, err := PodsCreated(c, ns, name, replicas)
- if err != nil {
- return err
- }
- e := podsRunning(c, pods)
- if len(e) > 0 {
- return fmt.Errorf("failed to wait for pods running: %v", e)
- }
- err = PodsResponding(c, ns, name, wantName, pods)
- if err != nil {
- return fmt.Errorf("failed to wait for pods responding: %v", err)
- }
- return nil
- }
- func ServiceResponding(c *client.Client, ns, name string) error {
- By(fmt.Sprintf("trying to dial the service %s.%s via the proxy", ns, name))
- return wait.PollImmediate(Poll, ServiceRespondingTimeout, func() (done bool, err error) {
- proxyRequest, errProxy := GetServicesProxyRequest(c, c.Get())
- if errProxy != nil {
- Logf("Failed to get services proxy request: %v:", errProxy)
- return false, nil
- }
- body, err := proxyRequest.Namespace(ns).
- Name(name).
- Do().
- Raw()
- if err != nil {
- Logf("Failed to GET from service %s: %v:", name, err)
- return false, nil
- }
- got := string(body)
- if len(got) == 0 {
- Logf("Service %s: expected non-empty response", name)
- return false, err // stop polling
- }
- Logf("Service %s: found nonempty answer: %s", name, got)
- return true, nil
- })
- }
- func restclientConfig(kubeContext string) (*clientcmdapi.Config, error) {
- Logf(">>> kubeConfig: %s\n", TestContext.KubeConfig)
- if TestContext.KubeConfig == "" {
- return nil, fmt.Errorf("KubeConfig must be specified to load client config")
- }
- c, err := clientcmd.LoadFromFile(TestContext.KubeConfig)
- if err != nil {
- return nil, fmt.Errorf("error loading KubeConfig: %v", err.Error())
- }
- if kubeContext != "" {
- Logf(">>> kubeContext: %s\n", kubeContext)
- c.CurrentContext = kubeContext
- }
- return c, nil
- }
- type ClientConfigGetter func() (*restclient.Config, error)
- func LoadConfig() (*restclient.Config, error) {
- if TestContext.NodeName != "" {
- // This is a node e2e test, apply the node e2e configuration
- return &restclient.Config{Host: TestContext.Host}, nil
- }
- c, err := restclientConfig(TestContext.KubeContext)
- if err != nil {
- return nil, err
- }
- return clientcmd.NewDefaultClientConfig(*c, &clientcmd.ConfigOverrides{ClusterInfo: clientcmdapi.Cluster{Server: TestContext.Host}}).ClientConfig()
- }
- func LoadFederatedConfig(overrides *clientcmd.ConfigOverrides) (*restclient.Config, error) {
- c, err := restclientConfig(federatedKubeContext)
- if err != nil {
- return nil, fmt.Errorf("error creating federation client config: %v", err.Error())
- }
- cfg, err := clientcmd.NewDefaultClientConfig(*c, overrides).ClientConfig()
- if cfg != nil {
- //TODO(colhom): this is only here because https://github.com/kubernetes/kubernetes/issues/25422
- cfg.NegotiatedSerializer = api.Codecs
- }
- if err != nil {
- return cfg, fmt.Errorf("error creating federation client config: %v", err.Error())
- }
- return cfg, nil
- }
- func loadClientFromConfig(config *restclient.Config) (*client.Client, error) {
- c, err := client.New(config)
- if err != nil {
- return nil, fmt.Errorf("error creating client: %v", err.Error())
- }
- if c.Client.Timeout == 0 {
- c.Client.Timeout = SingleCallTimeout
- }
- return c, nil
- }
- func setTimeouts(cs ...*http.Client) {
- for _, client := range cs {
- if client.Timeout == 0 {
- client.Timeout = SingleCallTimeout
- }
- }
- }
- func LoadFederationClientset_1_4() (*federation_release_1_4.Clientset, error) {
- config, err := LoadFederatedConfig(&clientcmd.ConfigOverrides{})
- if err != nil {
- return nil, err
- }
- c, err := federation_release_1_4.NewForConfig(config)
- if err != nil {
- return nil, fmt.Errorf("error creating federation clientset: %v", err.Error())
- }
- // Set timeout for each client in the set.
- setTimeouts(c.DiscoveryClient.Client, c.FederationClient.Client, c.CoreClient.Client, c.ExtensionsClient.Client)
- return c, nil
- }
- func LoadClient() (*client.Client, error) {
- config, err := LoadConfig()
- if err != nil {
- return nil, fmt.Errorf("error creating client: %v", err.Error())
- }
- return loadClientFromConfig(config)
- }
- // randomSuffix provides a random string to append to pods,services,rcs.
- // TODO: Allow service names to have the same form as names
- // for pods and replication controllers so we don't
- // need to use such a function and can instead
- // use the UUID utility function.
- func randomSuffix() string {
- r := rand.New(rand.NewSource(time.Now().UnixNano()))
- return strconv.Itoa(r.Int() % 10000)
- }
- func ExpectNoError(err error, explain ...interface{}) {
- if err != nil {
- Logf("Unexpected error occurred: %v", err)
- }
- ExpectWithOffset(1, err).NotTo(HaveOccurred(), explain...)
- }
- func ExpectNoErrorWithRetries(fn func() error, maxRetries int, explain ...interface{}) {
- var err error
- for i := 0; i < maxRetries; i++ {
- err = fn()
- if err == nil {
- return
- }
- Logf("(Attempt %d of %d) Unexpected error occurred: %v", i+1, maxRetries, err)
- }
- ExpectWithOffset(1, err).NotTo(HaveOccurred(), explain...)
- }
- // Stops everything from filePath from namespace ns and checks if everything matching selectors from the given namespace is correctly stopped.
- func Cleanup(filePath, ns string, selectors ...string) {
- By("using delete to clean up resources")
- var nsArg string
- if ns != "" {
- nsArg = fmt.Sprintf("--namespace=%s", ns)
- }
- RunKubectlOrDie("delete", "--grace-period=0", "-f", filePath, nsArg)
- AssertCleanup(ns, selectors...)
- }
- // Asserts that cleanup of a namespace wrt selectors occurred.
- func AssertCleanup(ns string, selectors ...string) {
- var nsArg string
- if ns != "" {
- nsArg = fmt.Sprintf("--namespace=%s", ns)
- }
- for _, selector := range selectors {
- resources := RunKubectlOrDie("get", "rc,svc", "-l", selector, "--no-headers", nsArg)
- if resources != "" {
- Failf("Resources left running after stop:\n%s", resources)
- }
- pods := RunKubectlOrDie("get", "pods", "-l", selector, nsArg, "-o", "go-template={{ range .items }}{{ if not .metadata.deletionTimestamp }}{{ .metadata.name }}{{ \"\\n\" }}{{ end }}{{ end }}")
- if pods != "" {
- Failf("Pods left unterminated after stop:\n%s", pods)
- }
- }
- }
- // validatorFn is the function which is individual tests will implement.
- // we may want it to return more than just an error, at some point.
- type validatorFn func(c *client.Client, podID string) error
- // ValidateController is a generic mechanism for testing RC's that are running.
- // It takes a container name, a test name, and a validator function which is plugged in by a specific test.
- // "containername": this is grepped for.
- // "containerImage" : this is the name of the image we expect to be launched. Not to confuse w/ images (kitten.jpg) which are validated.
- // "testname": which gets bubbled up to the logging/failure messages if errors happen.
- // "validator" function: This function is given a podID and a client, and it can do some specific validations that way.
- func ValidateController(c *client.Client, containerImage string, replicas int, containername string, testname string, validator validatorFn, ns string) {
- getPodsTemplate := "--template={{range.items}}{{.metadata.name}} {{end}}"
- // NB: kubectl adds the "exists" function to the standard template functions.
- // This lets us check to see if the "running" entry exists for each of the containers
- // we care about. Exists will never return an error and it's safe to check a chain of
- // things, any one of which may not exist. In the below template, all of info,
- // containername, and running might be nil, so the normal index function isn't very
- // helpful.
- // This template is unit-tested in kubectl, so if you change it, update the unit test.
- // You can read about the syntax here: http://golang.org/pkg/text/template/.
- getContainerStateTemplate := fmt.Sprintf(`--template={{if (exists . "status" "containerStatuses")}}{{range .status.containerStatuses}}{{if (and (eq .name "%s") (exists . "state" "running"))}}true{{end}}{{end}}{{end}}`, containername)
- getImageTemplate := fmt.Sprintf(`--template={{if (exists . "status" "containerStatuses")}}{{range .status.containerStatuses}}{{if eq .name "%s"}}{{.image}}{{end}}{{end}}{{end}}`, containername)
- By(fmt.Sprintf("waiting for all containers in %s pods to come up.", testname)) //testname should be selector
- waitLoop:
- for start := time.Now(); time.Since(start) < PodStartTimeout; time.Sleep(5 * time.Second) {
- getPodsOutput := RunKubectlOrDie("get", "pods", "-o", "template", getPodsTemplate, "-l", testname, fmt.Sprintf("--namespace=%v", ns))
- pods := strings.Fields(getPodsOutput)
- if numPods := len(pods); numPods != replicas {
- By(fmt.Sprintf("Replicas for %s: expected=%d actual=%d", testname, replicas, numPods))
- continue
- }
- var runningPods []string
- for _, podID := range pods {
- running := RunKubectlOrDie("get", "pods", podID, "-o", "template", getContainerStateTemplate, fmt.Sprintf("--namespace=%v", ns))
- if running != "true" {
- Logf("%s is created but not running", podID)
- continue waitLoop
- }
- currentImage := RunKubectlOrDie("get", "pods", podID, "-o", "template", getImageTemplate, fmt.Sprintf("--namespace=%v", ns))
- if currentImage != containerImage {
- Logf("%s is created but running wrong image; expected: %s, actual: %s", podID, containerImage, currentImage)
- continue waitLoop
- }
- // Call the generic validator function here.
- // This might validate for example, that (1) getting a url works and (2) url is serving correct content.
- if err := validator(c, podID); err != nil {
- Logf("%s is running right image but validator function failed: %v", podID, err)
- continue waitLoop
- }
- Logf("%s is verified up and running", podID)
- runningPods = append(runningPods, podID)
- }
- // If we reach here, then all our checks passed.
- if len(runningPods) == replicas {
- return
- }
- }
- // Reaching here means that one of more checks failed multiple times. Assuming its not a race condition, something is broken.
- Failf("Timed out after %v seconds waiting for %s pods to reach valid state", PodStartTimeout.Seconds(), testname)
- }
- // KubectlCmd runs the kubectl executable through the wrapper script.
- func KubectlCmd(args ...string) *exec.Cmd {
- defaultArgs := []string{}
- // Reference a --server option so tests can run anywhere.
- if TestContext.Host != "" {
- defaultArgs = append(defaultArgs, "--"+clientcmd.FlagAPIServer+"="+TestContext.Host)
- }
- if TestContext.KubeConfig != "" {
- defaultArgs = append(defaultArgs, "--"+clientcmd.RecommendedConfigPathFlag+"="+TestContext.KubeConfig)
- // Reference the KubeContext
- if TestContext.KubeContext != "" {
- defaultArgs = append(defaultArgs, "--"+clientcmd.FlagContext+"="+TestContext.KubeContext)
- }
- } else {
- if TestContext.CertDir != "" {
- defaultArgs = append(defaultArgs,
- fmt.Sprintf("--certificate-authority=%s", filepath.Join(TestContext.CertDir, "ca.crt")),
- fmt.Sprintf("--client-certificate=%s", filepath.Join(TestContext.CertDir, "kubecfg.crt")),
- fmt.Sprintf("--client-key=%s", filepath.Join(TestContext.CertDir, "kubecfg.key")))
- }
- }
- kubectlArgs := append(defaultArgs, args...)
- //We allow users to specify path to kubectl, so you can test either "kubectl" or "cluster/kubectl.sh"
- //and so on.
- cmd := exec.Command(TestContext.KubectlPath, kubectlArgs...)
- //caller will invoke this and wait on it.
- return cmd
- }
- // kubectlBuilder is used to build, customize and execute a kubectl Command.
- // Add more functions to customize the builder as needed.
- type kubectlBuilder struct {
- cmd *exec.Cmd
- timeout <-chan time.Time
- }
- func NewKubectlCommand(args ...string) *kubectlBuilder {
- b := new(kubectlBuilder)
- b.cmd = KubectlCmd(args...)
- return b
- }
- func (b *kubectlBuilder) WithEnv(env []string) *kubectlBuilder {
- b.cmd.Env = env
- return b
- }
- func (b *kubectlBuilder) WithTimeout(t <-chan time.Time) *kubectlBuilder {
- b.timeout = t
- return b
- }
- func (b kubectlBuilder) WithStdinData(data string) *kubectlBuilder {
- b.cmd.Stdin = strings.NewReader(data)
- return &b
- }
- func (b kubectlBuilder) WithStdinReader(reader io.Reader) *kubectlBuilder {
- b.cmd.Stdin = reader
- return &b
- }
- func (b kubectlBuilder) ExecOrDie() string {
- str, err := b.Exec()
- Logf("stdout: %q", str)
- // In case of i/o timeout error, try talking to the apiserver again after 2s before dying.
- // Note that we're still dying after retrying so that we can get visibility to triage it further.
- if isTimeout(err) {
- Logf("Hit i/o timeout error, talking to the server 2s later to see if it's temporary.")
- time.Sleep(2 * time.Second)
- retryStr, retryErr := RunKubectl("version")
- Logf("stdout: %q", retryStr)
- Logf("err: %v", retryErr)
- }
- Expect(err).NotTo(HaveOccurred())
- return str
- }
- func isTimeout(err error) bool {
- switch err := err.(type) {
- case net.Error:
- if err.Timeout() {
- return true
- }
- case *url.Error:
- if err, ok := err.Err.(net.Error); ok && err.Timeout() {
- return true
- }
- }
- return false
- }
- func (b kubectlBuilder) Exec() (string, error) {
- var stdout, stderr bytes.Buffer
- cmd := b.cmd
- cmd.Stdout, cmd.Stderr = &stdout, &stderr
- Logf("Running '%s %s'", cmd.Path, strings.Join(cmd.Args[1:], " ")) // skip arg[0] as it is printed separately
- if err := cmd.Start(); err != nil {
- return "", fmt.Errorf("error starting %v:\nCommand stdout:\n%v\nstderr:\n%v\nerror:\n%v\n", cmd, cmd.Stdout, cmd.Stderr, err)
- }
- errCh := make(chan error, 1)
- go func() {
- errCh <- cmd.Wait()
- }()
- select {
- case err := <-errCh:
- if err != nil {
- var rc int = 127
- if ee, ok := err.(*exec.ExitError); ok {
- Logf("rc: %d", rc)
- rc = int(ee.Sys().(syscall.WaitStatus).ExitStatus())
- }
- return "", uexec.CodeExitError{
- Err: fmt.Errorf("error running %v:\nCommand stdout:\n%v\nstderr:\n%v\nerror:\n%v\n", cmd, cmd.Stdout, cmd.Stderr, err),
- Code: rc,
- }
- }
- case <-b.timeout:
- b.cmd.Process.Kill()
- return "", fmt.Errorf("timed out waiting for command %v:\nCommand stdout:\n%v\nstderr:\n%v\n", cmd, cmd.Stdout, cmd.Stderr)
- }
- Logf("stderr: %q", stderr.String())
- return stdout.String(), nil
- }
- // RunKubectlOrDie is a convenience wrapper over kubectlBuilder
- func RunKubectlOrDie(args ...string) string {
- return NewKubectlCommand(args...).ExecOrDie()
- }
- // RunKubectl is a convenience wrapper over kubectlBuilder
- func RunKubectl(args ...string) (string, error) {
- return NewKubectlCommand(args...).Exec()
- }
- // RunKubectlOrDieInput is a convenience wrapper over kubectlBuilder that takes input to stdin
- func RunKubectlOrDieInput(data string, args ...string) string {
- return NewKubectlCommand(args...).WithStdinData(data).ExecOrDie()
- }
- func StartCmdAndStreamOutput(cmd *exec.Cmd) (stdout, stderr io.ReadCloser, err error) {
- stdout, err = cmd.StdoutPipe()
- if err != nil {
- return
- }
- stderr, err = cmd.StderrPipe()
- if err != nil {
- return
- }
- Logf("Asynchronously running '%s %s'", cmd.Path, strings.Join(cmd.Args, " "))
- err = cmd.Start()
- return
- }
- // Rough equivalent of ctrl+c for cleaning up processes. Intended to be run in defer.
- func TryKill(cmd *exec.Cmd) {
- if err := cmd.Process.Kill(); err != nil {
- Logf("ERROR failed to kill command %v! The process may leak", cmd)
- }
- }
- // testContainerOutputMatcher runs the given pod in the given namespace and waits
- // for all of the containers in the podSpec to move into the 'Success' status, and tests
- // the specified container log against the given expected output using the given matcher.
- func (f *Framework) testContainerOutputMatcher(scenarioName string,
- pod *api.Pod,
- containerIndex int,
- expectedOutput []string,
- matcher func(string, ...interface{}) gomegatypes.GomegaMatcher) {
- By(fmt.Sprintf("Creating a pod to test %v", scenarioName))
- if containerIndex < 0 || containerIndex >= len(pod.Spec.Containers) {
- Failf("Invalid container index: %d", containerIndex)
- }
- ExpectNoError(f.MatchContainerOutput(pod, pod.Spec.Containers[containerIndex].Name, expectedOutput, matcher))
- }
- // MatchContainerOutput creates a pod and waits for all it's containers to exit with success.
- // It then tests that the matcher with each expectedOutput matches the output of the specified container.
- func (f *Framework) MatchContainerOutput(
- pod *api.Pod,
- containerName string,
- expectedOutput []string,
- matcher func(string, ...interface{}) gomegatypes.GomegaMatcher) error {
- podClient := f.PodClient()
- ns := f.Namespace.Name
- defer podClient.Delete(pod.Name, api.NewDeleteOptions(0))
- podClient.Create(pod)
- // Wait for client pod to complete. All containers should succeed.
- for _, container := range pod.Spec.Containers {
- if err := WaitForPodSuccessInNamespace(f.Client, pod.Name, container.Name, ns); err != nil {
- return fmt.Errorf("expected container %s success: %v", container.Name, err)
- }
- }
- // Grab its logs. Get host first.
- podStatus, err := podClient.Get(pod.Name)
- if err != nil {
- return fmt.Errorf("failed to get pod status: %v", err)
- }
- Logf("Trying to get logs from node %s pod %s container %s: %v",
- podStatus.Spec.NodeName, podStatus.Name, containerName, err)
- // Sometimes the actual containers take a second to get started, try to get logs for 60s
- logs, err := GetPodLogs(f.Client, ns, pod.Name, containerName)
- if err != nil {
- Logf("Failed to get logs from node %q pod %q container %q. %v",
- podStatus.Spec.NodeName, podStatus.Name, containerName, err)
- return fmt.Errorf("failed to get logs from %s for %s: %v", podStatus.Name, containerName, err)
- }
- for _, expected := range expectedOutput {
- m := matcher(expected)
- matches, err := m.Match(logs)
- if err != nil {
- return fmt.Errorf("expected %q in container output: %v", expected, err)
- } else if !matches {
- return fmt.Errorf("expected %q in container output: %s", expected, m.FailureMessage(logs))
- }
- }
- return nil
- }
- // podInfo contains pod information useful for debugging e2e tests.
- type podInfo struct {
- oldHostname string
- oldPhase string
- hostname string
- phase string
- }
- // PodDiff is a map of pod name to podInfos
- type PodDiff map[string]*podInfo
- // Print formats and prints the give PodDiff.
- func (p PodDiff) Print(ignorePhases sets.String) {
- for name, info := range p {
- if ignorePhases.Has(info.phase) {
- continue
- }
- if info.phase == nonExist {
- Logf("Pod %v was deleted, had phase %v and host %v", name, info.oldPhase, info.oldHostname)
- continue
- }
- phaseChange, hostChange := false, false
- msg := fmt.Sprintf("Pod %v ", name)
- if info.oldPhase != info.phase {
- phaseChange = true
- if info.oldPhase == nonExist {
- msg += fmt.Sprintf("in phase %v ", info.phase)
- } else {
- msg += fmt.Sprintf("went from phase: %v -> %v ", info.oldPhase, info.phase)
- }
- }
- if info.oldHostname != info.hostname {
- hostChange = true
- if info.oldHostname == nonExist || info.oldHostname == "" {
- msg += fmt.Sprintf("assigned host %v ", info.hostname)
- } else {
- msg += fmt.Sprintf("went from host: %v -> %v ", info.oldHostname, info.hostname)
- }
- }
- if phaseChange || hostChange {
- Logf(msg)
- }
- }
- }
- // Diff computes a PodDiff given 2 lists of pods.
- func Diff(oldPods []*api.Pod, curPods []*api.Pod) PodDiff {
- podInfoMap := PodDiff{}
- // New pods will show up in the curPods list but not in oldPods. They have oldhostname/phase == nonexist.
- for _, pod := range curPods {
- podInfoMap[pod.Name] = &podInfo{hostname: pod.Spec.NodeName, phase: string(pod.Status.Phase), oldHostname: nonExist, oldPhase: nonExist}
- }
- // Deleted pods will show up in the oldPods list but not in curPods. They have a hostname/phase == nonexist.
- for _, pod := range oldPods {
- if info, ok := podInfoMap[pod.Name]; ok {
- info.oldHostname, info.oldPhase = pod.Spec.NodeName, string(pod.Status.Phase)
- } else {
- podInfoMap[pod.Name] = &podInfo{hostname: nonExist, phase: nonExist, oldHostname: pod.Spec.NodeName, oldPhase: string(pod.Status.Phase)}
- }
- }
- return podInfoMap
- }
- // RunDeployment Launches (and verifies correctness) of a Deployment
- // and will wait for all pods it spawns to become "Running".
- // It's the caller's responsibility to clean up externally (i.e. use the
- // namespace lifecycle for handling Cleanup).
- func RunDeployment(config DeploymentConfig) error {
- err := config.create()
- if err != nil {
- return err
- }
- return config.start()
- }
- func (config *DeploymentConfig) create() error {
- By(fmt.Sprintf("creating deployment %s in namespace %s", config.Name, config.Namespace))
- deployment := &extensions.Deployment{
- ObjectMeta: api.ObjectMeta{
- Name: config.Name,
- },
- Spec: extensions.DeploymentSpec{
- Replicas: int32(config.Replicas),
- Selector: &unversioned.LabelSelector{
- MatchLabels: map[string]string{
- "name": config.Name,
- },
- },
- Template: api.PodTemplateSpec{
- ObjectMeta: api.ObjectMeta{
- Labels: map[string]string{"name": config.Name},
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: config.Name,
- Image: config.Image,
- Command: config.Command,
- Ports: []api.ContainerPort{{ContainerPort: 80}},
- },
- },
- },
- },
- },
- }
- config.applyTo(&deployment.Spec.Template)
- _, err := config.Client.Deployments(config.Namespace).Create(deployment)
- if err != nil {
- return fmt.Errorf("Error creating deployment: %v", err)
- }
- Logf("Created deployment with name: %v, namespace: %v, replica count: %v", deployment.Name, config.Namespace, deployment.Spec.Replicas)
- return nil
- }
- // RunReplicaSet launches (and verifies correctness) of a ReplicaSet
- // and waits until all the pods it launches to reach the "Running" state.
- // It's the caller's responsibility to clean up externally (i.e. use the
- // namespace lifecycle for handling Cleanup).
- func RunReplicaSet(config ReplicaSetConfig) error {
- err := config.create()
- if err != nil {
- return err
- }
- return config.start()
- }
- func (config *ReplicaSetConfig) create() error {
- By(fmt.Sprintf("creating replicaset %s in namespace %s", config.Name, config.Namespace))
- rs := &extensions.ReplicaSet{
- ObjectMeta: api.ObjectMeta{
- Name: config.Name,
- },
- Spec: extensions.ReplicaSetSpec{
- Replicas: int32(config.Replicas),
- Selector: &unversioned.LabelSelector{
- MatchLabels: map[string]string{
- "name": config.Name,
- },
- },
- Template: api.PodTemplateSpec{
- ObjectMeta: api.ObjectMeta{
- Labels: map[string]string{"name": config.Name},
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: config.Name,
- Image: config.Image,
- Command: config.Command,
- Ports: []api.ContainerPort{{ContainerPort: 80}},
- },
- },
- },
- },
- },
- }
- config.applyTo(&rs.Spec.Template)
- _, err := config.Client.ReplicaSets(config.Namespace).Create(rs)
- if err != nil {
- return fmt.Errorf("Error creating replica set: %v", err)
- }
- Logf("Created replica set with name: %v, namespace: %v, replica count: %v", rs.Name, config.Namespace, rs.Spec.Replicas)
- return nil
- }
- // RunRC Launches (and verifies correctness) of a Replication Controller
- // and will wait for all pods it spawns to become "Running".
- // It's the caller's responsibility to clean up externally (i.e. use the
- // namespace lifecycle for handling Cleanup).
- func RunRC(config RCConfig) error {
- err := config.create()
- if err != nil {
- return err
- }
- return config.start()
- }
- func (config *RCConfig) create() error {
- By(fmt.Sprintf("creating replication controller %s in namespace %s", config.Name, config.Namespace))
- dnsDefault := api.DNSDefault
- if config.DNSPolicy == nil {
- config.DNSPolicy = &dnsDefault
- }
- rc := &api.ReplicationController{
- ObjectMeta: api.ObjectMeta{
- Name: config.Name,
- },
- Spec: api.ReplicationControllerSpec{
- Replicas: int32(config.Replicas),
- Selector: map[string]string{
- "name": config.Name,
- },
- Template: &api.PodTemplateSpec{
- ObjectMeta: api.ObjectMeta{
- Labels: map[string]string{"name": config.Name},
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: config.Name,
- Image: config.Image,
- Command: config.Command,
- Ports: []api.ContainerPort{{ContainerPort: 80}},
- ReadinessProbe: config.ReadinessProbe,
- },
- },
- DNSPolicy: *config.DNSPolicy,
- NodeSelector: config.NodeSelector,
- },
- },
- },
- }
- config.applyTo(rc.Spec.Template)
- _, err := config.Client.ReplicationControllers(config.Namespace).Create(rc)
- if err != nil {
- return fmt.Errorf("Error creating replication controller: %v", err)
- }
- Logf("Created replication controller with name: %v, namespace: %v, replica count: %v", rc.Name, config.Namespace, rc.Spec.Replicas)
- return nil
- }
- func (config *RCConfig) applyTo(template *api.PodTemplateSpec) {
- if config.Env != nil {
- for k, v := range config.Env {
- c := &template.Spec.Containers[0]
- c.Env = append(c.Env, api.EnvVar{Name: k, Value: v})
- }
- }
- if config.Labels != nil {
- for k, v := range config.Labels {
- template.ObjectMeta.Labels[k] = v
- }
- }
- if config.NodeSelector != nil {
- template.Spec.NodeSelector = make(map[string]string)
- for k, v := range config.NodeSelector {
- template.Spec.NodeSelector[k] = v
- }
- }
- if config.Ports != nil {
- for k, v := range config.Ports {
- c := &template.Spec.Containers[0]
- c.Ports = append(c.Ports, api.ContainerPort{Name: k, ContainerPort: int32(v)})
- }
- }
- if config.HostPorts != nil {
- for k, v := range config.HostPorts {
- c := &template.Spec.Containers[0]
- c.Ports = append(c.Ports, api.ContainerPort{Name: k, ContainerPort: int32(v), HostPort: int32(v)})
- }
- }
- if config.CpuLimit > 0 || config.MemLimit > 0 {
- template.Spec.Containers[0].Resources.Limits = api.ResourceList{}
- }
- if config.CpuLimit > 0 {
- template.Spec.Containers[0].Resources.Limits[api.ResourceCPU] = *resource.NewMilliQuantity(config.CpuLimit, resource.DecimalSI)
- }
- if config.MemLimit > 0 {
- template.Spec.Containers[0].Resources.Limits[api.ResourceMemory] = *resource.NewQuantity(config.MemLimit, resource.DecimalSI)
- }
- if config.CpuRequest > 0 || config.MemRequest > 0 {
- template.Spec.Containers[0].Resources.Requests = api.ResourceList{}
- }
- if config.CpuRequest > 0 {
- template.Spec.Containers[0].Resources.Requests[api.ResourceCPU] = *resource.NewMilliQuantity(config.CpuRequest, resource.DecimalSI)
- }
- if config.MemRequest > 0 {
- template.Spec.Containers[0].Resources.Requests[api.ResourceMemory] = *resource.NewQuantity(config.MemRequest, resource.DecimalSI)
- }
- if len(config.Volumes) > 0 {
- template.Spec.Volumes = config.Volumes
- }
- if len(config.VolumeMounts) > 0 {
- template.Spec.Containers[0].VolumeMounts = config.VolumeMounts
- }
- }
- type RCStartupStatus struct {
- Expected int
- Terminating int
- Running int
- RunningButNotReady int
- Waiting int
- Pending int
- Unknown int
- Inactive int
- FailedContainers int
- Created []*api.Pod
- ContainerRestartNodes sets.String
- }
- func (s *RCStartupStatus) Print(name string) {
- Logf("%v Pods: %d out of %d created, %d running, %d pending, %d waiting, %d inactive, %d terminating, %d unknown, %d runningButNotReady ",
- name, len(s.Created), s.Expected, s.Running, s.Pending, s.Waiting, s.Inactive, s.Terminating, s.Unknown, s.RunningButNotReady)
- }
- func ComputeRCStartupStatus(pods []*api.Pod, expected int) RCStartupStatus {
- startupStatus := RCStartupStatus{
- Expected: expected,
- Created: make([]*api.Pod, 0, expected),
- ContainerRestartNodes: sets.NewString(),
- }
- for _, p := range pods {
- if p.DeletionTimestamp != nil {
- startupStatus.Terminating++
- continue
- }
- startupStatus.Created = append(startupStatus.Created, p)
- if p.Status.Phase == api.PodRunning {
- ready := false
- for _, c := range p.Status.Conditions {
- if c.Type == api.PodReady && c.Status == api.ConditionTrue {
- ready = true
- break
- }
- }
- if ready {
- // Only count a pod is running when it is also ready.
- startupStatus.Running++
- } else {
- startupStatus.RunningButNotReady++
- }
- for _, v := range FailedContainers(p) {
- startupStatus.FailedContainers = startupStatus.FailedContainers + v.Restarts
- startupStatus.ContainerRestartNodes.Insert(p.Spec.NodeName)
- }
- } else if p.Status.Phase == api.PodPending {
- if p.Spec.NodeName == "" {
- startupStatus.Waiting++
- } else {
- startupStatus.Pending++
- }
- } else if p.Status.Phase == api.PodSucceeded || p.Status.Phase == api.PodFailed {
- startupStatus.Inactive++
- } else if p.Status.Phase == api.PodUnknown {
- startupStatus.Unknown++
- }
- }
- return startupStatus
- }
- func (config *RCConfig) start() error {
- // Don't force tests to fail if they don't care about containers restarting.
- var maxContainerFailures int
- if config.MaxContainerFailures == nil {
- maxContainerFailures = int(math.Max(1.0, float64(config.Replicas)*.01))
- } else {
- maxContainerFailures = *config.MaxContainerFailures
- }
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": config.Name}))
- PodStore := NewPodStore(config.Client, config.Namespace, label, fields.Everything())
- defer PodStore.Stop()
- interval := config.PollInterval
- if interval <= 0 {
- interval = 10 * time.Second
- }
- timeout := config.Timeout
- if timeout <= 0 {
- timeout = 5 * time.Minute
- }
- oldPods := make([]*api.Pod, 0)
- oldRunning := 0
- lastChange := time.Now()
- for oldRunning != config.Replicas {
- time.Sleep(interval)
- pods := PodStore.List()
- startupStatus := ComputeRCStartupStatus(pods, config.Replicas)
- pods = startupStatus.Created
- if config.CreatedPods != nil {
- *config.CreatedPods = pods
- }
- if !config.Silent {
- startupStatus.Print(config.Name)
- }
- promPushRunningPending(startupStatus.Running, startupStatus.Pending)
- if config.PodStatusFile != nil {
- fmt.Fprintf(config.PodStatusFile, "%d, running, %d, pending, %d, waiting, %d, inactive, %d, unknown, %d, runningButNotReady\n", startupStatus.Running, startupStatus.Pending, startupStatus.Waiting, startupStatus.Inactive, startupStatus.Unknown, startupStatus.RunningButNotReady)
- }
- if startupStatus.FailedContainers > maxContainerFailures {
- DumpNodeDebugInfo(config.Client, startupStatus.ContainerRestartNodes.List())
- // Get the logs from the failed containers to help diagnose what caused them to fail
- LogFailedContainers(config.Client, config.Namespace)
- return fmt.Errorf("%d containers failed which is more than allowed %d", startupStatus.FailedContainers, maxContainerFailures)
- }
- if len(pods) < len(oldPods) || len(pods) > config.Replicas {
- // This failure mode includes:
- // kubelet is dead, so node controller deleted pods and rc creates more
- // - diagnose by noting the pod diff below.
- // pod is unhealthy, so replication controller creates another to take its place
- // - diagnose by comparing the previous "2 Pod states" lines for inactive pods
- errorStr := fmt.Sprintf("Number of reported pods for %s changed: %d vs %d", config.Name, len(pods), len(oldPods))
- Logf("%v, pods that changed since the last iteration:", errorStr)
- Diff(oldPods, pods).Print(sets.NewString())
- return fmt.Errorf(errorStr)
- }
- if len(pods) > len(oldPods) || startupStatus.Running > oldRunning {
- lastChange = time.Now()
- }
- oldPods = pods
- oldRunning = startupStatus.Running
- if time.Since(lastChange) > timeout {
- dumpPodDebugInfo(config.Client, pods)
- break
- }
- }
- if oldRunning != config.Replicas {
- // List only pods from a given replication controller.
- options := api.ListOptions{LabelSelector: label}
- if pods, err := config.Client.Pods(api.NamespaceAll).List(options); err == nil {
- for _, pod := range pods.Items {
- Logf("Pod %s\t%s\t%s\t%s", pod.Name, pod.Spec.NodeName, pod.Status.Phase, pod.DeletionTimestamp)
- }
- } else {
- Logf("Can't list pod debug info: %v", err)
- }
- return fmt.Errorf("Only %d pods started out of %d", oldRunning, config.Replicas)
- }
- return nil
- }
- // Simplified version of RunRC, that does not create RC, but creates plain Pods.
- // Optionally waits for pods to start running (if waitForRunning == true).
- // The number of replicas must be non-zero.
- func StartPods(c *client.Client, replicas int, namespace string, podNamePrefix string, pod api.Pod, waitForRunning bool) {
- // no pod to start
- if replicas < 1 {
- panic("StartPods: number of replicas must be non-zero")
- }
- startPodsID := string(uuid.NewUUID()) // So that we can label and find them
- for i := 0; i < replicas; i++ {
- podName := fmt.Sprintf("%v-%v", podNamePrefix, i)
- pod.ObjectMeta.Name = podName
- pod.ObjectMeta.Labels["name"] = podName
- pod.ObjectMeta.Labels["startPodsID"] = startPodsID
- pod.Spec.Containers[0].Name = podName
- _, err := c.Pods(namespace).Create(&pod)
- ExpectNoError(err)
- }
- Logf("Waiting for running...")
- if waitForRunning {
- label := labels.SelectorFromSet(labels.Set(map[string]string{"startPodsID": startPodsID}))
- err := WaitForPodsWithLabelRunning(c, namespace, label)
- ExpectNoError(err, "Error waiting for %d pods to be running - probably a timeout", replicas)
- }
- }
- func dumpPodDebugInfo(c *client.Client, pods []*api.Pod) {
- badNodes := sets.NewString()
- for _, p := range pods {
- if p.Status.Phase != api.PodRunning {
- if p.Spec.NodeName != "" {
- Logf("Pod %v assigned to host %v (IP: %v) in %v", p.Name, p.Spec.NodeName, p.Status.HostIP, p.Status.Phase)
- badNodes.Insert(p.Spec.NodeName)
- } else {
- Logf("Pod %v still unassigned", p.Name)
- }
- }
- }
- DumpNodeDebugInfo(c, badNodes.List())
- }
- func DumpAllNamespaceInfo(c *client.Client, namespace string) {
- By(fmt.Sprintf("Collecting events from namespace %q.", namespace))
- events, err := c.Events(namespace).List(api.ListOptions{})
- Expect(err).NotTo(HaveOccurred())
- // Sort events by their first timestamp
- sortedEvents := events.Items
- if len(sortedEvents) > 1 {
- sort.Sort(byFirstTimestamp(sortedEvents))
- }
- for _, e := range sortedEvents {
- Logf("At %v - event for %v: %v %v: %v", e.FirstTimestamp, e.InvolvedObject.Name, e.Source, e.Reason, e.Message)
- }
- // Note that we don't wait for any Cleanup to propagate, which means
- // that if you delete a bunch of pods right before ending your test,
- // you may or may not see the killing/deletion/Cleanup events.
- // If cluster is large, then the following logs are basically useless, because:
- // 1. it takes tens of minutes or hours to grab all of them
- // 2. there are so many of them that working with them are mostly impossible
- // So we dump them only if the cluster is relatively small.
- maxNodesForDump := 20
- if nodes, err := c.Nodes().List(api.ListOptions{}); err == nil {
- if len(nodes.Items) <= maxNodesForDump {
- dumpAllPodInfo(c)
- dumpAllNodeInfo(c)
- } else {
- Logf("skipping dumping cluster info - cluster too large")
- }
- } else {
- Logf("unable to fetch node list: %v", err)
- }
- }
- // byFirstTimestamp sorts a slice of events by first timestamp, using their involvedObject's name as a tie breaker.
- type byFirstTimestamp []api.Event
- func (o byFirstTimestamp) Len() int { return len(o) }
- func (o byFirstTimestamp) Swap(i, j int) { o[i], o[j] = o[j], o[i] }
- func (o byFirstTimestamp) Less(i, j int) bool {
- if o[i].FirstTimestamp.Equal(o[j].FirstTimestamp) {
- return o[i].InvolvedObject.Name < o[j].InvolvedObject.Name
- }
- return o[i].FirstTimestamp.Before(o[j].FirstTimestamp)
- }
- func dumpAllPodInfo(c *client.Client) {
- pods, err := c.Pods("").List(api.ListOptions{})
- if err != nil {
- Logf("unable to fetch pod debug info: %v", err)
- }
- logPodStates(pods.Items)
- }
- func dumpAllNodeInfo(c *client.Client) {
- // It should be OK to list unschedulable Nodes here.
- nodes, err := c.Nodes().List(api.ListOptions{})
- if err != nil {
- Logf("unable to fetch node list: %v", err)
- return
- }
- names := make([]string, len(nodes.Items))
- for ix := range nodes.Items {
- names[ix] = nodes.Items[ix].Name
- }
- DumpNodeDebugInfo(c, names)
- }
- func DumpNodeDebugInfo(c *client.Client, nodeNames []string) {
- for _, n := range nodeNames {
- Logf("\nLogging node info for node %v", n)
- node, err := c.Nodes().Get(n)
- if err != nil {
- Logf("Error getting node info %v", err)
- }
- Logf("Node Info: %v", node)
- Logf("\nLogging kubelet events for node %v", n)
- for _, e := range getNodeEvents(c, n) {
- Logf("source %v type %v message %v reason %v first ts %v last ts %v, involved obj %+v",
- e.Source, e.Type, e.Message, e.Reason, e.FirstTimestamp, e.LastTimestamp, e.InvolvedObject)
- }
- Logf("\nLogging pods the kubelet thinks is on node %v", n)
- podList, err := GetKubeletPods(c, n)
- if err != nil {
- Logf("Unable to retrieve kubelet pods for node %v", n)
- continue
- }
- for _, p := range podList.Items {
- Logf("%v started at %v (%d+%d container statuses recorded)", p.Name, p.Status.StartTime, len(p.Status.InitContainerStatuses), len(p.Status.ContainerStatuses))
- for _, c := range p.Status.InitContainerStatuses {
- Logf("\tInit container %v ready: %v, restart count %v",
- c.Name, c.Ready, c.RestartCount)
- }
- for _, c := range p.Status.ContainerStatuses {
- Logf("\tContainer %v ready: %v, restart count %v",
- c.Name, c.Ready, c.RestartCount)
- }
- }
- HighLatencyKubeletOperations(c, 10*time.Second, n)
- // TODO: Log node resource info
- }
- }
- // logNodeEvents logs kubelet events from the given node. This includes kubelet
- // restart and node unhealthy events. Note that listing events like this will mess
- // with latency metrics, beware of calling it during a test.
- func getNodeEvents(c *client.Client, nodeName string) []api.Event {
- selector := fields.Set{
- "involvedObject.kind": "Node",
- "involvedObject.name": nodeName,
- "involvedObject.namespace": api.NamespaceAll,
- "source": "kubelet",
- }.AsSelector()
- options := api.ListOptions{FieldSelector: selector}
- events, err := c.Events(api.NamespaceSystem).List(options)
- if err != nil {
- Logf("Unexpected error retrieving node events %v", err)
- return []api.Event{}
- }
- return events.Items
- }
- // waitListSchedulableNodesOrDie is a wrapper around listing nodes supporting retries.
- func waitListSchedulableNodesOrDie(c *client.Client) *api.NodeList {
- var nodes *api.NodeList
- var err error
- if wait.PollImmediate(Poll, SingleCallTimeout, func() (bool, error) {
- nodes, err = c.Nodes().List(api.ListOptions{FieldSelector: fields.Set{
- "spec.unschedulable": "false",
- }.AsSelector()})
- return err == nil, nil
- }) != nil {
- ExpectNoError(err, "Timed out while listing nodes for e2e cluster.")
- }
- return nodes
- }
- // Node is schedulable if:
- // 1) doesn't have "unschedulable" field set
- // 2) it's Ready condition is set to true
- // 3) doesn't have NetworkUnavailable condition set to true
- func isNodeSchedulable(node *api.Node) bool {
- nodeReady := IsNodeConditionSetAsExpected(node, api.NodeReady, true)
- networkReady := IsNodeConditionUnset(node, api.NodeNetworkUnavailable) ||
- IsNodeConditionSetAsExpectedSilent(node, api.NodeNetworkUnavailable, false)
- return !node.Spec.Unschedulable && nodeReady && networkReady
- }
- // GetReadySchedulableNodesOrDie addresses the common use case of getting nodes you can do work on.
- // 1) Needs to be schedulable.
- // 2) Needs to be ready.
- // If EITHER 1 or 2 is not true, most tests will want to ignore the node entirely.
- func GetReadySchedulableNodesOrDie(c *client.Client) (nodes *api.NodeList) {
- nodes = waitListSchedulableNodesOrDie(c)
- // previous tests may have cause failures of some nodes. Let's skip
- // 'Not Ready' nodes, just in case (there is no need to fail the test).
- FilterNodes(nodes, func(node api.Node) bool {
- return isNodeSchedulable(&node)
- })
- return nodes
- }
- func WaitForAllNodesSchedulable(c *client.Client) error {
- return wait.PollImmediate(30*time.Second, 4*time.Hour, func() (bool, error) {
- opts := api.ListOptions{
- ResourceVersion: "0",
- FieldSelector: fields.Set{"spec.unschedulable": "false"}.AsSelector(),
- }
- nodes, err := c.Nodes().List(opts)
- if err != nil {
- Logf("Unexpected error listing nodes: %v", err)
- // Ignore the error here - it will be retried.
- return false, nil
- }
- schedulable := 0
- for _, node := range nodes.Items {
- if isNodeSchedulable(&node) {
- schedulable++
- }
- }
- if schedulable != len(nodes.Items) {
- Logf("%d/%d nodes schedulable (polling after 30s)", schedulable, len(nodes.Items))
- return false, nil
- }
- return true, nil
- })
- }
- func AddOrUpdateLabelOnNode(c *client.Client, nodeName string, labelKey string, labelValue string) {
- patch := fmt.Sprintf(`{"metadata":{"labels":{"%s":"%s"}}}`, labelKey, labelValue)
- var err error
- for attempt := 0; attempt < UpdateRetries; attempt++ {
- err = c.Patch(api.MergePatchType).Resource("nodes").Name(nodeName).Body([]byte(patch)).Do().Error()
- if err != nil {
- if !apierrs.IsConflict(err) {
- ExpectNoError(err)
- } else {
- Logf("Conflict when trying to add a label %v:%v to %v", labelKey, labelValue, nodeName)
- }
- } else {
- break
- }
- time.Sleep(100 * time.Millisecond)
- }
- ExpectNoError(err)
- }
- func ExpectNodeHasLabel(c *client.Client, nodeName string, labelKey string, labelValue string) {
- By("verifying the node has the label " + labelKey + " " + labelValue)
- node, err := c.Nodes().Get(nodeName)
- ExpectNoError(err)
- Expect(node.Labels[labelKey]).To(Equal(labelValue))
- }
- // RemoveLabelOffNode is for cleaning up labels temporarily added to node,
- // won't fail if target label doesn't exist or has been removed.
- func RemoveLabelOffNode(c *client.Client, nodeName string, labelKey string) {
- By("removing the label " + labelKey + " off the node " + nodeName)
- var nodeUpdated *api.Node
- var node *api.Node
- var err error
- for attempt := 0; attempt < UpdateRetries; attempt++ {
- node, err = c.Nodes().Get(nodeName)
- ExpectNoError(err)
- if node.Labels == nil || len(node.Labels[labelKey]) == 0 {
- return
- }
- delete(node.Labels, labelKey)
- nodeUpdated, err = c.Nodes().Update(node)
- if err != nil {
- if !apierrs.IsConflict(err) {
- ExpectNoError(err)
- } else {
- Logf("Conflict when trying to remove a label %v from %v", labelKey, nodeName)
- }
- } else {
- break
- }
- time.Sleep(100 * time.Millisecond)
- }
- ExpectNoError(err)
- By("verifying the node doesn't have the label " + labelKey)
- if nodeUpdated.Labels != nil && len(nodeUpdated.Labels[labelKey]) != 0 {
- Failf("Failed removing label " + labelKey + " of the node " + nodeName)
- }
- }
- func AddOrUpdateTaintOnNode(c *client.Client, nodeName string, taint api.Taint) {
- for attempt := 0; attempt < UpdateRetries; attempt++ {
- node, err := c.Nodes().Get(nodeName)
- ExpectNoError(err)
- nodeTaints, err := api.GetTaintsFromNodeAnnotations(node.Annotations)
- ExpectNoError(err)
- var newTaints []api.Taint
- updated := false
- for _, existingTaint := range nodeTaints {
- if existingTaint.Key == taint.Key {
- newTaints = append(newTaints, taint)
- updated = true
- continue
- }
- newTaints = append(newTaints, existingTaint)
- }
- if !updated {
- newTaints = append(newTaints, taint)
- }
- taintsData, err := json.Marshal(newTaints)
- ExpectNoError(err)
- if node.Annotations == nil {
- node.Annotations = make(map[string]string)
- }
- node.Annotations[api.TaintsAnnotationKey] = string(taintsData)
- _, err = c.Nodes().Update(node)
- if err != nil {
- if !apierrs.IsConflict(err) {
- ExpectNoError(err)
- } else {
- Logf("Conflict when trying to add/update taint %v to %v", taint, nodeName)
- }
- } else {
- break
- }
- time.Sleep(100 * time.Millisecond)
- }
- }
- func taintExists(taints []api.Taint, taintKey string) bool {
- for _, taint := range taints {
- if taint.Key == taintKey {
- return true
- }
- }
- return false
- }
- func ExpectNodeHasTaint(c *client.Client, nodeName string, taintKey string) {
- By("verifying the node has the taint " + taintKey)
- node, err := c.Nodes().Get(nodeName)
- ExpectNoError(err)
- nodeTaints, err := api.GetTaintsFromNodeAnnotations(node.Annotations)
- ExpectNoError(err)
- if len(nodeTaints) == 0 || !taintExists(nodeTaints, taintKey) {
- Failf("Failed to find taint %s on node %s", taintKey, nodeName)
- }
- }
- func deleteTaintByKey(taints []api.Taint, taintKey string) ([]api.Taint, error) {
- newTaints := []api.Taint{}
- found := false
- for _, taint := range taints {
- if taint.Key == taintKey {
- found = true
- continue
- }
- newTaints = append(newTaints, taint)
- }
- if !found {
- return nil, fmt.Errorf("taint key=\"%s\" not found.", taintKey)
- }
- return newTaints, nil
- }
- // RemoveTaintOffNode is for cleaning up taints temporarily added to node,
- // won't fail if target taint doesn't exist or has been removed.
- func RemoveTaintOffNode(c *client.Client, nodeName string, taintKey string) {
- By("removing the taint " + taintKey + " off the node " + nodeName)
- for attempt := 0; attempt < UpdateRetries; attempt++ {
- node, err := c.Nodes().Get(nodeName)
- ExpectNoError(err)
- nodeTaints, err := api.GetTaintsFromNodeAnnotations(node.Annotations)
- ExpectNoError(err)
- if len(nodeTaints) == 0 {
- return
- }
- if !taintExists(nodeTaints, taintKey) {
- return
- }
- newTaints, err := deleteTaintByKey(nodeTaints, taintKey)
- ExpectNoError(err)
- taintsData, err := json.Marshal(newTaints)
- ExpectNoError(err)
- node.Annotations[api.TaintsAnnotationKey] = string(taintsData)
- _, err = c.Nodes().Update(node)
- if err != nil {
- if !apierrs.IsConflict(err) {
- ExpectNoError(err)
- } else {
- Logf("Conflict when trying to add/update taint %v to %v", taintKey, nodeName)
- }
- } else {
- break
- }
- time.Sleep(100 * time.Millisecond)
- }
- nodeUpdated, err := c.Nodes().Get(nodeName)
- ExpectNoError(err)
- By("verifying the node doesn't have the taint " + taintKey)
- taintsGot, err := api.GetTaintsFromNodeAnnotations(nodeUpdated.Annotations)
- ExpectNoError(err)
- if taintExists(taintsGot, taintKey) {
- Failf("Failed removing taint " + taintKey + " of the node " + nodeName)
- }
- }
- func ScaleRC(c *client.Client, ns, name string, size uint, wait bool) error {
- By(fmt.Sprintf("Scaling replication controller %s in namespace %s to %d", name, ns, size))
- scaler, err := kubectl.ScalerFor(api.Kind("ReplicationController"), c)
- if err != nil {
- return err
- }
- waitForScale := kubectl.NewRetryParams(5*time.Second, 1*time.Minute)
- waitForReplicas := kubectl.NewRetryParams(5*time.Second, 5*time.Minute)
- if err = scaler.Scale(ns, name, size, nil, waitForScale, waitForReplicas); err != nil {
- return fmt.Errorf("error while scaling RC %s to %d replicas: %v", name, size, err)
- }
- if !wait {
- return nil
- }
- return WaitForRCPodsRunning(c, ns, name)
- }
- // Wait up to 10 minutes for pods to become Running.
- func WaitForRCPodsRunning(c *client.Client, ns, rcName string) error {
- rc, err := c.ReplicationControllers(ns).Get(rcName)
- if err != nil {
- return err
- }
- selector := labels.SelectorFromSet(labels.Set(rc.Spec.Selector))
- err = WaitForPodsWithLabelRunning(c, ns, selector)
- if err != nil {
- return fmt.Errorf("Error while waiting for replication controller %s pods to be running: %v", rcName, err)
- }
- return nil
- }
- // Wait up to 10 minutes for all matching pods to become Running and at least one
- // matching pod exists.
- func WaitForPodsWithLabelRunning(c *client.Client, ns string, label labels.Selector) error {
- running := false
- PodStore := NewPodStore(c, ns, label, fields.Everything())
- defer PodStore.Stop()
- waitLoop:
- for start := time.Now(); time.Since(start) < 10*time.Minute; time.Sleep(5 * time.Second) {
- pods := PodStore.List()
- if len(pods) == 0 {
- continue waitLoop
- }
- for _, p := range pods {
- if p.Status.Phase != api.PodRunning {
- continue waitLoop
- }
- }
- running = true
- break
- }
- if !running {
- return fmt.Errorf("Timeout while waiting for pods with labels %q to be running", label.String())
- }
- return nil
- }
- // Returns true if all the specified pods are scheduled, else returns false.
- func podsWithLabelScheduled(c *client.Client, ns string, label labels.Selector) (bool, error) {
- PodStore := NewPodStore(c, ns, label, fields.Everything())
- defer PodStore.Stop()
- pods := PodStore.List()
- if len(pods) == 0 {
- return false, nil
- }
- for _, pod := range pods {
- if pod.Spec.NodeName == "" {
- return false, nil
- }
- }
- return true, nil
- }
- // Wait for all matching pods to become scheduled and at least one
- // matching pod exists. Return the list of matching pods.
- func WaitForPodsWithLabelScheduled(c *client.Client, ns string, label labels.Selector) (pods *api.PodList, err error) {
- err = wait.PollImmediate(Poll, podScheduledBeforeTimeout,
- func() (bool, error) {
- pods, err = WaitForPodsWithLabel(c, ns, label)
- if err != nil {
- return false, err
- }
- for _, pod := range pods.Items {
- if pod.Spec.NodeName == "" {
- return false, nil
- }
- }
- return true, nil
- })
- return pods, err
- }
- // Wait up to PodListTimeout for getting pods with certain label
- func WaitForPodsWithLabel(c *client.Client, ns string, label labels.Selector) (pods *api.PodList, err error) {
- for t := time.Now(); time.Since(t) < PodListTimeout; time.Sleep(Poll) {
- options := api.ListOptions{LabelSelector: label}
- pods, err = c.Pods(ns).List(options)
- Expect(err).NotTo(HaveOccurred())
- if len(pods.Items) > 0 {
- break
- }
- }
- if pods == nil || len(pods.Items) == 0 {
- err = fmt.Errorf("Timeout while waiting for pods with label %v", label)
- }
- return
- }
- // DeleteRCAndPods a Replication Controller and all pods it spawned
- func DeleteRCAndPods(c *client.Client, ns, name string) error {
- By(fmt.Sprintf("deleting replication controller %s in namespace %s", name, ns))
- rc, err := c.ReplicationControllers(ns).Get(name)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("RC %s was already deleted: %v", name, err)
- return nil
- }
- return err
- }
- reaper, err := kubectl.ReaperForReplicationController(c, 10*time.Minute)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("RC %s was already deleted: %v", name, err)
- return nil
- }
- return err
- }
- ps, err := podStoreForRC(c, rc)
- if err != nil {
- return err
- }
- defer ps.Stop()
- startTime := time.Now()
- err = reaper.Stop(ns, name, 0, nil)
- if apierrs.IsNotFound(err) {
- Logf("RC %s was already deleted: %v", name, err)
- return nil
- }
- if err != nil {
- return fmt.Errorf("error while stopping RC: %s: %v", name, err)
- }
- deleteRCTime := time.Now().Sub(startTime)
- Logf("Deleting RC %s took: %v", name, deleteRCTime)
- err = waitForPodsInactive(ps, 10*time.Millisecond, 10*time.Minute)
- if err != nil {
- return fmt.Errorf("error while waiting for pods to become inactive %s: %v", name, err)
- }
- terminatePodTime := time.Now().Sub(startTime) - deleteRCTime
- Logf("Terminating RC %s pods took: %v", name, terminatePodTime)
- // this is to relieve namespace controller's pressure when deleting the
- // namespace after a test.
- err = waitForPodsGone(ps, 10*time.Second, 10*time.Minute)
- if err != nil {
- return fmt.Errorf("error while waiting for pods gone %s: %v", name, err)
- }
- return nil
- }
- // DeleteRCAndWaitForGC deletes only the Replication Controller and waits for GC to delete the pods.
- func DeleteRCAndWaitForGC(c *client.Client, ns, name string) error {
- By(fmt.Sprintf("deleting replication controller %s in namespace %s, will wait for the garbage collector to delete the pods", name, ns))
- rc, err := c.ReplicationControllers(ns).Get(name)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("RC %s was already deleted: %v", name, err)
- return nil
- }
- return err
- }
- ps, err := podStoreForRC(c, rc)
- if err != nil {
- return err
- }
- defer ps.Stop()
- startTime := time.Now()
- falseVar := false
- deleteOption := &api.DeleteOptions{OrphanDependents: &falseVar}
- err = c.ReplicationControllers(ns).Delete(name, deleteOption)
- if err != nil && apierrs.IsNotFound(err) {
- Logf("RC %s was already deleted: %v", name, err)
- return nil
- }
- if err != nil {
- return err
- }
- deleteRCTime := time.Now().Sub(startTime)
- Logf("Deleting RC %s took: %v", name, deleteRCTime)
- var interval, timeout time.Duration
- switch {
- case rc.Spec.Replicas < 100:
- interval = 10 * time.Millisecond
- timeout = 10 * time.Minute
- case rc.Spec.Replicas < 1000:
- interval = 1 * time.Second
- timeout = 10 * time.Minute
- case rc.Spec.Replicas < 10000:
- interval = 10 * time.Second
- timeout = 10 * time.Minute
- default:
- interval = 10 * time.Second
- timeout = 40 * time.Minute
- }
- err = waitForPodsInactive(ps, interval, timeout)
- if err != nil {
- return fmt.Errorf("error while waiting for pods to become inactive %s: %v", name, err)
- }
- terminatePodTime := time.Now().Sub(startTime) - deleteRCTime
- Logf("Terminating RC %s pods took: %v", name, terminatePodTime)
- err = waitForPodsGone(ps, 10*time.Second, 10*time.Minute)
- if err != nil {
- return fmt.Errorf("error while waiting for pods gone %s: %v", name, err)
- }
- return nil
- }
- // podStoreForRC creates a PodStore that monitors pods belong to the rc. It
- // waits until the reflector does a List() before returning.
- func podStoreForRC(c *client.Client, rc *api.ReplicationController) (*PodStore, error) {
- labels := labels.SelectorFromSet(rc.Spec.Selector)
- ps := NewPodStore(c, rc.Namespace, labels, fields.Everything())
- err := wait.Poll(1*time.Second, 1*time.Minute, func() (bool, error) {
- if len(ps.reflector.LastSyncResourceVersion()) != 0 {
- return true, nil
- }
- return false, nil
- })
- return ps, err
- }
- // waitForPodsInactive waits until there are no active pods left in the PodStore.
- // This is to make a fair comparison of deletion time between DeleteRCAndPods
- // and DeleteRCAndWaitForGC, because the RC controller decreases status.replicas
- // when the pod is inactvie.
- func waitForPodsInactive(ps *PodStore, interval, timeout time.Duration) error {
- return wait.PollImmediate(interval, timeout, func() (bool, error) {
- pods := ps.List()
- for _, pod := range pods {
- if controller.IsPodActive(pod) {
- return false, nil
- }
- }
- return true, nil
- })
- }
- // waitForPodsGone waits until there are no pods left in the PodStore.
- func waitForPodsGone(ps *PodStore, interval, timeout time.Duration) error {
- return wait.PollImmediate(interval, timeout, func() (bool, error) {
- if pods := ps.List(); len(pods) == 0 {
- return true, nil
- }
- return false, nil
- })
- }
- // Delete a ReplicaSet and all pods it spawned
- func DeleteReplicaSet(c *client.Client, ns, name string) error {
- By(fmt.Sprintf("deleting ReplicaSet %s in namespace %s", name, ns))
- rc, err := c.Extensions().ReplicaSets(ns).Get(name)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("ReplicaSet %s was already deleted: %v", name, err)
- return nil
- }
- return err
- }
- reaper, err := kubectl.ReaperFor(extensions.Kind("ReplicaSet"), c)
- if err != nil {
- if apierrs.IsNotFound(err) {
- Logf("ReplicaSet %s was already deleted: %v", name, err)
- return nil
- }
- return err
- }
- startTime := time.Now()
- err = reaper.Stop(ns, name, 0, nil)
- if apierrs.IsNotFound(err) {
- Logf("ReplicaSet %s was already deleted: %v", name, err)
- return nil
- }
- deleteRSTime := time.Now().Sub(startTime)
- Logf("Deleting RS %s took: %v", name, deleteRSTime)
- if err == nil {
- err = waitForReplicaSetPodsGone(c, rc)
- }
- terminatePodTime := time.Now().Sub(startTime) - deleteRSTime
- Logf("Terminating ReplicaSet %s pods took: %v", name, terminatePodTime)
- return err
- }
- // waitForReplicaSetPodsGone waits until there are no pods reported under a
- // ReplicaSet selector (because the pods have completed termination).
- func waitForReplicaSetPodsGone(c *client.Client, rs *extensions.ReplicaSet) error {
- return wait.PollImmediate(Poll, 2*time.Minute, func() (bool, error) {
- selector, err := unversioned.LabelSelectorAsSelector(rs.Spec.Selector)
- ExpectNoError(err)
- options := api.ListOptions{LabelSelector: selector}
- if pods, err := c.Pods(rs.Namespace).List(options); err == nil && len(pods.Items) == 0 {
- return true, nil
- }
- return false, nil
- })
- }
- // Waits for the deployment status to become valid (i.e. max unavailable and max surge aren't violated anymore).
- // Note that the status should stay valid at all times unless shortly after a scaling event or the deployment is just created.
- // To verify that the deployment status is valid and wait for the rollout to finish, use WaitForDeploymentStatus instead.
- func WaitForDeploymentStatusValid(c clientset.Interface, d *extensions.Deployment) error {
- var (
- oldRSs, allOldRSs, allRSs []*extensions.ReplicaSet
- newRS *extensions.ReplicaSet
- deployment *extensions.Deployment
- reason string
- )
- err := wait.Poll(Poll, 2*time.Minute, func() (bool, error) {
- var err error
- deployment, err = c.Extensions().Deployments(d.Namespace).Get(d.Name)
- if err != nil {
- return false, err
- }
- oldRSs, allOldRSs, newRS, err = deploymentutil.GetAllReplicaSets(deployment, c)
- if err != nil {
- return false, err
- }
- if newRS == nil {
- // New RC hasn't been created yet.
- reason = "new replica set hasn't been created yet"
- Logf(reason)
- return false, nil
- }
- allRSs = append(oldRSs, newRS)
- // The old/new ReplicaSets need to contain the pod-template-hash label
- for i := range allRSs {
- if !labelsutil.SelectorHasLabel(allRSs[i].Spec.Selector, extensions.DefaultDeploymentUniqueLabelKey) {
- reason = "all replica sets need to contain the pod-template-hash label"
- Logf(reason)
- return false, nil
- }
- }
- totalCreated := deploymentutil.GetReplicaCountForReplicaSets(allRSs)
- totalAvailable, err := deploymentutil.GetAvailablePodsForDeployment(c, deployment)
- if err != nil {
- return false, err
- }
- maxCreated := deployment.Spec.Replicas + deploymentutil.MaxSurge(*deployment)
- if totalCreated > maxCreated {
- reason = fmt.Sprintf("total pods created: %d, more than the max allowed: %d", totalCreated, maxCreated)
- Logf(reason)
- return false, nil
- }
- minAvailable := deploymentutil.MinAvailable(deployment)
- if totalAvailable < minAvailable {
- reason = fmt.Sprintf("total pods available: %d, less than the min required: %d", totalAvailable, minAvailable)
- Logf(reason)
- return false, nil
- }
- return true, nil
- })
- if err == wait.ErrWaitTimeout {
- logReplicaSetsOfDeployment(deployment, allOldRSs, newRS)
- logPodsOfDeployment(c, deployment)
- err = fmt.Errorf("%s", reason)
- }
- if err != nil {
- return fmt.Errorf("error waiting for deployment %q status to match expectation: %v", d.Name, err)
- }
- return nil
- }
- // Waits for the deployment to reach desired state.
- // Returns an error if the deployment's rolling update strategy (max unavailable or max surge) is broken at any times.
- func WaitForDeploymentStatus(c clientset.Interface, d *extensions.Deployment) error {
- var (
- oldRSs, allOldRSs, allRSs []*extensions.ReplicaSet
- newRS *extensions.ReplicaSet
- deployment *extensions.Deployment
- )
- err := wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- var err error
- deployment, err = c.Extensions().Deployments(d.Namespace).Get(d.Name)
- if err != nil {
- return false, err
- }
- oldRSs, allOldRSs, newRS, err = deploymentutil.GetAllReplicaSets(deployment, c)
- if err != nil {
- return false, err
- }
- if newRS == nil {
- // New RS hasn't been created yet.
- return false, nil
- }
- allRSs = append(oldRSs, newRS)
- // The old/new ReplicaSets need to contain the pod-template-hash label
- for i := range allRSs {
- if !labelsutil.SelectorHasLabel(allRSs[i].Spec.Selector, extensions.DefaultDeploymentUniqueLabelKey) {
- return false, nil
- }
- }
- totalCreated := deploymentutil.GetReplicaCountForReplicaSets(allRSs)
- totalAvailable, err := deploymentutil.GetAvailablePodsForDeployment(c, deployment)
- if err != nil {
- return false, err
- }
- maxCreated := deployment.Spec.Replicas + deploymentutil.MaxSurge(*deployment)
- if totalCreated > maxCreated {
- logReplicaSetsOfDeployment(deployment, allOldRSs, newRS)
- logPodsOfDeployment(c, deployment)
- return false, fmt.Errorf("total pods created: %d, more than the max allowed: %d", totalCreated, maxCreated)
- }
- minAvailable := deploymentutil.MinAvailable(deployment)
- if totalAvailable < minAvailable {
- logReplicaSetsOfDeployment(deployment, allOldRSs, newRS)
- logPodsOfDeployment(c, deployment)
- return false, fmt.Errorf("total pods available: %d, less than the min required: %d", totalAvailable, minAvailable)
- }
- // When the deployment status and its underlying resources reach the desired state, we're done
- if deployment.Status.Replicas == deployment.Spec.Replicas &&
- deployment.Status.UpdatedReplicas == deployment.Spec.Replicas &&
- deploymentutil.GetReplicaCountForReplicaSets(oldRSs) == 0 &&
- deploymentutil.GetReplicaCountForReplicaSets([]*extensions.ReplicaSet{newRS}) == deployment.Spec.Replicas {
- return true, nil
- }
- return false, nil
- })
- if err == wait.ErrWaitTimeout {
- logReplicaSetsOfDeployment(deployment, allOldRSs, newRS)
- logPodsOfDeployment(c, deployment)
- }
- if err != nil {
- return fmt.Errorf("error waiting for deployment %q status to match expectation: %v", d.Name, err)
- }
- return nil
- }
- // WaitForDeploymentUpdatedReplicasLTE waits for given deployment to be observed by the controller and has at least a number of updatedReplicas
- func WaitForDeploymentUpdatedReplicasLTE(c clientset.Interface, ns, deploymentName string, minUpdatedReplicas int, desiredGeneration int64) error {
- err := wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- deployment, err := c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return false, err
- }
- if deployment.Status.ObservedGeneration >= desiredGeneration && deployment.Status.UpdatedReplicas >= int32(minUpdatedReplicas) {
- return true, nil
- }
- return false, nil
- })
- if err != nil {
- return fmt.Errorf("error waiting for deployment %s to have at least %d updpatedReplicas: %v", deploymentName, minUpdatedReplicas, err)
- }
- return nil
- }
- // WaitForDeploymentRollbackCleared waits for given deployment either started rolling back or doesn't need to rollback.
- // Note that rollback should be cleared shortly, so we only wait for 1 minute here to fail early.
- func WaitForDeploymentRollbackCleared(c clientset.Interface, ns, deploymentName string) error {
- err := wait.Poll(Poll, 1*time.Minute, func() (bool, error) {
- deployment, err := c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return false, err
- }
- // Rollback not set or is kicked off
- if deployment.Spec.RollbackTo == nil {
- return true, nil
- }
- return false, nil
- })
- if err != nil {
- return fmt.Errorf("error waiting for deployment %s rollbackTo to be cleared: %v", deploymentName, err)
- }
- return nil
- }
- // WaitForDeploymentRevisionAndImage waits for the deployment's and its new RS's revision and container image to match the given revision and image.
- // Note that deployment revision and its new RS revision should be updated shortly, so we only wait for 1 minute here to fail early.
- func WaitForDeploymentRevisionAndImage(c clientset.Interface, ns, deploymentName string, revision, image string) error {
- var deployment *extensions.Deployment
- var newRS *extensions.ReplicaSet
- err := wait.Poll(Poll, 1*time.Minute, func() (bool, error) {
- var err error
- deployment, err = c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return false, err
- }
- // The new ReplicaSet needs to be non-nil and contain the pod-template-hash label
- newRS, err = deploymentutil.GetNewReplicaSet(deployment, c)
- if err != nil || newRS == nil || !labelsutil.SelectorHasLabel(newRS.Spec.Selector, extensions.DefaultDeploymentUniqueLabelKey) {
- return false, err
- }
- // Check revision of this deployment, and of the new replica set of this deployment
- if deployment.Annotations == nil || deployment.Annotations[deploymentutil.RevisionAnnotation] != revision ||
- newRS.Annotations == nil || newRS.Annotations[deploymentutil.RevisionAnnotation] != revision ||
- deployment.Spec.Template.Spec.Containers[0].Image != image || newRS.Spec.Template.Spec.Containers[0].Image != image {
- return false, nil
- }
- return true, nil
- })
- if err == wait.ErrWaitTimeout {
- logReplicaSetsOfDeployment(deployment, nil, newRS)
- }
- if newRS == nil {
- return fmt.Errorf("deployment %s failed to create new RS: %v", deploymentName, err)
- }
- if err != nil {
- return fmt.Errorf("error waiting for deployment %s (got %s / %s) and new RS %s (got %s / %s) revision and image to match expectation (expected %s / %s): %v", deploymentName, deployment.Annotations[deploymentutil.RevisionAnnotation], deployment.Spec.Template.Spec.Containers[0].Image, newRS.Name, newRS.Annotations[deploymentutil.RevisionAnnotation], newRS.Spec.Template.Spec.Containers[0].Image, revision, image, err)
- }
- return nil
- }
- func WaitForOverlappingAnnotationMatch(c clientset.Interface, ns, deploymentName, expected string) error {
- return wait.Poll(Poll, 1*time.Minute, func() (bool, error) {
- deployment, err := c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return false, err
- }
- if deployment.Annotations[deploymentutil.OverlapAnnotation] == expected {
- return true, nil
- }
- return false, nil
- })
- }
- // CheckNewRSAnnotations check if the new RS's annotation is as expected
- func CheckNewRSAnnotations(c clientset.Interface, ns, deploymentName string, expectedAnnotations map[string]string) error {
- deployment, err := c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return err
- }
- newRS, err := deploymentutil.GetNewReplicaSet(deployment, c)
- if err != nil {
- return err
- }
- for k, v := range expectedAnnotations {
- // Skip checking revision annotations
- if k != deploymentutil.RevisionAnnotation && v != newRS.Annotations[k] {
- return fmt.Errorf("Expected new RS annotations = %+v, got %+v", expectedAnnotations, newRS.Annotations)
- }
- }
- return nil
- }
- func WaitForPodsReady(c *clientset.Clientset, ns, name string, minReadySeconds int) error {
- label := labels.SelectorFromSet(labels.Set(map[string]string{"name": name}))
- options := api.ListOptions{LabelSelector: label}
- return wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- pods, err := c.Pods(ns).List(options)
- if err != nil {
- return false, nil
- }
- for _, pod := range pods.Items {
- if !deploymentutil.IsPodAvailable(&pod, int32(minReadySeconds), time.Now()) {
- return false, nil
- }
- }
- return true, nil
- })
- }
- // Waits for the deployment to clean up old rcs.
- func WaitForDeploymentOldRSsNum(c *clientset.Clientset, ns, deploymentName string, desiredRSNum int) error {
- return wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- deployment, err := c.Extensions().Deployments(ns).Get(deploymentName)
- if err != nil {
- return false, err
- }
- _, oldRSs, err := deploymentutil.GetOldReplicaSets(deployment, c)
- if err != nil {
- return false, err
- }
- return len(oldRSs) == desiredRSNum, nil
- })
- }
- func logReplicaSetsOfDeployment(deployment *extensions.Deployment, allOldRSs []*extensions.ReplicaSet, newRS *extensions.ReplicaSet) {
- Logf("Deployment: %+v. Selector = %+v", *deployment, deployment.Spec.Selector)
- for i := range allOldRSs {
- Logf("All old ReplicaSets (%d/%d) of deployment %s: %+v. Selector = %+v", i+1, len(allOldRSs), deployment.Name, *allOldRSs[i], allOldRSs[i].Spec.Selector)
- }
- if newRS != nil {
- Logf("New ReplicaSet of deployment %s: %+v. Selector = %+v", deployment.Name, *newRS, newRS.Spec.Selector)
- } else {
- Logf("New ReplicaSet of deployment %s is nil.", deployment.Name)
- }
- }
- func WaitForObservedDeployment(c *clientset.Clientset, ns, deploymentName string, desiredGeneration int64) error {
- return deploymentutil.WaitForObservedDeployment(func() (*extensions.Deployment, error) { return c.Extensions().Deployments(ns).Get(deploymentName) }, desiredGeneration, Poll, 1*time.Minute)
- }
- func logPodsOfDeployment(c clientset.Interface, deployment *extensions.Deployment) {
- minReadySeconds := deployment.Spec.MinReadySeconds
- podList, err := deploymentutil.ListPods(deployment,
- func(namespace string, options api.ListOptions) (*api.PodList, error) {
- return c.Core().Pods(namespace).List(options)
- })
- if err != nil {
- Logf("Failed to list pods of deployment %s: %v", deployment.Name, err)
- return
- }
- if err == nil {
- for _, pod := range podList.Items {
- availability := "not available"
- if deploymentutil.IsPodAvailable(&pod, minReadySeconds, time.Now()) {
- availability = "available"
- }
- Logf("Pod %s is %s: %+v", pod.Name, availability, pod)
- }
- }
- }
- // Waits for the number of events on the given object to reach a desired count.
- func WaitForEvents(c *client.Client, ns string, objOrRef runtime.Object, desiredEventsCount int) error {
- return wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- events, err := c.Events(ns).Search(objOrRef)
- if err != nil {
- return false, fmt.Errorf("error in listing events: %s", err)
- }
- eventsCount := len(events.Items)
- if eventsCount == desiredEventsCount {
- return true, nil
- }
- if eventsCount < desiredEventsCount {
- return false, nil
- }
- // Number of events has exceeded the desired count.
- return false, fmt.Errorf("number of events has exceeded the desired count, eventsCount: %d, desiredCount: %d", eventsCount, desiredEventsCount)
- })
- }
- // Waits for the number of events on the given object to be at least a desired count.
- func WaitForPartialEvents(c *client.Client, ns string, objOrRef runtime.Object, atLeastEventsCount int) error {
- return wait.Poll(Poll, 5*time.Minute, func() (bool, error) {
- events, err := c.Events(ns).Search(objOrRef)
- if err != nil {
- return false, fmt.Errorf("error in listing events: %s", err)
- }
- eventsCount := len(events.Items)
- if eventsCount >= atLeastEventsCount {
- return true, nil
- }
- return false, nil
- })
- }
- type updateDeploymentFunc func(d *extensions.Deployment)
- func UpdateDeploymentWithRetries(c *clientset.Clientset, namespace, name string, applyUpdate updateDeploymentFunc) (deployment *extensions.Deployment, err error) {
- deployments := c.Extensions().Deployments(namespace)
- err = wait.Poll(10*time.Millisecond, 1*time.Minute, func() (bool, error) {
- if deployment, err = deployments.Get(name); err != nil {
- return false, err
- }
- // Apply the update, then attempt to push it to the apiserver.
- applyUpdate(deployment)
- if deployment, err = deployments.Update(deployment); err == nil {
- Logf("Updating deployment %s", name)
- return true, nil
- }
- return false, nil
- })
- return deployment, err
- }
- // FailedContainers inspects all containers in a pod and returns failure
- // information for containers that have failed or been restarted.
- // A map is returned where the key is the containerID and the value is a
- // struct containing the restart and failure information
- func FailedContainers(pod *api.Pod) map[string]ContainerFailures {
- var state ContainerFailures
- states := make(map[string]ContainerFailures)
- statuses := pod.Status.ContainerStatuses
- if len(statuses) == 0 {
- return nil
- } else {
- for _, status := range statuses {
- if status.State.Terminated != nil {
- states[status.ContainerID] = ContainerFailures{status: status.State.Terminated}
- } else if status.LastTerminationState.Terminated != nil {
- states[status.ContainerID] = ContainerFailures{status: status.LastTerminationState.Terminated}
- }
- if status.RestartCount > 0 {
- var ok bool
- if state, ok = states[status.ContainerID]; !ok {
- state = ContainerFailures{}
- }
- state.Restarts = int(status.RestartCount)
- states[status.ContainerID] = state
- }
- }
- }
- return states
- }
- // Prints the histogram of the events and returns the number of bad events.
- func BadEvents(events []*api.Event) int {
- type histogramKey struct {
- reason string
- source string
- }
- histogram := make(map[histogramKey]int)
- for _, e := range events {
- histogram[histogramKey{reason: e.Reason, source: e.Source.Component}]++
- }
- for key, number := range histogram {
- Logf("- reason: %s, source: %s -> %d", key.reason, key.source, number)
- }
- badPatterns := []string{"kill", "fail"}
- badEvents := 0
- for key, number := range histogram {
- for _, s := range badPatterns {
- if strings.Contains(key.reason, s) {
- Logf("WARNING %d events from %s with reason: %s", number, key.source, key.reason)
- badEvents += number
- break
- }
- }
- }
- return badEvents
- }
- // NodeAddresses returns the first address of the given type of each node.
- func NodeAddresses(nodelist *api.NodeList, addrType api.NodeAddressType) []string {
- hosts := []string{}
- for _, n := range nodelist.Items {
- for _, addr := range n.Status.Addresses {
- // Use the first external IP address we find on the node, and
- // use at most one per node.
- // TODO(roberthbailey): Use the "preferred" address for the node, once
- // such a thing is defined (#2462).
- if addr.Type == addrType {
- hosts = append(hosts, addr.Address)
- break
- }
- }
- }
- return hosts
- }
- // NodeSSHHosts returns SSH-able host names for all schedulable nodes - this excludes master node.
- // It returns an error if it can't find an external IP for every node, though it still returns all
- // hosts that it found in that case.
- func NodeSSHHosts(c *client.Client) ([]string, error) {
- nodelist := waitListSchedulableNodesOrDie(c)
- // TODO(roberthbailey): Use the "preferred" address for the node, once such a thing is defined (#2462).
- hosts := NodeAddresses(nodelist, api.NodeExternalIP)
- // Error if any node didn't have an external IP.
- if len(hosts) != len(nodelist.Items) {
- return hosts, fmt.Errorf(
- "only found %d external IPs on nodes, but found %d nodes. Nodelist: %v",
- len(hosts), len(nodelist.Items), nodelist)
- }
- sshHosts := make([]string, 0, len(hosts))
- for _, h := range hosts {
- sshHosts = append(sshHosts, net.JoinHostPort(h, "22"))
- }
- return sshHosts, nil
- }
- type SSHResult struct {
- User string
- Host string
- Cmd string
- Stdout string
- Stderr string
- Code int
- }
- // SSH synchronously SSHs to a node running on provider and runs cmd. If there
- // is no error performing the SSH, the stdout, stderr, and exit code are
- // returned.
- func SSH(cmd, host, provider string) (SSHResult, error) {
- result := SSHResult{Host: host, Cmd: cmd}
- // Get a signer for the provider.
- signer, err := GetSigner(provider)
- if err != nil {
- return result, fmt.Errorf("error getting signer for provider %s: '%v'", provider, err)
- }
- // RunSSHCommand will default to Getenv("USER") if user == "", but we're
- // defaulting here as well for logging clarity.
- result.User = os.Getenv("KUBE_SSH_USER")
- if result.User == "" {
- result.User = os.Getenv("USER")
- }
- stdout, stderr, code, err := sshutil.RunSSHCommand(cmd, result.User, host, signer)
- result.Stdout = stdout
- result.Stderr = stderr
- result.Code = code
- return result, err
- }
- func LogSSHResult(result SSHResult) {
- remote := fmt.Sprintf("%s@%s", result.User, result.Host)
- Logf("ssh %s: command: %s", remote, result.Cmd)
- Logf("ssh %s: stdout: %q", remote, result.Stdout)
- Logf("ssh %s: stderr: %q", remote, result.Stderr)
- Logf("ssh %s: exit code: %d", remote, result.Code)
- }
- func IssueSSHCommand(cmd, provider string, node *api.Node) error {
- Logf("Getting external IP address for %s", node.Name)
- host := ""
- for _, a := range node.Status.Addresses {
- if a.Type == api.NodeExternalIP {
- host = a.Address + ":22"
- break
- }
- }
- if host == "" {
- return fmt.Errorf("couldn't find external IP address for node %s", node.Name)
- }
- Logf("Calling %s on %s(%s)", cmd, node.Name, host)
- result, err := SSH(cmd, host, provider)
- LogSSHResult(result)
- if result.Code != 0 || err != nil {
- return fmt.Errorf("failed running %q: %v (exit code %d)", cmd, err, result.Code)
- }
- return nil
- }
- // NewHostExecPodSpec returns the pod spec of hostexec pod
- func NewHostExecPodSpec(ns, name string) *api.Pod {
- pod := &api.Pod{
- ObjectMeta: api.ObjectMeta{
- Name: name,
- Namespace: ns,
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: "hostexec",
- Image: "gcr.io/google_containers/hostexec:1.2",
- ImagePullPolicy: api.PullIfNotPresent,
- },
- },
- SecurityContext: &api.PodSecurityContext{
- HostNetwork: true,
- },
- },
- }
- return pod
- }
- // RunHostCmd runs the given cmd in the context of the given pod using `kubectl exec`
- // inside of a shell.
- func RunHostCmd(ns, name, cmd string) (string, error) {
- return RunKubectl("exec", fmt.Sprintf("--namespace=%v", ns), name, "--", "/bin/sh", "-c", cmd)
- }
- // RunHostCmdOrDie calls RunHostCmd and dies on error.
- func RunHostCmdOrDie(ns, name, cmd string) string {
- stdout, err := RunHostCmd(ns, name, cmd)
- Logf("stdout: %v", stdout)
- ExpectNoError(err)
- return stdout
- }
- // LaunchHostExecPod launches a hostexec pod in the given namespace and waits
- // until it's Running
- func LaunchHostExecPod(client *client.Client, ns, name string) *api.Pod {
- hostExecPod := NewHostExecPodSpec(ns, name)
- pod, err := client.Pods(ns).Create(hostExecPod)
- ExpectNoError(err)
- err = WaitForPodRunningInNamespace(client, pod)
- ExpectNoError(err)
- return pod
- }
- // GetSigner returns an ssh.Signer for the provider ("gce", etc.) that can be
- // used to SSH to their nodes.
- func GetSigner(provider string) (ssh.Signer, error) {
- // Get the directory in which SSH keys are located.
- keydir := filepath.Join(os.Getenv("HOME"), ".ssh")
- // Select the key itself to use. When implementing more providers here,
- // please also add them to any SSH tests that are disabled because of signer
- // support.
- keyfile := ""
- switch provider {
- case "gce", "gke", "kubemark":
- keyfile = "google_compute_engine"
- case "aws":
- // If there is an env. variable override, use that.
- aws_keyfile := os.Getenv("AWS_SSH_KEY")
- if len(aws_keyfile) != 0 {
- return sshutil.MakePrivateKeySignerFromFile(aws_keyfile)
- }
- // Otherwise revert to home dir
- keyfile = "kube_aws_rsa"
- default:
- return nil, fmt.Errorf("GetSigner(...) not implemented for %s", provider)
- }
- key := filepath.Join(keydir, keyfile)
- return sshutil.MakePrivateKeySignerFromFile(key)
- }
- // CheckPodsRunningReady returns whether all pods whose names are listed in
- // podNames in namespace ns are running and ready, using c and waiting at most
- // timeout.
- func CheckPodsRunningReady(c *client.Client, ns string, podNames []string, timeout time.Duration) bool {
- return CheckPodsCondition(c, ns, podNames, timeout, PodRunningReady, "running and ready")
- }
- // CheckPodsRunningReadyOrSucceeded returns whether all pods whose names are
- // listed in podNames in namespace ns are running and ready, or succeeded; use
- // c and waiting at most timeout.
- func CheckPodsRunningReadyOrSucceeded(c *client.Client, ns string, podNames []string, timeout time.Duration) bool {
- return CheckPodsCondition(c, ns, podNames, timeout, PodRunningReadyOrSucceeded, "running and ready, or succeeded")
- }
- // CheckPodsCondition returns whether all pods whose names are listed in podNames
- // in namespace ns are in the condition, using c and waiting at most timeout.
- func CheckPodsCondition(c *client.Client, ns string, podNames []string, timeout time.Duration, condition podCondition, desc string) bool {
- np := len(podNames)
- Logf("Waiting up to %v for %d pods to be %s: %s", timeout, np, desc, podNames)
- result := make(chan bool, len(podNames))
- for ix := range podNames {
- // Launch off pod readiness checkers.
- go func(name string) {
- err := waitForPodCondition(c, ns, name, desc, timeout, condition)
- result <- err == nil
- }(podNames[ix])
- }
- // Wait for them all to finish.
- success := true
- // TODO(a-robinson): Change to `for range` syntax and remove logging once we
- // support only Go >= 1.4.
- for _, podName := range podNames {
- if !<-result {
- Logf("Pod %[1]s failed to be %[2]s.", podName, desc)
- success = false
- }
- }
- Logf("Wanted all %d pods to be %s. Result: %t. Pods: %v", np, desc, success, podNames)
- return success
- }
- // WaitForNodeToBeReady returns whether node name is ready within timeout.
- func WaitForNodeToBeReady(c *client.Client, name string, timeout time.Duration) bool {
- return WaitForNodeToBe(c, name, api.NodeReady, true, timeout)
- }
- // WaitForNodeToBeNotReady returns whether node name is not ready (i.e. the
- // readiness condition is anything but ready, e.g false or unknown) within
- // timeout.
- func WaitForNodeToBeNotReady(c *client.Client, name string, timeout time.Duration) bool {
- return WaitForNodeToBe(c, name, api.NodeReady, false, timeout)
- }
- func isNodeConditionSetAsExpected(node *api.Node, conditionType api.NodeConditionType, wantTrue, silent bool) bool {
- // Check the node readiness condition (logging all).
- for _, cond := range node.Status.Conditions {
- // Ensure that the condition type and the status matches as desired.
- if cond.Type == conditionType {
- if (cond.Status == api.ConditionTrue) == wantTrue {
- return true
- } else {
- if !silent {
- Logf("Condition %s of node %s is %v instead of %t. Reason: %v, message: %v",
- conditionType, node.Name, cond.Status == api.ConditionTrue, wantTrue, cond.Reason, cond.Message)
- }
- return false
- }
- }
- }
- if !silent {
- Logf("Couldn't find condition %v on node %v", conditionType, node.Name)
- }
- return false
- }
- func IsNodeConditionSetAsExpected(node *api.Node, conditionType api.NodeConditionType, wantTrue bool) bool {
- return isNodeConditionSetAsExpected(node, conditionType, wantTrue, false)
- }
- func IsNodeConditionSetAsExpectedSilent(node *api.Node, conditionType api.NodeConditionType, wantTrue bool) bool {
- return isNodeConditionSetAsExpected(node, conditionType, wantTrue, true)
- }
- func IsNodeConditionUnset(node *api.Node, conditionType api.NodeConditionType) bool {
- for _, cond := range node.Status.Conditions {
- if cond.Type == conditionType {
- return false
- }
- }
- return true
- }
- // WaitForNodeToBe returns whether node "name's" condition state matches wantTrue
- // within timeout. If wantTrue is true, it will ensure the node condition status
- // is ConditionTrue; if it's false, it ensures the node condition is in any state
- // other than ConditionTrue (e.g. not true or unknown).
- func WaitForNodeToBe(c *client.Client, name string, conditionType api.NodeConditionType, wantTrue bool, timeout time.Duration) bool {
- Logf("Waiting up to %v for node %s condition %s to be %t", timeout, name, conditionType, wantTrue)
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(Poll) {
- node, err := c.Nodes().Get(name)
- if err != nil {
- Logf("Couldn't get node %s", name)
- continue
- }
- if IsNodeConditionSetAsExpected(node, conditionType, wantTrue) {
- return true
- }
- }
- Logf("Node %s didn't reach desired %s condition status (%t) within %v", name, conditionType, wantTrue, timeout)
- return false
- }
- // Checks whether all registered nodes are ready.
- // TODO: we should change the AllNodesReady call in AfterEach to WaitForAllNodesHealthy,
- // and figure out how to do it in a configurable way, as we can't expect all setups to run
- // default test add-ons.
- func AllNodesReady(c *client.Client, timeout time.Duration) error {
- Logf("Waiting up to %v for all nodes to be ready", timeout)
- var notReady []api.Node
- err := wait.PollImmediate(Poll, timeout, func() (bool, error) {
- notReady = nil
- // It should be OK to list unschedulable Nodes here.
- nodes, err := c.Nodes().List(api.ListOptions{})
- if err != nil {
- return false, err
- }
- for _, node := range nodes.Items {
- if !IsNodeConditionSetAsExpected(&node, api.NodeReady, true) {
- notReady = append(notReady, node)
- }
- }
- return len(notReady) == 0, nil
- })
- if err != nil && err != wait.ErrWaitTimeout {
- return err
- }
- if len(notReady) > 0 {
- return fmt.Errorf("Not ready nodes: %v", notReady)
- }
- return nil
- }
- // checks whether all registered nodes are ready and all required Pods are running on them.
- func WaitForAllNodesHealthy(c *client.Client, timeout time.Duration) error {
- Logf("Waiting up to %v for all nodes to be ready", timeout)
- var notReady []api.Node
- var missingPodsPerNode map[string][]string
- err := wait.PollImmediate(Poll, timeout, func() (bool, error) {
- notReady = nil
- // It should be OK to list unschedulable Nodes here.
- nodes, err := c.Nodes().List(api.ListOptions{ResourceVersion: "0"})
- if err != nil {
- return false, err
- }
- for _, node := range nodes.Items {
- if !IsNodeConditionSetAsExpected(&node, api.NodeReady, true) {
- notReady = append(notReady, node)
- }
- }
- pods, err := c.Pods(api.NamespaceAll).List(api.ListOptions{ResourceVersion: "0"})
- if err != nil {
- return false, err
- }
- systemPodsPerNode := make(map[string][]string)
- for _, pod := range pods.Items {
- if pod.Namespace == api.NamespaceSystem && pod.Status.Phase == api.PodRunning {
- if pod.Spec.NodeName != "" {
- systemPodsPerNode[pod.Spec.NodeName] = append(systemPodsPerNode[pod.Spec.NodeName], pod.Name)
- }
- }
- }
- missingPodsPerNode = make(map[string][]string)
- for _, node := range nodes.Items {
- if !system.IsMasterNode(&node) {
- for _, requiredPod := range requiredPerNodePods {
- foundRequired := false
- for _, presentPod := range systemPodsPerNode[node.Name] {
- if requiredPod.MatchString(presentPod) {
- foundRequired = true
- break
- }
- }
- if !foundRequired {
- missingPodsPerNode[node.Name] = append(missingPodsPerNode[node.Name], requiredPod.String())
- }
- }
- }
- }
- return len(notReady) == 0 && len(missingPodsPerNode) == 0, nil
- })
- if err != nil && err != wait.ErrWaitTimeout {
- return err
- }
- if len(notReady) > 0 {
- return fmt.Errorf("Not ready nodes: %v", notReady)
- }
- if len(missingPodsPerNode) > 0 {
- return fmt.Errorf("Not running system Pods: %v", missingPodsPerNode)
- }
- return nil
- }
- // Filters nodes in NodeList in place, removing nodes that do not
- // satisfy the given condition
- // TODO: consider merging with pkg/client/cache.NodeLister
- func FilterNodes(nodeList *api.NodeList, fn func(node api.Node) bool) {
- var l []api.Node
- for _, node := range nodeList.Items {
- if fn(node) {
- l = append(l, node)
- }
- }
- nodeList.Items = l
- }
- // ParseKVLines parses output that looks like lines containing "<key>: <val>"
- // and returns <val> if <key> is found. Otherwise, it returns the empty string.
- func ParseKVLines(output, key string) string {
- delim := ":"
- key = key + delim
- for _, line := range strings.Split(output, "\n") {
- pieces := strings.SplitAfterN(line, delim, 2)
- if len(pieces) != 2 {
- continue
- }
- k, v := pieces[0], pieces[1]
- if k == key {
- return strings.TrimSpace(v)
- }
- }
- return ""
- }
- func RestartKubeProxy(host string) error {
- // TODO: Make it work for all providers.
- if !ProviderIs("gce", "gke", "aws") {
- return fmt.Errorf("unsupported provider: %s", TestContext.Provider)
- }
- // kubelet will restart the kube-proxy since it's running in a static pod
- result, err := SSH("sudo pkill kube-proxy", host, TestContext.Provider)
- if err != nil || result.Code != 0 {
- LogSSHResult(result)
- return fmt.Errorf("couldn't restart kube-proxy: %v", err)
- }
- // wait for kube-proxy to come back up
- err = wait.Poll(5*time.Second, 60*time.Second, func() (bool, error) {
- result, err := SSH("sudo /bin/sh -c 'pgrep kube-proxy | wc -l'", host, TestContext.Provider)
- if err != nil {
- return false, err
- }
- if result.Code != 0 {
- LogSSHResult(result)
- return false, fmt.Errorf("failed to run command, exited %d", result.Code)
- }
- if result.Stdout == "0\n" {
- return false, nil
- }
- Logf("kube-proxy is back up.")
- return true, nil
- })
- if err != nil {
- return fmt.Errorf("kube-proxy didn't recover: %v", err)
- }
- return nil
- }
- func RestartApiserver(c *client.Client) error {
- // TODO: Make it work for all providers.
- if !ProviderIs("gce", "gke", "aws") {
- return fmt.Errorf("unsupported provider: %s", TestContext.Provider)
- }
- if ProviderIs("gce", "aws") {
- return sshRestartMaster()
- }
- // GKE doesn't allow ssh access, so use a same-version master
- // upgrade to teardown/recreate master.
- v, err := c.ServerVersion()
- if err != nil {
- return err
- }
- return masterUpgradeGKE(v.GitVersion[1:]) // strip leading 'v'
- }
- func sshRestartMaster() error {
- if !ProviderIs("gce", "aws") {
- return fmt.Errorf("unsupported provider: %s", TestContext.Provider)
- }
- var command string
- if ProviderIs("gce") {
- command = "sudo docker ps | grep /kube-apiserver | cut -d ' ' -f 1 | xargs sudo docker kill"
- } else {
- command = "sudo /etc/init.d/kube-apiserver restart"
- }
- result, err := SSH(command, GetMasterHost()+":22", TestContext.Provider)
- if err != nil || result.Code != 0 {
- LogSSHResult(result)
- return fmt.Errorf("couldn't restart apiserver: %v", err)
- }
- return nil
- }
- func WaitForApiserverUp(c *client.Client) error {
- for start := time.Now(); time.Since(start) < time.Minute; time.Sleep(5 * time.Second) {
- body, err := c.Get().AbsPath("/healthz").Do().Raw()
- if err == nil && string(body) == "ok" {
- return nil
- }
- }
- return fmt.Errorf("waiting for apiserver timed out")
- }
- // WaitForClusterSize waits until the cluster has desired size and there is no not-ready nodes in it.
- // By cluster size we mean number of Nodes excluding Master Node.
- func WaitForClusterSize(c *client.Client, size int, timeout time.Duration) error {
- for start := time.Now(); time.Since(start) < timeout; time.Sleep(20 * time.Second) {
- nodes, err := c.Nodes().List(api.ListOptions{FieldSelector: fields.Set{
- "spec.unschedulable": "false",
- }.AsSelector()})
- if err != nil {
- Logf("Failed to list nodes: %v", err)
- continue
- }
- numNodes := len(nodes.Items)
- // Filter out not-ready nodes.
- FilterNodes(nodes, func(node api.Node) bool {
- return IsNodeConditionSetAsExpected(&node, api.NodeReady, true)
- })
- numReady := len(nodes.Items)
- if numNodes == size && numReady == size {
- Logf("Cluster has reached the desired size %d", size)
- return nil
- }
- Logf("Waiting for cluster size %d, current size %d, not ready nodes %d", size, numNodes, numNodes-numReady)
- }
- return fmt.Errorf("timeout waiting %v for cluster size to be %d", timeout, size)
- }
- // GetHostExternalAddress gets the node for a pod and returns the first External
- // address. Returns an error if the node the pod is on doesn't have an External
- // address.
- func GetHostExternalAddress(client *client.Client, p *api.Pod) (externalAddress string, err error) {
- node, err := client.Nodes().Get(p.Spec.NodeName)
- if err != nil {
- return "", err
- }
- for _, address := range node.Status.Addresses {
- if address.Type == api.NodeExternalIP {
- if address.Address != "" {
- externalAddress = address.Address
- break
- }
- }
- }
- if externalAddress == "" {
- err = fmt.Errorf("No external address for pod %v on node %v",
- p.Name, p.Spec.NodeName)
- }
- return
- }
- type extractRT struct {
- http.Header
- }
- func (rt *extractRT) RoundTrip(req *http.Request) (*http.Response, error) {
- rt.Header = req.Header
- return &http.Response{}, nil
- }
- // headersForConfig extracts any http client logic necessary for the provided
- // config.
- func headersForConfig(c *restclient.Config) (http.Header, error) {
- extract := &extractRT{}
- rt, err := restclient.HTTPWrappersForConfig(c, extract)
- if err != nil {
- return nil, err
- }
- if _, err := rt.RoundTrip(&http.Request{}); err != nil {
- return nil, err
- }
- return extract.Header, nil
- }
- // OpenWebSocketForURL constructs a websocket connection to the provided URL, using the client
- // config, with the specified protocols.
- func OpenWebSocketForURL(url *url.URL, config *restclient.Config, protocols []string) (*websocket.Conn, error) {
- tlsConfig, err := restclient.TLSConfigFor(config)
- if err != nil {
- return nil, fmt.Errorf("failed to create tls config: %v", err)
- }
- if tlsConfig != nil {
- url.Scheme = "wss"
- if !strings.Contains(url.Host, ":") {
- url.Host += ":443"
- }
- } else {
- url.Scheme = "ws"
- if !strings.Contains(url.Host, ":") {
- url.Host += ":80"
- }
- }
- headers, err := headersForConfig(config)
- if err != nil {
- return nil, fmt.Errorf("failed to load http headers: %v", err)
- }
- cfg, err := websocket.NewConfig(url.String(), "http://localhost")
- if err != nil {
- return nil, fmt.Errorf("failed to create websocket config: %v", err)
- }
- cfg.Header = headers
- cfg.TlsConfig = tlsConfig
- cfg.Protocol = protocols
- return websocket.DialConfig(cfg)
- }
- // getIngressAddress returns the ips/hostnames associated with the Ingress.
- func getIngressAddress(client *client.Client, ns, name string) ([]string, error) {
- ing, err := client.Extensions().Ingress(ns).Get(name)
- if err != nil {
- return nil, err
- }
- addresses := []string{}
- for _, a := range ing.Status.LoadBalancer.Ingress {
- if a.IP != "" {
- addresses = append(addresses, a.IP)
- }
- if a.Hostname != "" {
- addresses = append(addresses, a.Hostname)
- }
- }
- return addresses, nil
- }
- // WaitForIngressAddress waits for the Ingress to acquire an address.
- func WaitForIngressAddress(c *client.Client, ns, ingName string, timeout time.Duration) (string, error) {
- var address string
- err := wait.PollImmediate(10*time.Second, timeout, func() (bool, error) {
- ipOrNameList, err := getIngressAddress(c, ns, ingName)
- if err != nil || len(ipOrNameList) == 0 {
- Logf("Waiting for Ingress %v to acquire IP, error %v", ingName, err)
- return false, nil
- }
- address = ipOrNameList[0]
- return true, nil
- })
- return address, err
- }
- // Looks for the given string in the log of a specific pod container
- func LookForStringInLog(ns, podName, container, expectedString string, timeout time.Duration) (result string, err error) {
- return LookForString(expectedString, timeout, func() string {
- return RunKubectlOrDie("logs", podName, container, fmt.Sprintf("--namespace=%v", ns))
- })
- }
- // Looks for the given string in a file in a specific pod container
- func LookForStringInFile(ns, podName, container, file, expectedString string, timeout time.Duration) (result string, err error) {
- return LookForString(expectedString, timeout, func() string {
- return RunKubectlOrDie("exec", podName, "-c", container, fmt.Sprintf("--namespace=%v", ns), "--", "cat", file)
- })
- }
- // Looks for the given string in the output of a command executed in a specific pod container
- func LookForStringInPodExec(ns, podName string, command []string, expectedString string, timeout time.Duration) (result string, err error) {
- return LookForString(expectedString, timeout, func() string {
- // use the first container
- args := []string{"exec", podName, fmt.Sprintf("--namespace=%v", ns), "--"}
- args = append(args, command...)
- return RunKubectlOrDie(args...)
- })
- }
- // Looks for the given string in the output of fn, repeatedly calling fn until
- // the timeout is reached or the string is found. Returns last log and possibly
- // error if the string was not found.
- func LookForString(expectedString string, timeout time.Duration, fn func() string) (result string, err error) {
- for t := time.Now(); time.Since(t) < timeout; time.Sleep(Poll) {
- result = fn()
- if strings.Contains(result, expectedString) {
- return
- }
- }
- err = fmt.Errorf("Failed to find \"%s\", last result: \"%s\"", expectedString, result)
- return
- }
- // getSvcNodePort returns the node port for the given service:port.
- func getSvcNodePort(client *client.Client, ns, name string, svcPort int) (int, error) {
- svc, err := client.Services(ns).Get(name)
- if err != nil {
- return 0, err
- }
- for _, p := range svc.Spec.Ports {
- if p.Port == int32(svcPort) {
- if p.NodePort != 0 {
- return int(p.NodePort), nil
- }
- }
- }
- return 0, fmt.Errorf(
- "No node port found for service %v, port %v", name, svcPort)
- }
- // GetNodePortURL returns the url to a nodeport Service.
- func GetNodePortURL(client *client.Client, ns, name string, svcPort int) (string, error) {
- nodePort, err := getSvcNodePort(client, ns, name, svcPort)
- if err != nil {
- return "", err
- }
- // This list of nodes must not include the master, which is marked
- // unschedulable, since the master doesn't run kube-proxy. Without
- // kube-proxy NodePorts won't work.
- var nodes *api.NodeList
- if wait.PollImmediate(Poll, SingleCallTimeout, func() (bool, error) {
- nodes, err = client.Nodes().List(api.ListOptions{FieldSelector: fields.Set{
- "spec.unschedulable": "false",
- }.AsSelector()})
- return err == nil, nil
- }) != nil {
- return "", err
- }
- if len(nodes.Items) == 0 {
- return "", fmt.Errorf("Unable to list nodes in cluster.")
- }
- for _, node := range nodes.Items {
- for _, address := range node.Status.Addresses {
- if address.Type == api.NodeExternalIP {
- if address.Address != "" {
- return fmt.Sprintf("http://%v:%v", address.Address, nodePort), nil
- }
- }
- }
- }
- return "", fmt.Errorf("Failed to find external address for service %v", name)
- }
- // ScaleRCByLabels scales an RC via ns/label lookup. If replicas == 0 it waits till
- // none are running, otherwise it does what a synchronous scale operation would do.
- func ScaleRCByLabels(client *client.Client, ns string, l map[string]string, replicas uint) error {
- listOpts := api.ListOptions{LabelSelector: labels.SelectorFromSet(labels.Set(l))}
- rcs, err := client.ReplicationControllers(ns).List(listOpts)
- if err != nil {
- return err
- }
- if len(rcs.Items) == 0 {
- return fmt.Errorf("RC with labels %v not found in ns %v", l, ns)
- }
- Logf("Scaling %v RCs with labels %v in ns %v to %v replicas.", len(rcs.Items), l, ns, replicas)
- for _, labelRC := range rcs.Items {
- name := labelRC.Name
- if err := ScaleRC(client, ns, name, replicas, false); err != nil {
- return err
- }
- rc, err := client.ReplicationControllers(ns).Get(name)
- if err != nil {
- return err
- }
- if replicas == 0 {
- ps, err := podStoreForRC(client, rc)
- if err != nil {
- return err
- }
- defer ps.Stop()
- if err = waitForPodsGone(ps, 10*time.Second, 10*time.Minute); err != nil {
- return fmt.Errorf("error while waiting for pods gone %s: %v", name, err)
- }
- } else {
- if err := WaitForPodsWithLabelRunning(
- client, ns, labels.SelectorFromSet(labels.Set(rc.Spec.Selector))); err != nil {
- return err
- }
- }
- }
- return nil
- }
- // TODO(random-liu): Change this to be a member function of the framework.
- func GetPodLogs(c *client.Client, namespace, podName, containerName string) (string, error) {
- return getPodLogsInternal(c, namespace, podName, containerName, false)
- }
- func getPreviousPodLogs(c *client.Client, namespace, podName, containerName string) (string, error) {
- return getPodLogsInternal(c, namespace, podName, containerName, true)
- }
- // utility function for gomega Eventually
- func getPodLogsInternal(c *client.Client, namespace, podName, containerName string, previous bool) (string, error) {
- logs, err := c.Get().
- Resource("pods").
- Namespace(namespace).
- Name(podName).SubResource("log").
- Param("container", containerName).
- Param("previous", strconv.FormatBool(previous)).
- Do().
- Raw()
- if err != nil {
- return "", err
- }
- if err == nil && strings.Contains(string(logs), "Internal Error") {
- return "", fmt.Errorf("Fetched log contains \"Internal Error\": %q.", string(logs))
- }
- return string(logs), err
- }
- // EnsureLoadBalancerResourcesDeleted ensures that cloud load balancer resources that were created
- // are actually cleaned up. Currently only implemented for GCE/GKE.
- func EnsureLoadBalancerResourcesDeleted(ip, portRange string) error {
- if TestContext.Provider == "gce" || TestContext.Provider == "gke" {
- return ensureGCELoadBalancerResourcesDeleted(ip, portRange)
- }
- return nil
- }
- func ensureGCELoadBalancerResourcesDeleted(ip, portRange string) error {
- gceCloud, ok := TestContext.CloudConfig.Provider.(*gcecloud.GCECloud)
- if !ok {
- return fmt.Errorf("failed to convert CloudConfig.Provider to GCECloud: %#v", TestContext.CloudConfig.Provider)
- }
- project := TestContext.CloudConfig.ProjectID
- region, err := gcecloud.GetGCERegion(TestContext.CloudConfig.Zone)
- if err != nil {
- return fmt.Errorf("could not get region for zone %q: %v", TestContext.CloudConfig.Zone, err)
- }
- return wait.Poll(10*time.Second, 5*time.Minute, func() (bool, error) {
- service := gceCloud.GetComputeService()
- list, err := service.ForwardingRules.List(project, region).Do()
- if err != nil {
- return false, err
- }
- for ix := range list.Items {
- item := list.Items[ix]
- if item.PortRange == portRange && item.IPAddress == ip {
- Logf("found a load balancer: %v", item)
- return false, nil
- }
- }
- return true, nil
- })
- }
- // The following helper functions can block/unblock network from source
- // host to destination host by manipulating iptable rules.
- // This function assumes it can ssh to the source host.
- //
- // Caution:
- // Recommend to input IP instead of hostnames. Using hostnames will cause iptables to
- // do a DNS lookup to resolve the name to an IP address, which will
- // slow down the test and cause it to fail if DNS is absent or broken.
- //
- // Suggested usage pattern:
- // func foo() {
- // ...
- // defer UnblockNetwork(from, to)
- // BlockNetwork(from, to)
- // ...
- // }
- //
- func BlockNetwork(from string, to string) {
- Logf("block network traffic from %s to %s", from, to)
- iptablesRule := fmt.Sprintf("OUTPUT --destination %s --jump REJECT", to)
- dropCmd := fmt.Sprintf("sudo iptables --insert %s", iptablesRule)
- if result, err := SSH(dropCmd, from, TestContext.Provider); result.Code != 0 || err != nil {
- LogSSHResult(result)
- Failf("Unexpected error: %v", err)
- }
- }
- func UnblockNetwork(from string, to string) {
- Logf("Unblock network traffic from %s to %s", from, to)
- iptablesRule := fmt.Sprintf("OUTPUT --destination %s --jump REJECT", to)
- undropCmd := fmt.Sprintf("sudo iptables --delete %s", iptablesRule)
- // Undrop command may fail if the rule has never been created.
- // In such case we just lose 30 seconds, but the cluster is healthy.
- // But if the rule had been created and removing it failed, the node is broken and
- // not coming back. Subsequent tests will run or fewer nodes (some of the tests
- // may fail). Manual intervention is required in such case (recreating the
- // cluster solves the problem too).
- err := wait.Poll(time.Millisecond*100, time.Second*30, func() (bool, error) {
- result, err := SSH(undropCmd, from, TestContext.Provider)
- if result.Code == 0 && err == nil {
- return true, nil
- }
- LogSSHResult(result)
- if err != nil {
- Logf("Unexpected error: %v", err)
- }
- return false, nil
- })
- if err != nil {
- Failf("Failed to remove the iptable REJECT rule. Manual intervention is "+
- "required on host %s: remove rule %s, if exists", from, iptablesRule)
- }
- }
- func isElementOf(podUID types.UID, pods *api.PodList) bool {
- for _, pod := range pods.Items {
- if pod.UID == podUID {
- return true
- }
- }
- return false
- }
- func CheckRSHashLabel(rs *extensions.ReplicaSet) error {
- if len(rs.Labels[extensions.DefaultDeploymentUniqueLabelKey]) == 0 ||
- len(rs.Spec.Selector.MatchLabels[extensions.DefaultDeploymentUniqueLabelKey]) == 0 ||
- len(rs.Spec.Template.Labels[extensions.DefaultDeploymentUniqueLabelKey]) == 0 {
- return fmt.Errorf("unexpected RS missing required pod-hash-template: %+v, selector = %+v, template = %+v", rs, rs.Spec.Selector, rs.Spec.Template)
- }
- return nil
- }
- func CheckPodHashLabel(pods *api.PodList) error {
- invalidPod := ""
- for _, pod := range pods.Items {
- if len(pod.Labels[extensions.DefaultDeploymentUniqueLabelKey]) == 0 {
- if len(invalidPod) == 0 {
- invalidPod = "unexpected pods missing required pod-hash-template:"
- }
- invalidPod = fmt.Sprintf("%s %+v;", invalidPod, pod)
- }
- }
- if len(invalidPod) > 0 {
- return fmt.Errorf("%s", invalidPod)
- }
- return nil
- }
- // timeout for proxy requests.
- const proxyTimeout = 2 * time.Minute
- // NodeProxyRequest performs a get on a node proxy endpoint given the nodename and rest client.
- func NodeProxyRequest(c *client.Client, node, endpoint string) (restclient.Result, error) {
- // proxy tends to hang in some cases when Node is not ready. Add an artificial timeout for this call.
- // This will leak a goroutine if proxy hangs. #22165
- subResourceProxyAvailable, err := ServerVersionGTE(subResourceServiceAndNodeProxyVersion, c)
- if err != nil {
- return restclient.Result{}, err
- }
- var result restclient.Result
- finished := make(chan struct{})
- go func() {
- if subResourceProxyAvailable {
- result = c.Get().
- Resource("nodes").
- SubResource("proxy").
- Name(fmt.Sprintf("%v:%v", node, ports.KubeletPort)).
- Suffix(endpoint).
- Do()
- } else {
- result = c.Get().
- Prefix("proxy").
- Resource("nodes").
- Name(fmt.Sprintf("%v:%v", node, ports.KubeletPort)).
- Suffix(endpoint).
- Do()
- }
- finished <- struct{}{}
- }()
- select {
- case <-finished:
- return result, nil
- case <-time.After(proxyTimeout):
- return restclient.Result{}, nil
- }
- }
- // GetKubeletPods retrieves the list of pods on the kubelet
- func GetKubeletPods(c *client.Client, node string) (*api.PodList, error) {
- return getKubeletPods(c, node, "pods")
- }
- // GetKubeletRunningPods retrieves the list of running pods on the kubelet. The pods
- // includes necessary information (e.g., UID, name, namespace for
- // pods/containers), but do not contain the full spec.
- func GetKubeletRunningPods(c *client.Client, node string) (*api.PodList, error) {
- return getKubeletPods(c, node, "runningpods")
- }
- func getKubeletPods(c *client.Client, node, resource string) (*api.PodList, error) {
- result := &api.PodList{}
- client, err := NodeProxyRequest(c, node, resource)
- if err != nil {
- return &api.PodList{}, err
- }
- if err = client.Into(result); err != nil {
- return &api.PodList{}, err
- }
- return result, nil
- }
- // LaunchWebserverPod launches a pod serving http on port 8080 to act
- // as the target for networking connectivity checks. The ip address
- // of the created pod will be returned if the pod is launched
- // successfully.
- func LaunchWebserverPod(f *Framework, podName, nodeName string) (ip string) {
- containerName := fmt.Sprintf("%s-container", podName)
- port := 8080
- pod := &api.Pod{
- ObjectMeta: api.ObjectMeta{
- Name: podName,
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: containerName,
- Image: "gcr.io/google_containers/porter:cd5cb5791ebaa8641955f0e8c2a9bed669b1eaab",
- Env: []api.EnvVar{{Name: fmt.Sprintf("SERVE_PORT_%d", port), Value: "foo"}},
- Ports: []api.ContainerPort{{ContainerPort: int32(port)}},
- },
- },
- NodeName: nodeName,
- RestartPolicy: api.RestartPolicyNever,
- },
- }
- podClient := f.Client.Pods(f.Namespace.Name)
- _, err := podClient.Create(pod)
- ExpectNoError(err)
- ExpectNoError(f.WaitForPodRunning(podName))
- createdPod, err := podClient.Get(podName)
- ExpectNoError(err)
- ip = fmt.Sprintf("%s:%d", createdPod.Status.PodIP, port)
- Logf("Target pod IP:port is %s", ip)
- return
- }
- // CheckConnectivityToHost launches a pod running wget on the
- // specified node to test connectivity to the specified host. An
- // error will be returned if the host is not reachable from the pod.
- func CheckConnectivityToHost(f *Framework, nodeName, podName, host string, timeout int) error {
- contName := fmt.Sprintf("%s-container", podName)
- pod := &api.Pod{
- ObjectMeta: api.ObjectMeta{
- Name: podName,
- },
- Spec: api.PodSpec{
- Containers: []api.Container{
- {
- Name: contName,
- Image: "gcr.io/google_containers/busybox:1.24",
- Command: []string{"wget", fmt.Sprintf("--timeout=%d", timeout), "-s", host},
- },
- },
- NodeName: nodeName,
- RestartPolicy: api.RestartPolicyNever,
- },
- }
- podClient := f.Client.Pods(f.Namespace.Name)
- _, err := podClient.Create(pod)
- if err != nil {
- return err
- }
- defer podClient.Delete(podName, nil)
- err = WaitForPodSuccessInNamespace(f.Client, podName, contName, f.Namespace.Name)
- if err != nil {
- logs, logErr := GetPodLogs(f.Client, f.Namespace.Name, pod.Name, contName)
- if logErr != nil {
- Logf("Warning: Failed to get logs from pod %q: %v", pod.Name, logErr)
- } else {
- Logf("pod %s/%s \"wget\" logs:\n%s", f.Namespace.Name, pod.Name, logs)
- }
- }
- return err
- }
- // CoreDump SSHs to the master and all nodes and dumps their logs into dir.
- // It shells out to cluster/log-dump.sh to accomplish this.
- func CoreDump(dir string) {
- cmd := exec.Command(path.Join(TestContext.RepoRoot, "cluster", "log-dump.sh"), dir)
- cmd.Stdout = os.Stdout
- cmd.Stderr = os.Stderr
- if err := cmd.Run(); err != nil {
- Logf("Error running cluster/log-dump.sh: %v", err)
- }
- }
- func UpdatePodWithRetries(client *client.Client, ns, name string, update func(*api.Pod)) (*api.Pod, error) {
- for i := 0; i < 3; i++ {
- pod, err := client.Pods(ns).Get(name)
- if err != nil {
- return nil, fmt.Errorf("Failed to get pod %q: %v", name, err)
- }
- update(pod)
- pod, err = client.Pods(ns).Update(pod)
- if err == nil {
- return pod, nil
- }
- if !apierrs.IsConflict(err) && !apierrs.IsServerTimeout(err) {
- return nil, fmt.Errorf("Failed to update pod %q: %v", name, err)
- }
- }
- return nil, fmt.Errorf("Too many retries updating Pod %q", name)
- }
- func GetPodsInNamespace(c *client.Client, ns string, ignoreLabels map[string]string) ([]*api.Pod, error) {
- pods, err := c.Pods(ns).List(api.ListOptions{})
- if err != nil {
- return []*api.Pod{}, err
- }
- ignoreSelector := labels.SelectorFromSet(ignoreLabels)
- filtered := []*api.Pod{}
- for _, p := range pods.Items {
- if len(ignoreLabels) != 0 && ignoreSelector.Matches(labels.Set(p.Labels)) {
- continue
- }
- filtered = append(filtered, &p)
- }
- return filtered, nil
- }
- // RunCmd runs cmd using args and returns its stdout and stderr. It also outputs
- // cmd's stdout and stderr to their respective OS streams.
- func RunCmd(command string, args ...string) (string, string, error) {
- Logf("Running %s %v", command, args)
- var bout, berr bytes.Buffer
- cmd := exec.Command(command, args...)
- // We also output to the OS stdout/stderr to aid in debugging in case cmd
- // hangs and never returns before the test gets killed.
- //
- // This creates some ugly output because gcloud doesn't always provide
- // newlines.
- cmd.Stdout = io.MultiWriter(os.Stdout, &bout)
- cmd.Stderr = io.MultiWriter(os.Stderr, &berr)
- err := cmd.Run()
- stdout, stderr := bout.String(), berr.String()
- if err != nil {
- return "", "", fmt.Errorf("error running %s %v; got error %v, stdout %q, stderr %q",
- command, args, err, stdout, stderr)
- }
- return stdout, stderr, nil
- }
- // retryCmd runs cmd using args and retries it for up to SingleCallTimeout if
- // it returns an error. It returns stdout and stderr.
- func retryCmd(command string, args ...string) (string, string, error) {
- var err error
- stdout, stderr := "", ""
- wait.Poll(Poll, SingleCallTimeout, func() (bool, error) {
- stdout, stderr, err = RunCmd(command, args...)
- if err != nil {
- Logf("Got %v", err)
- return false, nil
- }
- return true, nil
- })
- return stdout, stderr, err
- }
- // GetPodsScheduled returns a number of currently scheduled and not scheduled Pods.
- func GetPodsScheduled(masterNodes sets.String, pods *api.PodList) (scheduledPods, notScheduledPods []api.Pod) {
- for _, pod := range pods.Items {
- if !masterNodes.Has(pod.Spec.NodeName) {
- if pod.Spec.NodeName != "" {
- _, scheduledCondition := api.GetPodCondition(&pod.Status, api.PodScheduled)
- Expect(scheduledCondition != nil).To(Equal(true))
- Expect(scheduledCondition.Status).To(Equal(api.ConditionTrue))
- scheduledPods = append(scheduledPods, pod)
- } else {
- _, scheduledCondition := api.GetPodCondition(&pod.Status, api.PodScheduled)
- Expect(scheduledCondition != nil).To(Equal(true))
- Expect(scheduledCondition.Status).To(Equal(api.ConditionFalse))
- if scheduledCondition.Reason == "Unschedulable" {
- notScheduledPods = append(notScheduledPods, pod)
- }
- }
- }
- }
- return
- }
- // WaitForStableCluster waits until all existing pods are scheduled and returns their amount.
- func WaitForStableCluster(c *client.Client, masterNodes sets.String) int {
- timeout := 10 * time.Minute
- startTime := time.Now()
- allPods, err := c.Pods(api.NamespaceAll).List(api.ListOptions{})
- ExpectNoError(err)
- // API server returns also Pods that succeeded. We need to filter them out.
- currentPods := make([]api.Pod, 0, len(allPods.Items))
- for _, pod := range allPods.Items {
- if pod.Status.Phase != api.PodSucceeded && pod.Status.Phase != api.PodFailed {
- currentPods = append(currentPods, pod)
- }
- }
- allPods.Items = currentPods
- scheduledPods, currentlyNotScheduledPods := GetPodsScheduled(masterNodes, allPods)
- for len(currentlyNotScheduledPods) != 0 {
- time.Sleep(2 * time.Second)
- allPods, err := c.Pods(api.NamespaceAll).List(api.ListOptions{})
- ExpectNoError(err)
- scheduledPods, currentlyNotScheduledPods = GetPodsScheduled(masterNodes, allPods)
- if startTime.Add(timeout).Before(time.Now()) {
- Failf("Timed out after %v waiting for stable cluster.", timeout)
- break
- }
- }
- return len(scheduledPods)
- }
- // GetMasterAndWorkerNodesOrDie will return a list masters and schedulable worker nodes
- func GetMasterAndWorkerNodesOrDie(c *client.Client) (sets.String, *api.NodeList) {
- nodes := &api.NodeList{}
- masters := sets.NewString()
- all, _ := c.Nodes().List(api.ListOptions{})
- for _, n := range all.Items {
- if system.IsMasterNode(&n) {
- masters.Insert(n.Name)
- } else if isNodeSchedulable(&n) {
- nodes.Items = append(nodes.Items, n)
- }
- }
- return masters, nodes
- }
- func CreateFileForGoBinData(gobindataPath, outputFilename string) error {
- data := ReadOrDie(gobindataPath)
- if len(data) == 0 {
- return fmt.Errorf("Failed to read gobindata from %v", gobindataPath)
- }
- fullPath := filepath.Join(TestContext.OutputDir, outputFilename)
- err := os.MkdirAll(filepath.Dir(fullPath), 0777)
- if err != nil {
- return fmt.Errorf("Error while creating directory %v: %v", filepath.Dir(fullPath), err)
- }
- err = ioutil.WriteFile(fullPath, data, 0644)
- if err != nil {
- return fmt.Errorf("Error while trying to write to file %v: %v", fullPath, err)
- }
- return nil
- }
|