etcd.go 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399
  1. // Copyright 2015 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package subnet
  15. import (
  16. "encoding/json"
  17. "errors"
  18. "fmt"
  19. "net"
  20. "regexp"
  21. "strconv"
  22. "time"
  23. "github.com/coreos/flannel/Godeps/_workspace/src/github.com/coreos/go-etcd/etcd"
  24. log "github.com/coreos/flannel/Godeps/_workspace/src/github.com/golang/glog"
  25. "github.com/coreos/flannel/Godeps/_workspace/src/golang.org/x/net/context"
  26. "github.com/coreos/flannel/pkg/ip"
  27. )
  28. const (
  29. registerRetries = 10
  30. subnetTTL = 24 * 3600
  31. )
  32. // etcd error codes
  33. const (
  34. etcdKeyNotFound = 100
  35. etcdKeyAlreadyExists = 105
  36. etcdEventIndexCleared = 401
  37. )
  38. type EtcdManager struct {
  39. registry Registry
  40. }
  41. var (
  42. subnetRegex *regexp.Regexp = regexp.MustCompile(`(\d+\.\d+.\d+.\d+)-(\d+)`)
  43. )
  44. type watchCursor struct {
  45. index uint64
  46. }
  47. func (c watchCursor) String() string {
  48. return strconv.FormatUint(c.index, 10)
  49. }
  50. func NewEtcdManager(config *EtcdConfig) (Manager, error) {
  51. r, err := newEtcdSubnetRegistry(config)
  52. if err != nil {
  53. return nil, err
  54. }
  55. return &EtcdManager{r}, nil
  56. }
  57. func newEtcdManager(r Registry) Manager {
  58. return &EtcdManager{r}
  59. }
  60. func (m *EtcdManager) GetNetworkConfig(ctx context.Context, network string) (*Config, error) {
  61. cfgResp, err := m.registry.getConfig(ctx, network)
  62. if err != nil {
  63. return nil, err
  64. }
  65. return ParseConfig(cfgResp.Node.Value)
  66. }
  67. func (m *EtcdManager) AcquireLease(ctx context.Context, network string, attrs *LeaseAttrs) (*Lease, error) {
  68. config, err := m.GetNetworkConfig(ctx, network)
  69. if err != nil {
  70. return nil, err
  71. }
  72. for {
  73. l, err := m.acquireLeaseOnce(ctx, network, config, attrs)
  74. switch {
  75. case err == nil:
  76. log.Info("Subnet lease acquired: ", l.Subnet)
  77. return l, nil
  78. case err == context.Canceled, err == context.DeadlineExceeded:
  79. return nil, err
  80. default:
  81. log.Error("Failed to acquire subnet: ", err)
  82. }
  83. select {
  84. case <-time.After(time.Second):
  85. case <-ctx.Done():
  86. return nil, ctx.Err()
  87. }
  88. }
  89. }
  90. func findLeaseByIP(leases []Lease, pubIP ip.IP4) *Lease {
  91. for _, l := range leases {
  92. if pubIP == l.Attrs.PublicIP {
  93. return &l
  94. }
  95. }
  96. return nil
  97. }
  98. func (m *EtcdManager) tryAcquireLease(ctx context.Context, network string, config *Config, extIaddr ip.IP4, attrs *LeaseAttrs) (*Lease, error) {
  99. var err error
  100. leases, _, err := m.getLeases(ctx, network)
  101. if err != nil {
  102. return nil, err
  103. }
  104. attrBytes, err := json.Marshal(attrs)
  105. if err != nil {
  106. return nil, err
  107. }
  108. // try to reuse a subnet if there's one that matches our IP
  109. if l := findLeaseByIP(leases, extIaddr); l != nil {
  110. // make sure the existing subnet is still within the configured network
  111. if isSubnetConfigCompat(config, l.Subnet) {
  112. log.Infof("Found lease (%v) for current IP (%v), reusing", l.Subnet, extIaddr)
  113. resp, err := m.registry.updateSubnet(ctx, network, l.Key(), string(attrBytes), subnetTTL)
  114. if err != nil {
  115. return nil, err
  116. }
  117. l.Attrs = attrs
  118. l.Expiration = *resp.Node.Expiration
  119. return l, nil
  120. } else {
  121. log.Infof("Found lease (%v) for current IP (%v) but not compatible with current config, deleting", l.Subnet, extIaddr)
  122. if _, err := m.registry.deleteSubnet(ctx, network, l.Key()); err != nil {
  123. return nil, err
  124. }
  125. }
  126. }
  127. // no existing match, grab a new one
  128. sn, err := m.allocateSubnet(config, leases)
  129. if err != nil {
  130. return nil, err
  131. }
  132. resp, err := m.registry.createSubnet(ctx, network, sn.StringSep(".", "-"), string(attrBytes), subnetTTL)
  133. switch {
  134. case err == nil:
  135. return &Lease{
  136. Subnet: sn,
  137. Attrs: attrs,
  138. Expiration: *resp.Node.Expiration,
  139. }, nil
  140. // if etcd returned Key Already Exists, try again.
  141. case err.(*etcd.EtcdError).ErrorCode == etcdKeyAlreadyExists:
  142. return nil, nil
  143. default:
  144. return nil, err
  145. }
  146. }
  147. func (m *EtcdManager) acquireLeaseOnce(ctx context.Context, network string, config *Config, attrs *LeaseAttrs) (*Lease, error) {
  148. for i := 0; i < registerRetries; i++ {
  149. l, err := m.tryAcquireLease(ctx, network, config, attrs.PublicIP, attrs)
  150. switch {
  151. case err != nil:
  152. return nil, err
  153. case l != nil:
  154. return l, nil
  155. }
  156. // before moving on, check for cancel
  157. // TODO(eyakubovich): propogate ctx deeper into registry
  158. select {
  159. case <-ctx.Done():
  160. return nil, ctx.Err()
  161. default:
  162. }
  163. }
  164. return nil, errors.New("Max retries reached trying to acquire a subnet")
  165. }
  166. func parseSubnetKey(s string) (ip.IP4Net, error) {
  167. if parts := subnetRegex.FindStringSubmatch(s); len(parts) == 3 {
  168. snIp := net.ParseIP(parts[1]).To4()
  169. prefixLen, err := strconv.ParseUint(parts[2], 10, 5)
  170. if snIp != nil && err == nil {
  171. return ip.IP4Net{IP: ip.FromIP(snIp), PrefixLen: uint(prefixLen)}, nil
  172. }
  173. }
  174. return ip.IP4Net{}, errors.New("Error parsing IP Subnet")
  175. }
  176. func (m *EtcdManager) allocateSubnet(config *Config, leases []Lease) (ip.IP4Net, error) {
  177. log.Infof("Picking subnet in range %s ... %s", config.SubnetMin, config.SubnetMax)
  178. var bag []ip.IP4
  179. sn := ip.IP4Net{IP: config.SubnetMin, PrefixLen: config.SubnetLen}
  180. OuterLoop:
  181. for ; sn.IP <= config.SubnetMax && len(bag) < 100; sn = sn.Next() {
  182. for _, l := range leases {
  183. if sn.Overlaps(l.Subnet) {
  184. continue OuterLoop
  185. }
  186. }
  187. bag = append(bag, sn.IP)
  188. }
  189. if len(bag) == 0 {
  190. return ip.IP4Net{}, errors.New("out of subnets")
  191. } else {
  192. i := randInt(0, len(bag))
  193. return ip.IP4Net{IP: bag[i], PrefixLen: config.SubnetLen}, nil
  194. }
  195. }
  196. // getLeases queries etcd to get a list of currently allocated leases for a given network.
  197. // It returns the leases along with the "as-of" etcd-index that can be used as the starting
  198. // point for etcd watch.
  199. func (m *EtcdManager) getLeases(ctx context.Context, network string) ([]Lease, uint64, error) {
  200. resp, err := m.registry.getSubnets(ctx, network)
  201. leases := []Lease{}
  202. index := uint64(0)
  203. switch {
  204. case err == nil:
  205. for _, node := range resp.Node.Nodes {
  206. sn, err := parseSubnetKey(node.Key)
  207. if err == nil {
  208. attrs := &LeaseAttrs{}
  209. if err = json.Unmarshal([]byte(node.Value), attrs); err == nil {
  210. exp := time.Time{}
  211. if node.Expiration != nil {
  212. exp = *node.Expiration
  213. }
  214. lease := Lease{
  215. Subnet: sn,
  216. Attrs: attrs,
  217. Expiration: exp,
  218. }
  219. leases = append(leases, lease)
  220. }
  221. }
  222. }
  223. index = resp.EtcdIndex
  224. case err.(*etcd.EtcdError).ErrorCode == etcdKeyNotFound:
  225. // key not found: treat it as empty set
  226. index = err.(*etcd.EtcdError).Index
  227. default:
  228. return nil, 0, err
  229. }
  230. return leases, index, nil
  231. }
  232. func (m *EtcdManager) RenewLease(ctx context.Context, network string, lease *Lease) error {
  233. attrBytes, err := json.Marshal(lease.Attrs)
  234. if err != nil {
  235. return err
  236. }
  237. // TODO(eyakubovich): propogate ctx into registry
  238. resp, err := m.registry.updateSubnet(ctx, network, lease.Key(), string(attrBytes), subnetTTL)
  239. if err != nil {
  240. return err
  241. }
  242. lease.Expiration = *resp.Node.Expiration
  243. return nil
  244. }
  245. func (m *EtcdManager) WatchLeases(ctx context.Context, network string, cursor interface{}) (WatchResult, error) {
  246. if cursor == nil {
  247. return m.watchReset(ctx, network)
  248. }
  249. nextIndex := uint64(0)
  250. if wc, ok := cursor.(watchCursor); ok {
  251. nextIndex = wc.index
  252. } else if s, ok := cursor.(string); ok {
  253. var err error
  254. nextIndex, err = strconv.ParseUint(s, 10, 64)
  255. if err != nil {
  256. return WatchResult{}, fmt.Errorf("failed to parse cursor: %v", err)
  257. }
  258. } else {
  259. return WatchResult{}, fmt.Errorf("internal error: watch cursor is of unknown type")
  260. }
  261. resp, err := m.registry.watchSubnets(ctx, network, nextIndex)
  262. switch {
  263. case err == nil:
  264. return parseSubnetWatchResponse(resp)
  265. case isIndexTooSmall(err):
  266. log.Warning("Watch of subnet leases failed because etcd index outside history window")
  267. return m.watchReset(ctx, network)
  268. default:
  269. return WatchResult{}, err
  270. }
  271. }
  272. func isIndexTooSmall(err error) bool {
  273. etcdErr, ok := err.(*etcd.EtcdError)
  274. return ok && etcdErr.ErrorCode == etcdEventIndexCleared
  275. }
  276. func parseSubnetWatchResponse(resp *etcd.Response) (WatchResult, error) {
  277. sn, err := parseSubnetKey(resp.Node.Key)
  278. if err != nil {
  279. return WatchResult{}, fmt.Errorf("error parsing subnet IP: %s", resp.Node.Key)
  280. }
  281. evt := Event{}
  282. switch resp.Action {
  283. case "delete", "expire":
  284. evt = Event{
  285. SubnetRemoved,
  286. Lease{Subnet: sn},
  287. }
  288. default:
  289. attrs := &LeaseAttrs{}
  290. err := json.Unmarshal([]byte(resp.Node.Value), attrs)
  291. if err != nil {
  292. return WatchResult{}, err
  293. }
  294. exp := time.Time{}
  295. if resp.Node.Expiration != nil {
  296. exp = *resp.Node.Expiration
  297. }
  298. evt = Event{
  299. SubnetAdded,
  300. Lease{
  301. Subnet: sn,
  302. Attrs: attrs,
  303. Expiration: exp,
  304. },
  305. }
  306. }
  307. cursor := watchCursor{resp.Node.ModifiedIndex + 1}
  308. return WatchResult{
  309. Cursor: cursor,
  310. Events: []Event{evt},
  311. }, nil
  312. }
  313. // watchReset is called when incremental watch failed and we need to grab a snapshot
  314. func (m *EtcdManager) watchReset(ctx context.Context, network string) (WatchResult, error) {
  315. wr := WatchResult{}
  316. leases, index, err := m.getLeases(ctx, network)
  317. if err != nil {
  318. return wr, fmt.Errorf("failed to retrieve subnet leases: %v", err)
  319. }
  320. cursor := watchCursor{index + 1}
  321. wr.Snapshot = leases
  322. wr.Cursor = cursor
  323. return wr, nil
  324. }
  325. func isSubnetConfigCompat(config *Config, sn ip.IP4Net) bool {
  326. if sn.IP < config.SubnetMin || sn.IP > config.SubnetMax {
  327. return false
  328. }
  329. return sn.PrefixLen == config.SubnetLen
  330. }