vxlan.go 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277
  1. package vxlan
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "net"
  6. "sync"
  7. log "github.com/coreos/flannel/Godeps/_workspace/src/github.com/golang/glog"
  8. "github.com/coreos/flannel/Godeps/_workspace/src/github.com/vishvananda/netlink"
  9. "github.com/coreos/flannel/backend"
  10. "github.com/coreos/flannel/subnet"
  11. "github.com/coreos/flannel/pkg/ip"
  12. "github.com/coreos/flannel/pkg/task"
  13. )
  14. const (
  15. defaultVNI = 1
  16. )
  17. type VXLANBackend struct {
  18. sm *subnet.SubnetManager
  19. rawCfg json.RawMessage
  20. cfg struct {
  21. Vni int
  22. Port int
  23. }
  24. dev *vxlanDevice
  25. stop chan bool
  26. wg sync.WaitGroup
  27. rts routes
  28. }
  29. func New(sm *subnet.SubnetManager, config json.RawMessage) backend.Backend {
  30. vb := &VXLANBackend{
  31. sm: sm,
  32. rawCfg: config,
  33. stop: make(chan bool),
  34. }
  35. vb.cfg.Vni = defaultVNI
  36. return vb
  37. }
  38. func newSubnetAttrs(pubIP net.IP, mac net.HardwareAddr) (*subnet.LeaseAttrs, error) {
  39. sa := subnet.LeaseAttrs{
  40. PublicIP: ip.FromIP(pubIP),
  41. BackendType: "vxlan",
  42. }
  43. data, err := json.Marshal(vxlanLeaseAttrs{hardwareAddr(mac)})
  44. if err != nil {
  45. return nil, err
  46. }
  47. err = sa.BackendData.UnmarshalJSON(data)
  48. if err != nil {
  49. return nil, err
  50. }
  51. return &sa, nil
  52. }
  53. func (vb *VXLANBackend) Init(extIface *net.Interface, extIP net.IP, ipMasq bool) (*backend.SubnetDef, error) {
  54. // Parse our configuration
  55. if len(vb.rawCfg) > 0 {
  56. if err := json.Unmarshal(vb.rawCfg, &vb.cfg); err != nil {
  57. return nil, fmt.Errorf("error decoding UDP backend config: %v", err)
  58. }
  59. }
  60. devAttrs := vxlanDeviceAttrs{
  61. vni: uint32(vb.cfg.Vni),
  62. name: fmt.Sprintf("flannel.%v", vb.cfg.Vni),
  63. vtepIndex: extIface.Index,
  64. vtepAddr: extIP,
  65. vtepPort: vb.cfg.Port,
  66. }
  67. var err error
  68. vb.dev, err = newVXLANDevice(&devAttrs)
  69. if err != nil {
  70. return nil, err
  71. }
  72. sa, err := newSubnetAttrs(extIP, vb.dev.MACAddr())
  73. if err != nil {
  74. return nil, err
  75. }
  76. sn, err := vb.sm.AcquireLease(sa, vb.stop)
  77. if err != nil {
  78. if err == task.ErrCanceled {
  79. return nil, err
  80. } else {
  81. return nil, fmt.Errorf("failed to acquire lease: %v", err)
  82. }
  83. }
  84. // vxlan's subnet is that of the whole overlay network (e.g. /16)
  85. // and not that of the individual host (e.g. /24)
  86. vxlanNet := ip.IP4Net{
  87. IP: sn.IP,
  88. PrefixLen: vb.sm.GetConfig().Network.PrefixLen,
  89. }
  90. if err = vb.dev.Configure(vxlanNet); err != nil {
  91. return nil, err
  92. }
  93. return &backend.SubnetDef{sn, vb.dev.MTU()}, nil
  94. }
  95. func (vb *VXLANBackend) Run() {
  96. vb.wg.Add(1)
  97. go func() {
  98. vb.sm.LeaseRenewer(vb.stop)
  99. vb.wg.Done()
  100. }()
  101. log.Info("Watching for L2/L3 misses")
  102. misses := make(chan *netlink.Neigh, 100)
  103. // Unfortunately MonitorMisses does not take a cancel channel
  104. // as there's no wait to interrupt netlink socket recv
  105. go vb.dev.MonitorMisses(misses)
  106. log.Info("Watching for new subnet leases")
  107. evts := make(chan subnet.EventBatch)
  108. vb.wg.Add(1)
  109. go func() {
  110. vb.sm.WatchLeases(evts, vb.stop)
  111. vb.wg.Done()
  112. }()
  113. defer vb.wg.Wait()
  114. for {
  115. select {
  116. case miss := <-misses:
  117. vb.handleMiss(miss)
  118. case evtBatch := <-evts:
  119. vb.handleSubnetEvents(evtBatch)
  120. case <-vb.stop:
  121. return
  122. }
  123. }
  124. }
  125. func (vb *VXLANBackend) Stop() {
  126. close(vb.stop)
  127. }
  128. func (vb *VXLANBackend) Name() string {
  129. return "VXLAN"
  130. }
  131. // So we can make it JSON (un)marshalable
  132. type hardwareAddr net.HardwareAddr
  133. func (hw hardwareAddr) MarshalJSON() ([]byte, error) {
  134. return []byte(fmt.Sprintf("%q", net.HardwareAddr(hw))), nil
  135. }
  136. func (hw *hardwareAddr) UnmarshalJSON(b []byte) error {
  137. if len(b) < 2 || b[0] != '"' || b[len(b)-1] != '"' {
  138. return fmt.Errorf("error parsing hardware addr")
  139. }
  140. b = b[1:len(b)-1]
  141. mac, err := net.ParseMAC(string(b))
  142. if err != nil {
  143. return err
  144. }
  145. *hw = hardwareAddr(mac)
  146. return nil
  147. }
  148. type vxlanLeaseAttrs struct {
  149. VtepMAC hardwareAddr
  150. }
  151. func (vb *VXLANBackend) handleSubnetEvents(batch subnet.EventBatch) {
  152. for _, evt := range batch {
  153. switch evt.Type {
  154. case subnet.SubnetAdded:
  155. log.Info("Subnet added: ", evt.Lease.Network)
  156. if evt.Lease.Attrs.BackendType != "vxlan" {
  157. log.Warningf("Ignoring non-vxlan subnet: type=%v", evt.Lease.Attrs.BackendType)
  158. continue
  159. }
  160. var attrs vxlanLeaseAttrs
  161. if err := json.Unmarshal(evt.Lease.Attrs.BackendData, &attrs); err != nil {
  162. log.Error("Error decoding subnet lease JSON: ", err)
  163. continue
  164. }
  165. vb.rts.set(evt.Lease.Network, evt.Lease.Attrs.PublicIP.ToIP(), net.HardwareAddr(attrs.VtepMAC))
  166. case subnet.SubnetRemoved:
  167. log.Info("Subnet removed: ", evt.Lease.Network)
  168. vb.rts.remove(evt.Lease.Network)
  169. if evt.Lease.Attrs.BackendType != "vxlan" {
  170. log.Warningf("Ignoring non-vxlan subnet: type=%v", evt.Lease.Attrs.BackendType)
  171. continue
  172. }
  173. var attrs vxlanLeaseAttrs
  174. if err := json.Unmarshal(evt.Lease.Attrs.BackendData, &attrs); err != nil {
  175. log.Error("Error decoding subnet lease JSON: ", err)
  176. continue
  177. }
  178. if len(attrs.VtepMAC) > 0 {
  179. vb.dev.DelL2(net.HardwareAddr(attrs.VtepMAC), evt.Lease.Attrs.PublicIP.ToIP())
  180. }
  181. default:
  182. log.Error("Internal error: unknown event type: ", int(evt.Type))
  183. }
  184. }
  185. }
  186. func (vb *VXLANBackend) handleMiss(miss *netlink.Neigh) {
  187. switch {
  188. case len(miss.IP) == 0 && len(miss.HardwareAddr) == 0:
  189. log.Info("Ignoring nil miss")
  190. case len(miss.IP) == 0:
  191. vb.handleL2Miss(miss)
  192. case len(miss.HardwareAddr) == 0:
  193. vb.handleL3Miss(miss)
  194. default:
  195. log.Infof("Ignoring not a miss: %v, %v", miss.HardwareAddr, miss.IP)
  196. }
  197. }
  198. func (vb *VXLANBackend) handleL2Miss(miss *netlink.Neigh) {
  199. log.Infof("L2 miss: %v", miss.HardwareAddr)
  200. rt := vb.rts.findByVtepMAC(miss.HardwareAddr)
  201. if rt == nil {
  202. log.Infof("Route for %v not found", miss.HardwareAddr)
  203. return
  204. }
  205. if err := vb.dev.AddL2(miss.HardwareAddr, rt.vtepIP); err != nil {
  206. log.Errorf("AddL2 failed: %v", err)
  207. } else {
  208. log.Info("AddL2 succeeded")
  209. }
  210. }
  211. func (vb *VXLANBackend) handleL3Miss(miss *netlink.Neigh) {
  212. log.Infof("L3 miss: %v", miss.IP)
  213. rt := vb.rts.findByNetwork(ip.FromIP(miss.IP))
  214. if rt == nil {
  215. log.Infof("Route for %v not found", miss.IP)
  216. return
  217. }
  218. if err := vb.dev.AddL3(miss.IP, rt.vtepMAC); err != nil {
  219. log.Errorf("AddL3 failed: %v", err)
  220. } else {
  221. log.Info("AddL3 succeeded")
  222. }
  223. }