123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300 |
- /*
- Copyright 2015 The Kubernetes Authors.
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
- http://www.apache.org/licenses/LICENSE-2.0
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
- */
- package userspace
- import (
- "fmt"
- "io"
- "net"
- "strconv"
- "strings"
- "sync"
- "time"
- "github.com/golang/glog"
- "k8s.io/kubernetes/pkg/api"
- "k8s.io/kubernetes/pkg/proxy"
- "k8s.io/kubernetes/pkg/util/runtime"
- )
- // Abstraction over TCP/UDP sockets which are proxied.
- type proxySocket interface {
- // Addr gets the net.Addr for a proxySocket.
- Addr() net.Addr
- // Close stops the proxySocket from accepting incoming connections.
- // Each implementation should comment on the impact of calling Close
- // while sessions are active.
- Close() error
- // ProxyLoop proxies incoming connections for the specified service to the service endpoints.
- ProxyLoop(service proxy.ServicePortName, info *serviceInfo, proxier *Proxier)
- // ListenPort returns the host port that the proxySocket is listening on
- ListenPort() int
- }
- func newProxySocket(protocol api.Protocol, ip net.IP, port int) (proxySocket, error) {
- host := ""
- if ip != nil {
- host = ip.String()
- }
- switch strings.ToUpper(string(protocol)) {
- case "TCP":
- listener, err := net.Listen("tcp", net.JoinHostPort(host, strconv.Itoa(port)))
- if err != nil {
- return nil, err
- }
- return &tcpProxySocket{Listener: listener, port: port}, nil
- case "UDP":
- addr, err := net.ResolveUDPAddr("udp", net.JoinHostPort(host, strconv.Itoa(port)))
- if err != nil {
- return nil, err
- }
- conn, err := net.ListenUDP("udp", addr)
- if err != nil {
- return nil, err
- }
- return &udpProxySocket{UDPConn: conn, port: port}, nil
- }
- return nil, fmt.Errorf("unknown protocol %q", protocol)
- }
- // How long we wait for a connection to a backend in seconds
- var endpointDialTimeout = []time.Duration{250 * time.Millisecond, 500 * time.Millisecond, 1 * time.Second, 2 * time.Second}
- // tcpProxySocket implements proxySocket. Close() is implemented by net.Listener. When Close() is called,
- // no new connections are allowed but existing connections are left untouched.
- type tcpProxySocket struct {
- net.Listener
- port int
- }
- func (tcp *tcpProxySocket) ListenPort() int {
- return tcp.port
- }
- func tryConnect(service proxy.ServicePortName, srcAddr net.Addr, protocol string, proxier *Proxier) (out net.Conn, err error) {
- sessionAffinityReset := false
- for _, dialTimeout := range endpointDialTimeout {
- endpoint, err := proxier.loadBalancer.NextEndpoint(service, srcAddr, sessionAffinityReset)
- if err != nil {
- glog.Errorf("Couldn't find an endpoint for %s: %v", service, err)
- return nil, err
- }
- glog.V(3).Infof("Mapped service %q to endpoint %s", service, endpoint)
- // TODO: This could spin up a new goroutine to make the outbound connection,
- // and keep accepting inbound traffic.
- outConn, err := net.DialTimeout(protocol, endpoint, dialTimeout)
- if err != nil {
- if isTooManyFDsError(err) {
- panic("Dial failed: " + err.Error())
- }
- glog.Errorf("Dial failed: %v", err)
- sessionAffinityReset = true
- continue
- }
- return outConn, nil
- }
- return nil, fmt.Errorf("failed to connect to an endpoint.")
- }
- func (tcp *tcpProxySocket) ProxyLoop(service proxy.ServicePortName, myInfo *serviceInfo, proxier *Proxier) {
- for {
- if !myInfo.isAlive() {
- // The service port was closed or replaced.
- return
- }
- // Block until a connection is made.
- inConn, err := tcp.Accept()
- if err != nil {
- if isTooManyFDsError(err) {
- panic("Accept failed: " + err.Error())
- }
- if isClosedError(err) {
- return
- }
- if !myInfo.isAlive() {
- // Then the service port was just closed so the accept failure is to be expected.
- return
- }
- glog.Errorf("Accept failed: %v", err)
- continue
- }
- glog.V(3).Infof("Accepted TCP connection from %v to %v", inConn.RemoteAddr(), inConn.LocalAddr())
- outConn, err := tryConnect(service, inConn.(*net.TCPConn).RemoteAddr(), "tcp", proxier)
- if err != nil {
- glog.Errorf("Failed to connect to balancer: %v", err)
- inConn.Close()
- continue
- }
- // Spin up an async copy loop.
- go proxyTCP(inConn.(*net.TCPConn), outConn.(*net.TCPConn))
- }
- }
- // proxyTCP proxies data bi-directionally between in and out.
- func proxyTCP(in, out *net.TCPConn) {
- var wg sync.WaitGroup
- wg.Add(2)
- glog.V(4).Infof("Creating proxy between %v <-> %v <-> %v <-> %v",
- in.RemoteAddr(), in.LocalAddr(), out.LocalAddr(), out.RemoteAddr())
- go copyBytes("from backend", in, out, &wg)
- go copyBytes("to backend", out, in, &wg)
- wg.Wait()
- }
- func copyBytes(direction string, dest, src *net.TCPConn, wg *sync.WaitGroup) {
- defer wg.Done()
- glog.V(4).Infof("Copying %s: %s -> %s", direction, src.RemoteAddr(), dest.RemoteAddr())
- n, err := io.Copy(dest, src)
- if err != nil {
- if !isClosedError(err) {
- glog.Errorf("I/O error: %v", err)
- }
- }
- glog.V(4).Infof("Copied %d bytes %s: %s -> %s", n, direction, src.RemoteAddr(), dest.RemoteAddr())
- dest.Close()
- src.Close()
- }
- // udpProxySocket implements proxySocket. Close() is implemented by net.UDPConn. When Close() is called,
- // no new connections are allowed and existing connections are broken.
- // TODO: We could lame-duck this ourselves, if it becomes important.
- type udpProxySocket struct {
- *net.UDPConn
- port int
- }
- func (udp *udpProxySocket) ListenPort() int {
- return udp.port
- }
- func (udp *udpProxySocket) Addr() net.Addr {
- return udp.LocalAddr()
- }
- // Holds all the known UDP clients that have not timed out.
- type clientCache struct {
- mu sync.Mutex
- clients map[string]net.Conn // addr string -> connection
- }
- func newClientCache() *clientCache {
- return &clientCache{clients: map[string]net.Conn{}}
- }
- func (udp *udpProxySocket) ProxyLoop(service proxy.ServicePortName, myInfo *serviceInfo, proxier *Proxier) {
- var buffer [4096]byte // 4KiB should be enough for most whole-packets
- for {
- if !myInfo.isAlive() {
- // The service port was closed or replaced.
- break
- }
- // Block until data arrives.
- // TODO: Accumulate a histogram of n or something, to fine tune the buffer size.
- n, cliAddr, err := udp.ReadFrom(buffer[0:])
- if err != nil {
- if e, ok := err.(net.Error); ok {
- if e.Temporary() {
- glog.V(1).Infof("ReadFrom had a temporary failure: %v", err)
- continue
- }
- }
- glog.Errorf("ReadFrom failed, exiting ProxyLoop: %v", err)
- break
- }
- // If this is a client we know already, reuse the connection and goroutine.
- svrConn, err := udp.getBackendConn(myInfo.activeClients, cliAddr, proxier, service, myInfo.timeout)
- if err != nil {
- continue
- }
- // TODO: It would be nice to let the goroutine handle this write, but we don't
- // really want to copy the buffer. We could do a pool of buffers or something.
- _, err = svrConn.Write(buffer[0:n])
- if err != nil {
- if !logTimeout(err) {
- glog.Errorf("Write failed: %v", err)
- // TODO: Maybe tear down the goroutine for this client/server pair?
- }
- continue
- }
- err = svrConn.SetDeadline(time.Now().Add(myInfo.timeout))
- if err != nil {
- glog.Errorf("SetDeadline failed: %v", err)
- continue
- }
- }
- }
- func (udp *udpProxySocket) getBackendConn(activeClients *clientCache, cliAddr net.Addr, proxier *Proxier, service proxy.ServicePortName, timeout time.Duration) (net.Conn, error) {
- activeClients.mu.Lock()
- defer activeClients.mu.Unlock()
- svrConn, found := activeClients.clients[cliAddr.String()]
- if !found {
- // TODO: This could spin up a new goroutine to make the outbound connection,
- // and keep accepting inbound traffic.
- glog.V(3).Infof("New UDP connection from %s", cliAddr)
- var err error
- svrConn, err = tryConnect(service, cliAddr, "udp", proxier)
- if err != nil {
- return nil, err
- }
- if err = svrConn.SetDeadline(time.Now().Add(timeout)); err != nil {
- glog.Errorf("SetDeadline failed: %v", err)
- return nil, err
- }
- activeClients.clients[cliAddr.String()] = svrConn
- go func(cliAddr net.Addr, svrConn net.Conn, activeClients *clientCache, timeout time.Duration) {
- defer runtime.HandleCrash()
- udp.proxyClient(cliAddr, svrConn, activeClients, timeout)
- }(cliAddr, svrConn, activeClients, timeout)
- }
- return svrConn, nil
- }
- // This function is expected to be called as a goroutine.
- // TODO: Track and log bytes copied, like TCP
- func (udp *udpProxySocket) proxyClient(cliAddr net.Addr, svrConn net.Conn, activeClients *clientCache, timeout time.Duration) {
- defer svrConn.Close()
- var buffer [4096]byte
- for {
- n, err := svrConn.Read(buffer[0:])
- if err != nil {
- if !logTimeout(err) {
- glog.Errorf("Read failed: %v", err)
- }
- break
- }
- err = svrConn.SetDeadline(time.Now().Add(timeout))
- if err != nil {
- glog.Errorf("SetDeadline failed: %v", err)
- break
- }
- n, err = udp.WriteTo(buffer[0:n], cliAddr)
- if err != nil {
- if !logTimeout(err) {
- glog.Errorf("WriteTo failed: %v", err)
- }
- break
- }
- }
- activeClients.mu.Lock()
- delete(activeClients.clients, cliAddr.String())
- activeClients.mu.Unlock()
- }
|