network.go 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. package docker
  2. import (
  3. "bytes"
  4. "encoding/binary"
  5. "errors"
  6. "fmt"
  7. "log"
  8. "net"
  9. "os/exec"
  10. "strconv"
  11. "strings"
  12. )
  13. const (
  14. networkBridgeIface = "lxcbr0"
  15. portRangeStart = 49153
  16. portRangeEnd = 65535
  17. )
  18. // Calculates the first and last IP addresses in an IPNet
  19. func networkRange(network *net.IPNet) (net.IP, net.IP) {
  20. netIP := network.IP.To4()
  21. firstIP := netIP.Mask(network.Mask)
  22. lastIP := net.IPv4(0, 0, 0, 0).To4()
  23. for i := 0; i < len(lastIP); i++ {
  24. lastIP[i] = netIP[i] | ^network.Mask[i]
  25. }
  26. return firstIP, lastIP
  27. }
  28. // Converts a 4 bytes IP into a 32 bit integer
  29. func ipToInt(ip net.IP) (int32, error) {
  30. buf := bytes.NewBuffer(ip.To4())
  31. var n int32
  32. if err := binary.Read(buf, binary.BigEndian, &n); err != nil {
  33. return 0, err
  34. }
  35. return n, nil
  36. }
  37. // Converts 32 bit integer into a 4 bytes IP address
  38. func intToIp(n int32) (net.IP, error) {
  39. var buf bytes.Buffer
  40. if err := binary.Write(&buf, binary.BigEndian, &n); err != nil {
  41. return net.IP{}, err
  42. }
  43. ip := net.IPv4(0, 0, 0, 0).To4()
  44. for i := 0; i < net.IPv4len; i++ {
  45. ip[i] = buf.Bytes()[i]
  46. }
  47. return ip, nil
  48. }
  49. // Given a netmask, calculates the number of available hosts
  50. func networkSize(mask net.IPMask) (int32, error) {
  51. m := net.IPv4Mask(0, 0, 0, 0)
  52. for i := 0; i < net.IPv4len; i++ {
  53. m[i] = ^mask[i]
  54. }
  55. buf := bytes.NewBuffer(m)
  56. var n int32
  57. if err := binary.Read(buf, binary.BigEndian, &n); err != nil {
  58. return 0, err
  59. }
  60. return n + 1, nil
  61. }
  62. // Wrapper around the iptables command
  63. func iptables(args ...string) error {
  64. path, err := exec.LookPath("iptables")
  65. if err != nil {
  66. return fmt.Errorf("command not found: iptables")
  67. }
  68. if err := exec.Command(path, args...).Run(); err != nil {
  69. return fmt.Errorf("iptables failed: iptables %v", strings.Join(args, " "))
  70. }
  71. return nil
  72. }
  73. // Return the IPv4 address of a network interface
  74. func getIfaceAddr(name string) (net.Addr, error) {
  75. iface, err := net.InterfaceByName(name)
  76. if err != nil {
  77. return nil, err
  78. }
  79. addrs, err := iface.Addrs()
  80. if err != nil {
  81. return nil, err
  82. }
  83. var addrs4 []net.Addr
  84. for _, addr := range addrs {
  85. ip := (addr.(*net.IPNet)).IP
  86. if ip4 := ip.To4(); len(ip4) == net.IPv4len {
  87. addrs4 = append(addrs4, addr)
  88. }
  89. }
  90. switch {
  91. case len(addrs4) == 0:
  92. return nil, fmt.Errorf("Interface %v has no IP addresses", name)
  93. case len(addrs4) > 1:
  94. fmt.Printf("Interface %v has more than 1 IPv4 address. Defaulting to using %v\n",
  95. name, (addrs4[0].(*net.IPNet)).IP)
  96. }
  97. return addrs4[0], nil
  98. }
  99. // Port mapper takes care of mapping external ports to containers by setting
  100. // up iptables rules.
  101. // It keeps track of all mappings and is able to unmap at will
  102. type PortMapper struct {
  103. mapping map[int]net.TCPAddr
  104. }
  105. func (mapper *PortMapper) cleanup() error {
  106. // Ignore errors - This could mean the chains were never set up
  107. iptables("-t", "nat", "-D", "PREROUTING", "-j", "DOCKER")
  108. iptables("-t", "nat", "-D", "OUTPUT", "-j", "DOCKER")
  109. iptables("-t", "nat", "-F", "DOCKER")
  110. iptables("-t", "nat", "-X", "DOCKER")
  111. mapper.mapping = make(map[int]net.TCPAddr)
  112. return nil
  113. }
  114. func (mapper *PortMapper) setup() error {
  115. if err := iptables("-t", "nat", "-N", "DOCKER"); err != nil {
  116. return fmt.Errorf("Failed to create DOCKER chain: %s", err)
  117. }
  118. if err := iptables("-t", "nat", "-A", "PREROUTING", "-j", "DOCKER"); err != nil {
  119. return fmt.Errorf("Failed to inject docker in PREROUTING chain: %s", err)
  120. }
  121. if err := iptables("-t", "nat", "-A", "OUTPUT", "-j", "DOCKER"); err != nil {
  122. return fmt.Errorf("Failed to inject docker in OUTPUT chain: %s", err)
  123. }
  124. return nil
  125. }
  126. func (mapper *PortMapper) iptablesForward(rule string, port int, dest net.TCPAddr) error {
  127. return iptables("-t", "nat", rule, "DOCKER", "-p", "tcp", "--dport", strconv.Itoa(port),
  128. "-j", "DNAT", "--to-destination", net.JoinHostPort(dest.IP.String(), strconv.Itoa(dest.Port)))
  129. }
  130. func (mapper *PortMapper) Map(port int, dest net.TCPAddr) error {
  131. if err := mapper.iptablesForward("-A", port, dest); err != nil {
  132. return err
  133. }
  134. mapper.mapping[port] = dest
  135. return nil
  136. }
  137. func (mapper *PortMapper) Unmap(port int) error {
  138. dest, ok := mapper.mapping[port]
  139. if !ok {
  140. return errors.New("Port is not mapped")
  141. }
  142. if err := mapper.iptablesForward("-D", port, dest); err != nil {
  143. return err
  144. }
  145. delete(mapper.mapping, port)
  146. return nil
  147. }
  148. func newPortMapper() (*PortMapper, error) {
  149. mapper := &PortMapper{}
  150. if err := mapper.cleanup(); err != nil {
  151. return nil, err
  152. }
  153. if err := mapper.setup(); err != nil {
  154. return nil, err
  155. }
  156. return mapper, nil
  157. }
  158. // Port allocator: Atomatically allocate and release networking ports
  159. type PortAllocator struct {
  160. ports chan (int)
  161. }
  162. func (alloc *PortAllocator) populate(start, end int) {
  163. alloc.ports = make(chan int, end-start)
  164. for port := start; port < end; port++ {
  165. alloc.ports <- port
  166. }
  167. }
  168. func (alloc *PortAllocator) Acquire() (int, error) {
  169. select {
  170. case port := <-alloc.ports:
  171. return port, nil
  172. default:
  173. return -1, errors.New("No more ports available")
  174. }
  175. return -1, nil
  176. }
  177. func (alloc *PortAllocator) Release(port int) error {
  178. select {
  179. case alloc.ports <- port:
  180. return nil
  181. default:
  182. return errors.New("Too many ports have been released")
  183. }
  184. return nil
  185. }
  186. func newPortAllocator(start, end int) (*PortAllocator, error) {
  187. allocator := &PortAllocator{}
  188. allocator.populate(start, end)
  189. return allocator, nil
  190. }
  191. // IP allocator: Atomatically allocate and release networking ports
  192. type IPAllocator struct {
  193. network *net.IPNet
  194. queue chan (net.IP)
  195. }
  196. func (alloc *IPAllocator) populate() error {
  197. firstIP, _ := networkRange(alloc.network)
  198. size, err := networkSize(alloc.network.Mask)
  199. if err != nil {
  200. return err
  201. }
  202. // The queue size should be the network size - 3
  203. // -1 for the network address, -1 for the broadcast address and
  204. // -1 for the gateway address
  205. alloc.queue = make(chan net.IP, size-3)
  206. for i := int32(1); i < size-1; i++ {
  207. ipNum, err := ipToInt(firstIP)
  208. if err != nil {
  209. return err
  210. }
  211. ip, err := intToIp(ipNum + int32(i))
  212. if err != nil {
  213. return err
  214. }
  215. // Discard the network IP (that's the host IP address)
  216. if ip.Equal(alloc.network.IP) {
  217. continue
  218. }
  219. alloc.queue <- ip
  220. }
  221. return nil
  222. }
  223. func (alloc *IPAllocator) Acquire() (net.IP, error) {
  224. select {
  225. case ip := <-alloc.queue:
  226. return ip, nil
  227. default:
  228. return net.IP{}, errors.New("No more IP addresses available")
  229. }
  230. return net.IP{}, nil
  231. }
  232. func (alloc *IPAllocator) Release(ip net.IP) error {
  233. select {
  234. case alloc.queue <- ip:
  235. return nil
  236. default:
  237. return errors.New("Too many IP addresses have been released")
  238. }
  239. return nil
  240. }
  241. func newIPAllocator(network *net.IPNet) (*IPAllocator, error) {
  242. alloc := &IPAllocator{
  243. network: network,
  244. }
  245. if err := alloc.populate(); err != nil {
  246. return nil, err
  247. }
  248. return alloc, nil
  249. }
  250. // Network interface represents the networking stack of a container
  251. type NetworkInterface struct {
  252. IPNet net.IPNet
  253. Gateway net.IP
  254. manager *NetworkManager
  255. extPorts []int
  256. }
  257. // Allocate an external TCP port and map it to the interface
  258. func (iface *NetworkInterface) AllocatePort(port int) (int, error) {
  259. extPort, err := iface.manager.portAllocator.Acquire()
  260. if err != nil {
  261. return -1, err
  262. }
  263. if err := iface.manager.portMapper.Map(extPort, net.TCPAddr{IP: iface.IPNet.IP, Port: port}); err != nil {
  264. iface.manager.portAllocator.Release(extPort)
  265. return -1, err
  266. }
  267. iface.extPorts = append(iface.extPorts, extPort)
  268. return extPort, nil
  269. }
  270. // Release: Network cleanup - release all resources
  271. func (iface *NetworkInterface) Release() error {
  272. for _, port := range iface.extPorts {
  273. if err := iface.manager.portMapper.Unmap(port); err != nil {
  274. log.Printf("Unable to unmap port %v: %v", port, err)
  275. }
  276. if err := iface.manager.portAllocator.Release(port); err != nil {
  277. log.Printf("Unable to release port %v: %v", port, err)
  278. }
  279. }
  280. return iface.manager.ipAllocator.Release(iface.IPNet.IP)
  281. }
  282. // Network Manager manages a set of network interfaces
  283. // Only *one* manager per host machine should be used
  284. type NetworkManager struct {
  285. bridgeIface string
  286. bridgeNetwork *net.IPNet
  287. ipAllocator *IPAllocator
  288. portAllocator *PortAllocator
  289. portMapper *PortMapper
  290. }
  291. // Allocate a network interface
  292. func (manager *NetworkManager) Allocate() (*NetworkInterface, error) {
  293. ip, err := manager.ipAllocator.Acquire()
  294. if err != nil {
  295. return nil, err
  296. }
  297. iface := &NetworkInterface{
  298. IPNet: net.IPNet{IP: ip, Mask: manager.bridgeNetwork.Mask},
  299. Gateway: manager.bridgeNetwork.IP,
  300. manager: manager,
  301. }
  302. return iface, nil
  303. }
  304. func newNetworkManager(bridgeIface string) (*NetworkManager, error) {
  305. addr, err := getIfaceAddr(bridgeIface)
  306. if err != nil {
  307. return nil, err
  308. }
  309. network := addr.(*net.IPNet)
  310. ipAllocator, err := newIPAllocator(network)
  311. if err != nil {
  312. return nil, err
  313. }
  314. portAllocator, err := newPortAllocator(portRangeStart, portRangeEnd)
  315. if err != nil {
  316. return nil, err
  317. }
  318. portMapper, err := newPortMapper()
  319. if err != nil {
  320. return nil, err
  321. }
  322. manager := &NetworkManager{
  323. bridgeIface: bridgeIface,
  324. bridgeNetwork: network,
  325. ipAllocator: ipAllocator,
  326. portAllocator: portAllocator,
  327. portMapper: portMapper,
  328. }
  329. return manager, nil
  330. }