2013-02-21 01:47:09 +00:00
|
|
|
package docker
|
|
|
|
|
|
|
|
import (
|
2013-02-22 02:33:23 +00:00
|
|
|
"encoding/binary"
|
2013-02-25 18:45:23 +00:00
|
|
|
"errors"
|
2013-02-21 02:20:18 +00:00
|
|
|
"fmt"
|
2013-02-28 19:50:02 +00:00
|
|
|
"log"
|
2013-02-21 01:47:09 +00:00
|
|
|
"net"
|
2013-02-28 19:50:02 +00:00
|
|
|
"os/exec"
|
|
|
|
"strconv"
|
|
|
|
"strings"
|
2013-02-21 01:47:09 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
const (
|
2013-02-21 02:20:18 +00:00
|
|
|
networkBridgeIface = "lxcbr0"
|
2013-02-28 19:50:02 +00:00
|
|
|
portRangeStart = 49153
|
|
|
|
portRangeEnd = 65535
|
2013-02-21 01:47:09 +00:00
|
|
|
)
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Calculates the first and last IP addresses in an IPNet
|
2013-02-22 02:33:23 +00:00
|
|
|
func networkRange(network *net.IPNet) (net.IP, net.IP) {
|
|
|
|
netIP := network.IP.To4()
|
|
|
|
firstIP := netIP.Mask(network.Mask)
|
|
|
|
lastIP := net.IPv4(0, 0, 0, 0).To4()
|
|
|
|
for i := 0; i < len(lastIP); i++ {
|
|
|
|
lastIP[i] = netIP[i] | ^network.Mask[i]
|
|
|
|
}
|
|
|
|
return firstIP, lastIP
|
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Converts a 4 bytes IP into a 32 bit integer
|
2013-03-30 22:32:10 +00:00
|
|
|
func ipToInt(ip net.IP) int32 {
|
|
|
|
return int32(binary.BigEndian.Uint32(ip.To4()))
|
2013-02-22 02:33:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Converts 32 bit integer into a 4 bytes IP address
|
2013-03-30 22:32:10 +00:00
|
|
|
func intToIp(n int32) net.IP {
|
|
|
|
b := make([]byte, 4)
|
|
|
|
binary.BigEndian.PutUint32(b, uint32(n))
|
|
|
|
return net.IP(b)
|
2013-02-22 02:33:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Given a netmask, calculates the number of available hosts
|
2013-03-30 22:32:10 +00:00
|
|
|
func networkSize(mask net.IPMask) int32 {
|
2013-02-25 22:06:22 +00:00
|
|
|
m := net.IPv4Mask(0, 0, 0, 0)
|
2013-02-22 02:33:23 +00:00
|
|
|
for i := 0; i < net.IPv4len; i++ {
|
2013-02-25 22:06:22 +00:00
|
|
|
m[i] = ^mask[i]
|
2013-02-22 02:33:23 +00:00
|
|
|
}
|
2013-03-30 22:32:10 +00:00
|
|
|
|
|
|
|
return int32(binary.BigEndian.Uint32(m)) + 1
|
2013-02-22 02:33:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Wrapper around the iptables command
|
|
|
|
func iptables(args ...string) error {
|
2013-03-27 18:29:58 +00:00
|
|
|
path, err := exec.LookPath("iptables")
|
|
|
|
if err != nil {
|
2013-03-28 19:30:56 +00:00
|
|
|
return fmt.Errorf("command not found: iptables")
|
2013-03-27 18:29:58 +00:00
|
|
|
}
|
|
|
|
if err := exec.Command(path, args...).Run(); err != nil {
|
2013-02-28 19:50:02 +00:00
|
|
|
return fmt.Errorf("iptables failed: iptables %v", strings.Join(args, " "))
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return the IPv4 address of a network interface
|
2013-02-25 22:06:22 +00:00
|
|
|
func getIfaceAddr(name string) (net.Addr, error) {
|
2013-02-21 02:20:18 +00:00
|
|
|
iface, err := net.InterfaceByName(name)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
addrs, err := iface.Addrs()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
var addrs4 []net.Addr
|
|
|
|
for _, addr := range addrs {
|
|
|
|
ip := (addr.(*net.IPNet)).IP
|
|
|
|
if ip4 := ip.To4(); len(ip4) == net.IPv4len {
|
|
|
|
addrs4 = append(addrs4, addr)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
switch {
|
|
|
|
case len(addrs4) == 0:
|
2013-02-28 19:50:02 +00:00
|
|
|
return nil, fmt.Errorf("Interface %v has no IP addresses", name)
|
2013-02-21 02:20:18 +00:00
|
|
|
case len(addrs4) > 1:
|
2013-03-21 16:19:22 +00:00
|
|
|
fmt.Printf("Interface %v has more than 1 IPv4 address. Defaulting to using %v\n",
|
|
|
|
name, (addrs4[0].(*net.IPNet)).IP)
|
2013-02-21 02:20:18 +00:00
|
|
|
}
|
|
|
|
return addrs4[0], nil
|
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Port mapper takes care of mapping external ports to containers by setting
|
|
|
|
// up iptables rules.
|
|
|
|
// It keeps track of all mappings and is able to unmap at will
|
|
|
|
type PortMapper struct {
|
|
|
|
mapping map[int]net.TCPAddr
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mapper *PortMapper) cleanup() error {
|
|
|
|
// Ignore errors - This could mean the chains were never set up
|
2013-04-03 22:32:46 +00:00
|
|
|
iptables("-t", "nat", "-D", "PREROUTING", "-m", "addrtype", "--dst-type", "LOCAL", "-j", "DOCKER")
|
2013-04-04 19:56:37 +00:00
|
|
|
iptables("-t", "nat", "-D", "OUTPUT", "-m", "addrtype", "--dst-type", "LOCAL", "-j", "DOCKER")
|
2013-04-04 22:16:42 +00:00
|
|
|
// Also cleanup rules created by older versions, or -X might fail.
|
|
|
|
iptables("-t", "nat", "-D", "PREROUTING", "-j", "DOCKER")
|
|
|
|
iptables("-t", "nat", "-D", "OUTPUT", "-j", "DOCKER")
|
2013-02-28 19:50:02 +00:00
|
|
|
iptables("-t", "nat", "-F", "DOCKER")
|
|
|
|
iptables("-t", "nat", "-X", "DOCKER")
|
|
|
|
mapper.mapping = make(map[int]net.TCPAddr)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mapper *PortMapper) setup() error {
|
|
|
|
if err := iptables("-t", "nat", "-N", "DOCKER"); err != nil {
|
2013-03-28 19:44:54 +00:00
|
|
|
return fmt.Errorf("Failed to create DOCKER chain: %s", err)
|
2013-02-21 02:20:18 +00:00
|
|
|
}
|
2013-04-03 22:32:46 +00:00
|
|
|
if err := iptables("-t", "nat", "-A", "PREROUTING", "-m", "addrtype", "--dst-type", "LOCAL", "-j", "DOCKER"); err != nil {
|
2013-03-28 19:44:54 +00:00
|
|
|
return fmt.Errorf("Failed to inject docker in PREROUTING chain: %s", err)
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
2013-04-04 19:56:37 +00:00
|
|
|
if err := iptables("-t", "nat", "-A", "OUTPUT", "-m", "addrtype", "--dst-type", "LOCAL", "-j", "DOCKER"); err != nil {
|
2013-03-28 19:44:54 +00:00
|
|
|
return fmt.Errorf("Failed to inject docker in OUTPUT chain: %s", err)
|
2013-03-22 14:06:14 +00:00
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mapper *PortMapper) iptablesForward(rule string, port int, dest net.TCPAddr) error {
|
|
|
|
return iptables("-t", "nat", rule, "DOCKER", "-p", "tcp", "--dport", strconv.Itoa(port),
|
|
|
|
"-j", "DNAT", "--to-destination", net.JoinHostPort(dest.IP.String(), strconv.Itoa(dest.Port)))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (mapper *PortMapper) Map(port int, dest net.TCPAddr) error {
|
|
|
|
if err := mapper.iptablesForward("-A", port, dest); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
mapper.mapping[port] = dest
|
|
|
|
return nil
|
|
|
|
}
|
2013-02-25 22:06:22 +00:00
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
func (mapper *PortMapper) Unmap(port int) error {
|
|
|
|
dest, ok := mapper.mapping[port]
|
|
|
|
if !ok {
|
|
|
|
return errors.New("Port is not mapped")
|
|
|
|
}
|
|
|
|
if err := mapper.iptablesForward("-D", port, dest); err != nil {
|
|
|
|
return err
|
2013-02-22 02:33:23 +00:00
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
delete(mapper.mapping, port)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func newPortMapper() (*PortMapper, error) {
|
|
|
|
mapper := &PortMapper{}
|
|
|
|
if err := mapper.cleanup(); err != nil {
|
2013-02-25 22:06:22 +00:00
|
|
|
return nil, err
|
2013-02-21 01:47:09 +00:00
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
if err := mapper.setup(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return mapper, nil
|
2013-02-21 01:47:09 +00:00
|
|
|
}
|
2013-02-25 18:45:23 +00:00
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
// Port allocator: Atomatically allocate and release networking ports
|
|
|
|
type PortAllocator struct {
|
|
|
|
ports chan (int)
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
func (alloc *PortAllocator) populate(start, end int) {
|
|
|
|
alloc.ports = make(chan int, end-start)
|
|
|
|
for port := start; port < end; port++ {
|
|
|
|
alloc.ports <- port
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (alloc *PortAllocator) Acquire() (int, error) {
|
2013-02-25 18:45:23 +00:00
|
|
|
select {
|
2013-02-28 19:50:02 +00:00
|
|
|
case port := <-alloc.ports:
|
|
|
|
return port, nil
|
2013-02-25 18:45:23 +00:00
|
|
|
default:
|
2013-02-28 19:50:02 +00:00
|
|
|
return -1, errors.New("No more ports available")
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
return -1, nil
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
func (alloc *PortAllocator) Release(port int) error {
|
2013-02-25 18:45:23 +00:00
|
|
|
select {
|
2013-02-28 19:50:02 +00:00
|
|
|
case alloc.ports <- port:
|
2013-02-25 18:45:23 +00:00
|
|
|
return nil
|
|
|
|
default:
|
2013-02-28 19:50:02 +00:00
|
|
|
return errors.New("Too many ports have been released")
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-04-03 09:18:23 +00:00
|
|
|
panic("unreachable")
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
func newPortAllocator(start, end int) (*PortAllocator, error) {
|
|
|
|
allocator := &PortAllocator{}
|
|
|
|
allocator.populate(start, end)
|
|
|
|
return allocator, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// IP allocator: Atomatically allocate and release networking ports
|
|
|
|
type IPAllocator struct {
|
2013-03-30 22:32:10 +00:00
|
|
|
network *net.IPNet
|
|
|
|
queueAlloc chan allocatedIP
|
|
|
|
queueReleased chan net.IP
|
|
|
|
inUse map[int32]struct{}
|
|
|
|
}
|
|
|
|
|
|
|
|
type allocatedIP struct {
|
|
|
|
ip net.IP
|
|
|
|
err error
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:32:10 +00:00
|
|
|
func (alloc *IPAllocator) run() {
|
2013-02-28 19:50:02 +00:00
|
|
|
firstIP, _ := networkRange(alloc.network)
|
2013-03-30 22:32:10 +00:00
|
|
|
ipNum := ipToInt(firstIP)
|
|
|
|
ownIP := ipToInt(alloc.network.IP)
|
|
|
|
size := networkSize(alloc.network.Mask)
|
|
|
|
|
|
|
|
pos := int32(1)
|
|
|
|
max := size - 2 // -1 for the broadcast address, -1 for the gateway address
|
|
|
|
for {
|
|
|
|
var (
|
|
|
|
newNum int32
|
|
|
|
inUse bool
|
|
|
|
)
|
|
|
|
|
|
|
|
// Find first unused IP, give up after one whole round
|
|
|
|
for attempt := int32(0); attempt < max; attempt++ {
|
|
|
|
newNum = ipNum + pos
|
|
|
|
|
|
|
|
pos = pos%max + 1
|
|
|
|
|
|
|
|
// The network's IP is never okay to use
|
|
|
|
if newNum == ownIP {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if _, inUse = alloc.inUse[newNum]; !inUse {
|
|
|
|
// We found an unused IP
|
|
|
|
break
|
|
|
|
}
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-03-30 22:32:10 +00:00
|
|
|
|
|
|
|
ip := allocatedIP{ip: intToIp(newNum)}
|
|
|
|
if inUse {
|
|
|
|
ip.err = errors.New("No unallocated IP available")
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-03-30 22:32:10 +00:00
|
|
|
|
|
|
|
select {
|
|
|
|
case alloc.queueAlloc <- ip:
|
|
|
|
alloc.inUse[newNum] = struct{}{}
|
|
|
|
case released := <-alloc.queueReleased:
|
|
|
|
r := ipToInt(released)
|
|
|
|
delete(alloc.inUse, r)
|
|
|
|
|
|
|
|
if inUse {
|
|
|
|
// If we couldn't allocate a new IP, the released one
|
|
|
|
// will be the only free one now, so instantly use it
|
|
|
|
// next time
|
|
|
|
pos = r - ipNum
|
|
|
|
} else {
|
|
|
|
// Use same IP as last time
|
|
|
|
if pos == 1 {
|
|
|
|
pos = max
|
|
|
|
} else {
|
|
|
|
pos--
|
|
|
|
}
|
|
|
|
}
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (alloc *IPAllocator) Acquire() (net.IP, error) {
|
2013-03-30 22:32:10 +00:00
|
|
|
ip := <-alloc.queueAlloc
|
|
|
|
return ip.ip, ip.err
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:32:10 +00:00
|
|
|
func (alloc *IPAllocator) Release(ip net.IP) {
|
|
|
|
alloc.queueReleased <- ip
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
|
|
|
|
2013-03-30 22:32:10 +00:00
|
|
|
func newIPAllocator(network *net.IPNet) *IPAllocator {
|
2013-02-28 19:50:02 +00:00
|
|
|
alloc := &IPAllocator{
|
2013-03-30 22:32:10 +00:00
|
|
|
network: network,
|
|
|
|
queueAlloc: make(chan allocatedIP),
|
|
|
|
queueReleased: make(chan net.IP),
|
|
|
|
inUse: make(map[int32]struct{}),
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
2013-03-30 22:32:10 +00:00
|
|
|
|
|
|
|
go alloc.run()
|
|
|
|
|
|
|
|
return alloc
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Network interface represents the networking stack of a container
|
|
|
|
type NetworkInterface struct {
|
|
|
|
IPNet net.IPNet
|
|
|
|
Gateway net.IP
|
|
|
|
|
|
|
|
manager *NetworkManager
|
|
|
|
extPorts []int
|
|
|
|
}
|
|
|
|
|
|
|
|
// Allocate an external TCP port and map it to the interface
|
|
|
|
func (iface *NetworkInterface) AllocatePort(port int) (int, error) {
|
|
|
|
extPort, err := iface.manager.portAllocator.Acquire()
|
|
|
|
if err != nil {
|
|
|
|
return -1, err
|
|
|
|
}
|
2013-03-21 03:11:16 +00:00
|
|
|
if err := iface.manager.portMapper.Map(extPort, net.TCPAddr{IP: iface.IPNet.IP, Port: port}); err != nil {
|
2013-02-28 19:50:02 +00:00
|
|
|
iface.manager.portAllocator.Release(extPort)
|
|
|
|
return -1, err
|
|
|
|
}
|
|
|
|
iface.extPorts = append(iface.extPorts, extPort)
|
|
|
|
return extPort, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Release: Network cleanup - release all resources
|
2013-03-30 22:32:10 +00:00
|
|
|
func (iface *NetworkInterface) Release() {
|
2013-02-28 19:50:02 +00:00
|
|
|
for _, port := range iface.extPorts {
|
|
|
|
if err := iface.manager.portMapper.Unmap(port); err != nil {
|
|
|
|
log.Printf("Unable to unmap port %v: %v", port, err)
|
|
|
|
}
|
|
|
|
if err := iface.manager.portAllocator.Release(port); err != nil {
|
|
|
|
log.Printf("Unable to release port %v: %v", port, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
2013-03-30 22:32:10 +00:00
|
|
|
|
|
|
|
iface.manager.ipAllocator.Release(iface.IPNet.IP)
|
2013-02-28 19:50:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Network Manager manages a set of network interfaces
|
|
|
|
// Only *one* manager per host machine should be used
|
|
|
|
type NetworkManager struct {
|
|
|
|
bridgeIface string
|
|
|
|
bridgeNetwork *net.IPNet
|
|
|
|
|
|
|
|
ipAllocator *IPAllocator
|
|
|
|
portAllocator *PortAllocator
|
|
|
|
portMapper *PortMapper
|
|
|
|
}
|
|
|
|
|
|
|
|
// Allocate a network interface
|
|
|
|
func (manager *NetworkManager) Allocate() (*NetworkInterface, error) {
|
|
|
|
ip, err := manager.ipAllocator.Acquire()
|
2013-02-25 18:45:23 +00:00
|
|
|
if err != nil {
|
2013-02-25 22:06:22 +00:00
|
|
|
return nil, err
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|
2013-02-25 22:06:22 +00:00
|
|
|
iface := &NetworkInterface{
|
2013-03-20 13:02:25 +00:00
|
|
|
IPNet: net.IPNet{IP: ip, Mask: manager.bridgeNetwork.Mask},
|
2013-02-28 19:50:02 +00:00
|
|
|
Gateway: manager.bridgeNetwork.IP,
|
|
|
|
manager: manager,
|
2013-02-25 22:06:22 +00:00
|
|
|
}
|
|
|
|
return iface, nil
|
|
|
|
}
|
|
|
|
|
2013-02-28 19:50:02 +00:00
|
|
|
func newNetworkManager(bridgeIface string) (*NetworkManager, error) {
|
|
|
|
addr, err := getIfaceAddr(bridgeIface)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
network := addr.(*net.IPNet)
|
|
|
|
|
2013-03-30 22:32:10 +00:00
|
|
|
ipAllocator := newIPAllocator(network)
|
2013-02-28 19:50:02 +00:00
|
|
|
|
|
|
|
portAllocator, err := newPortAllocator(portRangeStart, portRangeEnd)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
portMapper, err := newPortMapper()
|
2013-03-23 04:43:31 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2013-02-28 19:50:02 +00:00
|
|
|
|
|
|
|
manager := &NetworkManager{
|
|
|
|
bridgeIface: bridgeIface,
|
|
|
|
bridgeNetwork: network,
|
|
|
|
ipAllocator: ipAllocator,
|
|
|
|
portAllocator: portAllocator,
|
|
|
|
portMapper: portMapper,
|
|
|
|
}
|
|
|
|
return manager, nil
|
2013-02-25 18:45:23 +00:00
|
|
|
}
|