
If makeVeth fails as a peer exists, the existing peer name should be included in the error message. Signed-off-by: Samuel Karp <samuelkarp@google.com>
259 lines
7.6 KiB
Go
259 lines
7.6 KiB
Go
// Copyright 2015 CNI authors
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package ip
|
|
|
|
import (
|
|
"crypto/rand"
|
|
"errors"
|
|
"fmt"
|
|
"net"
|
|
"os"
|
|
|
|
"github.com/safchain/ethtool"
|
|
"github.com/vishvananda/netlink"
|
|
|
|
"github.com/containernetworking/plugins/pkg/ns"
|
|
"github.com/containernetworking/plugins/pkg/utils/sysctl"
|
|
)
|
|
|
|
var ErrLinkNotFound = errors.New("link not found")
|
|
|
|
// makeVethPair is called from within the container's network namespace
|
|
func makeVethPair(name, peer string, mtu int, mac string, hostNS ns.NetNS) (netlink.Link, error) {
|
|
veth := &netlink.Veth{
|
|
LinkAttrs: netlink.LinkAttrs{
|
|
Name: name,
|
|
MTU: mtu,
|
|
},
|
|
PeerName: peer,
|
|
PeerNamespace: netlink.NsFd(int(hostNS.Fd())),
|
|
}
|
|
if mac != "" {
|
|
m, err := net.ParseMAC(mac)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
veth.LinkAttrs.HardwareAddr = m
|
|
}
|
|
if err := netlink.LinkAdd(veth); err != nil {
|
|
return nil, err
|
|
}
|
|
// Re-fetch the container link to get its creation-time parameters, e.g. index and mac
|
|
veth2, err := netlink.LinkByName(name)
|
|
if err != nil {
|
|
netlink.LinkDel(veth) // try and clean up the link if possible.
|
|
return nil, err
|
|
}
|
|
|
|
return veth2, nil
|
|
}
|
|
|
|
func peerExists(name string) bool {
|
|
if _, err := netlink.LinkByName(name); err != nil {
|
|
return false
|
|
}
|
|
return true
|
|
}
|
|
|
|
func makeVeth(name, vethPeerName string, mtu int, mac string, hostNS ns.NetNS) (string, netlink.Link, error) {
|
|
var peerName string
|
|
var veth netlink.Link
|
|
var err error
|
|
for i := 0; i < 10; i++ {
|
|
if vethPeerName != "" {
|
|
peerName = vethPeerName
|
|
} else {
|
|
peerName, err = RandomVethName()
|
|
if err != nil {
|
|
return peerName, nil, err
|
|
}
|
|
}
|
|
|
|
veth, err = makeVethPair(name, peerName, mtu, mac, hostNS)
|
|
switch {
|
|
case err == nil:
|
|
return peerName, veth, nil
|
|
|
|
case os.IsExist(err):
|
|
if peerExists(peerName) && vethPeerName == "" {
|
|
continue
|
|
}
|
|
return peerName, veth, fmt.Errorf("container veth name (%q) peer provided (%q) already exists", name, peerName)
|
|
default:
|
|
return peerName, veth, fmt.Errorf("failed to make veth pair: %v", err)
|
|
}
|
|
}
|
|
|
|
// should really never be hit
|
|
return peerName, nil, fmt.Errorf("failed to find a unique veth name")
|
|
}
|
|
|
|
// RandomVethName returns string "veth" with random prefix (hashed from entropy)
|
|
func RandomVethName() (string, error) {
|
|
entropy := make([]byte, 4)
|
|
_, err := rand.Read(entropy)
|
|
if err != nil {
|
|
return "", fmt.Errorf("failed to generate random veth name: %v", err)
|
|
}
|
|
|
|
// NetworkManager (recent versions) will ignore veth devices that start with "veth"
|
|
return fmt.Sprintf("veth%x", entropy), nil
|
|
}
|
|
|
|
func RenameLink(curName, newName string) error {
|
|
link, err := netlink.LinkByName(curName)
|
|
if err == nil {
|
|
err = netlink.LinkSetName(link, newName)
|
|
}
|
|
return err
|
|
}
|
|
|
|
func ifaceFromNetlinkLink(l netlink.Link) net.Interface {
|
|
a := l.Attrs()
|
|
return net.Interface{
|
|
Index: a.Index,
|
|
MTU: a.MTU,
|
|
Name: a.Name,
|
|
HardwareAddr: a.HardwareAddr,
|
|
Flags: a.Flags,
|
|
}
|
|
}
|
|
|
|
// SetupVethWithName sets up a pair of virtual ethernet devices.
|
|
// Call SetupVethWithName from inside the container netns. It will create both veth
|
|
// devices and move the host-side veth into the provided hostNS namespace.
|
|
// hostVethName: If hostVethName is not specified, the host-side veth name will use a random string.
|
|
// On success, SetupVethWithName returns (hostVeth, containerVeth, nil)
|
|
func SetupVethWithName(contVethName, hostVethName string, mtu int, contVethMac string, hostNS ns.NetNS) (net.Interface, net.Interface, error) {
|
|
hostVethName, contVeth, err := makeVeth(contVethName, hostVethName, mtu, contVethMac, hostNS)
|
|
if err != nil {
|
|
return net.Interface{}, net.Interface{}, err
|
|
}
|
|
|
|
var hostVeth netlink.Link
|
|
err = hostNS.Do(func(_ ns.NetNS) error {
|
|
hostVeth, err = netlink.LinkByName(hostVethName)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to lookup %q in %q: %v", hostVethName, hostNS.Path(), err)
|
|
}
|
|
|
|
if err = netlink.LinkSetUp(hostVeth); err != nil {
|
|
return fmt.Errorf("failed to set %q up: %v", hostVethName, err)
|
|
}
|
|
|
|
// we want to own the routes for this interface
|
|
_, _ = sysctl.Sysctl(fmt.Sprintf("net/ipv6/conf/%s/accept_ra", hostVethName), "0")
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
return net.Interface{}, net.Interface{}, err
|
|
}
|
|
return ifaceFromNetlinkLink(hostVeth), ifaceFromNetlinkLink(contVeth), nil
|
|
}
|
|
|
|
// SetupVeth sets up a pair of virtual ethernet devices.
|
|
// Call SetupVeth from inside the container netns. It will create both veth
|
|
// devices and move the host-side veth into the provided hostNS namespace.
|
|
// On success, SetupVeth returns (hostVeth, containerVeth, nil)
|
|
func SetupVeth(contVethName string, mtu int, contVethMac string, hostNS ns.NetNS) (net.Interface, net.Interface, error) {
|
|
return SetupVethWithName(contVethName, "", mtu, contVethMac, hostNS)
|
|
}
|
|
|
|
// DelLinkByName removes an interface link.
|
|
func DelLinkByName(ifName string) error {
|
|
iface, err := netlink.LinkByName(ifName)
|
|
if err != nil {
|
|
if _, ok := err.(netlink.LinkNotFoundError); ok {
|
|
return ErrLinkNotFound
|
|
}
|
|
return fmt.Errorf("failed to lookup %q: %v", ifName, err)
|
|
}
|
|
|
|
if err = netlink.LinkDel(iface); err != nil {
|
|
return fmt.Errorf("failed to delete %q: %v", ifName, err)
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// DelLinkByNameAddr remove an interface and returns its addresses
|
|
func DelLinkByNameAddr(ifName string) ([]*net.IPNet, error) {
|
|
iface, err := netlink.LinkByName(ifName)
|
|
if err != nil {
|
|
if _, ok := err.(netlink.LinkNotFoundError); ok {
|
|
return nil, ErrLinkNotFound
|
|
}
|
|
return nil, fmt.Errorf("failed to lookup %q: %v", ifName, err)
|
|
}
|
|
|
|
addrs, err := netlink.AddrList(iface, netlink.FAMILY_ALL)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("failed to get IP addresses for %q: %v", ifName, err)
|
|
}
|
|
|
|
if err = netlink.LinkDel(iface); err != nil {
|
|
return nil, fmt.Errorf("failed to delete %q: %v", ifName, err)
|
|
}
|
|
|
|
out := []*net.IPNet{}
|
|
for _, addr := range addrs {
|
|
if addr.IP.IsGlobalUnicast() {
|
|
out = append(out, addr.IPNet)
|
|
}
|
|
}
|
|
|
|
return out, nil
|
|
}
|
|
|
|
// GetVethPeerIfindex returns the veth link object, the peer ifindex of the
|
|
// veth, or an error. This peer ifindex will only be valid in the peer's
|
|
// network namespace.
|
|
func GetVethPeerIfindex(ifName string) (netlink.Link, int, error) {
|
|
link, err := netlink.LinkByName(ifName)
|
|
if err != nil {
|
|
return nil, -1, fmt.Errorf("could not look up %q: %v", ifName, err)
|
|
}
|
|
if _, ok := link.(*netlink.Veth); !ok {
|
|
return nil, -1, fmt.Errorf("interface %q was not a veth interface", ifName)
|
|
}
|
|
|
|
// veth supports IFLA_LINK (what vishvananda/netlink calls ParentIndex)
|
|
// on 4.1 and higher kernels
|
|
peerIndex := link.Attrs().ParentIndex
|
|
if peerIndex <= 0 {
|
|
// Fall back to ethtool for 4.0 and earlier kernels
|
|
e, err := ethtool.NewEthtool()
|
|
if err != nil {
|
|
return nil, -1, fmt.Errorf("failed to initialize ethtool: %v", err)
|
|
}
|
|
defer e.Close()
|
|
|
|
stats, err := e.Stats(link.Attrs().Name)
|
|
if err != nil {
|
|
return nil, -1, fmt.Errorf("failed to request ethtool stats: %v", err)
|
|
}
|
|
n, ok := stats["peer_ifindex"]
|
|
if !ok {
|
|
return nil, -1, fmt.Errorf("failed to find 'peer_ifindex' in ethtool stats")
|
|
}
|
|
if n > 32767 || n == 0 {
|
|
return nil, -1, fmt.Errorf("invalid 'peer_ifindex' %d", n)
|
|
}
|
|
peerIndex = int(n)
|
|
}
|
|
|
|
return link, peerIndex, nil
|
|
}
|