link_linux.go 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261
  1. // Copyright 2015 CNI authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package ip
  15. import (
  16. "crypto/rand"
  17. "errors"
  18. "fmt"
  19. "net"
  20. "os"
  21. "github.com/safchain/ethtool"
  22. "github.com/vishvananda/netlink"
  23. "github.com/containernetworking/plugins/pkg/ns"
  24. "github.com/containernetworking/plugins/pkg/utils/sysctl"
  25. )
  26. var (
  27. ErrLinkNotFound = errors.New("link not found")
  28. )
  29. // makeVethPair is called from within the container's network namespace
  30. func makeVethPair(name, peer string, mtu int, mac string, hostNS ns.NetNS) (netlink.Link, error) {
  31. veth := &netlink.Veth{
  32. LinkAttrs: netlink.LinkAttrs{
  33. Name: name,
  34. MTU: mtu,
  35. },
  36. PeerName: peer,
  37. PeerNamespace: netlink.NsFd(int(hostNS.Fd())),
  38. }
  39. if mac != "" {
  40. m, err := net.ParseMAC(mac)
  41. if err != nil {
  42. return nil, err
  43. }
  44. veth.LinkAttrs.HardwareAddr = m
  45. }
  46. if err := netlink.LinkAdd(veth); err != nil {
  47. return nil, err
  48. }
  49. // Re-fetch the container link to get its creation-time parameters, e.g. index and mac
  50. veth2, err := netlink.LinkByName(name)
  51. if err != nil {
  52. netlink.LinkDel(veth) // try and clean up the link if possible.
  53. return nil, err
  54. }
  55. return veth2, nil
  56. }
  57. func peerExists(name string) bool {
  58. if _, err := netlink.LinkByName(name); err != nil {
  59. return false
  60. }
  61. return true
  62. }
  63. func makeVeth(name, vethPeerName string, mtu int, mac string, hostNS ns.NetNS) (peerName string, veth netlink.Link, err error) {
  64. for i := 0; i < 10; i++ {
  65. if vethPeerName != "" {
  66. peerName = vethPeerName
  67. } else {
  68. peerName, err = RandomVethName()
  69. if err != nil {
  70. return
  71. }
  72. }
  73. veth, err = makeVethPair(name, peerName, mtu, mac, hostNS)
  74. switch {
  75. case err == nil:
  76. return
  77. case os.IsExist(err):
  78. if peerExists(peerName) && vethPeerName == "" {
  79. continue
  80. }
  81. err = fmt.Errorf("container veth name provided (%v) already exists", name)
  82. return
  83. default:
  84. err = fmt.Errorf("failed to make veth pair: %v", err)
  85. return
  86. }
  87. }
  88. // should really never be hit
  89. err = fmt.Errorf("failed to find a unique veth name")
  90. return
  91. }
  92. // RandomVethName returns string "veth" with random prefix (hashed from entropy)
  93. func RandomVethName() (string, error) {
  94. entropy := make([]byte, 4)
  95. _, err := rand.Read(entropy)
  96. if err != nil {
  97. return "", fmt.Errorf("failed to generate random veth name: %v", err)
  98. }
  99. // NetworkManager (recent versions) will ignore veth devices that start with "veth"
  100. return fmt.Sprintf("veth%x", entropy), nil
  101. }
  102. func RenameLink(curName, newName string) error {
  103. link, err := netlink.LinkByName(curName)
  104. if err == nil {
  105. err = netlink.LinkSetName(link, newName)
  106. }
  107. return err
  108. }
  109. func ifaceFromNetlinkLink(l netlink.Link) net.Interface {
  110. a := l.Attrs()
  111. return net.Interface{
  112. Index: a.Index,
  113. MTU: a.MTU,
  114. Name: a.Name,
  115. HardwareAddr: a.HardwareAddr,
  116. Flags: a.Flags,
  117. }
  118. }
  119. // SetupVethWithName sets up a pair of virtual ethernet devices.
  120. // Call SetupVethWithName from inside the container netns. It will create both veth
  121. // devices and move the host-side veth into the provided hostNS namespace.
  122. // hostVethName: If hostVethName is not specified, the host-side veth name will use a random string.
  123. // On success, SetupVethWithName returns (hostVeth, containerVeth, nil)
  124. func SetupVethWithName(contVethName, hostVethName string, mtu int, contVethMac string, hostNS ns.NetNS) (net.Interface, net.Interface, error) {
  125. hostVethName, contVeth, err := makeVeth(contVethName, hostVethName, mtu, contVethMac, hostNS)
  126. if err != nil {
  127. return net.Interface{}, net.Interface{}, err
  128. }
  129. var hostVeth netlink.Link
  130. err = hostNS.Do(func(_ ns.NetNS) error {
  131. hostVeth, err = netlink.LinkByName(hostVethName)
  132. if err != nil {
  133. return fmt.Errorf("failed to lookup %q in %q: %v", hostVethName, hostNS.Path(), err)
  134. }
  135. if err = netlink.LinkSetUp(hostVeth); err != nil {
  136. return fmt.Errorf("failed to set %q up: %v", hostVethName, err)
  137. }
  138. // we want to own the routes for this interface
  139. _, _ = sysctl.Sysctl(fmt.Sprintf("net/ipv6/conf/%s/accept_ra", hostVethName), "0")
  140. return nil
  141. })
  142. if err != nil {
  143. return net.Interface{}, net.Interface{}, err
  144. }
  145. return ifaceFromNetlinkLink(hostVeth), ifaceFromNetlinkLink(contVeth), nil
  146. }
  147. // SetupVeth sets up a pair of virtual ethernet devices.
  148. // Call SetupVeth from inside the container netns. It will create both veth
  149. // devices and move the host-side veth into the provided hostNS namespace.
  150. // On success, SetupVeth returns (hostVeth, containerVeth, nil)
  151. func SetupVeth(contVethName string, mtu int, contVethMac string, hostNS ns.NetNS) (net.Interface, net.Interface, error) {
  152. return SetupVethWithName(contVethName, "", mtu, contVethMac, hostNS)
  153. }
  154. // DelLinkByName removes an interface link.
  155. func DelLinkByName(ifName string) error {
  156. iface, err := netlink.LinkByName(ifName)
  157. if err != nil {
  158. if _, ok := err.(netlink.LinkNotFoundError); ok {
  159. return ErrLinkNotFound
  160. }
  161. return fmt.Errorf("failed to lookup %q: %v", ifName, err)
  162. }
  163. if err = netlink.LinkDel(iface); err != nil {
  164. return fmt.Errorf("failed to delete %q: %v", ifName, err)
  165. }
  166. return nil
  167. }
  168. // DelLinkByNameAddr remove an interface and returns its addresses
  169. func DelLinkByNameAddr(ifName string) ([]*net.IPNet, error) {
  170. iface, err := netlink.LinkByName(ifName)
  171. if err != nil {
  172. if _, ok := err.(netlink.LinkNotFoundError); ok {
  173. return nil, ErrLinkNotFound
  174. }
  175. return nil, fmt.Errorf("failed to lookup %q: %v", ifName, err)
  176. }
  177. addrs, err := netlink.AddrList(iface, netlink.FAMILY_ALL)
  178. if err != nil {
  179. return nil, fmt.Errorf("failed to get IP addresses for %q: %v", ifName, err)
  180. }
  181. if err = netlink.LinkDel(iface); err != nil {
  182. return nil, fmt.Errorf("failed to delete %q: %v", ifName, err)
  183. }
  184. out := []*net.IPNet{}
  185. for _, addr := range addrs {
  186. if addr.IP.IsGlobalUnicast() {
  187. out = append(out, addr.IPNet)
  188. }
  189. }
  190. return out, nil
  191. }
  192. // GetVethPeerIfindex returns the veth link object, the peer ifindex of the
  193. // veth, or an error. This peer ifindex will only be valid in the peer's
  194. // network namespace.
  195. func GetVethPeerIfindex(ifName string) (netlink.Link, int, error) {
  196. link, err := netlink.LinkByName(ifName)
  197. if err != nil {
  198. return nil, -1, fmt.Errorf("could not look up %q: %v", ifName, err)
  199. }
  200. if _, ok := link.(*netlink.Veth); !ok {
  201. return nil, -1, fmt.Errorf("interface %q was not a veth interface", ifName)
  202. }
  203. // veth supports IFLA_LINK (what vishvananda/netlink calls ParentIndex)
  204. // on 4.1 and higher kernels
  205. peerIndex := link.Attrs().ParentIndex
  206. if peerIndex <= 0 {
  207. // Fall back to ethtool for 4.0 and earlier kernels
  208. e, err := ethtool.NewEthtool()
  209. if err != nil {
  210. return nil, -1, fmt.Errorf("failed to initialize ethtool: %v", err)
  211. }
  212. defer e.Close()
  213. stats, err := e.Stats(link.Attrs().Name)
  214. if err != nil {
  215. return nil, -1, fmt.Errorf("failed to request ethtool stats: %v", err)
  216. }
  217. n, ok := stats["peer_ifindex"]
  218. if !ok {
  219. return nil, -1, fmt.Errorf("failed to find 'peer_ifindex' in ethtool stats")
  220. }
  221. if n > 32767 || n == 0 {
  222. return nil, -1, fmt.Errorf("invalid 'peer_ifindex' %d", n)
  223. }
  224. peerIndex = int(n)
  225. }
  226. return link, peerIndex, nil
  227. }