2017-01-09 20:33:55 +01:00
|
|
|
package netlink
|
|
|
|
|
|
|
|
import (
|
|
|
|
"errors"
|
2017-11-02 12:30:34 +01:00
|
|
|
"io"
|
2017-02-28 22:59:37 +01:00
|
|
|
"math/rand"
|
2017-11-02 12:30:34 +01:00
|
|
|
"os"
|
2017-01-09 20:33:55 +01:00
|
|
|
"sync/atomic"
|
2017-02-28 22:59:37 +01:00
|
|
|
|
|
|
|
"golang.org/x/net/bpf"
|
2017-01-09 20:33:55 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
// Error messages which can be returned by Validate.
|
|
|
|
var (
|
|
|
|
errMismatchedSequence = errors.New("mismatched sequence in netlink reply")
|
|
|
|
errMismatchedPID = errors.New("mismatched PID in netlink reply")
|
|
|
|
errShortErrorMessage = errors.New("not enough data for netlink error code")
|
|
|
|
)
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// Errors which can be returned by a Socket that does not implement
|
|
|
|
// all exposed methods of Conn.
|
|
|
|
var (
|
|
|
|
errReadWriteCloserNotSupported = errors.New("raw read/write/closer not supported")
|
|
|
|
errMulticastGroupsNotSupported = errors.New("multicast groups not supported")
|
|
|
|
errBPFFiltersNotSupported = errors.New("BPF filters not supported")
|
|
|
|
)
|
|
|
|
|
2017-01-09 20:33:55 +01:00
|
|
|
// A Conn is a connection to netlink. A Conn can be used to send and
|
|
|
|
// receives messages to and from netlink.
|
2018-01-25 18:20:39 +01:00
|
|
|
//
|
|
|
|
// A Conn is safe for concurrent use, but to avoid contention in
|
|
|
|
// high-throughput applications, the caller should almost certainly create a
|
|
|
|
// pool of Conns and distribute them among workers.
|
2017-01-09 20:33:55 +01:00
|
|
|
type Conn struct {
|
2017-11-02 12:30:34 +01:00
|
|
|
// sock is the operating system-specific implementation of
|
2017-01-09 20:33:55 +01:00
|
|
|
// a netlink sockets connection.
|
2017-11-02 12:30:34 +01:00
|
|
|
sock Socket
|
2017-01-09 20:33:55 +01:00
|
|
|
|
|
|
|
// seq is an atomically incremented integer used to provide sequence
|
|
|
|
// numbers when Conn.Send is called.
|
|
|
|
seq *uint32
|
2017-01-12 18:41:35 +01:00
|
|
|
|
2017-03-10 18:32:29 +01:00
|
|
|
// pid is the PID assigned by netlink.
|
|
|
|
pid uint32
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// A Socket is an operating-system specific implementation of netlink
|
2017-01-09 20:33:55 +01:00
|
|
|
// sockets used by Conn.
|
2017-11-02 12:30:34 +01:00
|
|
|
type Socket interface {
|
2017-01-09 20:33:55 +01:00
|
|
|
Close() error
|
|
|
|
Send(m Message) error
|
|
|
|
Receive() ([]Message, error)
|
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// Dial dials a connection to netlink, using the specified netlink family.
|
2017-01-09 20:33:55 +01:00
|
|
|
// Config specifies optional configuration for Conn. If config is nil, a default
|
|
|
|
// configuration will be used.
|
2017-11-02 12:30:34 +01:00
|
|
|
func Dial(family int, config *Config) (*Conn, error) {
|
|
|
|
// Use OS-specific dial() to create Socket
|
|
|
|
c, pid, err := dial(family, config)
|
2017-01-09 20:33:55 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
return NewConn(c, pid), nil
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// NewConn creates a Conn using the specified Socket and PID for netlink
|
|
|
|
// communications.
|
|
|
|
//
|
|
|
|
// NewConn is primarily useful for tests. Most applications should use
|
|
|
|
// Dial instead.
|
|
|
|
func NewConn(c Socket, pid uint32) *Conn {
|
2017-02-28 22:59:37 +01:00
|
|
|
seq := rand.Uint32()
|
|
|
|
|
2017-01-09 20:33:55 +01:00
|
|
|
return &Conn{
|
2017-11-02 12:30:34 +01:00
|
|
|
sock: c,
|
|
|
|
seq: &seq,
|
|
|
|
pid: pid,
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Close closes the connection.
|
|
|
|
func (c *Conn) Close() error {
|
2017-11-02 12:30:34 +01:00
|
|
|
return c.sock.Close()
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Execute sends a single Message to netlink using Conn.Send, receives one or more
|
|
|
|
// replies using Conn.Receive, and then checks the validity of the replies against
|
|
|
|
// the request using Validate.
|
|
|
|
//
|
|
|
|
// See the documentation of Conn.Send, Conn.Receive, and Validate for details about
|
|
|
|
// each function.
|
|
|
|
func (c *Conn) Execute(m Message) ([]Message, error) {
|
|
|
|
req, err := c.Send(m)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
replies, err := c.Receive()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := Validate(req, replies); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return replies, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Send sends a single Message to netlink. In most cases, m.Header's Length,
|
|
|
|
// Sequence, and PID fields should be set to 0, so they can be populated
|
|
|
|
// automatically before the Message is sent. On success, Send returns a copy
|
|
|
|
// of the Message with all parameters populated, for later validation.
|
|
|
|
//
|
|
|
|
// If m.Header.Length is 0, it will be automatically populated using the
|
|
|
|
// correct length for the Message, including its payload.
|
|
|
|
//
|
|
|
|
// If m.Header.Sequence is 0, it will be automatically populated using the
|
|
|
|
// next sequence number for this connection.
|
|
|
|
//
|
2017-01-12 18:41:35 +01:00
|
|
|
// If m.Header.PID is 0, it will be automatically populated using a PID
|
|
|
|
// assigned by netlink.
|
2017-01-09 20:33:55 +01:00
|
|
|
func (c *Conn) Send(m Message) (Message, error) {
|
|
|
|
ml := nlmsgLength(len(m.Data))
|
|
|
|
|
2017-01-09 20:37:59 +01:00
|
|
|
// TODO(mdlayher): fine-tune this limit.
|
|
|
|
if ml > (1024 * 32) {
|
2017-01-09 20:33:55 +01:00
|
|
|
return Message{}, errors.New("netlink message data too large")
|
|
|
|
}
|
|
|
|
|
|
|
|
if m.Header.Length == 0 {
|
|
|
|
m.Header.Length = uint32(nlmsgAlign(ml))
|
|
|
|
}
|
|
|
|
|
|
|
|
if m.Header.Sequence == 0 {
|
|
|
|
m.Header.Sequence = c.nextSequence()
|
|
|
|
}
|
|
|
|
|
|
|
|
if m.Header.PID == 0 {
|
2017-03-10 18:32:29 +01:00
|
|
|
m.Header.PID = c.pid
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
if err := c.sock.Send(m); err != nil {
|
2017-01-09 20:33:55 +01:00
|
|
|
return Message{}, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return m, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Receive receives one or more messages from netlink. Multi-part messages are
|
|
|
|
// handled transparently and returned as a single slice of Messages, with the
|
2017-01-12 18:41:35 +01:00
|
|
|
// final empty "multi-part done" message removed.
|
|
|
|
//
|
|
|
|
// If any of the messages indicate a netlink error, that error will be returned.
|
2017-01-09 20:33:55 +01:00
|
|
|
func (c *Conn) Receive() ([]Message, error) {
|
|
|
|
msgs, err := c.receive()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// When using nltest, it's possible for zero messages to be returned by receive.
|
|
|
|
if len(msgs) == 0 {
|
|
|
|
return msgs, nil
|
|
|
|
}
|
|
|
|
|
2017-01-09 20:33:55 +01:00
|
|
|
// Trim the final message with multi-part done indicator if
|
2017-11-02 12:30:34 +01:00
|
|
|
// present.
|
2017-01-09 20:33:55 +01:00
|
|
|
if m := msgs[len(msgs)-1]; m.Header.Flags&HeaderFlagsMulti != 0 && m.Header.Type == HeaderTypeDone {
|
|
|
|
return msgs[:len(msgs)-1], nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return msgs, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// receive is the internal implementation of Conn.Receive, which can be called
|
|
|
|
// recursively to handle multi-part messages.
|
|
|
|
func (c *Conn) receive() ([]Message, error) {
|
2017-11-02 12:30:34 +01:00
|
|
|
msgs, err := c.sock.Receive()
|
2017-01-09 20:33:55 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// If this message is multi-part, we will need to perform an recursive call
|
|
|
|
// to continue draining the socket
|
|
|
|
var multi bool
|
|
|
|
|
|
|
|
for _, m := range msgs {
|
|
|
|
// Is this a multi-part message and is it not done yet?
|
|
|
|
if m.Header.Flags&HeaderFlagsMulti != 0 && m.Header.Type != HeaderTypeDone {
|
|
|
|
multi = true
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := checkMessage(m); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if !multi {
|
|
|
|
return msgs, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// More messages waiting
|
|
|
|
mmsgs, err := c.receive()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return append(msgs, mmsgs...), nil
|
|
|
|
}
|
|
|
|
|
2017-11-02 12:30:34 +01:00
|
|
|
// An fder is a Socket that supports retrieving its raw file descriptor.
|
|
|
|
type fder interface {
|
|
|
|
Socket
|
|
|
|
FD() int
|
|
|
|
}
|
|
|
|
|
|
|
|
var _ io.ReadWriteCloser = &fileReadWriteCloser{}
|
|
|
|
|
|
|
|
// A fileReadWriteCloser is a limited *os.File which only allows access to its
|
|
|
|
// Read and Write methods.
|
|
|
|
type fileReadWriteCloser struct {
|
|
|
|
f *os.File
|
|
|
|
}
|
|
|
|
|
|
|
|
// Read implements io.ReadWriteCloser.
|
|
|
|
func (rwc *fileReadWriteCloser) Read(b []byte) (int, error) { return rwc.f.Read(b) }
|
|
|
|
|
|
|
|
// Write implements io.ReadWriteCloser.
|
|
|
|
func (rwc *fileReadWriteCloser) Write(b []byte) (int, error) { return rwc.f.Write(b) }
|
|
|
|
|
|
|
|
// Close implements io.ReadWriteCloser.
|
|
|
|
func (rwc *fileReadWriteCloser) Close() error { return rwc.f.Close() }
|
|
|
|
|
|
|
|
// ReadWriteCloser returns a raw io.ReadWriteCloser backed by the connection
|
|
|
|
// of the Conn.
|
|
|
|
//
|
|
|
|
// ReadWriteCloser is intended for advanced use cases, such as those that do
|
|
|
|
// not involve standard netlink message passing.
|
|
|
|
//
|
|
|
|
// Once invoked, it is the caller's responsibility to ensure that operations
|
|
|
|
// performed using Conn and the raw io.ReadWriteCloser do not conflict with
|
|
|
|
// each other. In almost all scenarios, only one of the two should be used.
|
|
|
|
func (c *Conn) ReadWriteCloser() (io.ReadWriteCloser, error) {
|
|
|
|
fc, ok := c.sock.(fder)
|
|
|
|
if !ok {
|
|
|
|
return nil, errReadWriteCloserNotSupported
|
|
|
|
}
|
|
|
|
|
|
|
|
return &fileReadWriteCloser{
|
|
|
|
// Backing the io.ReadWriteCloser with an *os.File enables easy reading
|
|
|
|
// and writing without more system call boilerplate.
|
|
|
|
f: os.NewFile(uintptr(fc.FD()), "netlink"),
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// A groupJoinLeaver is a Socket that supports joining and leaving
|
|
|
|
// netlink multicast groups.
|
|
|
|
type groupJoinLeaver interface {
|
|
|
|
Socket
|
|
|
|
JoinGroup(group uint32) error
|
|
|
|
LeaveGroup(group uint32) error
|
|
|
|
}
|
|
|
|
|
2017-01-09 20:33:55 +01:00
|
|
|
// JoinGroup joins a netlink multicast group by its ID.
|
|
|
|
func (c *Conn) JoinGroup(group uint32) error {
|
2017-11-02 12:30:34 +01:00
|
|
|
gc, ok := c.sock.(groupJoinLeaver)
|
|
|
|
if !ok {
|
|
|
|
return errMulticastGroupsNotSupported
|
|
|
|
}
|
|
|
|
|
|
|
|
return gc.JoinGroup(group)
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// LeaveGroup leaves a netlink multicast group by its ID.
|
|
|
|
func (c *Conn) LeaveGroup(group uint32) error {
|
2017-11-02 12:30:34 +01:00
|
|
|
gc, ok := c.sock.(groupJoinLeaver)
|
|
|
|
if !ok {
|
|
|
|
return errMulticastGroupsNotSupported
|
|
|
|
}
|
|
|
|
|
|
|
|
return gc.LeaveGroup(group)
|
|
|
|
}
|
|
|
|
|
|
|
|
// A bpfSetter is a Socket that supports setting BPF filters.
|
|
|
|
type bpfSetter interface {
|
|
|
|
Socket
|
|
|
|
bpf.Setter
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|
|
|
|
|
2017-02-28 22:59:37 +01:00
|
|
|
// SetBPF attaches an assembled BPF program to a Conn.
|
|
|
|
func (c *Conn) SetBPF(filter []bpf.RawInstruction) error {
|
2017-11-02 12:30:34 +01:00
|
|
|
bc, ok := c.sock.(bpfSetter)
|
|
|
|
if !ok {
|
|
|
|
return errBPFFiltersNotSupported
|
|
|
|
}
|
|
|
|
|
|
|
|
return bc.SetBPF(filter)
|
2017-02-28 22:59:37 +01:00
|
|
|
}
|
|
|
|
|
2017-01-09 20:33:55 +01:00
|
|
|
// nextSequence atomically increments Conn's sequence number and returns
|
|
|
|
// the incremented value.
|
|
|
|
func (c *Conn) nextSequence() uint32 {
|
|
|
|
return atomic.AddUint32(c.seq, 1)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Validate validates one or more reply Messages against a request Message,
|
|
|
|
// ensuring that they contain matching sequence numbers and PIDs.
|
|
|
|
func Validate(request Message, replies []Message) error {
|
|
|
|
for _, m := range replies {
|
2017-01-12 18:41:35 +01:00
|
|
|
// Check for mismatched sequence, unless:
|
|
|
|
// - request had no sequence, meaning we are probably validating
|
|
|
|
// a multicast reply
|
|
|
|
if m.Header.Sequence != request.Header.Sequence && request.Header.Sequence != 0 {
|
2017-01-09 20:33:55 +01:00
|
|
|
return errMismatchedSequence
|
|
|
|
}
|
2017-01-12 18:41:35 +01:00
|
|
|
|
|
|
|
// Check for mismatched PID, unless:
|
|
|
|
// - request had no PID, meaning we are either:
|
|
|
|
// - validating a multicast reply
|
|
|
|
// - netlink has not yet assigned us a PID
|
|
|
|
// - response had no PID, meaning it's from the kernel as a multicast reply
|
|
|
|
if m.Header.PID != request.Header.PID && request.Header.PID != 0 && m.Header.PID != 0 {
|
2017-01-09 20:33:55 +01:00
|
|
|
return errMismatchedPID
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Config contains options for a Conn.
|
|
|
|
type Config struct {
|
|
|
|
// Groups is a bitmask which specifies multicast groups. If set to 0,
|
|
|
|
// no multicast group subscriptions will be made.
|
|
|
|
Groups uint32
|
2018-01-25 18:20:39 +01:00
|
|
|
|
|
|
|
// Experimental: do not lock the internal system call handling goroutine
|
|
|
|
// to its OS thread. This may result in a speed-up of system call handling,
|
|
|
|
// but may cause unexpected behavior when sending and receiving a large number
|
|
|
|
// of messages.
|
|
|
|
//
|
|
|
|
// This should almost certainly be set to false, but if you come up with a
|
|
|
|
// valid reason for using this, please file an issue at
|
|
|
|
// https://github.com/mdlayher/netlink to discuss your thoughts.
|
|
|
|
NoLockThread bool
|
2017-01-09 20:33:55 +01:00
|
|
|
}
|