package tio import ( "io" "github.com/slackhq/nebula/wire" ) // QueueSet holds one or many Queue objects and helps close them in an orderly way. type QueueSet interface { io.Closer Queues() []Queue // Add takes a tun fd, adds it to the set, and prepares it for use as a Queue. Add(fd int) error } // Capabilities advertises which kernel offload features a Queue successfully negotiated. // Callers consult this to decide which coalescers to wire onto the write path. type Capabilities struct { // TSO means the FD was opened with IFF_VNET_HDR and the kernel agreed // to TUN_F_TSO4|TSO6 — i.e. WriteGSO with GSOProtoTCP is safe. TSO bool // USO means the kernel additionally agreed to TUN_F_USO4|USO6, so // WriteGSO with GSOProtoUDP is safe. Linux ≥ 6.2. USO bool } // Queue is a readable/writable Poll queue. One Queue is driven by a single // read goroutine plus a single writer (see Write below). type Queue interface { io.Closer // Read will read at least 1 packet from the tun (up to len(p)). // mem will be used to provide the backing for each of p[n].Bytes. // Callers should size mem and p to avoid exhausting mem before p. // Returns the number of packets actually read, or error. Read(p []wire.TunPacket, mem []byte) (int, error) // Write emits a single packet on the plaintext (outside→inside) // delivery path. Write(p []byte) (int, error) // Capabilities returns the Queue's negotiated offload capabilities, // or the zero value when q does not advertise any. Capabilities() Capabilities } // GSOInfo describes a kernel-supplied superpacket sitting in Packet.Bytes. // The zero value means "not a superpacket" — Bytes is one regular IP // datagram and no segmentation is required. type GSOInfo struct { // Size is the GSO segment size: max payload bytes per segment // (== TCP MSS for TSO, == UDP payload chunk for USO). Zero means // not a superpacket. Size uint16 // HdrLen is the total L3+L4 header length within Bytes (already // corrected via correctHdrLen, so safe to slice on). HdrLen uint16 // CsumStart is the L4 header offset inside Bytes (== L3 header // length). CsumStart uint16 // Proto picks the L4 protocol (TCP or UDP) so the segmenter knows // which checksum/header layout to apply. Proto GSOProto } // GSOProto selects the L4 protocol for a GSO superpacket. Determines which // VIRTIO_NET_HDR_GSO_* type the writer stamps and which checksum offset // inside the transport header virtio NEEDS_CSUM expects. type GSOProto uint8 const ( GSOProtoNone GSOProto = iota GSOProtoTCP GSOProtoUDP ) // GSOWriter is implemented by Queues that can emit a TCP or UDP superpacket // assembled from a header prefix plus one or more borrowed payload // fragments, in a single vectored write (writev with a leading // virtio_net_hdr). This lets the coalescer avoid copying payload bytes // between the caller's decrypt buffer and the TUN. Backends without GSO // support do not implement this interface and coalescing is skipped. // // hdr contains the IPv4/IPv6 header prefix (mutable - callers will have // filled in total length and IP csum). transportHdr is the TCP or UDP // header (mutable - the L4 checksum field must hold the pseudo-header // partial, single-fold not inverted, per virtio NEEDS_CSUM semantics). // pays are non-overlapping payload fragments whose concatenation is the // full superpacket payload; they are read-only from the writer's // perspective and must remain valid until the call returns. Every segment // in pays except possibly the last is exactly the same size. proto picks // the L4 protocol so the writer knows which GSOType / CsumOffset to set. // // Callers should also consult CapsProvider (via SupportsGSO or // QueueCapabilities) for the per-protocol negotiated capability; an // implementation of GSOWriter is necessary but not sufficient since USO // may not have been negotiated even when TSO was. type GSOWriter interface { WriteGSO(hdr []byte, transportHdr []byte, pays [][]byte, proto GSOProto) error } // SupportsGSO reports whether w implements GSOWriter and the underlying // queue advertises the negotiated capability for `want`. A writer that // implements GSOWriter but not CapsProvider is treated as permissive // (used by tests and fakes that don't negotiate). func SupportsGSO(w Queue, want GSOProto) (GSOWriter, bool) { gw, ok := w.(GSOWriter) if !ok { return nil, false } caps := w.Capabilities() switch want { case GSOProtoTCP: return gw, caps.TSO case GSOProtoUDP: return gw, caps.USO default: return gw, false } }