mirror of
https://git.FreeBSD.org/src.git
synced 2025-01-24 16:10:11 +00:00
d0728d7174
network stacks, VNET_SYSINIT: - Add VNET_SYSINIT and VNET_SYSUNINIT macros to declare events that will occur each time a network stack is instantiated and destroyed. In the !VIMAGE case, these are simply mapped into regular SYSINIT/SYSUNINIT. For the VIMAGE case, we instead use SYSINIT's to track their order and properties on registration, using them for each vnet when created/ destroyed, or immediately on module load for already-started vnets. - Remove vnet_modinfo mechanism that existed to serve this purpose previously, as well as its dependency scheme: we now just use the SYSINIT ordering scheme. - Implement VNET_DOMAIN_SET() to allow protocol domains to declare that they want init functions to be called for each virtual network stack rather than just once at boot, compiling down to DOMAIN_SET() in the non-VIMAGE case. - Walk all virtualized kernel subsystems and make use of these instead of modinfo or DOMAIN_SET() for init/uninit events. In some cases, convert modular components from using modevent to using sysinit (where appropriate). In some cases, do minor rejuggling of SYSINIT ordering to make room for or better manage events. Portions submitted by: jhb (VNET_SYSINIT), bz (cleanup) Discussed with: jhb, bz, julian, zec Reviewed by: bz Approved by: re (VIMAGE blanket)
414 lines
11 KiB
C
414 lines
11 KiB
C
/*-
|
|
* Copyright (c) 1982, 1986, 1993
|
|
* The Regents of the University of California. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 4. Neither the name of the University nor the names of its contributors
|
|
* may be used to endorse or promote products derived from this software
|
|
* without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*
|
|
* @(#)in_proto.c 8.2 (Berkeley) 2/9/95
|
|
*/
|
|
|
|
#include <sys/cdefs.h>
|
|
__FBSDID("$FreeBSD$");
|
|
|
|
#include "opt_ipx.h"
|
|
#include "opt_mrouting.h"
|
|
#include "opt_ipsec.h"
|
|
#include "opt_inet6.h"
|
|
#include "opt_pf.h"
|
|
#include "opt_carp.h"
|
|
#include "opt_sctp.h"
|
|
#include "opt_mpath.h"
|
|
|
|
#include <sys/param.h>
|
|
#include <sys/systm.h>
|
|
#include <sys/kernel.h>
|
|
#include <sys/socket.h>
|
|
#include <sys/domain.h>
|
|
#include <sys/proc.h>
|
|
#include <sys/protosw.h>
|
|
#include <sys/queue.h>
|
|
#include <sys/sysctl.h>
|
|
#include <sys/vimage.h>
|
|
|
|
#include <net/if.h>
|
|
#include <net/route.h>
|
|
#ifdef RADIX_MPATH
|
|
#include <net/radix_mpath.h>
|
|
#endif
|
|
|
|
#include <netinet/in.h>
|
|
#include <netinet/in_systm.h>
|
|
#include <netinet/in_var.h>
|
|
#include <netinet/ip.h>
|
|
#include <netinet/ip_var.h>
|
|
#include <netinet/ip_icmp.h>
|
|
#include <netinet/igmp_var.h>
|
|
#include <netinet/tcp.h>
|
|
#include <netinet/tcp_timer.h>
|
|
#include <netinet/tcp_var.h>
|
|
#include <netinet/udp.h>
|
|
#include <netinet/udp_var.h>
|
|
#include <netinet/ip_encap.h>
|
|
|
|
/*
|
|
* TCP/IP protocol family: IP, ICMP, UDP, TCP.
|
|
*/
|
|
|
|
static struct pr_usrreqs nousrreqs;
|
|
|
|
#ifdef IPSEC
|
|
#include <netipsec/ipsec.h>
|
|
#endif /* IPSEC */
|
|
|
|
#ifdef SCTP
|
|
#include <netinet/in_pcb.h>
|
|
#include <netinet/sctp_pcb.h>
|
|
#include <netinet/sctp.h>
|
|
#include <netinet/sctp_var.h>
|
|
#endif /* SCTP */
|
|
|
|
#ifdef DEV_PFSYNC
|
|
#include <net/pfvar.h>
|
|
#include <net/if_pfsync.h>
|
|
#endif
|
|
|
|
#ifdef DEV_CARP
|
|
#include <netinet/ip_carp.h>
|
|
#endif
|
|
|
|
extern struct domain inetdomain;
|
|
|
|
/* Spacer for loadable protocols. */
|
|
#define IPPROTOSPACER \
|
|
{ \
|
|
.pr_domain = &inetdomain, \
|
|
.pr_protocol = PROTO_SPACER, \
|
|
.pr_usrreqs = &nousrreqs \
|
|
}
|
|
|
|
struct protosw inetsw[] = {
|
|
{
|
|
.pr_type = 0,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_IP,
|
|
.pr_init = ip_init,
|
|
.pr_slowtimo = ip_slowtimo,
|
|
.pr_drain = ip_drain,
|
|
.pr_usrreqs = &nousrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_DGRAM,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_UDP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = udp_input,
|
|
.pr_ctlinput = udp_ctlinput,
|
|
.pr_ctloutput = udp_ctloutput,
|
|
.pr_init = udp_init,
|
|
#ifdef VIMAGE
|
|
.pr_destroy = udp_destroy,
|
|
#endif
|
|
.pr_usrreqs = &udp_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_STREAM,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_TCP,
|
|
.pr_flags = PR_CONNREQUIRED|PR_IMPLOPCL|PR_WANTRCVD,
|
|
.pr_input = tcp_input,
|
|
.pr_ctlinput = tcp_ctlinput,
|
|
.pr_ctloutput = tcp_ctloutput,
|
|
.pr_init = tcp_init,
|
|
#ifdef VIMAGE
|
|
.pr_destroy = tcp_destroy,
|
|
#endif
|
|
.pr_slowtimo = tcp_slowtimo,
|
|
.pr_drain = tcp_drain,
|
|
.pr_usrreqs = &tcp_usrreqs
|
|
},
|
|
#ifdef SCTP
|
|
{
|
|
.pr_type = SOCK_DGRAM,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_SCTP,
|
|
.pr_flags = PR_WANTRCVD,
|
|
.pr_input = sctp_input,
|
|
.pr_ctlinput = sctp_ctlinput,
|
|
.pr_ctloutput = sctp_ctloutput,
|
|
.pr_init = sctp_init,
|
|
.pr_drain = sctp_drain,
|
|
.pr_usrreqs = &sctp_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_SEQPACKET,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_SCTP,
|
|
.pr_flags = PR_WANTRCVD,
|
|
.pr_input = sctp_input,
|
|
.pr_ctlinput = sctp_ctlinput,
|
|
.pr_ctloutput = sctp_ctloutput,
|
|
.pr_drain = sctp_drain,
|
|
.pr_usrreqs = &sctp_usrreqs
|
|
},
|
|
|
|
{
|
|
.pr_type = SOCK_STREAM,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_SCTP,
|
|
.pr_flags = PR_WANTRCVD,
|
|
.pr_input = sctp_input,
|
|
.pr_ctlinput = sctp_ctlinput,
|
|
.pr_ctloutput = sctp_ctloutput,
|
|
.pr_drain = sctp_drain,
|
|
.pr_usrreqs = &sctp_usrreqs
|
|
},
|
|
#endif /* SCTP */
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_RAW,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = rip_input,
|
|
.pr_ctlinput = rip_ctlinput,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_ICMP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = icmp_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = icmp_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_IGMP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = igmp_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_fasttimo = igmp_fasttimo,
|
|
.pr_slowtimo = igmp_slowtimo,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_RSVP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = rsvp_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
#ifdef IPSEC
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_AH,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = ah4_input,
|
|
.pr_ctlinput = ah4_ctlinput,
|
|
.pr_usrreqs = &nousrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_ESP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = esp4_input,
|
|
.pr_ctlinput = esp4_ctlinput,
|
|
.pr_usrreqs = &nousrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_IPCOMP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = ipcomp4_input,
|
|
.pr_usrreqs = &nousrreqs
|
|
},
|
|
#endif /* IPSEC */
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_IPV4,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = encap_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_MOBILE,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = encap_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_ETHERIP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = encap_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_GRE,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = encap_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
# ifdef INET6
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_IPV6,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = encap_init,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
#endif
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_PIM,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR|PR_LASTHDR,
|
|
.pr_input = encap4_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
#ifdef DEV_PFSYNC
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_PFSYNC,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = pfsync_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
#endif /* DEV_PFSYNC */
|
|
#ifdef DEV_CARP
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_protocol = IPPROTO_CARP,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = carp_input,
|
|
.pr_output = (pr_output_t*)rip_output,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
#endif /* DEV_CARP */
|
|
/* Spacer n-times for loadable protocols. */
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
IPPROTOSPACER,
|
|
/* raw wildcard */
|
|
{
|
|
.pr_type = SOCK_RAW,
|
|
.pr_domain = &inetdomain,
|
|
.pr_flags = PR_ATOMIC|PR_ADDR,
|
|
.pr_input = rip_input,
|
|
.pr_ctloutput = rip_ctloutput,
|
|
.pr_init = rip_init,
|
|
#ifdef VIMAGE
|
|
.pr_destroy = rip_destroy,
|
|
#endif
|
|
.pr_usrreqs = &rip_usrreqs
|
|
},
|
|
};
|
|
|
|
extern int in_inithead(void **, int);
|
|
extern int in_detachhead(void **, int);
|
|
|
|
struct domain inetdomain = {
|
|
.dom_family = AF_INET,
|
|
.dom_name = "internet",
|
|
.dom_protosw = inetsw,
|
|
.dom_protoswNPROTOSW = &inetsw[sizeof(inetsw)/sizeof(inetsw[0])],
|
|
#ifdef RADIX_MPATH
|
|
.dom_rtattach = rn4_mpath_inithead,
|
|
#else
|
|
.dom_rtattach = in_inithead,
|
|
#endif
|
|
#ifdef VIMAGE
|
|
.dom_rtdetach = in_detachhead,
|
|
#endif
|
|
.dom_rtoffset = 32,
|
|
.dom_maxrtkey = sizeof(struct sockaddr_in),
|
|
.dom_ifattach = in_domifattach,
|
|
.dom_ifdetach = in_domifdetach
|
|
};
|
|
|
|
VNET_DOMAIN_SET(inet);
|
|
|
|
SYSCTL_NODE(_net, PF_INET, inet, CTLFLAG_RW, 0,
|
|
"Internet Family");
|
|
|
|
SYSCTL_NODE(_net_inet, IPPROTO_IP, ip, CTLFLAG_RW, 0, "IP");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_ICMP, icmp, CTLFLAG_RW, 0, "ICMP");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_UDP, udp, CTLFLAG_RW, 0, "UDP");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_TCP, tcp, CTLFLAG_RW, 0, "TCP");
|
|
#ifdef SCTP
|
|
SYSCTL_NODE(_net_inet, IPPROTO_SCTP, sctp, CTLFLAG_RW, 0, "SCTP");
|
|
#endif
|
|
SYSCTL_NODE(_net_inet, IPPROTO_IGMP, igmp, CTLFLAG_RW, 0, "IGMP");
|
|
#ifdef IPSEC
|
|
/* XXX no protocol # to use, pick something "reserved" */
|
|
SYSCTL_NODE(_net_inet, 253, ipsec, CTLFLAG_RW, 0, "IPSEC");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_AH, ah, CTLFLAG_RW, 0, "AH");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_ESP, esp, CTLFLAG_RW, 0, "ESP");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_IPCOMP, ipcomp, CTLFLAG_RW, 0, "IPCOMP");
|
|
SYSCTL_NODE(_net_inet, IPPROTO_IPIP, ipip, CTLFLAG_RW, 0, "IPIP");
|
|
#endif /* IPSEC */
|
|
SYSCTL_NODE(_net_inet, IPPROTO_RAW, raw, CTLFLAG_RW, 0, "RAW");
|
|
#ifdef DEV_PFSYNC
|
|
SYSCTL_NODE(_net_inet, IPPROTO_PFSYNC, pfsync, CTLFLAG_RW, 0, "PFSYNC");
|
|
#endif
|
|
#ifdef DEV_CARP
|
|
SYSCTL_NODE(_net_inet, IPPROTO_CARP, carp, CTLFLAG_RW, 0, "CARP");
|
|
#endif
|