1/* SPDX-License-Identifier: GPL-2.0-or-later */
2/*
3 * NET		An implementation of the SOCKET network access protocol.
4 *		This is the master header file for the Linux NET layer,
5 *		or, in plain English: the networking handling part of the
6 *		kernel.
7 *
8 * Version:	@(#)net.h	1.0.3	05/25/93
9 *
10 * Authors:	Orest Zborowski, <obz@Kodak.COM>
11 *		Ross Biro
12 *		Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
13 */
14#ifndef _LINUX_NET_H
15#define _LINUX_NET_H
16
17#include <linux/stringify.h>
18#include <linux/random.h>
19#include <linux/wait.h>
20#include <linux/fcntl.h>	/* For O_CLOEXEC and O_NONBLOCK */
21#include <linux/rcupdate.h>
22#include <linux/once.h>
23#include <linux/fs.h>
24#include <linux/mm.h>
25#include <linux/sockptr.h>
26
27#include <uapi/linux/net.h>
28
29struct poll_table_struct;
30struct pipe_inode_info;
31struct inode;
32struct file;
33struct net;
34
35/* Historically, SOCKWQ_ASYNC_NOSPACE & SOCKWQ_ASYNC_WAITDATA were located
36 * in sock->flags, but moved into sk->sk_wq->flags to be RCU protected.
37 * Eventually all flags will be in sk->sk_wq->flags.
38 */
39#define SOCKWQ_ASYNC_NOSPACE	0
40#define SOCKWQ_ASYNC_WAITDATA	1
41#define SOCK_NOSPACE		2
42#define SOCK_PASSCRED		3
43#define SOCK_PASSSEC		4
44#define SOCK_SUPPORT_ZC		5
45#define SOCK_CUSTOM_SOCKOPT	6
46#define SOCK_PASSPIDFD		7
47
48#ifndef ARCH_HAS_SOCKET_TYPES
49/**
50 * enum sock_type - Socket types
51 * @SOCK_STREAM: stream (connection) socket
52 * @SOCK_DGRAM: datagram (conn.less) socket
53 * @SOCK_RAW: raw socket
54 * @SOCK_RDM: reliably-delivered message
55 * @SOCK_SEQPACKET: sequential packet socket
56 * @SOCK_DCCP: Datagram Congestion Control Protocol socket
57 * @SOCK_PACKET: linux specific way of getting packets at the dev level.
58 *		  For writing rarp and other similar things on the user level.
59 *
60 * When adding some new socket type please
61 * grep ARCH_HAS_SOCKET_TYPE include/asm-* /socket.h, at least MIPS
62 * overrides this enum for binary compat reasons.
63 */
64enum sock_type {
65	SOCK_STREAM	= 1,
66	SOCK_DGRAM	= 2,
67	SOCK_RAW	= 3,
68	SOCK_RDM	= 4,
69	SOCK_SEQPACKET	= 5,
70	SOCK_DCCP	= 6,
71	SOCK_PACKET	= 10,
72};
73
74#define SOCK_MAX (SOCK_PACKET + 1)
75/* Mask which covers at least up to SOCK_MASK-1.  The
76 * remaining bits are used as flags. */
77#define SOCK_TYPE_MASK 0xf
78
79/* Flags for socket, socketpair, accept4 */
80#define SOCK_CLOEXEC	O_CLOEXEC
81#ifndef SOCK_NONBLOCK
82#define SOCK_NONBLOCK	O_NONBLOCK
83#endif
84
85#endif /* ARCH_HAS_SOCKET_TYPES */
86
87/**
88 * enum sock_shutdown_cmd - Shutdown types
89 * @SHUT_RD: shutdown receptions
90 * @SHUT_WR: shutdown transmissions
91 * @SHUT_RDWR: shutdown receptions/transmissions
92 */
93enum sock_shutdown_cmd {
94	SHUT_RD,
95	SHUT_WR,
96	SHUT_RDWR,
97};
98
99struct socket_wq {
100	/* Note: wait MUST be first field of socket_wq */
101	wait_queue_head_t	wait;
102	struct fasync_struct	*fasync_list;
103	unsigned long		flags; /* %SOCKWQ_ASYNC_NOSPACE, etc */
104	struct rcu_head		rcu;
105} ____cacheline_aligned_in_smp;
106
107/**
108 *  struct socket - general BSD socket
109 *  @state: socket state (%SS_CONNECTED, etc)
110 *  @type: socket type (%SOCK_STREAM, etc)
111 *  @flags: socket flags (%SOCK_NOSPACE, etc)
112 *  @ops: protocol specific socket operations
113 *  @file: File back pointer for gc
114 *  @sk: internal networking protocol agnostic socket representation
115 *  @wq: wait queue for several uses
116 */
117struct socket {
118	socket_state		state;
119
120	short			type;
121
122	unsigned long		flags;
123
124	struct file		*file;
125	struct sock		*sk;
126	const struct proto_ops	*ops; /* Might change with IPV6_ADDRFORM or MPTCP. */
127
128	struct socket_wq	wq;
129};
130
131/*
132 * "descriptor" for what we're up to with a read.
133 * This allows us to use the same read code yet
134 * have multiple different users of the data that
135 * we read from a file.
136 *
137 * The simplest case just copies the data to user
138 * mode.
139 */
140typedef struct {
141	size_t written;
142	size_t count;
143	union {
144		char __user *buf;
145		void *data;
146	} arg;
147	int error;
148} read_descriptor_t;
149
150struct vm_area_struct;
151struct page;
152struct sockaddr;
153struct msghdr;
154struct module;
155struct sk_buff;
156typedef int (*sk_read_actor_t)(read_descriptor_t *, struct sk_buff *,
157			       unsigned int, size_t);
158typedef int (*skb_read_actor_t)(struct sock *, struct sk_buff *);
159
160
161struct proto_ops {
162	int		family;
163	struct module	*owner;
164	int		(*release)   (struct socket *sock);
165	int		(*bind)	     (struct socket *sock,
166				      struct sockaddr *myaddr,
167				      int sockaddr_len);
168	int		(*connect)   (struct socket *sock,
169				      struct sockaddr *vaddr,
170				      int sockaddr_len, int flags);
171	int		(*socketpair)(struct socket *sock1,
172				      struct socket *sock2);
173	int		(*accept)    (struct socket *sock,
174				      struct socket *newsock, int flags, bool kern);
175	int		(*getname)   (struct socket *sock,
176				      struct sockaddr *addr,
177				      int peer);
178	__poll_t	(*poll)	     (struct file *file, struct socket *sock,
179				      struct poll_table_struct *wait);
180	int		(*ioctl)     (struct socket *sock, unsigned int cmd,
181				      unsigned long arg);
182#ifdef CONFIG_COMPAT
183	int	 	(*compat_ioctl) (struct socket *sock, unsigned int cmd,
184				      unsigned long arg);
185#endif
186	int		(*gettstamp) (struct socket *sock, void __user *userstamp,
187				      bool timeval, bool time32);
188	int		(*listen)    (struct socket *sock, int len);
189	int		(*shutdown)  (struct socket *sock, int flags);
190	int		(*setsockopt)(struct socket *sock, int level,
191				      int optname, sockptr_t optval,
192				      unsigned int optlen);
193	int		(*getsockopt)(struct socket *sock, int level,
194				      int optname, char __user *optval, int __user *optlen);
195	void		(*show_fdinfo)(struct seq_file *m, struct socket *sock);
196	int		(*sendmsg)   (struct socket *sock, struct msghdr *m,
197				      size_t total_len);
198	/* Notes for implementing recvmsg:
199	 * ===============================
200	 * msg->msg_namelen should get updated by the recvmsg handlers
201	 * iff msg_name != NULL. It is by default 0 to prevent
202	 * returning uninitialized memory to user space.  The recvfrom
203	 * handlers can assume that msg.msg_name is either NULL or has
204	 * a minimum size of sizeof(struct sockaddr_storage).
205	 */
206	int		(*recvmsg)   (struct socket *sock, struct msghdr *m,
207				      size_t total_len, int flags);
208	int		(*mmap)	     (struct file *file, struct socket *sock,
209				      struct vm_area_struct * vma);
210	ssize_t 	(*splice_read)(struct socket *sock,  loff_t *ppos,
211				       struct pipe_inode_info *pipe, size_t len, unsigned int flags);
212	void		(*splice_eof)(struct socket *sock);
213	int		(*set_peek_off)(struct sock *sk, int val);
214	int		(*peek_len)(struct socket *sock);
215
216	/* The following functions are called internally by kernel with
217	 * sock lock already held.
218	 */
219	int		(*read_sock)(struct sock *sk, read_descriptor_t *desc,
220				     sk_read_actor_t recv_actor);
221	/* This is different from read_sock(), it reads an entire skb at a time. */
222	int		(*read_skb)(struct sock *sk, skb_read_actor_t recv_actor);
223	int		(*sendmsg_locked)(struct sock *sk, struct msghdr *msg,
224					  size_t size);
225	int		(*set_rcvlowat)(struct sock *sk, int val);
226};
227
228#define DECLARE_SOCKADDR(type, dst, src)	\
229	type dst = ({ __sockaddr_check_size(sizeof(*dst)); (type) src; })
230
231struct net_proto_family {
232	int		family;
233	int		(*create)(struct net *net, struct socket *sock,
234				  int protocol, int kern);
235	struct module	*owner;
236};
237
238struct iovec;
239struct kvec;
240
241enum {
242	SOCK_WAKE_IO,
243	SOCK_WAKE_WAITD,
244	SOCK_WAKE_SPACE,
245	SOCK_WAKE_URG,
246};
247
248int sock_wake_async(struct socket_wq *sk_wq, int how, int band);
249int sock_register(const struct net_proto_family *fam);
250void sock_unregister(int family);
251bool sock_is_registered(int family);
252int __sock_create(struct net *net, int family, int type, int proto,
253		  struct socket **res, int kern);
254int sock_create(int family, int type, int proto, struct socket **res);
255int sock_create_kern(struct net *net, int family, int type, int proto, struct socket **res);
256int sock_create_lite(int family, int type, int proto, struct socket **res);
257struct socket *sock_alloc(void);
258void sock_release(struct socket *sock);
259int sock_sendmsg(struct socket *sock, struct msghdr *msg);
260int sock_recvmsg(struct socket *sock, struct msghdr *msg, int flags);
261struct file *sock_alloc_file(struct socket *sock, int flags, const char *dname);
262struct socket *sockfd_lookup(int fd, int *err);
263struct socket *sock_from_file(struct file *file);
264#define		     sockfd_put(sock) fput(sock->file)
265int net_ratelimit(void);
266
267#define net_ratelimited_function(function, ...)			\
268do {								\
269	if (net_ratelimit())					\
270		function(__VA_ARGS__);				\
271} while (0)
272
273#define net_emerg_ratelimited(fmt, ...)				\
274	net_ratelimited_function(pr_emerg, fmt, ##__VA_ARGS__)
275#define net_alert_ratelimited(fmt, ...)				\
276	net_ratelimited_function(pr_alert, fmt, ##__VA_ARGS__)
277#define net_crit_ratelimited(fmt, ...)				\
278	net_ratelimited_function(pr_crit, fmt, ##__VA_ARGS__)
279#define net_err_ratelimited(fmt, ...)				\
280	net_ratelimited_function(pr_err, fmt, ##__VA_ARGS__)
281#define net_notice_ratelimited(fmt, ...)			\
282	net_ratelimited_function(pr_notice, fmt, ##__VA_ARGS__)
283#define net_warn_ratelimited(fmt, ...)				\
284	net_ratelimited_function(pr_warn, fmt, ##__VA_ARGS__)
285#define net_info_ratelimited(fmt, ...)				\
286	net_ratelimited_function(pr_info, fmt, ##__VA_ARGS__)
287#if defined(CONFIG_DYNAMIC_DEBUG) || \
288	(defined(CONFIG_DYNAMIC_DEBUG_CORE) && defined(DYNAMIC_DEBUG_MODULE))
289#define net_dbg_ratelimited(fmt, ...)					\
290do {									\
291	DEFINE_DYNAMIC_DEBUG_METADATA(descriptor, fmt);			\
292	if (DYNAMIC_DEBUG_BRANCH(descriptor) &&				\
293	    net_ratelimit())						\
294		__dynamic_pr_debug(&descriptor, pr_fmt(fmt),		\
295		                   ##__VA_ARGS__);			\
296} while (0)
297#elif defined(DEBUG)
298#define net_dbg_ratelimited(fmt, ...)				\
299	net_ratelimited_function(pr_debug, fmt, ##__VA_ARGS__)
300#else
301#define net_dbg_ratelimited(fmt, ...)				\
302	no_printk(KERN_DEBUG pr_fmt(fmt), ##__VA_ARGS__)
303#endif
304
305#define net_get_random_once(buf, nbytes)			\
306	get_random_once((buf), (nbytes))
307
308/*
309 * E.g. XFS meta- & log-data is in slab pages, or bcache meta
310 * data pages, or other high order pages allocated by
311 * __get_free_pages() without __GFP_COMP, which have a page_count
312 * of 0 and/or have PageSlab() set. We cannot use send_page for
313 * those, as that does get_page(); put_page(); and would cause
314 * either a VM_BUG directly, or __page_cache_release a page that
315 * would actually still be referenced by someone, leading to some
316 * obscure delayed Oops somewhere else.
317 */
318static inline bool sendpage_ok(struct page *page)
319{
320	return !PageSlab(page) && page_count(page) >= 1;
321}
322
323int kernel_sendmsg(struct socket *sock, struct msghdr *msg, struct kvec *vec,
324		   size_t num, size_t len);
325int kernel_sendmsg_locked(struct sock *sk, struct msghdr *msg,
326			  struct kvec *vec, size_t num, size_t len);
327int kernel_recvmsg(struct socket *sock, struct msghdr *msg, struct kvec *vec,
328		   size_t num, size_t len, int flags);
329
330int kernel_bind(struct socket *sock, struct sockaddr *addr, int addrlen);
331int kernel_listen(struct socket *sock, int backlog);
332int kernel_accept(struct socket *sock, struct socket **newsock, int flags);
333int kernel_connect(struct socket *sock, struct sockaddr *addr, int addrlen,
334		   int flags);
335int kernel_getsockname(struct socket *sock, struct sockaddr *addr);
336int kernel_getpeername(struct socket *sock, struct sockaddr *addr);
337int kernel_sock_shutdown(struct socket *sock, enum sock_shutdown_cmd how);
338
339/* Routine returns the IP overhead imposed by a (caller-protected) socket. */
340u32 kernel_sock_ip_overhead(struct sock *sk);
341
342#define MODULE_ALIAS_NETPROTO(proto) \
343	MODULE_ALIAS("net-pf-" __stringify(proto))
344
345#define MODULE_ALIAS_NET_PF_PROTO(pf, proto) \
346	MODULE_ALIAS("net-pf-" __stringify(pf) "-proto-" __stringify(proto))
347
348#define MODULE_ALIAS_NET_PF_PROTO_TYPE(pf, proto, type) \
349	MODULE_ALIAS("net-pf-" __stringify(pf) "-proto-" __stringify(proto) \
350		     "-type-" __stringify(type))
351
352#define MODULE_ALIAS_NET_PF_PROTO_NAME(pf, proto, name) \
353	MODULE_ALIAS("net-pf-" __stringify(pf) "-proto-" __stringify(proto) \
354		     name)
355#endif	/* _LINUX_NET_H */
356