| /* |
| * CDDL HEADER START |
| * |
| * The contents of this file are subject to the terms of the |
| * Common Development and Distribution License (the "License"). |
| * You may not use this file except in compliance with the License. |
| * |
| * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE |
| * or http://www.opensolaris.org/os/licensing. |
| * See the License for the specific language governing permissions |
| * and limitations under the License. |
| * |
| * When distributing Covered Code, include this CDDL HEADER in each |
| * file and include the License file at usr/src/OPENSOLARIS.LICENSE. |
| * If applicable, add the following below this CDDL HEADER, with the |
| * fields enclosed by brackets "[]" replaced with your own identifying |
| * information: Portions Copyright [yyyy] [name of copyright owner] |
| * |
| * CDDL HEADER END |
| */ |
| |
| /* |
| * Copyright 2009 Sun Microsystems, Inc. All rights reserved. |
| * Use is subject to license terms. |
| */ |
| |
| /* Copyright (c) 1983, 1984, 1985, 1986, 1987, 1988, 1989 AT&T */ |
| /* All Rights Reserved */ |
| |
| /* |
| * University Copyright- Copyright (c) 1982, 1986, 1988 |
| * The Regents of the University of California |
| * All Rights Reserved |
| * |
| * University Acknowledgment- Portions of this document are derived from |
| * software developed by the University of California, Berkeley, and its |
| * contributors. |
| */ |
| |
| #ifndef _SYS_SOCKETVAR_H |
| #define _SYS_SOCKETVAR_H |
| |
| #include <sys/types.h> |
| #include <sys/stream.h> |
| #include <sys/t_lock.h> |
| #include <sys/cred.h> |
| #include <sys/vnode.h> |
| #include <sys/file.h> |
| #include <sys/param.h> |
| #include <sys/zone.h> |
| #include <sys/sdt.h> |
| #include <sys/modctl.h> |
| #include <sys/atomic.h> |
| #include <sys/socket.h> |
| #include <sys/ksocket.h> |
| #include <sys/sodirect.h> |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| /* |
| * Internal representation of the address used to represent addresses |
| * in the loopback transport for AF_UNIX. While the sockaddr_un is used |
| * as the sockfs layer address for AF_UNIX the pathnames contained in |
| * these addresses are not unique (due to relative pathnames) thus can not |
| * be used in the transport. |
| * |
| * The transport level address consists of a magic number (used to separate the |
| * name space for specific and implicit binds). For a specific bind |
| * this is followed by a "vnode *" which ensures that all specific binds |
| * have a unique transport level address. For implicit binds the latter |
| * part of the address is a byte string (of the same length as a pointer) |
| * that is assigned by the loopback transport. |
| * |
| * The uniqueness assumes that the loopback transport has a separate namespace |
| * for sockets in order to avoid name conflicts with e.g. TLI use of the |
| * same transport. |
| */ |
| struct so_ux_addr { |
| void *soua_vp; /* vnode pointer or assigned by tl */ |
| uint_t soua_magic; /* See below */ |
| }; |
| |
| #define SOU_MAGIC_EXPLICIT 0x75787670 /* "uxvp" */ |
| #define SOU_MAGIC_IMPLICIT 0x616e6f6e /* "anon" */ |
| |
| struct sockaddr_ux { |
| sa_family_t sou_family; /* AF_UNIX */ |
| struct so_ux_addr sou_addr; |
| }; |
| |
| #if defined(_KERNEL) || defined(_KMEMUSER) |
| |
| #include <sys/socket_proto.h> |
| |
| typedef struct sonodeops sonodeops_t; |
| typedef struct sonode sonode_t; |
| |
| /* |
| * The sonode represents a socket. A sonode never exist in the file system |
| * name space and can not be opened using open() - only the socket, socketpair |
| * and accept calls create sonodes. |
| * |
| * The locking of sockfs uses the so_lock mutex plus the SOLOCKED and |
| * SOREADLOCKED flags in so_flag. The mutex protects all the state in the |
| * sonode. It is expected that the underlying transport protocol serializes |
| * socket operations, so sockfs will not normally not single-thread |
| * operations. However, certain sockets, including TPI based ones, can only |
| * handle one control operation at a time. The SOLOCKED flag is used to |
| * single-thread operations from sockfs users to prevent e.g. multiple bind() |
| * calls to operate on the same sonode concurrently. The SOREADLOCKED flag is |
| * used to ensure that only one thread sleeps in kstrgetmsg for a given |
| * sonode. This is needed to ensure atomic operation for things like |
| * MSG_WAITALL. |
| * |
| * The so_fallback_rwlock is used to ensure that for sockets that can |
| * fall back to TPI, the fallback is not initiated until all pending |
| * operations have completed. |
| * |
| * Note that so_lock is sometimes held across calls that might go to sleep |
| * (kmem_alloc and soallocproto*). This implies that no other lock in |
| * the system should be held when calling into sockfs; from the system call |
| * side or from strrput (in case of TPI based sockets). If locks are held |
| * while calling into sockfs the system might hang when running low on memory. |
| */ |
| struct sonode { |
| struct vnode *so_vnode; /* vnode associated with this sonode */ |
| |
| sonodeops_t *so_ops; /* operations vector for this sonode */ |
| void *so_priv; /* sonode private data */ |
| |
| krwlock_t so_fallback_rwlock; |
| kmutex_t so_lock; /* protects sonode fields */ |
| |
| kcondvar_t so_state_cv; /* synchronize state changes */ |
| kcondvar_t so_want_cv; /* wait due to SOLOCKED */ |
| |
| /* These fields are protected by so_lock */ |
| |
| uint_t so_state; /* internal state flags SS_*, below */ |
| uint_t so_mode; /* characteristics on socket. SM_* */ |
| ushort_t so_flag; /* flags, see below */ |
| int so_count; /* count of opened references */ |
| |
| sock_connid_t so_proto_connid; /* protocol generation number */ |
| |
| ushort_t so_error; /* error affecting connection */ |
| |
| struct sockparams *so_sockparams; /* vnode or socket module */ |
| /* Needed to recreate the same socket for accept */ |
| short so_family; |
| short so_type; |
| short so_protocol; |
| short so_version; /* From so_socket call */ |
| |
| /* Accept queue */ |
| kmutex_t so_acceptq_lock; /* protects accept queue */ |
| struct sonode *so_acceptq_next; /* acceptq list node */ |
| struct sonode *so_acceptq_head; |
| struct sonode **so_acceptq_tail; |
| unsigned int so_acceptq_len; |
| unsigned int so_backlog; /* Listen backlog */ |
| kcondvar_t so_acceptq_cv; /* wait for new conn. */ |
| |
| /* Options */ |
| short so_options; /* From socket call, see socket.h */ |
| struct linger so_linger; /* SO_LINGER value */ |
| #define so_sndbuf so_proto_props.sopp_txhiwat /* SO_SNDBUF value */ |
| #define so_sndlowat so_proto_props.sopp_txlowat /* tx low water mark */ |
| #define so_rcvbuf so_proto_props.sopp_rxhiwat /* SO_RCVBUF value */ |
| #define so_rcvlowat so_proto_props.sopp_rxlowat /* rx low water mark */ |
| #define so_max_addr_len so_proto_props.sopp_maxaddrlen |
| #define so_minpsz so_proto_props.sopp_minpsz |
| #define so_maxpsz so_proto_props.sopp_maxpsz |
| |
| int so_xpg_rcvbuf; /* SO_RCVBUF value for XPG4 socket */ |
| clock_t so_sndtimeo; /* send timeout */ |
| clock_t so_rcvtimeo; /* recv timeout */ |
| |
| mblk_t *so_oobmsg; /* outofline oob data */ |
| ssize_t so_oobmark; /* offset of the oob data */ |
| |
| pid_t so_pgrp; /* pgrp for signals */ |
| |
| cred_t *so_peercred; /* connected socket peer cred */ |
| pid_t so_cpid; /* connected socket peer cached pid */ |
| zoneid_t so_zoneid; /* opener's zoneid */ |
| |
| struct pollhead so_poll_list; /* common pollhead */ |
| short so_pollev; /* events that should be generated */ |
| |
| /* Receive */ |
| unsigned int so_rcv_queued; /* # bytes on both rcv lists */ |
| mblk_t *so_rcv_q_head; /* processing/copyout rcv queue */ |
| mblk_t *so_rcv_q_last_head; |
| mblk_t *so_rcv_head; /* protocol prequeue */ |
| mblk_t *so_rcv_last_head; /* last mblk in b_next chain */ |
| kcondvar_t so_rcv_cv; /* wait for data */ |
| uint_t so_rcv_wanted; /* # of bytes wanted by app */ |
| timeout_id_t so_rcv_timer_tid; |
| |
| #define so_rcv_thresh so_proto_props.sopp_rcvthresh |
| #define so_rcv_timer_interval so_proto_props.sopp_rcvtimer |
| |
| kcondvar_t so_snd_cv; /* wait for snd buffers */ |
| uint32_t |
| so_snd_qfull: 1, /* Transmit full */ |
| so_rcv_wakeup: 1, |
| so_snd_wakeup: 1, |
| so_not_str: 1, /* B_TRUE if not streams based socket */ |
| so_pad_to_bit_31: 28; |
| |
| /* Communication channel with protocol */ |
| sock_lower_handle_t so_proto_handle; |
| sock_downcalls_t *so_downcalls; |
| |
| struct sock_proto_props so_proto_props; /* protocol settings */ |
| boolean_t so_flowctrld; /* Flow controlled */ |
| uint_t so_copyflag; /* Copy related flag */ |
| kcondvar_t so_copy_cv; /* Copy cond variable */ |
| |
| /* kernel sockets */ |
| ksocket_callbacks_t so_ksock_callbacks; |
| void *so_ksock_cb_arg; /* callback argument */ |
| kcondvar_t so_closing_cv; |
| |
| /* != NULL for sodirect_t enabled socket */ |
| sodirect_t *so_direct; |
| }; |
| |
| #define SO_HAVE_DATA(so) \ |
| /* \ |
| * For the (tid == 0) case we must check so_rcv_{q_,}head \ |
| * rather than (so_rcv_queued > 0), since the latter does not \ |
| * take into account mblks with only control/name information. \ |
| */ \ |
| ((so)->so_rcv_timer_tid == 0 && ((so)->so_rcv_head != NULL || \ |
| (so)->so_rcv_q_head != NULL)) || \ |
| ((so)->so_state & SS_CANTRCVMORE) |
| |
| /* |
| * Events handled by the protocol (in case sd_poll is set) |
| */ |
| #define SO_PROTO_POLLEV (POLLIN|POLLRDNORM|POLLRDBAND) |
| |
| |
| #endif /* _KERNEL || _KMEMUSER */ |
| |
| /* flags */ |
| #define SOMOD 0x0001 /* update socket modification time */ |
| #define SOACC 0x0002 /* update socket access time */ |
| |
| #define SOLOCKED 0x0010 /* use to serialize open/closes */ |
| #define SOREADLOCKED 0x0020 /* serialize kstrgetmsg calls */ |
| #define SOWANT 0x0040 /* some process waiting on lock */ |
| #define SOCLONE 0x0080 /* child of clone driver */ |
| #define SOASYNC_UNBIND 0x0100 /* wait for ACK of async unbind */ |
| |
| #define SOCK_IS_NONSTR(so) ((so)->so_not_str) |
| |
| /* |
| * Socket state bits. |
| */ |
| #define SS_ISCONNECTED 0x00000001 /* socket connected to a peer */ |
| #define SS_ISCONNECTING 0x00000002 /* in process, connecting to peer */ |
| #define SS_ISDISCONNECTING 0x00000004 /* in process of disconnecting */ |
| #define SS_CANTSENDMORE 0x00000008 /* can't send more data to peer */ |
| |
| #define SS_CANTRCVMORE 0x00000010 /* can't receive more data */ |
| #define SS_ISBOUND 0x00000020 /* socket is bound */ |
| #define SS_NDELAY 0x00000040 /* FNDELAY non-blocking */ |
| #define SS_NONBLOCK 0x00000080 /* O_NONBLOCK non-blocking */ |
| |
| #define SS_ASYNC 0x00000100 /* async i/o notify */ |
| #define SS_ACCEPTCONN 0x00000200 /* listen done */ |
| /* unused 0x00000400 */ /* was SS_HASCONNIND */ |
| #define SS_SAVEDEOR 0x00000800 /* Saved MSG_EOR rcv side state */ |
| |
| #define SS_RCVATMARK 0x00001000 /* at mark on input */ |
| #define SS_OOBPEND 0x00002000 /* OOB pending or present - poll */ |
| #define SS_HAVEOOBDATA 0x00004000 /* OOB data present */ |
| #define SS_HADOOBDATA 0x00008000 /* OOB data consumed */ |
| #define SS_CLOSING 0x00010000 /* in process of closing */ |
| |
| /* unused 0x00020000 */ /* was SS_FADDR_NOXLATE */ |
| /* unused 0x00040000 */ /* was SS_HASDATA */ |
| /* unused 0x00080000 */ /* was SS_DONEREAD */ |
| /* unused 0x00100000 */ /* was SS_MOREDATA */ |
| /* unused 0x00200000 */ /* was SS_DIRECT */ |
| |
| #define SS_SODIRECT 0x00400000 /* transport supports sodirect */ |
| |
| #define SS_SENTLASTREADSIG 0x01000000 /* last rx signal has been sent */ |
| #define SS_SENTLASTWRITESIG 0x02000000 /* last tx signal has been sent */ |
| |
| #define SS_FALLBACK_DRAIN 0x20000000 /* data was/is being drained */ |
| #define SS_FALLBACK_PENDING 0x40000000 /* fallback is pending */ |
| #define SS_FALLBACK_COMP 0x80000000 /* fallback has completed */ |
| |
| |
| /* Set of states when the socket can't be rebound */ |
| #define SS_CANTREBIND (SS_ISCONNECTED|SS_ISCONNECTING|SS_ISDISCONNECTING|\ |
| SS_CANTSENDMORE|SS_CANTRCVMORE|SS_ACCEPTCONN) |
| |
| /* |
| * Sockets that can fall back to TPI must ensure that fall back is not |
| * initiated while a thread is using a socket. |
| */ |
| #define SO_BLOCK_FALLBACK(so, fn) { \ |
| ASSERT(MUTEX_NOT_HELD(&(so)->so_lock)); \ |
| rw_enter(&(so)->so_fallback_rwlock, RW_READER); \ |
| if ((so)->so_state & SS_FALLBACK_COMP) { \ |
| rw_exit(&(so)->so_fallback_rwlock); \ |
| return (fn); \ |
| } \ |
| } |
| |
| #define SO_UNBLOCK_FALLBACK(so) { \ |
| rw_exit(&(so)->so_fallback_rwlock); \ |
| } |
| |
| /* Poll events */ |
| #define SO_POLLEV_IN 0x1 /* POLLIN wakeup needed */ |
| #define SO_POLLEV_ALWAYS 0x2 /* wakeups */ |
| |
| /* |
| * Characteristics of sockets. Not changed after the socket is created. |
| */ |
| #define SM_PRIV 0x001 /* privileged for broadcast, raw... */ |
| #define SM_ATOMIC 0x002 /* atomic data transmission */ |
| #define SM_ADDR 0x004 /* addresses given with messages */ |
| #define SM_CONNREQUIRED 0x008 /* connection required by protocol */ |
| |
| #define SM_FDPASSING 0x010 /* passes file descriptors */ |
| #define SM_EXDATA 0x020 /* Can handle T_EXDATA_REQ */ |
| #define SM_OPTDATA 0x040 /* Can handle T_OPTDATA_REQ */ |
| #define SM_BYTESTREAM 0x080 /* Byte stream - can use M_DATA */ |
| |
| #define SM_ACCEPTOR_ID 0x100 /* so_acceptor_id is valid */ |
| |
| #define SM_KERNEL 0x200 /* kernel socket */ |
| |
| /* The modes below are only for non-streams sockets */ |
| #define SM_ACCEPTSUPP 0x400 /* can handle accept() */ |
| #define SM_SENDFILESUPP 0x800 /* Private: proto supp sendfile */ |
| |
| /* |
| * Socket versions. Used by the socket library when calling _so_socket(). |
| */ |
| #define SOV_STREAM 0 /* Not a socket - just a stream */ |
| #define SOV_DEFAULT 1 /* Select based on so_default_version */ |
| #define SOV_SOCKSTREAM 2 /* Socket plus streams operations */ |
| #define SOV_SOCKBSD 3 /* Socket with no streams operations */ |
| #define SOV_XPG4_2 4 /* Xnet socket */ |
| |
| #if defined(_KERNEL) || defined(_KMEMUSER) |
| |
| /* |
| * sonode create and destroy functions. |
| */ |
| typedef struct sonode *(*so_create_func_t)(struct sockparams *, |
| int, int, int, int, int, int *, cred_t *); |
| typedef void (*so_destroy_func_t)(struct sonode *); |
| |
| /* STREAM device information */ |
| typedef struct sdev_info { |
| char *sd_devpath; |
| int sd_devpathlen; /* Is 0 if sp_devpath is a static string */ |
| vnode_t *sd_vnode; |
| } sdev_info_t; |
| |
| #define SOCKMOD_VERSION 1 |
| /* name of the TPI pseudo socket module */ |
| #define SOTPI_SMOD_NAME "socktpi" |
| |
| typedef struct __smod_priv_s { |
| so_create_func_t smodp_sock_create_func; |
| so_destroy_func_t smodp_sock_destroy_func; |
| so_proto_fallback_func_t smodp_proto_fallback_func; |
| } __smod_priv_t; |
| |
| /* |
| * Socket module register information |
| */ |
| typedef struct smod_reg_s { |
| int smod_version; |
| char *smod_name; |
| size_t smod_uc_version; |
| size_t smod_dc_version; |
| so_proto_create_func_t smod_proto_create_func; |
| |
| /* __smod_priv_data must be NULL */ |
| __smod_priv_t *__smod_priv; |
| } smod_reg_t; |
| |
| /* |
| * Socket module information |
| */ |
| typedef struct smod_info { |
| int smod_version; |
| char *smod_name; |
| uint_t smod_refcnt; /* # of entries */ |
| size_t smod_uc_version; /* upcall version */ |
| size_t smod_dc_version; /* down call version */ |
| so_proto_create_func_t smod_proto_create_func; |
| so_proto_fallback_func_t smod_proto_fallback_func; |
| so_create_func_t smod_sock_create_func; |
| so_destroy_func_t smod_sock_destroy_func; |
| list_node_t smod_node; |
| } smod_info_t; |
| |
| /* |
| * sockparams |
| * |
| * Used for mapping family/type/protocol to module |
| */ |
| struct sockparams { |
| /* |
| * The family, type, protocol, sdev_info and smod_info are |
| * set when the entry is created, and they will never change |
| * thereafter. |
| */ |
| int sp_family; |
| int sp_type; |
| int sp_protocol; |
| |
| sdev_info_t sp_sdev_info; /* STREAM device */ |
| char *sp_smod_name; /* socket module name */ |
| smod_info_t *sp_smod_info; /* socket module */ |
| |
| kmutex_t sp_lock; /* lock for refcnt */ |
| uint64_t sp_refcnt; /* entry reference count */ |
| |
| /* |
| * The entries below are only modified while holding |
| * splist_lock as a writer. |
| */ |
| int sp_flags; /* see below */ |
| list_node_t sp_node; |
| }; |
| |
| |
| /* |
| * sockparams flags |
| */ |
| #define SOCKPARAMS_EPHEMERAL 0x1 /* temp. entry, not on global list */ |
| |
| extern void sockparams_init(void); |
| extern struct sockparams *sockparams_hold_ephemeral_bydev(int, int, int, |
| const char *, int, int *); |
| extern struct sockparams *sockparams_hold_ephemeral_bymod(int, int, int, |
| const char *, int, int *); |
| extern void sockparams_ephemeral_drop_last_ref(struct sockparams *); |
| |
| extern void smod_init(void); |
| extern void smod_add(smod_info_t *); |
| extern int smod_register(const smod_reg_t *); |
| extern int smod_unregister(const char *); |
| extern smod_info_t *smod_lookup_byname(const char *); |
| |
| #define SOCKPARAMS_HAS_DEVICE(sp) \ |
| ((sp)->sp_sdev_info.sd_devpath != NULL) |
| |
| /* Increase the smod_info_t reference count */ |
| #define SMOD_INC_REF(smodp) { \ |
| ASSERT((smodp) != NULL); \ |
| DTRACE_PROBE1(smodinfo__inc__ref, struct smod_info *, (smodp)); \ |
| atomic_inc_uint(&(smodp)->smod_refcnt); \ |
| } |
| |
| /* |
| * Decreace the socket module entry reference count. |
| * When no one mapping to the entry, we try to unload the module from the |
| * kernel. If the module can't unload, just leave the module entry with |
| * a zero refcnt. |
| */ |
| #define SMOD_DEC_REF(sp, smodp) { \ |
| ASSERT((smodp) != NULL); \ |
| ASSERT((smodp)->smod_refcnt != 0); \ |
| atomic_dec_uint(&(smodp)->smod_refcnt); \ |
| /* \ |
| * No need to atomically check the return value because the \ |
| * socket module framework will verify that no one is using \ |
| * the module before unloading. Worst thing that can happen \ |
| * here is multiple calls to mod_remove_by_name(), which is OK. \ |
| */ \ |
| if ((smodp)->smod_refcnt == 0) \ |
| (void) mod_remove_by_name((sp)->sp_smod_name); \ |
| } |
| |
| /* Increase the reference count */ |
| #define SOCKPARAMS_INC_REF(sp) { \ |
| ASSERT((sp) != NULL); \ |
| DTRACE_PROBE1(sockparams__inc__ref, struct sockparams *, (sp)); \ |
| mutex_enter(&(sp)->sp_lock); \ |
| (sp)->sp_refcnt++; \ |
| ASSERT((sp)->sp_refcnt != 0); \ |
| mutex_exit(&(sp)->sp_lock); \ |
| } |
| |
| /* |
| * Decrease the reference count. |
| * |
| * If the sockparams is ephemeral, then the thread dropping the last ref |
| * count will destroy the entry. |
| */ |
| #define SOCKPARAMS_DEC_REF(sp) { \ |
| ASSERT((sp) != NULL); \ |
| DTRACE_PROBE1(sockparams__dec__ref, struct sockparams *, (sp)); \ |
| mutex_enter(&(sp)->sp_lock); \ |
| ASSERT((sp)->sp_refcnt > 0); \ |
| if ((sp)->sp_refcnt == 1) { \ |
| if ((sp)->sp_flags & SOCKPARAMS_EPHEMERAL) { \ |
| mutex_exit(&(sp)->sp_lock); \ |
| sockparams_ephemeral_drop_last_ref((sp)); \ |
| } else { \ |
| (sp)->sp_refcnt--; \ |
| if ((sp)->sp_smod_info != NULL) \ |
| SMOD_DEC_REF(sp, (sp)->sp_smod_info); \ |
| (sp)->sp_smod_info = NULL; \ |
| mutex_exit(&(sp)->sp_lock); \ |
| } \ |
| } else { \ |
| (sp)->sp_refcnt--; \ |
| mutex_exit(&(sp)->sp_lock); \ |
| } \ |
| } |
| |
| /* |
| * Used to traverse the list of AF_UNIX sockets to construct the kstat |
| * for netstat(1m). |
| */ |
| struct socklist { |
| kmutex_t sl_lock; |
| struct sonode *sl_list; |
| }; |
| |
| extern struct socklist socklist; |
| /* |
| * ss_full_waits is the number of times the reader thread |
| * waits when the queue is full and ss_empty_waits is the number |
| * of times the consumer thread waits when the queue is empty. |
| * No locks for these as they are just indicators of whether |
| * disk or network or both is slow or fast. |
| */ |
| struct sendfile_stats { |
| uint32_t ss_file_cached; |
| uint32_t ss_file_not_cached; |
| uint32_t ss_full_waits; |
| uint32_t ss_empty_waits; |
| uint32_t ss_file_segmap; |
| }; |
| |
| /* |
| * A single sendfile request is represented by snf_req. |
| */ |
| typedef struct snf_req { |
| struct snf_req *sr_next; |
| mblk_t *sr_mp_head; |
| mblk_t *sr_mp_tail; |
| kmutex_t sr_lock; |
| kcondvar_t sr_cv; |
| uint_t sr_qlen; |
| int sr_hiwat; |
| int sr_lowat; |
| int sr_operation; |
| struct vnode *sr_vp; |
| file_t *sr_fp; |
| ssize_t sr_maxpsz; |
| u_offset_t sr_file_off; |
| u_offset_t sr_file_size; |
| #define SR_READ_DONE 0x80000000 |
| int sr_read_error; |
| int sr_write_error; |
| } snf_req_t; |
| |
| /* A queue of sendfile requests */ |
| struct sendfile_queue { |
| snf_req_t *snfq_req_head; |
| snf_req_t *snfq_req_tail; |
| kmutex_t snfq_lock; |
| kcondvar_t snfq_cv; |
| int snfq_svc_threads; /* # of service threads */ |
| int snfq_idle_cnt; /* # of idling threads */ |
| int snfq_max_threads; |
| int snfq_req_cnt; /* Number of requests */ |
| }; |
| |
| #define READ_OP 1 |
| #define SNFQ_TIMEOUT (60 * 5 * hz) /* 5 minutes */ |
| |
| /* Socket network operations switch */ |
| struct sonodeops { |
| int (*sop_init)(struct sonode *, struct sonode *, cred_t *, |
| int); |
| int (*sop_accept)(struct sonode *, int, cred_t *, struct sonode **); |
| int (*sop_bind)(struct sonode *, struct sockaddr *, socklen_t, |
| int, cred_t *); |
| int (*sop_listen)(struct sonode *, int, cred_t *); |
| int (*sop_connect)(struct sonode *, const struct sockaddr *, |
| socklen_t, int, int, cred_t *); |
| int (*sop_recvmsg)(struct sonode *, struct msghdr *, |
| struct uio *, cred_t *); |
| int (*sop_sendmsg)(struct sonode *, struct msghdr *, |
| struct uio *, cred_t *); |
| int (*sop_sendmblk)(struct sonode *, struct msghdr *, int, |
| cred_t *, mblk_t **); |
| int (*sop_getpeername)(struct sonode *, struct sockaddr *, |
| socklen_t *, boolean_t, cred_t *); |
| int (*sop_getsockname)(struct sonode *, struct sockaddr *, |
| socklen_t *, cred_t *); |
| int (*sop_shutdown)(struct sonode *, int, cred_t *); |
| int (*sop_getsockopt)(struct sonode *, int, int, void *, |
| socklen_t *, int, cred_t *); |
| int (*sop_setsockopt)(struct sonode *, int, int, const void *, |
| socklen_t, cred_t *); |
| int (*sop_ioctl)(struct sonode *, int, intptr_t, int, |
| cred_t *, int32_t *); |
| int (*sop_poll)(struct sonode *, short, int, short *, |
| struct pollhead **); |
| int (*sop_close)(struct sonode *, int, cred_t *); |
| }; |
| |
| #define SOP_INIT(so, flag, cr, flags) \ |
| ((so)->so_ops->sop_init((so), (flag), (cr), (flags))) |
| #define SOP_ACCEPT(so, fflag, cr, nsop) \ |
| ((so)->so_ops->sop_accept((so), (fflag), (cr), (nsop))) |
| #define SOP_BIND(so, name, namelen, flags, cr) \ |
| ((so)->so_ops->sop_bind((so), (name), (namelen), (flags), (cr))) |
| #define SOP_LISTEN(so, backlog, cr) \ |
| ((so)->so_ops->sop_listen((so), (backlog), (cr))) |
| #define SOP_CONNECT(so, name, namelen, fflag, flags, cr) \ |
| ((so)->so_ops->sop_connect((so), (name), (namelen), (fflag), (flags), \ |
| (cr))) |
| #define SOP_RECVMSG(so, msg, uiop, cr) \ |
| ((so)->so_ops->sop_recvmsg((so), (msg), (uiop), (cr))) |
| #define SOP_SENDMSG(so, msg, uiop, cr) \ |
| ((so)->so_ops->sop_sendmsg((so), (msg), (uiop), (cr))) |
| #define SOP_SENDMBLK(so, msg, size, cr, mpp) \ |
| ((so)->so_ops->sop_sendmblk((so), (msg), (size), (cr), (mpp))) |
| #define SOP_GETPEERNAME(so, addr, addrlen, accept, cr) \ |
| ((so)->so_ops->sop_getpeername((so), (addr), (addrlen), (accept), (cr))) |
| #define SOP_GETSOCKNAME(so, addr, addrlen, cr) \ |
| ((so)->so_ops->sop_getsockname((so), (addr), (addrlen), (cr))) |
| #define SOP_SHUTDOWN(so, how, cr) \ |
| ((so)->so_ops->sop_shutdown((so), (how), (cr))) |
| #define SOP_GETSOCKOPT(so, level, optionname, optval, optlenp, flags, cr) \ |
| ((so)->so_ops->sop_getsockopt((so), (level), (optionname), \ |
| (optval), (optlenp), (flags), (cr))) |
| #define SOP_SETSOCKOPT(so, level, optionname, optval, optlen, cr) \ |
| ((so)->so_ops->sop_setsockopt((so), (level), (optionname), \ |
| (optval), (optlen), (cr))) |
| #define SOP_IOCTL(so, cmd, arg, mode, cr, rvalp) \ |
| ((so)->so_ops->sop_ioctl((so), (cmd), (arg), (mode), (cr), (rvalp))) |
| #define SOP_POLL(so, events, anyyet, reventsp, phpp) \ |
| ((so)->so_ops->sop_poll((so), (events), (anyyet), (reventsp), (phpp))) |
| #define SOP_CLOSE(so, flag, cr) \ |
| ((so)->so_ops->sop_close((so), (flag), (cr))) |
| |
| #endif /* defined(_KERNEL) || defined(_KMEMUSER) */ |
| |
| #ifdef _KERNEL |
| |
| #define ISALIGNED_cmsghdr(addr) \ |
| (((uintptr_t)(addr) & (_CMSG_HDR_ALIGNMENT - 1)) == 0) |
| |
| #define ROUNDUP_cmsglen(len) \ |
| (((len) + _CMSG_HDR_ALIGNMENT - 1) & ~(_CMSG_HDR_ALIGNMENT - 1)) |
| |
| #define IS_NON_STREAM_SOCK(vp) \ |
| ((vp)->v_type == VSOCK && (vp)->v_stream == NULL) |
| /* |
| * Macros that operate on struct cmsghdr. |
| * Used in parsing msg_control. |
| * The CMSG_VALID macro does not assume that the last option buffer is padded. |
| */ |
| #define CMSG_NEXT(cmsg) \ |
| (struct cmsghdr *)((uintptr_t)(cmsg) + \ |
| ROUNDUP_cmsglen((cmsg)->cmsg_len)) |
| #define CMSG_CONTENT(cmsg) (&((cmsg)[1])) |
| #define CMSG_CONTENTLEN(cmsg) ((cmsg)->cmsg_len - sizeof (struct cmsghdr)) |
| #define CMSG_VALID(cmsg, start, end) \ |
| (ISALIGNED_cmsghdr(cmsg) && \ |
| ((uintptr_t)(cmsg) >= (uintptr_t)(start)) && \ |
| ((uintptr_t)(cmsg) < (uintptr_t)(end)) && \ |
| ((ssize_t)(cmsg)->cmsg_len >= sizeof (struct cmsghdr)) && \ |
| ((uintptr_t)(cmsg) + (cmsg)->cmsg_len <= (uintptr_t)(end))) |
| |
| /* |
| * Maximum size of any argument that is copied in (addresses, options, |
| * access rights). MUST be at least MAXPATHLEN + 3. |
| * BSD and SunOS 4.X limited this to MLEN or MCLBYTES. |
| */ |
| #define SO_MAXARGSIZE 8192 |
| |
| /* |
| * Convert between vnode and sonode |
| */ |
| #define VTOSO(vp) ((struct sonode *)((vp)->v_data)) |
| #define SOTOV(sp) ((sp)->so_vnode) |
| |
| /* |
| * Internal flags for sobind() |
| */ |
| #define _SOBIND_REBIND 0x01 /* Bind to existing local address */ |
| #define _SOBIND_UNSPEC 0x02 /* Bind to unspecified address */ |
| #define _SOBIND_LOCK_HELD 0x04 /* so_excl_lock held by caller */ |
| #define _SOBIND_NOXLATE 0x08 /* No addr translation for AF_UNIX */ |
| #define _SOBIND_XPG4_2 0x10 /* xpg4.2 semantics */ |
| #define _SOBIND_SOCKBSD 0x20 /* BSD semantics */ |
| #define _SOBIND_LISTEN 0x40 /* Make into SS_ACCEPTCONN */ |
| #define _SOBIND_SOCKETPAIR 0x80 /* Internal flag for so_socketpair() */ |
| /* to enable listen with backlog = 1 */ |
| |
| /* |
| * Internal flags for sounbind() |
| */ |
| #define _SOUNBIND_REBIND 0x01 /* Don't clear fields - will rebind */ |
| |
| /* |
| * Internal flags for soconnect() |
| */ |
| #define _SOCONNECT_NOXLATE 0x01 /* No addr translation for AF_UNIX */ |
| #define _SOCONNECT_DID_BIND 0x02 /* Unbind when connect fails */ |
| #define _SOCONNECT_XPG4_2 0x04 /* xpg4.2 semantics */ |
| |
| /* |
| * Internal flags for sodisconnect() |
| */ |
| #define _SODISCONNECT_LOCK_HELD 0x01 /* so_excl_lock held by caller */ |
| |
| /* |
| * Internal flags for sotpi_getsockopt(). |
| */ |
| #define _SOGETSOCKOPT_XPG4_2 0x01 /* xpg4.2 semantics */ |
| |
| /* |
| * Internal flags for soallocproto*() |
| */ |
| #define _ALLOC_NOSLEEP 0 /* Don't sleep for memory */ |
| #define _ALLOC_INTR 1 /* Sleep until interrupt */ |
| #define _ALLOC_SLEEP 2 /* Sleep forever */ |
| |
| /* |
| * Internal structure for handling AF_UNIX file descriptor passing |
| */ |
| struct fdbuf { |
| int fd_size; /* In bytes, for kmem_free */ |
| int fd_numfd; /* Number of elements below */ |
| char *fd_ebuf; /* Extra buffer to free */ |
| int fd_ebuflen; |
| frtn_t fd_frtn; |
| struct file *fd_fds[1]; /* One or more */ |
| }; |
| #define FDBUF_HDRSIZE (sizeof (struct fdbuf) - sizeof (struct file *)) |
| |
| /* |
| * Variable that can be patched to set what version of socket socket() |
| * will create. |
| */ |
| extern int so_default_version; |
| |
| #ifdef DEBUG |
| /* Turn on extra testing capabilities */ |
| #define SOCK_TEST |
| #endif /* DEBUG */ |
| |
| #ifdef DEBUG |
| char *pr_state(uint_t, uint_t); |
| char *pr_addr(int, struct sockaddr *, t_uscalar_t); |
| int so_verify_oobstate(struct sonode *); |
| #endif /* DEBUG */ |
| |
| /* |
| * DEBUG macros |
| */ |
| #if defined(DEBUG) |
| #define SOCK_DEBUG |
| |
| extern int sockdebug; |
| extern int sockprinterr; |
| |
| #define eprint(args) printf args |
| #define eprintso(so, args) \ |
| { if (sockprinterr && ((so)->so_options & SO_DEBUG)) printf args; } |
| #define eprintline(error) \ |
| { \ |
| if (error != EINTR && (sockprinterr || sockdebug > 0)) \ |
| printf("socket error %d: line %d file %s\n", \ |
| (error), __LINE__, __FILE__); \ |
| } |
| |
| #define eprintsoline(so, error) \ |
| { if (sockprinterr && ((so)->so_options & SO_DEBUG)) \ |
| printf("socket(%p) error %d: line %d file %s\n", \ |
| (void *)(so), (error), __LINE__, __FILE__); \ |
| } |
| #define dprint(level, args) { if (sockdebug > (level)) printf args; } |
| #define dprintso(so, level, args) \ |
| { if (sockdebug > (level) && ((so)->so_options & SO_DEBUG)) printf args; } |
| |
| #else /* define(DEBUG) */ |
| |
| #define eprint(args) {} |
| #define eprintso(so, args) {} |
| #define eprintline(error) {} |
| #define eprintsoline(so, error) {} |
| #define dprint(level, args) {} |
| #define dprintso(so, level, args) {} |
| |
| #endif /* defined(DEBUG) */ |
| |
| extern struct vfsops sock_vfsops; |
| extern struct vnodeops *socket_vnodeops; |
| extern const struct fs_operation_def socket_vnodeops_template[]; |
| |
| extern dev_t sockdev; |
| |
| /* |
| * sockfs functions |
| */ |
| extern int sock_getmsg(vnode_t *, struct strbuf *, struct strbuf *, |
| uchar_t *, int *, int, rval_t *); |
| extern int sock_putmsg(vnode_t *, struct strbuf *, struct strbuf *, |
| uchar_t, int, int); |
| extern int sogetvp(char *, vnode_t **, int); |
| extern int sockinit(int, char *); |
| extern int soconfig(int, int, int, char *, int, char *); |
| extern int solookup(int, int, int, struct sockparams **); |
| extern void so_lock_single(struct sonode *); |
| extern void so_unlock_single(struct sonode *, int); |
| extern int so_lock_read(struct sonode *, int); |
| extern int so_lock_read_intr(struct sonode *, int); |
| extern void so_unlock_read(struct sonode *); |
| extern void *sogetoff(mblk_t *, t_uscalar_t, t_uscalar_t, uint_t); |
| extern void so_getopt_srcaddr(void *, t_uscalar_t, |
| void **, t_uscalar_t *); |
| extern int so_getopt_unix_close(void *, t_uscalar_t); |
| extern void fdbuf_free(struct fdbuf *); |
| extern mblk_t *fdbuf_allocmsg(int, struct fdbuf *); |
| extern int fdbuf_create(void *, int, struct fdbuf **); |
| extern void so_closefds(void *, t_uscalar_t, int, int); |
| extern int so_getfdopt(void *, t_uscalar_t, int, void **, int *); |
| t_uscalar_t so_optlen(void *, t_uscalar_t, int); |
| extern void so_cmsg2opt(void *, t_uscalar_t, int, mblk_t *); |
| extern t_uscalar_t |
| so_cmsglen(mblk_t *, void *, t_uscalar_t, int); |
| extern int so_opt2cmsg(mblk_t *, void *, t_uscalar_t, int, |
| void *, t_uscalar_t); |
| extern void soisconnecting(struct sonode *); |
| extern void soisconnected(struct sonode *); |
| extern void soisdisconnected(struct sonode *, int); |
| extern void socantsendmore(struct sonode *); |
| extern void socantrcvmore(struct sonode *); |
| extern void soseterror(struct sonode *, int); |
| extern int sogeterr(struct sonode *, boolean_t); |
| extern int sowaitconnected(struct sonode *, int, int); |
| |
| extern ssize_t soreadfile(file_t *, uchar_t *, u_offset_t, int *, size_t); |
| extern void *sock_kstat_init(zoneid_t); |
| extern void sock_kstat_fini(zoneid_t, void *); |
| extern struct sonode *getsonode(int, int *, file_t **); |
| /* |
| * Function wrappers (mostly around the sonode switch) for |
| * backward compatibility. |
| */ |
| extern int soaccept(struct sonode *, int, struct sonode **); |
| extern int sobind(struct sonode *, struct sockaddr *, socklen_t, |
| int, int); |
| extern int solisten(struct sonode *, int); |
| extern int soconnect(struct sonode *, const struct sockaddr *, socklen_t, |
| int, int); |
| extern int sorecvmsg(struct sonode *, struct nmsghdr *, struct uio *); |
| extern int sosendmsg(struct sonode *, struct nmsghdr *, struct uio *); |
| extern int soshutdown(struct sonode *, int); |
| extern int sogetsockopt(struct sonode *, int, int, void *, socklen_t *, |
| int); |
| extern int sosetsockopt(struct sonode *, int, int, const void *, |
| t_uscalar_t); |
| |
| extern struct sonode *socreate(struct sockparams *, int, int, int, int, |
| int *); |
| |
| extern int so_copyin(const void *, void *, size_t, int); |
| extern int so_copyout(const void *, void *, size_t, int); |
| |
| #endif |
| |
| /* |
| * Internal structure for obtaining sonode information from the socklist. |
| * These types match those corresponding in the sonode structure. |
| * This is not a published interface, and may change at any time. |
| */ |
| struct sockinfo { |
| uint_t si_size; /* real length of this struct */ |
| short si_family; |
| short si_type; |
| ushort_t si_flag; |
| uint_t si_state; |
| uint_t si_ux_laddr_sou_magic; |
| uint_t si_ux_faddr_sou_magic; |
| t_scalar_t si_serv_type; |
| t_uscalar_t si_laddr_soa_len; |
| t_uscalar_t si_faddr_soa_len; |
| uint16_t si_laddr_family; |
| uint16_t si_faddr_family; |
| char si_laddr_sun_path[MAXPATHLEN + 1]; /* NULL terminated */ |
| char si_faddr_sun_path[MAXPATHLEN + 1]; |
| boolean_t si_faddr_noxlate; |
| zoneid_t si_szoneid; |
| }; |
| |
| #define SOCKMOD_PATH "socketmod" /* dir where sockmods are stored */ |
| |
| #ifdef __cplusplus |
| } |
| #endif |
| |
| #endif /* _SYS_SOCKETVAR_H */ |