version 1.170, 2008/08/04 03:55:47 |
version 1.177.4.3.2.1, 2011/08/08 19:47:01 |
|
|
/* $NetBSD$ */ |
/* $NetBSD$ */ |
|
|
/*- |
/*- |
* Copyright (c) 2002, 2007, 2008 The NetBSD Foundation, Inc. |
* Copyright (c) 2002, 2007, 2008, 2009 The NetBSD Foundation, Inc. |
* All rights reserved. |
* All rights reserved. |
* |
* |
* This code is derived from software contributed to The NetBSD Foundation |
* This code is derived from software contributed to The NetBSD Foundation |
* by Jason R. Thorpe of Wasabi Systems, Inc. |
* by Jason R. Thorpe of Wasabi Systems, Inc, and by Andrew Doran. |
* |
* |
* Redistribution and use in source and binary forms, with or without |
* Redistribution and use in source and binary forms, with or without |
* modification, are permitted provided that the following conditions |
* modification, are permitted provided that the following conditions |
|
|
#include <sys/cdefs.h> |
#include <sys/cdefs.h> |
__KERNEL_RCSID(0, "$NetBSD$"); |
__KERNEL_RCSID(0, "$NetBSD$"); |
|
|
#include "opt_inet.h" |
|
#include "opt_sock_counters.h" |
#include "opt_sock_counters.h" |
#include "opt_sosend_loan.h" |
#include "opt_sosend_loan.h" |
#include "opt_mbuftrace.h" |
#include "opt_mbuftrace.h" |
Line 77 __KERNEL_RCSID(0, "$NetBSD$"); |
|
Line 76 __KERNEL_RCSID(0, "$NetBSD$"); |
|
#include <sys/proc.h> |
#include <sys/proc.h> |
#include <sys/file.h> |
#include <sys/file.h> |
#include <sys/filedesc.h> |
#include <sys/filedesc.h> |
#include <sys/malloc.h> |
#include <sys/kmem.h> |
#include <sys/mbuf.h> |
#include <sys/mbuf.h> |
#include <sys/domain.h> |
#include <sys/domain.h> |
#include <sys/kernel.h> |
#include <sys/kernel.h> |
Line 86 __KERNEL_RCSID(0, "$NetBSD$"); |
|
Line 85 __KERNEL_RCSID(0, "$NetBSD$"); |
|
#include <sys/socketvar.h> |
#include <sys/socketvar.h> |
#include <sys/signalvar.h> |
#include <sys/signalvar.h> |
#include <sys/resourcevar.h> |
#include <sys/resourcevar.h> |
|
#include <sys/uidinfo.h> |
#include <sys/event.h> |
#include <sys/event.h> |
#include <sys/poll.h> |
#include <sys/poll.h> |
#include <sys/kauth.h> |
#include <sys/kauth.h> |
#include <sys/mutex.h> |
#include <sys/mutex.h> |
#include <sys/condvar.h> |
#include <sys/condvar.h> |
|
#include <sys/kthread.h> |
|
|
#include <uvm/uvm.h> |
#include <uvm/uvm.h> |
|
|
Line 136 int sock_loan_thresh = 4096; |
|
Line 137 int sock_loan_thresh = 4096; |
|
#endif |
#endif |
|
|
static kmutex_t so_pendfree_lock; |
static kmutex_t so_pendfree_lock; |
static struct mbuf *so_pendfree; |
static struct mbuf *so_pendfree = NULL; |
|
|
#ifndef SOMAXKVA |
#ifndef SOMAXKVA |
#define SOMAXKVA (16 * 1024 * 1024) |
#define SOMAXKVA (16 * 1024 * 1024) |
Line 147 static kcondvar_t socurkva_cv; |
|
Line 148 static kcondvar_t socurkva_cv; |
|
|
|
#define SOCK_LOAN_CHUNK 65536 |
#define SOCK_LOAN_CHUNK 65536 |
|
|
static size_t sodopendfree(void); |
static void sopendfree_thread(void *); |
static size_t sodopendfreel(void); |
static kcondvar_t pendfree_thread_cv; |
|
static lwp_t *sopendfree_lwp; |
|
|
static vsize_t |
static vsize_t |
sokvareserve(struct socket *so, vsize_t len) |
sokvareserve(struct socket *so, vsize_t len) |
Line 157 sokvareserve(struct socket *so, vsize_t |
|
Line 159 sokvareserve(struct socket *so, vsize_t |
|
|
|
mutex_enter(&so_pendfree_lock); |
mutex_enter(&so_pendfree_lock); |
while (socurkva + len > somaxkva) { |
while (socurkva + len > somaxkva) { |
size_t freed; |
|
|
|
/* |
|
* try to do pendfree. |
|
*/ |
|
|
|
freed = sodopendfreel(); |
|
|
|
/* |
|
* if some kva was freed, try again. |
|
*/ |
|
|
|
if (freed) |
|
continue; |
|
|
|
SOSEND_COUNTER_INCR(&sosend_kvalimit); |
SOSEND_COUNTER_INCR(&sosend_kvalimit); |
error = cv_wait_sig(&socurkva_cv, &so_pendfree_lock); |
error = cv_wait_sig(&socurkva_cv, &so_pendfree_lock); |
if (error) { |
if (error) { |
Line 264 sodoloanfree(struct vm_page **pgs, void |
|
Line 251 sodoloanfree(struct vm_page **pgs, void |
|
sokvafree(sva, len); |
sokvafree(sva, len); |
} |
} |
|
|
static size_t |
|
sodopendfree(void) |
|
{ |
|
size_t rv; |
|
|
|
if (__predict_true(so_pendfree == NULL)) |
|
return 0; |
|
|
|
mutex_enter(&so_pendfree_lock); |
|
rv = sodopendfreel(); |
|
mutex_exit(&so_pendfree_lock); |
|
|
|
return rv; |
|
} |
|
|
|
/* |
/* |
* sodopendfreel: free mbufs on "pendfree" list. |
* sopendfree_thread: free mbufs on "pendfree" list. |
* unlock and relock so_pendfree_lock when freeing mbufs. |
* unlock and relock so_pendfree_lock when freeing mbufs. |
* |
|
* => called with so_pendfree_lock held. |
|
*/ |
*/ |
|
|
static size_t |
static void |
sodopendfreel(void) |
sopendfree_thread(void *v) |
{ |
{ |
struct mbuf *m, *next; |
struct mbuf *m, *next; |
size_t rv = 0; |
size_t rv; |
|
|
KASSERT(mutex_owned(&so_pendfree_lock)); |
|
|
|
while (so_pendfree != NULL) { |
mutex_enter(&so_pendfree_lock); |
m = so_pendfree; |
|
so_pendfree = NULL; |
|
mutex_exit(&so_pendfree_lock); |
|
|
|
for (; m != NULL; m = next) { |
for (;;) { |
next = m->m_next; |
rv = 0; |
KASSERT((~m->m_flags & (M_EXT|M_EXT_PAGES)) == 0); |
while (so_pendfree != NULL) { |
KASSERT(m->m_ext.ext_refcnt == 0); |
m = so_pendfree; |
|
so_pendfree = NULL; |
|
mutex_exit(&so_pendfree_lock); |
|
|
|
for (; m != NULL; m = next) { |
|
next = m->m_next; |
|
KASSERT((~m->m_flags & (M_EXT|M_EXT_PAGES)) == 0); |
|
KASSERT(m->m_ext.ext_refcnt == 0); |
|
|
|
rv += m->m_ext.ext_size; |
|
sodoloanfree(m->m_ext.ext_pgs, m->m_ext.ext_buf, |
|
m->m_ext.ext_size); |
|
pool_cache_put(mb_cache, m); |
|
} |
|
|
rv += m->m_ext.ext_size; |
mutex_enter(&so_pendfree_lock); |
sodoloanfree(m->m_ext.ext_pgs, m->m_ext.ext_buf, |
|
m->m_ext.ext_size); |
|
pool_cache_put(mb_cache, m); |
|
} |
} |
|
if (rv) |
mutex_enter(&so_pendfree_lock); |
cv_broadcast(&socurkva_cv); |
|
cv_wait(&pendfree_thread_cv, &so_pendfree_lock); |
} |
} |
|
panic("sopendfree_thread"); |
return (rv); |
/* NOTREACHED */ |
} |
} |
|
|
void |
void |
Line 332 soloanfree(struct mbuf *m, void *buf, si |
|
Line 308 soloanfree(struct mbuf *m, void *buf, si |
|
mutex_enter(&so_pendfree_lock); |
mutex_enter(&so_pendfree_lock); |
m->m_next = so_pendfree; |
m->m_next = so_pendfree; |
so_pendfree = m; |
so_pendfree = m; |
cv_broadcast(&socurkva_cv); |
cv_signal(&pendfree_thread_cv); |
mutex_exit(&so_pendfree_lock); |
mutex_exit(&so_pendfree_lock); |
} |
} |
|
|
Line 402 sokva_reclaim_callback(struct callback_e |
|
Line 378 sokva_reclaim_callback(struct callback_e |
|
KASSERT(ce == &sokva_reclaimerentry); |
KASSERT(ce == &sokva_reclaimerentry); |
KASSERT(obj == NULL); |
KASSERT(obj == NULL); |
|
|
sodopendfree(); |
|
if (!vm_map_starved_p(kernel_map)) { |
if (!vm_map_starved_p(kernel_map)) { |
return CALLBACK_CHAIN_ABORT; |
return CALLBACK_CHAIN_ABORT; |
} |
} |
Line 419 getsombuf(struct socket *so, int type) |
|
Line 394 getsombuf(struct socket *so, int type) |
|
return m; |
return m; |
} |
} |
|
|
struct mbuf * |
|
m_intopt(struct socket *so, int val) |
|
{ |
|
struct mbuf *m; |
|
|
|
m = getsombuf(so, MT_SOOPTS); |
|
m->m_len = sizeof(int); |
|
*mtod(m, int *) = val; |
|
return m; |
|
} |
|
|
|
void |
void |
soinit(void) |
soinit() |
{ |
{ |
|
|
mutex_init(&so_pendfree_lock, MUTEX_DEFAULT, IPL_VM); |
mutex_init(&so_pendfree_lock, MUTEX_DEFAULT, IPL_VM); |
softnet_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE); |
softnet_lock = mutex_obj_alloc(MUTEX_DEFAULT, IPL_NONE); |
cv_init(&socurkva_cv, "sokva"); |
cv_init(&socurkva_cv, "sokva"); |
|
cv_init(&pendfree_thread_cv, "sopendfr"); |
soinit2(); |
soinit2(); |
|
|
|
|
/* Set the initial adjusted socket buffer size. */ |
/* Set the initial adjusted socket buffer size. */ |
if (sb_max_set(sb_max)) |
if (sb_max_set(sb_max)) |
panic("bad initial sb_max value: %lu", sb_max); |
panic("bad initial sb_max value: %lu", sb_max); |
|
|
&sokva_reclaimerentry, NULL, sokva_reclaim_callback); |
&sokva_reclaimerentry, NULL, sokva_reclaim_callback); |
} |
} |
|
|
|
void |
|
soinit1(void) |
|
{ |
|
int error = kthread_create(PRI_NONE, KTHREAD_MPSAFE, NULL, |
|
sopendfree_thread, NULL, &sopendfree_lwp, "sopendfree"); |
|
if (error) |
|
panic("soinit1 %d", error); |
|
} |
|
|
/* |
/* |
* Socket operation routines. |
* Socket operation routines. |
* These routines are called by the routines in |
* These routines are called by the routines in |
Line 625 sofree(struct socket *so) |
|
Line 599 sofree(struct socket *so) |
|
KASSERT(!cv_has_waiters(&so->so_snd.sb_cv)); |
KASSERT(!cv_has_waiters(&so->so_snd.sb_cv)); |
sorflush(so); |
sorflush(so); |
refs = so->so_aborting; /* XXX */ |
refs = so->so_aborting; /* XXX */ |
#ifdef INET |
/* Remove acccept filter if one is present. */ |
/* remove acccept filter if one is present. */ |
|
if (so->so_accf != NULL) |
if (so->so_accf != NULL) |
do_setopt_accept_filter(so, NULL); |
(void)accept_filt_clear(so); |
#endif |
|
sounlock(so); |
sounlock(so); |
if (refs == 0) /* XXX */ |
if (refs == 0) /* XXX */ |
soput(so); |
soput(so); |
Line 650 soclose(struct socket *so) |
|
Line 622 soclose(struct socket *so) |
|
error = 0; |
error = 0; |
solock(so); |
solock(so); |
if (so->so_options & SO_ACCEPTCONN) { |
if (so->so_options & SO_ACCEPTCONN) { |
do { |
for (;;) { |
while ((so2 = TAILQ_FIRST(&so->so_q0)) != 0) { |
if ((so2 = TAILQ_FIRST(&so->so_q0)) != 0) { |
KASSERT(solocked2(so, so2)); |
KASSERT(solocked2(so, so2)); |
(void) soqremque(so2, 0); |
(void) soqremque(so2, 0); |
/* soabort drops the lock. */ |
/* soabort drops the lock. */ |
(void) soabort(so2); |
(void) soabort(so2); |
solock(so); |
solock(so); |
|
continue; |
} |
} |
while ((so2 = TAILQ_FIRST(&so->so_q)) != 0) { |
if ((so2 = TAILQ_FIRST(&so->so_q)) != 0) { |
KASSERT(solocked2(so, so2)); |
KASSERT(solocked2(so, so2)); |
(void) soqremque(so2, 1); |
(void) soqremque(so2, 1); |
/* soabort drops the lock. */ |
/* soabort drops the lock. */ |
(void) soabort(so2); |
(void) soabort(so2); |
solock(so); |
solock(so); |
|
continue; |
} |
} |
} while (!TAILQ_EMPTY(&so->so_q0)); |
break; |
|
} |
} |
} |
if (so->so_pcb == 0) |
if (so->so_pcb == 0) |
goto discard; |
goto discard; |
Line 679 soclose(struct socket *so) |
|
Line 654 soclose(struct socket *so) |
|
if ((so->so_state & SS_ISDISCONNECTING) && so->so_nbio) |
if ((so->so_state & SS_ISDISCONNECTING) && so->so_nbio) |
goto drop; |
goto drop; |
while (so->so_state & SS_ISCONNECTED) { |
while (so->so_state & SS_ISCONNECTED) { |
error = sowait(so, so->so_linger * hz); |
error = sowait(so, true, so->so_linger * hz); |
if (error) |
if (error) |
break; |
break; |
} |
} |
Line 797 sodisconnect(struct socket *so) |
|
Line 772 sodisconnect(struct socket *so) |
|
error = (*so->so_proto->pr_usrreq)(so, PRU_DISCONNECT, |
error = (*so->so_proto->pr_usrreq)(so, PRU_DISCONNECT, |
NULL, NULL, NULL, NULL); |
NULL, NULL, NULL, NULL); |
} |
} |
sodopendfree(); |
|
return (error); |
return (error); |
} |
} |
|
|
Line 829 sosend(struct socket *so, struct mbuf *a |
|
Line 803 sosend(struct socket *so, struct mbuf *a |
|
int error, s, dontroute, atomic; |
int error, s, dontroute, atomic; |
|
|
p = l->l_proc; |
p = l->l_proc; |
sodopendfree(); |
|
clen = 0; |
clen = 0; |
|
|
/* |
/* |
Line 1098 soreceive(struct socket *so, struct mbuf |
|
Line 1071 soreceive(struct socket *so, struct mbuf |
|
else |
else |
flags = 0; |
flags = 0; |
|
|
if ((flags & MSG_DONTWAIT) == 0) |
|
sodopendfree(); |
|
|
|
if (flags & MSG_OOB) { |
if (flags & MSG_OOB) { |
m = m_get(M_WAIT, MT_DATA); |
m = m_get(M_WAIT, MT_DATA); |
solock(so); |
solock(so); |
Line 1546 soshutdown(struct socket *so, int how) |
|
Line 1516 soshutdown(struct socket *so, int how) |
|
return error; |
return error; |
} |
} |
|
|
|
int |
|
sodrain(struct socket *so) |
|
{ |
|
int error; |
|
|
|
solock(so); |
|
so->so_state |= SS_ISDRAINING; |
|
cv_broadcast(&so->so_cv); |
|
error = soshutdown(so, SHUT_RDWR); |
|
sounlock(so); |
|
|
|
return error; |
|
} |
|
|
void |
void |
sorflush(struct socket *so) |
sorflush(struct socket *so) |
{ |
{ |
Line 1575 sorflush(struct socket *so) |
|
Line 1559 sorflush(struct socket *so) |
|
sbrelease(&asb, so); |
sbrelease(&asb, so); |
} |
} |
|
|
|
/* |
|
* internal set SOL_SOCKET options |
|
*/ |
static int |
static int |
sosetopt1(struct socket *so, int level, int optname, struct mbuf *m) |
sosetopt1(struct socket *so, const struct sockopt *sopt) |
{ |
{ |
#ifdef INET |
int error, optval; |
int error, optval, val; |
struct linger l; |
#else |
struct timeval tv; |
int optval, val; |
|
#endif |
|
struct linger *l; |
|
struct sockbuf *sb; |
|
struct timeval *tv; |
|
|
|
switch (optname) { |
switch (sopt->sopt_name) { |
|
|
#ifdef INET |
|
case SO_ACCEPTFILTER: |
case SO_ACCEPTFILTER: |
error = do_setopt_accept_filter(so, m); |
error = accept_filt_setopt(so, sopt); |
if (error) |
KASSERT(solocked(so)); |
return error; |
|
break; |
break; |
#endif |
|
|
|
case SO_LINGER: |
case SO_LINGER: |
if (m == NULL || m->m_len != sizeof(struct linger)) |
error = sockopt_get(sopt, &l, sizeof(l)); |
return EINVAL; |
solock(so); |
l = mtod(m, struct linger *); |
if (error) |
if (l->l_linger < 0 || l->l_linger > USHRT_MAX || |
break; |
l->l_linger > (INT_MAX / hz)) |
if (l.l_linger < 0 || l.l_linger > USHRT_MAX || |
return EDOM; |
l.l_linger > (INT_MAX / hz)) { |
so->so_linger = l->l_linger; |
error = EDOM; |
if (l->l_onoff) |
break; |
so->so_options |= SO_LINGER; |
} |
else |
so->so_linger = l.l_linger; |
so->so_options &= ~SO_LINGER; |
if (l.l_onoff) |
break; |
so->so_options |= SO_LINGER; |
|
else |
|
so->so_options &= ~SO_LINGER; |
|
break; |
|
|
case SO_DEBUG: |
case SO_DEBUG: |
case SO_KEEPALIVE: |
case SO_KEEPALIVE: |
Line 1620 sosetopt1(struct socket *so, int level, |
|
Line 1602 sosetopt1(struct socket *so, int level, |
|
case SO_REUSEPORT: |
case SO_REUSEPORT: |
case SO_OOBINLINE: |
case SO_OOBINLINE: |
case SO_TIMESTAMP: |
case SO_TIMESTAMP: |
if (m == NULL || m->m_len < sizeof(int)) |
error = sockopt_getint(sopt, &optval); |
return EINVAL; |
solock(so); |
if (*mtod(m, int *)) |
if (error) |
so->so_options |= optname; |
break; |
|
if (optval) |
|
so->so_options |= sopt->sopt_name; |
else |
else |
so->so_options &= ~optname; |
so->so_options &= ~sopt->sopt_name; |
break; |
break; |
|
|
case SO_SNDBUF: |
case SO_SNDBUF: |
case SO_RCVBUF: |
case SO_RCVBUF: |
case SO_SNDLOWAT: |
case SO_SNDLOWAT: |
case SO_RCVLOWAT: |
case SO_RCVLOWAT: |
if (m == NULL || m->m_len < sizeof(int)) |
error = sockopt_getint(sopt, &optval); |
return EINVAL; |
solock(so); |
|
if (error) |
|
break; |
|
|
/* |
/* |
* Values < 1 make no sense for any of these |
* Values < 1 make no sense for any of these |
* options, so disallow them. |
* options, so disallow them. |
*/ |
*/ |
optval = *mtod(m, int *); |
if (optval < 1) { |
if (optval < 1) |
error = EINVAL; |
return EINVAL; |
break; |
|
} |
switch (optname) { |
|
|
|
|
switch (sopt->sopt_name) { |
case SO_SNDBUF: |
case SO_SNDBUF: |
|
if (sbreserve(&so->so_snd, (u_long)optval, so) == 0) { |
|
error = ENOBUFS; |
|
break; |
|
} |
|
so->so_snd.sb_flags &= ~SB_AUTOSIZE; |
|
break; |
|
|
case SO_RCVBUF: |
case SO_RCVBUF: |
sb = (optname == SO_SNDBUF) ? |
if (sbreserve(&so->so_rcv, (u_long)optval, so) == 0) { |
&so->so_snd : &so->so_rcv; |
error = ENOBUFS; |
if (sbreserve(sb, (u_long)optval, so) == 0) |
break; |
return ENOBUFS; |
} |
sb->sb_flags &= ~SB_AUTOSIZE; |
so->so_rcv.sb_flags &= ~SB_AUTOSIZE; |
break; |
break; |
|
|
/* |
/* |
Line 1659 sosetopt1(struct socket *so, int level, |
|
Line 1652 sosetopt1(struct socket *so, int level, |
|
* the high-water. |
* the high-water. |
*/ |
*/ |
case SO_SNDLOWAT: |
case SO_SNDLOWAT: |
so->so_snd.sb_lowat = |
if (optval > so->so_snd.sb_hiwat) |
(optval > so->so_snd.sb_hiwat) ? |
optval = so->so_snd.sb_hiwat; |
so->so_snd.sb_hiwat : optval; |
|
|
so->so_snd.sb_lowat = optval; |
break; |
break; |
|
|
case SO_RCVLOWAT: |
case SO_RCVLOWAT: |
so->so_rcv.sb_lowat = |
if (optval > so->so_rcv.sb_hiwat) |
(optval > so->so_rcv.sb_hiwat) ? |
optval = so->so_rcv.sb_hiwat; |
so->so_rcv.sb_hiwat : optval; |
|
|
so->so_rcv.sb_lowat = optval; |
break; |
break; |
} |
} |
break; |
break; |
|
|
case SO_SNDTIMEO: |
case SO_SNDTIMEO: |
case SO_RCVTIMEO: |
case SO_RCVTIMEO: |
if (m == NULL || m->m_len < sizeof(*tv)) |
error = sockopt_get(sopt, &tv, sizeof(tv)); |
return EINVAL; |
solock(so); |
tv = mtod(m, struct timeval *); |
if (error) |
if (tv->tv_sec > (INT_MAX - tv->tv_usec / tick) / hz) |
break; |
return EDOM; |
|
val = tv->tv_sec * hz + tv->tv_usec / tick; |
|
if (val == 0 && tv->tv_usec != 0) |
|
val = 1; |
|
|
|
switch (optname) { |
if (tv.tv_sec > (INT_MAX - tv.tv_usec / tick) / hz) { |
|
error = EDOM; |
|
break; |
|
} |
|
|
|
optval = tv.tv_sec * hz + tv.tv_usec / tick; |
|
if (optval == 0 && tv.tv_usec != 0) |
|
optval = 1; |
|
|
|
switch (sopt->sopt_name) { |
case SO_SNDTIMEO: |
case SO_SNDTIMEO: |
so->so_snd.sb_timeo = val; |
so->so_snd.sb_timeo = optval; |
break; |
break; |
case SO_RCVTIMEO: |
case SO_RCVTIMEO: |
so->so_rcv.sb_timeo = val; |
so->so_rcv.sb_timeo = optval; |
break; |
break; |
} |
} |
break; |
break; |
|
|
default: |
default: |
return ENOPROTOOPT; |
solock(so); |
|
error = ENOPROTOOPT; |
|
break; |
} |
} |
return 0; |
KASSERT(solocked(so)); |
|
return error; |
} |
} |
|
|
int |
int |
sosetopt(struct socket *so, int level, int optname, struct mbuf *m) |
sosetopt(struct socket *so, struct sockopt *sopt) |
{ |
{ |
int error, prerr; |
int error, prerr; |
|
|
solock(so); |
if (sopt->sopt_level == SOL_SOCKET) { |
if (level == SOL_SOCKET) |
error = sosetopt1(so, sopt); |
error = sosetopt1(so, level, optname, m); |
KASSERT(solocked(so)); |
else |
} else { |
error = ENOPROTOOPT; |
error = ENOPROTOOPT; |
|
solock(so); |
|
} |
|
|
if ((error == 0 || error == ENOPROTOOPT) && |
if ((error == 0 || error == ENOPROTOOPT) && |
so->so_proto != NULL && so->so_proto->pr_ctloutput != NULL) { |
so->so_proto != NULL && so->so_proto->pr_ctloutput != NULL) { |
/* give the protocol stack a shot */ |
/* give the protocol stack a shot */ |
prerr = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, level, |
prerr = (*so->so_proto->pr_ctloutput)(PRCO_SETOPT, so, sopt); |
optname, &m); |
|
if (prerr == 0) |
if (prerr == 0) |
error = 0; |
error = 0; |
else if (prerr != ENOPROTOOPT) |
else if (prerr != ENOPROTOOPT) |
error = prerr; |
error = prerr; |
} else if (m != NULL) |
} |
(void)m_free(m); |
|
sounlock(so); |
sounlock(so); |
return error; |
return error; |
} |
} |
|
|
|
/* |
|
* so_setsockopt() is a wrapper providing a sockopt structure for sosetopt() |
|
*/ |
|
int |
|
so_setsockopt(struct lwp *l, struct socket *so, int level, int name, |
|
const void *val, size_t valsize) |
|
{ |
|
struct sockopt sopt; |
|
int error; |
|
|
|
KASSERT(valsize == 0 || val != NULL); |
|
|
|
sockopt_init(&sopt, level, name, valsize); |
|
sockopt_set(&sopt, val, valsize); |
|
|
|
error = sosetopt(so, &sopt); |
|
|
|
sockopt_destroy(&sopt); |
|
|
|
return error; |
|
} |
|
|
|
/* |
|
* internal get SOL_SOCKET options |
|
*/ |
|
static int |
|
sogetopt1(struct socket *so, struct sockopt *sopt) |
|
{ |
|
int error, optval; |
|
struct linger l; |
|
struct timeval tv; |
|
|
|
switch (sopt->sopt_name) { |
|
|
|
case SO_ACCEPTFILTER: |
|
error = accept_filt_getopt(so, sopt); |
|
break; |
|
|
|
case SO_LINGER: |
|
l.l_onoff = (so->so_options & SO_LINGER) ? 1 : 0; |
|
l.l_linger = so->so_linger; |
|
|
|
error = sockopt_set(sopt, &l, sizeof(l)); |
|
break; |
|
|
|
case SO_USELOOPBACK: |
|
case SO_DONTROUTE: |
|
case SO_DEBUG: |
|
case SO_KEEPALIVE: |
|
case SO_REUSEADDR: |
|
case SO_REUSEPORT: |
|
case SO_BROADCAST: |
|
case SO_OOBINLINE: |
|
case SO_TIMESTAMP: |
|
error = sockopt_setint(sopt, |
|
(so->so_options & sopt->sopt_name) ? 1 : 0); |
|
break; |
|
|
|
case SO_TYPE: |
|
error = sockopt_setint(sopt, so->so_type); |
|
break; |
|
|
|
case SO_ERROR: |
|
error = sockopt_setint(sopt, so->so_error); |
|
so->so_error = 0; |
|
break; |
|
|
|
case SO_SNDBUF: |
|
error = sockopt_setint(sopt, so->so_snd.sb_hiwat); |
|
break; |
|
|
|
case SO_RCVBUF: |
|
error = sockopt_setint(sopt, so->so_rcv.sb_hiwat); |
|
break; |
|
|
|
case SO_SNDLOWAT: |
|
error = sockopt_setint(sopt, so->so_snd.sb_lowat); |
|
break; |
|
|
|
case SO_RCVLOWAT: |
|
error = sockopt_setint(sopt, so->so_rcv.sb_lowat); |
|
break; |
|
|
|
case SO_SNDTIMEO: |
|
case SO_RCVTIMEO: |
|
optval = (sopt->sopt_name == SO_SNDTIMEO ? |
|
so->so_snd.sb_timeo : so->so_rcv.sb_timeo); |
|
|
|
tv.tv_sec = optval / hz; |
|
tv.tv_usec = (optval % hz) * tick; |
|
|
|
error = sockopt_set(sopt, &tv, sizeof(tv)); |
|
break; |
|
|
|
case SO_OVERFLOWED: |
|
error = sockopt_setint(sopt, so->so_rcv.sb_overflowed); |
|
break; |
|
|
|
default: |
|
error = ENOPROTOOPT; |
|
break; |
|
} |
|
|
|
return (error); |
|
} |
|
|
int |
int |
sogetopt(struct socket *so, int level, int optname, struct mbuf **mp) |
sogetopt(struct socket *so, struct sockopt *sopt) |
{ |
{ |
struct mbuf *m; |
|
int error; |
int error; |
|
|
solock(so); |
solock(so); |
if (level != SOL_SOCKET) { |
if (sopt->sopt_level != SOL_SOCKET) { |
if (so->so_proto && so->so_proto->pr_ctloutput) { |
if (so->so_proto && so->so_proto->pr_ctloutput) { |
error = ((*so->so_proto->pr_ctloutput) |
error = ((*so->so_proto->pr_ctloutput) |
(PRCO_GETOPT, so, level, optname, mp)); |
(PRCO_GETOPT, so, sopt)); |
} else |
} else |
error = (ENOPROTOOPT); |
error = (ENOPROTOOPT); |
} else { |
} else { |
m = m_get(M_WAIT, MT_SOOPTS); |
error = sogetopt1(so, sopt); |
m->m_len = sizeof(int); |
} |
|
sounlock(so); |
|
return (error); |
|
} |
|
|
switch (optname) { |
/* |
|
* alloc sockopt data buffer buffer |
|
* - will be released at destroy |
|
*/ |
|
static int |
|
sockopt_alloc(struct sockopt *sopt, size_t len, km_flag_t kmflag) |
|
{ |
|
|
#ifdef INET |
KASSERT(sopt->sopt_size == 0); |
case SO_ACCEPTFILTER: |
|
error = do_getopt_accept_filter(so, m); |
|
break; |
|
#endif |
|
|
|
case SO_LINGER: |
if (len > sizeof(sopt->sopt_buf)) { |
m->m_len = sizeof(struct linger); |
sopt->sopt_data = kmem_zalloc(len, kmflag); |
mtod(m, struct linger *)->l_onoff = |
if (sopt->sopt_data == NULL) |
(so->so_options & SO_LINGER) ? 1 : 0; |
return ENOMEM; |
mtod(m, struct linger *)->l_linger = so->so_linger; |
} else |
break; |
sopt->sopt_data = sopt->sopt_buf; |
|
|
case SO_USELOOPBACK: |
sopt->sopt_size = len; |
case SO_DONTROUTE: |
return 0; |
case SO_DEBUG: |
} |
case SO_KEEPALIVE: |
|
case SO_REUSEADDR: |
|
case SO_REUSEPORT: |
|
case SO_BROADCAST: |
|
case SO_OOBINLINE: |
|
case SO_TIMESTAMP: |
|
*mtod(m, int *) = (so->so_options & optname) ? 1 : 0; |
|
break; |
|
|
|
case SO_TYPE: |
/* |
*mtod(m, int *) = so->so_type; |
* initialise sockopt storage |
break; |
* - MAY sleep during allocation |
|
*/ |
|
void |
|
sockopt_init(struct sockopt *sopt, int level, int name, size_t size) |
|
{ |
|
|
case SO_ERROR: |
memset(sopt, 0, sizeof(*sopt)); |
*mtod(m, int *) = so->so_error; |
|
so->so_error = 0; |
|
break; |
|
|
|
case SO_SNDBUF: |
sopt->sopt_level = level; |
*mtod(m, int *) = so->so_snd.sb_hiwat; |
sopt->sopt_name = name; |
break; |
(void)sockopt_alloc(sopt, size, KM_SLEEP); |
|
} |
|
|
case SO_RCVBUF: |
/* |
*mtod(m, int *) = so->so_rcv.sb_hiwat; |
* destroy sockopt storage |
break; |
* - will release any held memory references |
|
*/ |
|
void |
|
sockopt_destroy(struct sockopt *sopt) |
|
{ |
|
|
case SO_SNDLOWAT: |
if (sopt->sopt_data != sopt->sopt_buf) |
*mtod(m, int *) = so->so_snd.sb_lowat; |
kmem_free(sopt->sopt_data, sopt->sopt_size); |
break; |
|
|
|
case SO_RCVLOWAT: |
memset(sopt, 0, sizeof(*sopt)); |
*mtod(m, int *) = so->so_rcv.sb_lowat; |
} |
break; |
|
|
|
case SO_SNDTIMEO: |
/* |
case SO_RCVTIMEO: |
* set sockopt value |
{ |
* - value is copied into sockopt |
int val = (optname == SO_SNDTIMEO ? |
* - memory is allocated when necessary, will not sleep |
so->so_snd.sb_timeo : so->so_rcv.sb_timeo); |
*/ |
|
int |
m->m_len = sizeof(struct timeval); |
sockopt_set(struct sockopt *sopt, const void *buf, size_t len) |
mtod(m, struct timeval *)->tv_sec = val / hz; |
{ |
mtod(m, struct timeval *)->tv_usec = |
int error; |
(val % hz) * tick; |
|
break; |
|
} |
|
|
|
case SO_OVERFLOWED: |
if (sopt->sopt_size == 0) { |
*mtod(m, int *) = so->so_rcv.sb_overflowed; |
error = sockopt_alloc(sopt, len, KM_NOSLEEP); |
break; |
if (error) |
|
return error; |
|
} |
|
|
default: |
KASSERT(sopt->sopt_size == len); |
sounlock(so); |
memcpy(sopt->sopt_data, buf, len); |
(void)m_free(m); |
return 0; |
return (ENOPROTOOPT); |
} |
|
|
|
/* |
|
* common case of set sockopt integer value |
|
*/ |
|
int |
|
sockopt_setint(struct sockopt *sopt, int val) |
|
{ |
|
|
|
return sockopt_set(sopt, &val, sizeof(int)); |
|
} |
|
|
|
/* |
|
* get sockopt value |
|
* - correct size must be given |
|
*/ |
|
int |
|
sockopt_get(const struct sockopt *sopt, void *buf, size_t len) |
|
{ |
|
|
|
if (sopt->sopt_size != len) |
|
return EINVAL; |
|
|
|
memcpy(buf, sopt->sopt_data, len); |
|
return 0; |
|
} |
|
|
|
/* |
|
* common case of get sockopt integer value |
|
*/ |
|
int |
|
sockopt_getint(const struct sockopt *sopt, int *valp) |
|
{ |
|
|
|
return sockopt_get(sopt, valp, sizeof(int)); |
|
} |
|
|
|
/* |
|
* set sockopt value from mbuf |
|
* - ONLY for legacy code |
|
* - mbuf is released by sockopt |
|
* - will not sleep |
|
*/ |
|
int |
|
sockopt_setmbuf(struct sockopt *sopt, struct mbuf *m) |
|
{ |
|
size_t len; |
|
int error; |
|
|
|
len = m_length(m); |
|
|
|
if (sopt->sopt_size == 0) { |
|
error = sockopt_alloc(sopt, len, KM_NOSLEEP); |
|
if (error) |
|
return error; |
|
} |
|
|
|
KASSERT(sopt->sopt_size == len); |
|
m_copydata(m, 0, len, sopt->sopt_data); |
|
m_freem(m); |
|
|
|
return 0; |
|
} |
|
|
|
/* |
|
* get sockopt value into mbuf |
|
* - ONLY for legacy code |
|
* - mbuf to be released by the caller |
|
* - will not sleep |
|
*/ |
|
struct mbuf * |
|
sockopt_getmbuf(const struct sockopt *sopt) |
|
{ |
|
struct mbuf *m; |
|
|
|
if (sopt->sopt_size > MCLBYTES) |
|
return NULL; |
|
|
|
m = m_get(M_DONTWAIT, MT_SOOPTS); |
|
if (m == NULL) |
|
return NULL; |
|
|
|
if (sopt->sopt_size > MLEN) { |
|
MCLGET(m, M_DONTWAIT); |
|
if ((m->m_flags & M_EXT) == 0) { |
|
m_free(m); |
|
return NULL; |
} |
} |
*mp = m; |
|
error = 0; |
|
} |
} |
|
|
sounlock(so); |
memcpy(mtod(m, void *), sopt->sopt_data, sopt->sopt_size); |
return (error); |
m->m_len = sopt->sopt_size; |
|
|
|
return m; |
} |
} |
|
|
void |
void |
Line 1829 sohasoutofband(struct socket *so) |
|
Line 2023 sohasoutofband(struct socket *so) |
|
{ |
{ |
|
|
fownsignal(so->so_pgid, SIGURG, POLL_PRI, POLLPRI|POLLRDBAND, so); |
fownsignal(so->so_pgid, SIGURG, POLL_PRI, POLLPRI|POLLRDBAND, so); |
selnotify(&so->so_rcv.sb_sel, POLLPRI | POLLRDBAND, 0); |
selnotify(&so->so_rcv.sb_sel, POLLPRI | POLLRDBAND, NOTE_SUBMIT); |
} |
} |
|
|
static void |
static void |