diff options
Diffstat (limited to 'net/core/sock.c')
| -rw-r--r-- | net/core/sock.c | 255 | 
1 files changed, 192 insertions, 63 deletions
diff --git a/net/core/sock.c b/net/core/sock.c index 6aa2e7e0b4fb..782343bb925b 100644 --- a/net/core/sock.c +++ b/net/core/sock.c @@ -335,14 +335,68 @@ int __sk_backlog_rcv(struct sock *sk, struct sk_buff *skb)  }  EXPORT_SYMBOL(__sk_backlog_rcv); -static int sock_set_timeout(long *timeo_p, char __user *optval, int optlen) +static int sock_get_timeout(long timeo, void *optval, bool old_timeval)  { -	struct timeval tv; +	struct __kernel_sock_timeval tv; +	int size; -	if (optlen < sizeof(tv)) -		return -EINVAL; -	if (copy_from_user(&tv, optval, sizeof(tv))) -		return -EFAULT; +	if (timeo == MAX_SCHEDULE_TIMEOUT) { +		tv.tv_sec = 0; +		tv.tv_usec = 0; +	} else { +		tv.tv_sec = timeo / HZ; +		tv.tv_usec = ((timeo % HZ) * USEC_PER_SEC) / HZ; +	} + +	if (in_compat_syscall() && !COMPAT_USE_64BIT_TIME) { +		struct old_timeval32 tv32 = { tv.tv_sec, tv.tv_usec }; +		*(struct old_timeval32 *)optval = tv32; +		return sizeof(tv32); +	} + +	if (old_timeval) { +		struct __kernel_old_timeval old_tv; +		old_tv.tv_sec = tv.tv_sec; +		old_tv.tv_usec = tv.tv_usec; +		*(struct __kernel_old_timeval *)optval = old_tv; +		size = sizeof(old_tv); +	} else { +		*(struct __kernel_sock_timeval *)optval = tv; +		size = sizeof(tv); +	} + +	return size; +} + +static int sock_set_timeout(long *timeo_p, char __user *optval, int optlen, bool old_timeval) +{ +	struct __kernel_sock_timeval tv; + +	if (in_compat_syscall() && !COMPAT_USE_64BIT_TIME) { +		struct old_timeval32 tv32; + +		if (optlen < sizeof(tv32)) +			return -EINVAL; + +		if (copy_from_user(&tv32, optval, sizeof(tv32))) +			return -EFAULT; +		tv.tv_sec = tv32.tv_sec; +		tv.tv_usec = tv32.tv_usec; +	} else if (old_timeval) { +		struct __kernel_old_timeval old_tv; + +		if (optlen < sizeof(old_tv)) +			return -EINVAL; +		if (copy_from_user(&old_tv, optval, sizeof(old_tv))) +			return -EFAULT; +		tv.tv_sec = old_tv.tv_sec; +		tv.tv_usec = old_tv.tv_usec; +	} else { +		if (optlen < sizeof(tv)) +			return -EINVAL; +		if (copy_from_user(&tv, optval, sizeof(tv))) +			return -EFAULT; +	}  	if (tv.tv_usec < 0 || tv.tv_usec >= USEC_PER_SEC)  		return -EDOM; @@ -360,8 +414,8 @@ static int sock_set_timeout(long *timeo_p, char __user *optval, int optlen)  	*timeo_p = MAX_SCHEDULE_TIMEOUT;  	if (tv.tv_sec == 0 && tv.tv_usec == 0)  		return 0; -	if (tv.tv_sec < (MAX_SCHEDULE_TIMEOUT/HZ - 1)) -		*timeo_p = tv.tv_sec * HZ + DIV_ROUND_UP(tv.tv_usec, USEC_PER_SEC / HZ); +	if (tv.tv_sec < (MAX_SCHEDULE_TIMEOUT / HZ - 1)) +		*timeo_p = tv.tv_sec * HZ + DIV_ROUND_UP((unsigned long)tv.tv_usec, USEC_PER_SEC / HZ);  	return 0;  } @@ -520,14 +574,11 @@ struct dst_entry *sk_dst_check(struct sock *sk, u32 cookie)  }  EXPORT_SYMBOL(sk_dst_check); -static int sock_setbindtodevice(struct sock *sk, char __user *optval, -				int optlen) +static int sock_setbindtodevice_locked(struct sock *sk, int ifindex)  {  	int ret = -ENOPROTOOPT;  #ifdef CONFIG_NETDEVICES  	struct net *net = sock_net(sk); -	char devname[IFNAMSIZ]; -	int index;  	/* Sorry... */  	ret = -EPERM; @@ -535,6 +586,32 @@ static int sock_setbindtodevice(struct sock *sk, char __user *optval,  		goto out;  	ret = -EINVAL; +	if (ifindex < 0) +		goto out; + +	sk->sk_bound_dev_if = ifindex; +	if (sk->sk_prot->rehash) +		sk->sk_prot->rehash(sk); +	sk_dst_reset(sk); + +	ret = 0; + +out: +#endif + +	return ret; +} + +static int sock_setbindtodevice(struct sock *sk, char __user *optval, +				int optlen) +{ +	int ret = -ENOPROTOOPT; +#ifdef CONFIG_NETDEVICES +	struct net *net = sock_net(sk); +	char devname[IFNAMSIZ]; +	int index; + +	ret = -EINVAL;  	if (optlen < 0)  		goto out; @@ -566,14 +643,9 @@ static int sock_setbindtodevice(struct sock *sk, char __user *optval,  	}  	lock_sock(sk); -	sk->sk_bound_dev_if = index; -	if (sk->sk_prot->rehash) -		sk->sk_prot->rehash(sk); -	sk_dst_reset(sk); +	ret = sock_setbindtodevice_locked(sk, index);  	release_sock(sk); -	ret = 0; -  out:  #endif @@ -713,6 +785,10 @@ int sock_setsockopt(struct socket *sock, int level, int optname,  		 */  		val = min_t(u32, val, sysctl_wmem_max);  set_sndbuf: +		/* Ensure val * 2 fits into an int, to prevent max_t() +		 * from treating it as a negative value. +		 */ +		val = min_t(int, val, INT_MAX / 2);  		sk->sk_userlocks |= SOCK_SNDBUF_LOCK;  		sk->sk_sndbuf = max_t(int, val * 2, SOCK_MIN_SNDBUF);  		/* Wake up sending tasks if we upped the value. */ @@ -724,6 +800,12 @@ set_sndbuf:  			ret = -EPERM;  			break;  		} + +		/* No negative values (to prevent underflow, as val will be +		 * multiplied by 2). +		 */ +		if (val < 0) +			val = 0;  		goto set_sndbuf;  	case SO_RCVBUF: @@ -734,6 +816,10 @@ set_sndbuf:  		 */  		val = min_t(u32, val, sysctl_rmem_max);  set_rcvbuf: +		/* Ensure val * 2 fits into an int, to prevent max_t() +		 * from treating it as a negative value. +		 */ +		val = min_t(int, val, INT_MAX / 2);  		sk->sk_userlocks |= SOCK_RCVBUF_LOCK;  		/*  		 * We double it on the way in to account for @@ -758,6 +844,12 @@ set_rcvbuf:  			ret = -EPERM;  			break;  		} + +		/* No negative values (to prevent underflow, as val will be +		 * multiplied by 2). +		 */ +		if (val < 0) +			val = 0;  		goto set_rcvbuf;  	case SO_KEEPALIVE: @@ -815,10 +907,17 @@ set_rcvbuf:  			clear_bit(SOCK_PASSCRED, &sock->flags);  		break; -	case SO_TIMESTAMP: -	case SO_TIMESTAMPNS: +	case SO_TIMESTAMP_OLD: +	case SO_TIMESTAMP_NEW: +	case SO_TIMESTAMPNS_OLD: +	case SO_TIMESTAMPNS_NEW:  		if (valbool)  { -			if (optname == SO_TIMESTAMP) +			if (optname == SO_TIMESTAMP_NEW || optname == SO_TIMESTAMPNS_NEW) +				sock_set_flag(sk, SOCK_TSTAMP_NEW); +			else +				sock_reset_flag(sk, SOCK_TSTAMP_NEW); + +			if (optname == SO_TIMESTAMP_OLD || optname == SO_TIMESTAMP_NEW)  				sock_reset_flag(sk, SOCK_RCVTSTAMPNS);  			else  				sock_set_flag(sk, SOCK_RCVTSTAMPNS); @@ -827,10 +926,14 @@ set_rcvbuf:  		} else {  			sock_reset_flag(sk, SOCK_RCVTSTAMP);  			sock_reset_flag(sk, SOCK_RCVTSTAMPNS); +			sock_reset_flag(sk, SOCK_TSTAMP_NEW);  		}  		break; -	case SO_TIMESTAMPING: +	case SO_TIMESTAMPING_NEW: +		sock_set_flag(sk, SOCK_TSTAMP_NEW); +		/* fall through */ +	case SO_TIMESTAMPING_OLD:  		if (val & ~SOF_TIMESTAMPING_MASK) {  			ret = -EINVAL;  			break; @@ -861,9 +964,13 @@ set_rcvbuf:  		if (val & SOF_TIMESTAMPING_RX_SOFTWARE)  			sock_enable_timestamp(sk,  					      SOCK_TIMESTAMPING_RX_SOFTWARE); -		else +		else { +			if (optname == SO_TIMESTAMPING_NEW) +				sock_reset_flag(sk, SOCK_TSTAMP_NEW); +  			sock_disable_timestamp(sk,  					       (1UL << SOCK_TIMESTAMPING_RX_SOFTWARE)); +		}  		break;  	case SO_RCVLOWAT: @@ -875,12 +982,14 @@ set_rcvbuf:  			sk->sk_rcvlowat = val ? : 1;  		break; -	case SO_RCVTIMEO: -		ret = sock_set_timeout(&sk->sk_rcvtimeo, optval, optlen); +	case SO_RCVTIMEO_OLD: +	case SO_RCVTIMEO_NEW: +		ret = sock_set_timeout(&sk->sk_rcvtimeo, optval, optlen, optname == SO_RCVTIMEO_OLD);  		break; -	case SO_SNDTIMEO: -		ret = sock_set_timeout(&sk->sk_sndtimeo, optval, optlen); +	case SO_SNDTIMEO_OLD: +	case SO_SNDTIMEO_NEW: +		ret = sock_set_timeout(&sk->sk_sndtimeo, optval, optlen, optname == SO_SNDTIMEO_OLD);  		break;  	case SO_ATTACH_FILTER: @@ -999,15 +1108,23 @@ set_rcvbuf:  #endif  	case SO_MAX_PACING_RATE: -		if (val != ~0U) +		{ +		unsigned long ulval = (val == ~0U) ? ~0UL : val; + +		if (sizeof(ulval) != sizeof(val) && +		    optlen >= sizeof(ulval) && +		    get_user(ulval, (unsigned long __user *)optval)) { +			ret = -EFAULT; +			break; +		} +		if (ulval != ~0UL)  			cmpxchg(&sk->sk_pacing_status,  				SK_PACING_NONE,  				SK_PACING_NEEDED); -		sk->sk_max_pacing_rate = (val == ~0U) ? ~0UL : val; -		sk->sk_pacing_rate = min(sk->sk_pacing_rate, -					 sk->sk_max_pacing_rate); +		sk->sk_max_pacing_rate = ulval; +		sk->sk_pacing_rate = min(sk->sk_pacing_rate, ulval);  		break; - +		}  	case SO_INCOMING_CPU:  		sk->sk_incoming_cpu = val;  		break; @@ -1055,6 +1172,10 @@ set_rcvbuf:  		}  		break; +	case SO_BINDTOIFINDEX: +		ret = sock_setbindtodevice_locked(sk, val); +		break; +  	default:  		ret = -ENOPROTOOPT;  		break; @@ -1098,8 +1219,11 @@ int sock_getsockopt(struct socket *sock, int level, int optname,  	union {  		int val;  		u64 val64; +		unsigned long ulval;  		struct linger ling; -		struct timeval tm; +		struct old_timeval32 tm32; +		struct __kernel_old_timeval tm; +		struct  __kernel_sock_timeval stm;  		struct sock_txtime txtime;  	} v; @@ -1186,39 +1310,36 @@ int sock_getsockopt(struct socket *sock, int level, int optname,  		sock_warn_obsolete_bsdism("getsockopt");  		break; -	case SO_TIMESTAMP: +	case SO_TIMESTAMP_OLD:  		v.val = sock_flag(sk, SOCK_RCVTSTAMP) && +				!sock_flag(sk, SOCK_TSTAMP_NEW) &&  				!sock_flag(sk, SOCK_RCVTSTAMPNS);  		break; -	case SO_TIMESTAMPNS: -		v.val = sock_flag(sk, SOCK_RCVTSTAMPNS); +	case SO_TIMESTAMPNS_OLD: +		v.val = sock_flag(sk, SOCK_RCVTSTAMPNS) && !sock_flag(sk, SOCK_TSTAMP_NEW);  		break; -	case SO_TIMESTAMPING: +	case SO_TIMESTAMP_NEW: +		v.val = sock_flag(sk, SOCK_RCVTSTAMP) && sock_flag(sk, SOCK_TSTAMP_NEW); +		break; + +	case SO_TIMESTAMPNS_NEW: +		v.val = sock_flag(sk, SOCK_RCVTSTAMPNS) && sock_flag(sk, SOCK_TSTAMP_NEW); +		break; + +	case SO_TIMESTAMPING_OLD:  		v.val = sk->sk_tsflags;  		break; -	case SO_RCVTIMEO: -		lv = sizeof(struct timeval); -		if (sk->sk_rcvtimeo == MAX_SCHEDULE_TIMEOUT) { -			v.tm.tv_sec = 0; -			v.tm.tv_usec = 0; -		} else { -			v.tm.tv_sec = sk->sk_rcvtimeo / HZ; -			v.tm.tv_usec = ((sk->sk_rcvtimeo % HZ) * USEC_PER_SEC) / HZ; -		} +	case SO_RCVTIMEO_OLD: +	case SO_RCVTIMEO_NEW: +		lv = sock_get_timeout(sk->sk_rcvtimeo, &v, SO_RCVTIMEO_OLD == optname);  		break; -	case SO_SNDTIMEO: -		lv = sizeof(struct timeval); -		if (sk->sk_sndtimeo == MAX_SCHEDULE_TIMEOUT) { -			v.tm.tv_sec = 0; -			v.tm.tv_usec = 0; -		} else { -			v.tm.tv_sec = sk->sk_sndtimeo / HZ; -			v.tm.tv_usec = ((sk->sk_sndtimeo % HZ) * USEC_PER_SEC) / HZ; -		} +	case SO_SNDTIMEO_OLD: +	case SO_SNDTIMEO_NEW: +		lv = sock_get_timeout(sk->sk_sndtimeo, &v, SO_SNDTIMEO_OLD == optname);  		break;  	case SO_RCVLOWAT: @@ -1344,8 +1465,13 @@ int sock_getsockopt(struct socket *sock, int level, int optname,  #endif  	case SO_MAX_PACING_RATE: -		/* 32bit version */ -		v.val = min_t(unsigned long, sk->sk_max_pacing_rate, ~0U); +		if (sizeof(v.ulval) != sizeof(v.val) && len >= sizeof(v.ulval)) { +			lv = sizeof(v.ulval); +			v.ulval = sk->sk_max_pacing_rate; +		} else { +			/* 32bit version */ +			v.val = min_t(unsigned long, sk->sk_max_pacing_rate, ~0U); +		}  		break;  	case SO_INCOMING_CPU: @@ -1399,6 +1525,10 @@ int sock_getsockopt(struct socket *sock, int level, int optname,  				  SOF_TXTIME_REPORT_ERRORS : 0;  		break; +	case SO_BINDTOIFINDEX: +		v.val = sk->sk_bound_dev_if; +		break; +  	default:  		/* We implement the SO_SNDLOWAT etc to not be settable  		 * (1003.1g 7). @@ -1726,7 +1856,6 @@ struct sock *sk_clone_lock(const struct sock *sk, const gfp_t priority)  		newsk->sk_err_soft = 0;  		newsk->sk_priority = 0;  		newsk->sk_incoming_cpu = raw_smp_processor_id(); -		atomic64_set(&newsk->sk_cookie, 0);  		if (likely(newsk->sk_net_refcnt))  			sock_inuse_add(sock_net(newsk), 1); @@ -1750,7 +1879,7 @@ struct sock *sk_clone_lock(const struct sock *sk, const gfp_t priority)  		 */  		sk_refcnt_debug_inc(newsk);  		sk_set_socket(newsk, NULL); -		newsk->sk_wq = NULL; +		RCU_INIT_POINTER(newsk->sk_wq, NULL);  		if (newsk->sk_prot->sockets_allocated)  			sk_sockets_allocated_inc(newsk); @@ -2122,7 +2251,7 @@ int __sock_cmsg_send(struct sock *sk, struct msghdr *msg, struct cmsghdr *cmsg,  			return -EINVAL;  		sockc->mark = *(u32 *)CMSG_DATA(cmsg);  		break; -	case SO_TIMESTAMPING: +	case SO_TIMESTAMPING_OLD:  		if (cmsg->cmsg_len != CMSG_LEN(sizeof(u32)))  			return -EINVAL; @@ -2380,7 +2509,7 @@ int __sk_mem_raise_allocated(struct sock *sk, int size, int amt, int kind)  	}  	if (sk_has_memory_pressure(sk)) { -		int alloc; +		u64 alloc;  		if (!sk_under_memory_pressure(sk))  			return 1; @@ -2713,11 +2842,11 @@ void sock_init_data(struct socket *sock, struct sock *sk)  	if (sock) {  		sk->sk_type	=	sock->type; -		sk->sk_wq	=	sock->wq; +		RCU_INIT_POINTER(sk->sk_wq, sock->wq);  		sock->sk	=	sk;  		sk->sk_uid	=	SOCK_INODE(sock)->i_uid;  	} else { -		sk->sk_wq	=	NULL; +		RCU_INIT_POINTER(sk->sk_wq, NULL);  		sk->sk_uid	=	make_kuid(sock_net(sk)->user_ns, 0);  	}  |