Skip to content

Commit 95766ff

Browse files
Hideo Aokidavem330
authored andcommitted
[UDP]: Add memory accounting.
Signed-off-by: Takahiro Yasui <[email protected]> Signed-off-by: Hideo Aoki <[email protected]> Signed-off-by: David S. Miller <[email protected]>
1 parent 3ab224b commit 95766ff

File tree

7 files changed

+157
-7
lines changed

7 files changed

+157
-7
lines changed

Documentation/networking/ip-sysctl.txt

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -446,6 +446,33 @@ tcp_dma_copybreak - INTEGER
446446
and CONFIG_NET_DMA is enabled.
447447
Default: 4096
448448

449+
UDP variables:
450+
451+
udp_mem - vector of 3 INTEGERs: min, pressure, max
452+
Number of pages allowed for queueing by all UDP sockets.
453+
454+
min: Below this number of pages UDP is not bothered about its
455+
memory appetite. When amount of memory allocated by UDP exceeds
456+
this number, UDP starts to moderate memory usage.
457+
458+
pressure: This value was introduced to follow format of tcp_mem.
459+
460+
max: Number of pages allowed for queueing by all UDP sockets.
461+
462+
Default is calculated at boot time from amount of available memory.
463+
464+
udp_rmem_min - INTEGER
465+
Minimal size of receive buffer used by UDP sockets in moderation.
466+
Each UDP socket is able to use the size for receiving data, even if
467+
total pages of UDP sockets exceed udp_mem pressure. The unit is byte.
468+
Default: 4096
469+
470+
udp_wmem_min - INTEGER
471+
Minimal size of send buffer used by UDP sockets in moderation.
472+
Each UDP socket is able to use the size for sending data, even if
473+
total pages of UDP sockets exceed udp_mem pressure. The unit is byte.
474+
Default: 4096
475+
449476
CIPSOv4 Variables:
450477

451478
cipso_cache_enable - BOOLEAN

include/net/udp.h

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,6 +65,13 @@ extern rwlock_t udp_hash_lock;
6565

6666
extern struct proto udp_prot;
6767

68+
extern atomic_t udp_memory_allocated;
69+
70+
/* sysctl variables for udp */
71+
extern int sysctl_udp_mem[3];
72+
extern int sysctl_udp_rmem_min;
73+
extern int sysctl_udp_wmem_min;
74+
6875
struct sk_buff;
6976

7077
/*
@@ -198,4 +205,6 @@ extern void udp_proc_unregister(struct udp_seq_afinfo *afinfo);
198205
extern int udp4_proc_init(void);
199206
extern void udp4_proc_exit(void);
200207
#endif
208+
209+
extern void udp_init(void);
201210
#endif /* _UDP_H */

net/ipv4/af_inet.c

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -139,6 +139,8 @@ void inet_sock_destruct(struct sock *sk)
139139
__skb_queue_purge(&sk->sk_receive_queue);
140140
__skb_queue_purge(&sk->sk_error_queue);
141141

142+
sk_mem_reclaim(sk);
143+
142144
if (sk->sk_type == SOCK_STREAM && sk->sk_state != TCP_CLOSE) {
143145
printk("Attempt to release TCP socket in state %d %p\n",
144146
sk->sk_state, sk);
@@ -1417,6 +1419,9 @@ static int __init inet_init(void)
14171419
/* Setup TCP slab cache for open requests. */
14181420
tcp_init();
14191421

1422+
/* Setup UDP memory threshold */
1423+
udp_init();
1424+
14201425
/* Add UDP-Lite (RFC 3828) */
14211426
udplite4_register();
14221427

net/ipv4/proc.c

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -56,7 +56,8 @@ static int sockstat_seq_show(struct seq_file *seq, void *v)
5656
sock_prot_inuse(&tcp_prot), atomic_read(&tcp_orphan_count),
5757
tcp_death_row.tw_count, atomic_read(&tcp_sockets_allocated),
5858
atomic_read(&tcp_memory_allocated));
59-
seq_printf(seq, "UDP: inuse %d\n", sock_prot_inuse(&udp_prot));
59+
seq_printf(seq, "UDP: inuse %d mem %d\n", sock_prot_inuse(&udp_prot),
60+
atomic_read(&udp_memory_allocated));
6061
seq_printf(seq, "UDPLITE: inuse %d\n", sock_prot_inuse(&udplite_prot));
6162
seq_printf(seq, "RAW: inuse %d\n", sock_prot_inuse(&raw_prot));
6263
seq_printf(seq, "FRAG: inuse %d memory %d\n",

net/ipv4/sysctl_net_ipv4.c

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,7 @@
1919
#include <net/ip.h>
2020
#include <net/route.h>
2121
#include <net/tcp.h>
22+
#include <net/udp.h>
2223
#include <net/cipso_ipv4.h>
2324
#include <net/inet_frag.h>
2425

@@ -812,6 +813,36 @@ static struct ctl_table ipv4_table[] = {
812813
.mode = 0644,
813814
.proc_handler = &proc_dointvec,
814815
},
816+
{
817+
.ctl_name = CTL_UNNUMBERED,
818+
.procname = "udp_mem",
819+
.data = &sysctl_udp_mem,
820+
.maxlen = sizeof(sysctl_udp_mem),
821+
.mode = 0644,
822+
.proc_handler = &proc_dointvec_minmax,
823+
.strategy = &sysctl_intvec,
824+
.extra1 = &zero
825+
},
826+
{
827+
.ctl_name = CTL_UNNUMBERED,
828+
.procname = "udp_rmem_min",
829+
.data = &sysctl_udp_rmem_min,
830+
.maxlen = sizeof(sysctl_udp_rmem_min),
831+
.mode = 0644,
832+
.proc_handler = &proc_dointvec_minmax,
833+
.strategy = &sysctl_intvec,
834+
.extra1 = &zero
835+
},
836+
{
837+
.ctl_name = CTL_UNNUMBERED,
838+
.procname = "udp_wmem_min",
839+
.data = &sysctl_udp_wmem_min,
840+
.maxlen = sizeof(sysctl_udp_wmem_min),
841+
.mode = 0644,
842+
.proc_handler = &proc_dointvec_minmax,
843+
.strategy = &sysctl_intvec,
844+
.extra1 = &zero
845+
},
815846
{ .ctl_name = 0 }
816847
};
817848

net/ipv4/udp.c

Lines changed: 55 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -82,6 +82,7 @@
8282
#include <asm/system.h>
8383
#include <asm/uaccess.h>
8484
#include <asm/ioctls.h>
85+
#include <linux/bootmem.h>
8586
#include <linux/types.h>
8687
#include <linux/fcntl.h>
8788
#include <linux/module.h>
@@ -118,6 +119,17 @@ EXPORT_SYMBOL(udp_stats_in6);
118119
struct hlist_head udp_hash[UDP_HTABLE_SIZE];
119120
DEFINE_RWLOCK(udp_hash_lock);
120121

122+
int sysctl_udp_mem[3] __read_mostly;
123+
int sysctl_udp_rmem_min __read_mostly;
124+
int sysctl_udp_wmem_min __read_mostly;
125+
126+
EXPORT_SYMBOL(sysctl_udp_mem);
127+
EXPORT_SYMBOL(sysctl_udp_rmem_min);
128+
EXPORT_SYMBOL(sysctl_udp_wmem_min);
129+
130+
atomic_t udp_memory_allocated;
131+
EXPORT_SYMBOL(udp_memory_allocated);
132+
121133
static inline int __udp_lib_lport_inuse(__u16 num,
122134
const struct hlist_head udptable[])
123135
{
@@ -901,13 +913,17 @@ int udp_recvmsg(struct kiocb *iocb, struct sock *sk, struct msghdr *msg,
901913
err = ulen;
902914

903915
out_free:
916+
lock_sock(sk);
904917
skb_free_datagram(sk, skb);
918+
release_sock(sk);
905919
out:
906920
return err;
907921

908922
csum_copy_err:
923+
lock_sock(sk);
909924
if (!skb_kill_datagram(sk, skb, flags))
910925
UDP_INC_STATS_USER(UDP_MIB_INERRORS, is_udplite);
926+
release_sock(sk);
911927

912928
if (noblock)
913929
return -EAGAIN;
@@ -1072,7 +1088,15 @@ static int __udp4_lib_mcast_deliver(struct sk_buff *skb,
10721088
skb1 = skb_clone(skb, GFP_ATOMIC);
10731089

10741090
if (skb1) {
1075-
int ret = udp_queue_rcv_skb(sk, skb1);
1091+
int ret = 0;
1092+
1093+
bh_lock_sock_nested(sk);
1094+
if (!sock_owned_by_user(sk))
1095+
ret = udp_queue_rcv_skb(sk, skb1);
1096+
else
1097+
sk_add_backlog(sk, skb1);
1098+
bh_unlock_sock(sk);
1099+
10761100
if (ret > 0)
10771101
/* we should probably re-process instead
10781102
* of dropping packets here. */
@@ -1165,7 +1189,13 @@ int __udp4_lib_rcv(struct sk_buff *skb, struct hlist_head udptable[],
11651189
inet_iif(skb), udptable);
11661190

11671191
if (sk != NULL) {
1168-
int ret = udp_queue_rcv_skb(sk, skb);
1192+
int ret = 0;
1193+
bh_lock_sock_nested(sk);
1194+
if (!sock_owned_by_user(sk))
1195+
ret = udp_queue_rcv_skb(sk, skb);
1196+
else
1197+
sk_add_backlog(sk, skb);
1198+
bh_unlock_sock(sk);
11691199
sock_put(sk);
11701200

11711201
/* a return value > 0 means to resubmit the input, but
@@ -1460,6 +1490,10 @@ struct proto udp_prot = {
14601490
.hash = udp_lib_hash,
14611491
.unhash = udp_lib_unhash,
14621492
.get_port = udp_v4_get_port,
1493+
.memory_allocated = &udp_memory_allocated,
1494+
.sysctl_mem = sysctl_udp_mem,
1495+
.sysctl_wmem = &sysctl_udp_wmem_min,
1496+
.sysctl_rmem = &sysctl_udp_rmem_min,
14631497
.obj_size = sizeof(struct udp_sock),
14641498
#ifdef CONFIG_COMPAT
14651499
.compat_setsockopt = compat_udp_setsockopt,
@@ -1655,6 +1689,25 @@ void udp4_proc_exit(void)
16551689
}
16561690
#endif /* CONFIG_PROC_FS */
16571691

1692+
void __init udp_init(void)
1693+
{
1694+
unsigned long limit;
1695+
1696+
/* Set the pressure threshold up by the same strategy of TCP. It is a
1697+
* fraction of global memory that is up to 1/2 at 256 MB, decreasing
1698+
* toward zero with the amount of memory, with a floor of 128 pages.
1699+
*/
1700+
limit = min(nr_all_pages, 1UL<<(28-PAGE_SHIFT)) >> (20-PAGE_SHIFT);
1701+
limit = (limit * (nr_all_pages >> (20-PAGE_SHIFT))) >> (PAGE_SHIFT-11);
1702+
limit = max(limit, 128UL);
1703+
sysctl_udp_mem[0] = limit / 4 * 3;
1704+
sysctl_udp_mem[1] = limit;
1705+
sysctl_udp_mem[2] = sysctl_udp_mem[0] * 2;
1706+
1707+
sysctl_udp_rmem_min = SK_MEM_QUANTUM;
1708+
sysctl_udp_wmem_min = SK_MEM_QUANTUM;
1709+
}
1710+
16581711
EXPORT_SYMBOL(udp_disconnect);
16591712
EXPORT_SYMBOL(udp_hash);
16601713
EXPORT_SYMBOL(udp_hash_lock);

net/ipv6/udp.c

Lines changed: 28 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -204,13 +204,17 @@ int udpv6_recvmsg(struct kiocb *iocb, struct sock *sk,
204204
err = ulen;
205205

206206
out_free:
207+
lock_sock(sk);
207208
skb_free_datagram(sk, skb);
209+
release_sock(sk);
208210
out:
209211
return err;
210212

211213
csum_copy_err:
214+
lock_sock(sk);
212215
if (!skb_kill_datagram(sk, skb, flags))
213216
UDP6_INC_STATS_USER(UDP_MIB_INERRORS, is_udplite);
217+
release_sock(sk);
214218

215219
if (flags & MSG_DONTWAIT)
216220
return -EAGAIN;
@@ -366,10 +370,21 @@ static int __udp6_lib_mcast_deliver(struct sk_buff *skb, struct in6_addr *saddr,
366370
while ((sk2 = udp_v6_mcast_next(sk_next(sk2), uh->dest, daddr,
367371
uh->source, saddr, dif))) {
368372
struct sk_buff *buff = skb_clone(skb, GFP_ATOMIC);
369-
if (buff)
370-
udpv6_queue_rcv_skb(sk2, buff);
373+
if (buff) {
374+
bh_lock_sock_nested(sk2);
375+
if (!sock_owned_by_user(sk2))
376+
udpv6_queue_rcv_skb(sk2, buff);
377+
else
378+
sk_add_backlog(sk2, buff);
379+
bh_unlock_sock(sk2);
380+
}
371381
}
372-
udpv6_queue_rcv_skb(sk, skb);
382+
bh_lock_sock_nested(sk);
383+
if (!sock_owned_by_user(sk))
384+
udpv6_queue_rcv_skb(sk, skb);
385+
else
386+
sk_add_backlog(sk, skb);
387+
bh_unlock_sock(sk);
373388
out:
374389
read_unlock(&udp_hash_lock);
375390
return 0;
@@ -482,7 +497,12 @@ int __udp6_lib_rcv(struct sk_buff *skb, struct hlist_head udptable[],
482497

483498
/* deliver */
484499

485-
udpv6_queue_rcv_skb(sk, skb);
500+
bh_lock_sock_nested(sk);
501+
if (!sock_owned_by_user(sk))
502+
udpv6_queue_rcv_skb(sk, skb);
503+
else
504+
sk_add_backlog(sk, skb);
505+
bh_unlock_sock(sk);
486506
sock_put(sk);
487507
return 0;
488508

@@ -994,6 +1014,10 @@ struct proto udpv6_prot = {
9941014
.hash = udp_lib_hash,
9951015
.unhash = udp_lib_unhash,
9961016
.get_port = udp_v6_get_port,
1017+
.memory_allocated = &udp_memory_allocated,
1018+
.sysctl_mem = sysctl_udp_mem,
1019+
.sysctl_wmem = &sysctl_udp_wmem_min,
1020+
.sysctl_rmem = &sysctl_udp_rmem_min,
9971021
.obj_size = sizeof(struct udp6_sock),
9981022
#ifdef CONFIG_COMPAT
9991023
.compat_setsockopt = compat_udpv6_setsockopt,

0 commit comments

Comments
 (0)