[PATCH 31/33] nfs: enable swap on NFS
Provide an a_ops->swapfile() implementation for NFS. This will set the NFS socket to SOCK_MEMALLOC and run socket reconnect under PF_MEMALLOC as well as reset SOCK_MEMALLOC before engaging the protocol ->connect() method. PF_MEMALLOC should allow the allocation of struct socket and related objects and the early (re)setting of SOCK_MEMALLOC should allow us to receive the packets required for the TCP connection buildup. (swapping continues over a server reset during heavy network traffic) Signed-off-by: Peter Zijlstra <[EMAIL PROTECTED]> --- fs/Kconfig | 18 fs/nfs/file.c | 10 ++ include/linux/sunrpc/xprt.h |5 ++- net/sunrpc/sched.c |9 -- net/sunrpc/xprtsock.c | 63 5 files changed, 102 insertions(+), 3 deletions(-) Index: linux-2.6/fs/nfs/file.c === --- linux-2.6.orig/fs/nfs/file.c +++ linux-2.6/fs/nfs/file.c @@ -371,6 +371,13 @@ static int nfs_launder_page(struct page return nfs_wb_page(page_file_mapping(page)->host, page); } +#ifdef CONFIG_NFS_SWAP +static int nfs_swapfile(struct address_space *mapping, int enable) +{ + return xs_swapper(NFS_CLIENT(mapping->host)->cl_xprt, enable); +} +#endif + const struct address_space_operations nfs_file_aops = { .readpage = nfs_readpage, .readpages = nfs_readpages, @@ -385,6 +392,9 @@ const struct address_space_operations nf .direct_IO = nfs_direct_IO, #endif .launder_page = nfs_launder_page, +#ifdef CONFIG_NFS_SWAP + .swapfile = nfs_swapfile, +#endif }; static int nfs_vm_page_mkwrite(struct vm_area_struct *vma, struct page *page) Index: linux-2.6/include/linux/sunrpc/xprt.h === --- linux-2.6.orig/include/linux/sunrpc/xprt.h +++ linux-2.6/include/linux/sunrpc/xprt.h @@ -143,7 +143,9 @@ struct rpc_xprt { unsigned intmax_reqs; /* total slots */ unsigned long state; /* transport state */ unsigned char shutdown : 1, /* being shut down */ - resvport : 1; /* use a reserved port */ + resvport : 1, /* use a reserved port */ + swapper: 1; /* we're swapping over this + transport */ unsigned intbind_index; /* bind function index */ /* @@ -246,6 +248,7 @@ struct rpc_rqst * xprt_lookup_rqst(struc void xprt_complete_rqst(struct rpc_task *task, int copied); void xprt_release_rqst_cong(struct rpc_task *task); void xprt_disconnect(struct rpc_xprt *xprt); +intxs_swapper(struct rpc_xprt *xprt, int enable); /* * Reserved bit positions in xprt->state Index: linux-2.6/net/sunrpc/sched.c === --- linux-2.6.orig/net/sunrpc/sched.c +++ linux-2.6/net/sunrpc/sched.c @@ -761,7 +761,10 @@ struct rpc_buffer { void *rpc_malloc(struct rpc_task *task, size_t size) { struct rpc_buffer *buf; - gfp_t gfp = RPC_IS_SWAPPER(task) ? GFP_ATOMIC : GFP_NOWAIT; + gfp_t gfp = GFP_NOWAIT; + + if (RPC_IS_SWAPPER(task)) + gfp |= __GFP_MEMALLOC; size += sizeof(struct rpc_buffer); if (size <= RPC_BUFFER_MAXSIZE) @@ -817,6 +820,8 @@ void rpc_init_task(struct rpc_task *task atomic_set(>tk_count, 1); task->tk_client = clnt; task->tk_flags = flags; + if (clnt->cl_xprt->swapper) + task->tk_flags |= RPC_TASK_SWAPPER; task->tk_ops = tk_ops; if (tk_ops->rpc_call_prepare != NULL) task->tk_action = rpc_prepare_task; @@ -853,7 +858,7 @@ void rpc_init_task(struct rpc_task *task static struct rpc_task * rpc_alloc_task(void) { - return (struct rpc_task *)mempool_alloc(rpc_task_mempool, GFP_NOFS); + return (struct rpc_task *)mempool_alloc(rpc_task_mempool, GFP_NOIO); } static void rpc_free_task(struct rcu_head *rcu) Index: linux-2.6/net/sunrpc/xprtsock.c === --- linux-2.6.orig/net/sunrpc/xprtsock.c +++ linux-2.6/net/sunrpc/xprtsock.c @@ -1397,6 +1397,9 @@ static void xs_udp_finish_connecting(str transport->sock = sock; transport->inet = sk; + if (xprt->swapper) + sk_set_memalloc(sk); + write_unlock_bh(>sk_callback_lock); } xs_udp_do_set_buffer_size(xprt); @@ -1414,11 +1417,15 @@ static void xs_udp_connect_worker4(struc container_of(work, struct sock_xprt, connect_worker.work); struct rpc_xprt *xprt = >xprt; struct socket *sock = transport->sock; + unsigned long
[PATCH 31/33] nfs: enable swap on NFS
Provide an a_ops-swapfile() implementation for NFS. This will set the NFS socket to SOCK_MEMALLOC and run socket reconnect under PF_MEMALLOC as well as reset SOCK_MEMALLOC before engaging the protocol -connect() method. PF_MEMALLOC should allow the allocation of struct socket and related objects and the early (re)setting of SOCK_MEMALLOC should allow us to receive the packets required for the TCP connection buildup. (swapping continues over a server reset during heavy network traffic) Signed-off-by: Peter Zijlstra [EMAIL PROTECTED] --- fs/Kconfig | 18 fs/nfs/file.c | 10 ++ include/linux/sunrpc/xprt.h |5 ++- net/sunrpc/sched.c |9 -- net/sunrpc/xprtsock.c | 63 5 files changed, 102 insertions(+), 3 deletions(-) Index: linux-2.6/fs/nfs/file.c === --- linux-2.6.orig/fs/nfs/file.c +++ linux-2.6/fs/nfs/file.c @@ -371,6 +371,13 @@ static int nfs_launder_page(struct page return nfs_wb_page(page_file_mapping(page)-host, page); } +#ifdef CONFIG_NFS_SWAP +static int nfs_swapfile(struct address_space *mapping, int enable) +{ + return xs_swapper(NFS_CLIENT(mapping-host)-cl_xprt, enable); +} +#endif + const struct address_space_operations nfs_file_aops = { .readpage = nfs_readpage, .readpages = nfs_readpages, @@ -385,6 +392,9 @@ const struct address_space_operations nf .direct_IO = nfs_direct_IO, #endif .launder_page = nfs_launder_page, +#ifdef CONFIG_NFS_SWAP + .swapfile = nfs_swapfile, +#endif }; static int nfs_vm_page_mkwrite(struct vm_area_struct *vma, struct page *page) Index: linux-2.6/include/linux/sunrpc/xprt.h === --- linux-2.6.orig/include/linux/sunrpc/xprt.h +++ linux-2.6/include/linux/sunrpc/xprt.h @@ -143,7 +143,9 @@ struct rpc_xprt { unsigned intmax_reqs; /* total slots */ unsigned long state; /* transport state */ unsigned char shutdown : 1, /* being shut down */ - resvport : 1; /* use a reserved port */ + resvport : 1, /* use a reserved port */ + swapper: 1; /* we're swapping over this + transport */ unsigned intbind_index; /* bind function index */ /* @@ -246,6 +248,7 @@ struct rpc_rqst * xprt_lookup_rqst(struc void xprt_complete_rqst(struct rpc_task *task, int copied); void xprt_release_rqst_cong(struct rpc_task *task); void xprt_disconnect(struct rpc_xprt *xprt); +intxs_swapper(struct rpc_xprt *xprt, int enable); /* * Reserved bit positions in xprt-state Index: linux-2.6/net/sunrpc/sched.c === --- linux-2.6.orig/net/sunrpc/sched.c +++ linux-2.6/net/sunrpc/sched.c @@ -761,7 +761,10 @@ struct rpc_buffer { void *rpc_malloc(struct rpc_task *task, size_t size) { struct rpc_buffer *buf; - gfp_t gfp = RPC_IS_SWAPPER(task) ? GFP_ATOMIC : GFP_NOWAIT; + gfp_t gfp = GFP_NOWAIT; + + if (RPC_IS_SWAPPER(task)) + gfp |= __GFP_MEMALLOC; size += sizeof(struct rpc_buffer); if (size = RPC_BUFFER_MAXSIZE) @@ -817,6 +820,8 @@ void rpc_init_task(struct rpc_task *task atomic_set(task-tk_count, 1); task-tk_client = clnt; task-tk_flags = flags; + if (clnt-cl_xprt-swapper) + task-tk_flags |= RPC_TASK_SWAPPER; task-tk_ops = tk_ops; if (tk_ops-rpc_call_prepare != NULL) task-tk_action = rpc_prepare_task; @@ -853,7 +858,7 @@ void rpc_init_task(struct rpc_task *task static struct rpc_task * rpc_alloc_task(void) { - return (struct rpc_task *)mempool_alloc(rpc_task_mempool, GFP_NOFS); + return (struct rpc_task *)mempool_alloc(rpc_task_mempool, GFP_NOIO); } static void rpc_free_task(struct rcu_head *rcu) Index: linux-2.6/net/sunrpc/xprtsock.c === --- linux-2.6.orig/net/sunrpc/xprtsock.c +++ linux-2.6/net/sunrpc/xprtsock.c @@ -1397,6 +1397,9 @@ static void xs_udp_finish_connecting(str transport-sock = sock; transport-inet = sk; + if (xprt-swapper) + sk_set_memalloc(sk); + write_unlock_bh(sk-sk_callback_lock); } xs_udp_do_set_buffer_size(xprt); @@ -1414,11 +1417,15 @@ static void xs_udp_connect_worker4(struc container_of(work, struct sock_xprt, connect_worker.work); struct rpc_xprt *xprt = transport-xprt; struct socket *sock = transport-sock; + unsigned long pflags =