2 * Common NFS I/O operations for the pnfs file based
5 * Copyright (c) 2014, Primary Data, Inc. All rights reserved.
7 * Tom Haynes <loghyr@primarydata.com>
10 #include <linux/nfs_fs.h>
11 #include <linux/nfs_page.h>
12 #include <linux/sunrpc/addr.h>
13 #include <linux/module.h>
15 #include "nfs4session.h"
19 #define NFSDBG_FACILITY NFSDBG_PNFS
21 void pnfs_generic_rw_release(void *data
)
23 struct nfs_pgio_header
*hdr
= data
;
25 nfs_put_client(hdr
->ds_clp
);
26 hdr
->mds_ops
->rpc_release(data
);
28 EXPORT_SYMBOL_GPL(pnfs_generic_rw_release
);
30 /* Fake up some data that will cause nfs_commit_release to retry the writes. */
31 void pnfs_generic_prepare_to_resend_writes(struct nfs_commit_data
*data
)
33 struct nfs_page
*first
= nfs_list_entry(data
->pages
.next
);
35 data
->task
.tk_status
= 0;
36 memcpy(&data
->verf
.verifier
, &first
->wb_verf
,
37 sizeof(data
->verf
.verifier
));
38 data
->verf
.verifier
.data
[0]++; /* ensure verifier mismatch */
40 EXPORT_SYMBOL_GPL(pnfs_generic_prepare_to_resend_writes
);
42 void pnfs_generic_write_commit_done(struct rpc_task
*task
, void *data
)
44 struct nfs_commit_data
*wdata
= data
;
46 /* Note this may cause RPC to be resent */
47 wdata
->mds_ops
->rpc_call_done(task
, data
);
49 EXPORT_SYMBOL_GPL(pnfs_generic_write_commit_done
);
51 void pnfs_generic_commit_release(void *calldata
)
53 struct nfs_commit_data
*data
= calldata
;
55 data
->completion_ops
->completion(data
);
56 pnfs_put_lseg(data
->lseg
);
57 nfs_put_client(data
->ds_clp
);
58 nfs_commitdata_release(data
);
60 EXPORT_SYMBOL_GPL(pnfs_generic_commit_release
);
62 /* The generic layer is about to remove the req from the commit list.
63 * If this will make the bucket empty, it will need to put the lseg reference.
64 * Note this must be called holding i_lock
67 pnfs_generic_clear_request_commit(struct nfs_page
*req
,
68 struct nfs_commit_info
*cinfo
)
70 struct pnfs_layout_segment
*freeme
= NULL
;
72 if (!test_and_clear_bit(PG_COMMIT_TO_DS
, &req
->wb_flags
))
74 cinfo
->ds
->nwritten
--;
75 if (list_is_singular(&req
->wb_list
)) {
76 struct pnfs_commit_bucket
*bucket
;
78 bucket
= list_first_entry(&req
->wb_list
,
79 struct pnfs_commit_bucket
,
81 freeme
= bucket
->wlseg
;
85 nfs_request_remove_commit_list(req
, cinfo
);
86 pnfs_put_lseg_locked(freeme
);
88 EXPORT_SYMBOL_GPL(pnfs_generic_clear_request_commit
);
91 pnfs_generic_transfer_commit_list(struct list_head
*src
, struct list_head
*dst
,
92 struct nfs_commit_info
*cinfo
, int max
)
94 struct nfs_page
*req
, *tmp
;
97 list_for_each_entry_safe(req
, tmp
, src
, wb_list
) {
98 if (!nfs_lock_request(req
))
100 kref_get(&req
->wb_kref
);
101 if (cond_resched_lock(&cinfo
->inode
->i_lock
))
102 list_safe_reset_next(req
, tmp
, wb_list
);
103 nfs_request_remove_commit_list(req
, cinfo
);
104 clear_bit(PG_COMMIT_TO_DS
, &req
->wb_flags
);
105 nfs_list_add_request(req
, dst
);
107 if ((ret
== max
) && !cinfo
->dreq
)
114 pnfs_generic_scan_ds_commit_list(struct pnfs_commit_bucket
*bucket
,
115 struct nfs_commit_info
*cinfo
,
118 struct list_head
*src
= &bucket
->written
;
119 struct list_head
*dst
= &bucket
->committing
;
122 lockdep_assert_held(&cinfo
->inode
->i_lock
);
123 ret
= pnfs_generic_transfer_commit_list(src
, dst
, cinfo
, max
);
125 cinfo
->ds
->nwritten
-= ret
;
126 cinfo
->ds
->ncommitting
+= ret
;
127 if (bucket
->clseg
== NULL
)
128 bucket
->clseg
= pnfs_get_lseg(bucket
->wlseg
);
129 if (list_empty(src
)) {
130 pnfs_put_lseg_locked(bucket
->wlseg
);
131 bucket
->wlseg
= NULL
;
137 /* Move reqs from written to committing lists, returning count
140 int pnfs_generic_scan_commit_lists(struct nfs_commit_info
*cinfo
,
145 lockdep_assert_held(&cinfo
->inode
->i_lock
);
146 for (i
= 0; i
< cinfo
->ds
->nbuckets
&& max
!= 0; i
++) {
147 cnt
= pnfs_generic_scan_ds_commit_list(&cinfo
->ds
->buckets
[i
],
154 EXPORT_SYMBOL_GPL(pnfs_generic_scan_commit_lists
);
156 /* Pull everything off the committing lists and dump into @dst. */
157 void pnfs_generic_recover_commit_reqs(struct list_head
*dst
,
158 struct nfs_commit_info
*cinfo
)
160 struct pnfs_commit_bucket
*b
;
161 struct pnfs_layout_segment
*freeme
;
164 lockdep_assert_held(&cinfo
->inode
->i_lock
);
166 for (i
= 0, b
= cinfo
->ds
->buckets
; i
< cinfo
->ds
->nbuckets
; i
++, b
++) {
167 if (pnfs_generic_transfer_commit_list(&b
->written
, dst
,
171 spin_unlock(&cinfo
->inode
->i_lock
);
172 pnfs_put_lseg(freeme
);
173 spin_lock(&cinfo
->inode
->i_lock
);
177 cinfo
->ds
->nwritten
= 0;
179 EXPORT_SYMBOL_GPL(pnfs_generic_recover_commit_reqs
);
181 static void pnfs_generic_retry_commit(struct nfs_commit_info
*cinfo
, int idx
)
183 struct pnfs_ds_commit_info
*fl_cinfo
= cinfo
->ds
;
184 struct pnfs_commit_bucket
*bucket
;
185 struct pnfs_layout_segment
*freeme
;
189 spin_lock(&cinfo
->inode
->i_lock
);
190 for (i
= idx
; i
< fl_cinfo
->nbuckets
; i
++) {
191 bucket
= &fl_cinfo
->buckets
[i
];
192 if (list_empty(&bucket
->committing
))
194 freeme
= bucket
->clseg
;
195 bucket
->clseg
= NULL
;
196 list_splice_init(&bucket
->committing
, &pages
);
197 spin_unlock(&cinfo
->inode
->i_lock
);
198 nfs_retry_commit(&pages
, freeme
, cinfo
, i
);
199 pnfs_put_lseg(freeme
);
200 spin_lock(&cinfo
->inode
->i_lock
);
202 spin_unlock(&cinfo
->inode
->i_lock
);
206 pnfs_generic_alloc_ds_commits(struct nfs_commit_info
*cinfo
,
207 struct list_head
*list
)
209 struct pnfs_ds_commit_info
*fl_cinfo
;
210 struct pnfs_commit_bucket
*bucket
;
211 struct nfs_commit_data
*data
;
213 unsigned int nreq
= 0;
215 fl_cinfo
= cinfo
->ds
;
216 bucket
= fl_cinfo
->buckets
;
217 for (i
= 0; i
< fl_cinfo
->nbuckets
; i
++, bucket
++) {
218 if (list_empty(&bucket
->committing
))
221 * If the layout segment is invalid, then let
222 * pnfs_generic_retry_commit() clean up the bucket.
224 if (bucket
->clseg
&& !pnfs_is_valid_lseg(bucket
->clseg
) &&
225 !test_bit(NFS_LSEG_LAYOUTRETURN
, &bucket
->clseg
->pls_flags
))
227 data
= nfs_commitdata_alloc(false);
230 data
->ds_commit_index
= i
;
231 list_add(&data
->pages
, list
);
235 /* Clean up on error */
236 pnfs_generic_retry_commit(cinfo
, i
);
241 void pnfs_fetch_commit_bucket_list(struct list_head
*pages
,
242 struct nfs_commit_data
*data
,
243 struct nfs_commit_info
*cinfo
)
245 struct pnfs_commit_bucket
*bucket
;
247 bucket
= &cinfo
->ds
->buckets
[data
->ds_commit_index
];
248 spin_lock(&cinfo
->inode
->i_lock
);
249 list_splice_init(&bucket
->committing
, pages
);
250 data
->lseg
= bucket
->clseg
;
251 bucket
->clseg
= NULL
;
252 spin_unlock(&cinfo
->inode
->i_lock
);
256 /* Helper function for pnfs_generic_commit_pagelist to catch an empty
257 * page list. This can happen when two commits race.
259 * This must be called instead of nfs_init_commit - call one or the other, but
263 pnfs_generic_commit_cancel_empty_pagelist(struct list_head
*pages
,
264 struct nfs_commit_data
*data
,
265 struct nfs_commit_info
*cinfo
)
267 if (list_empty(pages
)) {
268 if (atomic_dec_and_test(&cinfo
->mds
->rpcs_out
))
269 wake_up_atomic_t(&cinfo
->mds
->rpcs_out
);
270 /* don't call nfs_commitdata_release - it tries to put
271 * the open_context which is not acquired until nfs_init_commit
272 * which has not been called on @data */
273 WARN_ON_ONCE(data
->context
);
274 nfs_commit_free(data
);
281 /* This follows nfs_commit_list pretty closely */
283 pnfs_generic_commit_pagelist(struct inode
*inode
, struct list_head
*mds_pages
,
284 int how
, struct nfs_commit_info
*cinfo
,
285 int (*initiate_commit
)(struct nfs_commit_data
*data
,
288 struct nfs_commit_data
*data
, *tmp
;
290 unsigned int nreq
= 0;
292 if (!list_empty(mds_pages
)) {
293 data
= nfs_commitdata_alloc(true);
294 data
->ds_commit_index
= -1;
295 list_add(&data
->pages
, &list
);
299 nreq
+= pnfs_generic_alloc_ds_commits(cinfo
, &list
);
304 atomic_add(nreq
, &cinfo
->mds
->rpcs_out
);
306 list_for_each_entry_safe(data
, tmp
, &list
, pages
) {
307 list_del_init(&data
->pages
);
308 if (data
->ds_commit_index
< 0) {
309 /* another commit raced with us */
310 if (pnfs_generic_commit_cancel_empty_pagelist(mds_pages
,
314 nfs_init_commit(data
, mds_pages
, NULL
, cinfo
);
315 nfs_initiate_commit(NFS_CLIENT(inode
), data
,
316 NFS_PROTO(data
->inode
),
317 data
->mds_ops
, how
, 0);
321 pnfs_fetch_commit_bucket_list(&pages
, data
, cinfo
);
323 /* another commit raced with us */
324 if (pnfs_generic_commit_cancel_empty_pagelist(&pages
,
328 nfs_init_commit(data
, &pages
, data
->lseg
, cinfo
);
329 initiate_commit(data
, how
);
333 cinfo
->ds
->ncommitting
= 0;
334 return PNFS_ATTEMPTED
;
336 EXPORT_SYMBOL_GPL(pnfs_generic_commit_pagelist
);
341 * Data servers can be mapped to different device ids.
342 * nfs4_pnfs_ds reference counting
343 * - set to 1 on allocation
344 * - incremented when a device id maps a data server already in the cache.
345 * - decremented when deviceid is removed from the cache.
347 static DEFINE_SPINLOCK(nfs4_ds_cache_lock
);
348 static LIST_HEAD(nfs4_data_server_cache
);
352 print_ds(struct nfs4_pnfs_ds
*ds
)
355 printk(KERN_WARNING
"%s NULL device\n", __func__
);
358 printk(KERN_WARNING
" ds %s\n"
361 " cl_exchange_flags %x\n",
363 atomic_read(&ds
->ds_count
), ds
->ds_clp
,
364 ds
->ds_clp
? ds
->ds_clp
->cl_exchange_flags
: 0);
368 same_sockaddr(struct sockaddr
*addr1
, struct sockaddr
*addr2
)
370 struct sockaddr_in
*a
, *b
;
371 struct sockaddr_in6
*a6
, *b6
;
373 if (addr1
->sa_family
!= addr2
->sa_family
)
376 switch (addr1
->sa_family
) {
378 a
= (struct sockaddr_in
*)addr1
;
379 b
= (struct sockaddr_in
*)addr2
;
381 if (a
->sin_addr
.s_addr
== b
->sin_addr
.s_addr
&&
382 a
->sin_port
== b
->sin_port
)
387 a6
= (struct sockaddr_in6
*)addr1
;
388 b6
= (struct sockaddr_in6
*)addr2
;
390 /* LINKLOCAL addresses must have matching scope_id */
391 if (ipv6_addr_src_scope(&a6
->sin6_addr
) ==
392 IPV6_ADDR_SCOPE_LINKLOCAL
&&
393 a6
->sin6_scope_id
!= b6
->sin6_scope_id
)
396 if (ipv6_addr_equal(&a6
->sin6_addr
, &b6
->sin6_addr
) &&
397 a6
->sin6_port
== b6
->sin6_port
)
402 dprintk("%s: unhandled address family: %u\n",
403 __func__
, addr1
->sa_family
);
411 * Checks if 'dsaddrs1' contains a subset of 'dsaddrs2'. If it does,
415 _same_data_server_addrs_locked(const struct list_head
*dsaddrs1
,
416 const struct list_head
*dsaddrs2
)
418 struct nfs4_pnfs_ds_addr
*da1
, *da2
;
419 struct sockaddr
*sa1
, *sa2
;
422 list_for_each_entry(da1
, dsaddrs1
, da_node
) {
423 sa1
= (struct sockaddr
*)&da1
->da_addr
;
425 list_for_each_entry(da2
, dsaddrs2
, da_node
) {
426 sa2
= (struct sockaddr
*)&da2
->da_addr
;
427 match
= same_sockaddr(sa1
, sa2
);
438 * Lookup DS by addresses. nfs4_ds_cache_lock is held
440 static struct nfs4_pnfs_ds
*
441 _data_server_lookup_locked(const struct list_head
*dsaddrs
)
443 struct nfs4_pnfs_ds
*ds
;
445 list_for_each_entry(ds
, &nfs4_data_server_cache
, ds_node
)
446 if (_same_data_server_addrs_locked(&ds
->ds_addrs
, dsaddrs
))
451 static void destroy_ds(struct nfs4_pnfs_ds
*ds
)
453 struct nfs4_pnfs_ds_addr
*da
;
455 dprintk("--> %s\n", __func__
);
459 nfs_put_client(ds
->ds_clp
);
461 while (!list_empty(&ds
->ds_addrs
)) {
462 da
= list_first_entry(&ds
->ds_addrs
,
463 struct nfs4_pnfs_ds_addr
,
465 list_del_init(&da
->da_node
);
466 kfree(da
->da_remotestr
);
470 kfree(ds
->ds_remotestr
);
474 void nfs4_pnfs_ds_put(struct nfs4_pnfs_ds
*ds
)
476 if (atomic_dec_and_lock(&ds
->ds_count
,
477 &nfs4_ds_cache_lock
)) {
478 list_del_init(&ds
->ds_node
);
479 spin_unlock(&nfs4_ds_cache_lock
);
483 EXPORT_SYMBOL_GPL(nfs4_pnfs_ds_put
);
486 * Create a string with a human readable address and port to avoid
487 * complicated setup around many dprinks.
490 nfs4_pnfs_remotestr(struct list_head
*dsaddrs
, gfp_t gfp_flags
)
492 struct nfs4_pnfs_ds_addr
*da
;
497 len
= 3; /* '{', '}' and eol */
498 list_for_each_entry(da
, dsaddrs
, da_node
) {
499 len
+= strlen(da
->da_remotestr
) + 1; /* string plus comma */
502 remotestr
= kzalloc(len
, gfp_flags
);
509 list_for_each_entry(da
, dsaddrs
, da_node
) {
510 size_t ll
= strlen(da
->da_remotestr
);
515 memcpy(p
, da
->da_remotestr
, ll
);
535 * Given a list of multipath struct nfs4_pnfs_ds_addr, add it to ds cache if
536 * uncached and return cached struct nfs4_pnfs_ds.
538 struct nfs4_pnfs_ds
*
539 nfs4_pnfs_ds_add(struct list_head
*dsaddrs
, gfp_t gfp_flags
)
541 struct nfs4_pnfs_ds
*tmp_ds
, *ds
= NULL
;
544 if (list_empty(dsaddrs
)) {
545 dprintk("%s: no addresses defined\n", __func__
);
549 ds
= kzalloc(sizeof(*ds
), gfp_flags
);
553 /* this is only used for debugging, so it's ok if its NULL */
554 remotestr
= nfs4_pnfs_remotestr(dsaddrs
, gfp_flags
);
556 spin_lock(&nfs4_ds_cache_lock
);
557 tmp_ds
= _data_server_lookup_locked(dsaddrs
);
558 if (tmp_ds
== NULL
) {
559 INIT_LIST_HEAD(&ds
->ds_addrs
);
560 list_splice_init(dsaddrs
, &ds
->ds_addrs
);
561 ds
->ds_remotestr
= remotestr
;
562 atomic_set(&ds
->ds_count
, 1);
563 INIT_LIST_HEAD(&ds
->ds_node
);
565 list_add(&ds
->ds_node
, &nfs4_data_server_cache
);
566 dprintk("%s add new data server %s\n", __func__
,
571 atomic_inc(&tmp_ds
->ds_count
);
572 dprintk("%s data server %s found, inc'ed ds_count to %d\n",
573 __func__
, tmp_ds
->ds_remotestr
,
574 atomic_read(&tmp_ds
->ds_count
));
577 spin_unlock(&nfs4_ds_cache_lock
);
581 EXPORT_SYMBOL_GPL(nfs4_pnfs_ds_add
);
583 static void nfs4_wait_ds_connect(struct nfs4_pnfs_ds
*ds
)
586 wait_on_bit(&ds
->ds_state
, NFS4DS_CONNECTING
,
590 static void nfs4_clear_ds_conn_bit(struct nfs4_pnfs_ds
*ds
)
592 smp_mb__before_atomic();
593 clear_bit(NFS4DS_CONNECTING
, &ds
->ds_state
);
594 smp_mb__after_atomic();
595 wake_up_bit(&ds
->ds_state
, NFS4DS_CONNECTING
);
598 static struct nfs_client
*(*get_v3_ds_connect
)(
599 struct nfs_server
*mds_srv
,
600 const struct sockaddr
*ds_addr
,
603 unsigned int ds_timeo
,
604 unsigned int ds_retrans
);
606 static bool load_v3_ds_connect(void)
608 if (!get_v3_ds_connect
) {
609 get_v3_ds_connect
= symbol_request(nfs3_set_ds_client
);
610 WARN_ON_ONCE(!get_v3_ds_connect
);
613 return(get_v3_ds_connect
!= NULL
);
616 void nfs4_pnfs_v3_ds_connect_unload(void)
618 if (get_v3_ds_connect
) {
619 symbol_put(nfs3_set_ds_client
);
620 get_v3_ds_connect
= NULL
;
624 static int _nfs4_pnfs_v3_ds_connect(struct nfs_server
*mds_srv
,
625 struct nfs4_pnfs_ds
*ds
,
627 unsigned int retrans
)
629 struct nfs_client
*clp
= ERR_PTR(-EIO
);
630 struct nfs4_pnfs_ds_addr
*da
;
633 dprintk("--> %s DS %s\n", __func__
, ds
->ds_remotestr
);
635 if (!load_v3_ds_connect())
638 list_for_each_entry(da
, &ds
->ds_addrs
, da_node
) {
639 dprintk("%s: DS %s: trying address %s\n",
640 __func__
, ds
->ds_remotestr
, da
->da_remotestr
);
643 struct xprt_create xprt_args
= {
644 .ident
= XPRT_TRANSPORT_TCP
,
646 .dstaddr
= (struct sockaddr
*)&da
->da_addr
,
647 .addrlen
= da
->da_addrlen
,
648 .servername
= clp
->cl_hostname
,
650 /* Add this address as an alias */
651 rpc_clnt_add_xprt(clp
->cl_rpcclient
, &xprt_args
,
652 rpc_clnt_test_and_add_xprt
, NULL
);
654 clp
= get_v3_ds_connect(mds_srv
,
655 (struct sockaddr
*)&da
->da_addr
,
656 da
->da_addrlen
, IPPROTO_TCP
,
661 status
= PTR_ERR(clp
);
667 dprintk("%s [new] addr: %s\n", __func__
, ds
->ds_remotestr
);
672 static int _nfs4_pnfs_v4_ds_connect(struct nfs_server
*mds_srv
,
673 struct nfs4_pnfs_ds
*ds
,
675 unsigned int retrans
,
678 struct nfs_client
*clp
= ERR_PTR(-EIO
);
679 struct nfs4_pnfs_ds_addr
*da
;
682 dprintk("--> %s DS %s\n", __func__
, ds
->ds_remotestr
);
684 list_for_each_entry(da
, &ds
->ds_addrs
, da_node
) {
685 dprintk("%s: DS %s: trying address %s\n",
686 __func__
, ds
->ds_remotestr
, da
->da_remotestr
);
688 if (!IS_ERR(clp
) && clp
->cl_mvops
->session_trunk
) {
689 struct xprt_create xprt_args
= {
690 .ident
= XPRT_TRANSPORT_TCP
,
692 .dstaddr
= (struct sockaddr
*)&da
->da_addr
,
693 .addrlen
= da
->da_addrlen
,
694 .servername
= clp
->cl_hostname
,
696 struct nfs4_add_xprt_data xprtdata
= {
698 .cred
= nfs4_get_clid_cred(clp
),
700 struct rpc_add_xprt_test rpcdata
= {
701 .add_xprt_test
= clp
->cl_mvops
->session_trunk
,
706 * Test this address for session trunking and
709 rpc_clnt_add_xprt(clp
->cl_rpcclient
, &xprt_args
,
710 rpc_clnt_setup_test_and_add_xprt
,
713 put_rpccred(xprtdata
.cred
);
715 clp
= nfs4_set_ds_client(mds_srv
,
716 (struct sockaddr
*)&da
->da_addr
,
717 da
->da_addrlen
, IPPROTO_TCP
,
718 timeo
, retrans
, minor_version
);
722 status
= nfs4_init_ds_session(clp
,
723 mds_srv
->nfs_client
->cl_lease_time
);
734 status
= PTR_ERR(clp
);
740 dprintk("%s [new] addr: %s\n", __func__
, ds
->ds_remotestr
);
746 * Create an rpc connection to the nfs4_pnfs_ds data server.
747 * Currently only supports IPv4 and IPv6 addresses.
748 * If connection fails, make devid unavailable and return a -errno.
750 int nfs4_pnfs_ds_connect(struct nfs_server
*mds_srv
, struct nfs4_pnfs_ds
*ds
,
751 struct nfs4_deviceid_node
*devid
, unsigned int timeo
,
752 unsigned int retrans
, u32 version
, u32 minor_version
)
758 if (test_and_set_bit(NFS4DS_CONNECTING
, &ds
->ds_state
) == 0) {
760 err
= _nfs4_pnfs_v3_ds_connect(mds_srv
, ds
, timeo
,
762 } else if (version
== 4) {
763 err
= _nfs4_pnfs_v4_ds_connect(mds_srv
, ds
, timeo
,
764 retrans
, minor_version
);
766 dprintk("%s: unsupported DS version %d\n", __func__
,
768 err
= -EPROTONOSUPPORT
;
771 nfs4_clear_ds_conn_bit(ds
);
773 nfs4_wait_ds_connect(ds
);
775 /* what was waited on didn't connect AND didn't mark unavail */
776 if (!ds
->ds_clp
&& !nfs4_test_deviceid_unavailable(devid
))
781 * At this point the ds->ds_clp should be ready, but it might have
785 if (!ds
->ds_clp
|| !nfs_client_init_is_complete(ds
->ds_clp
)) {
786 WARN_ON_ONCE(ds
->ds_clp
||
787 !nfs4_test_deviceid_unavailable(devid
));
790 err
= nfs_client_init_status(ds
->ds_clp
);
795 EXPORT_SYMBOL_GPL(nfs4_pnfs_ds_connect
);
798 * Currently only supports ipv4, ipv6 and one multi-path address.
800 struct nfs4_pnfs_ds_addr
*
801 nfs4_decode_mp_ds_addr(struct net
*net
, struct xdr_stream
*xdr
, gfp_t gfp_flags
)
803 struct nfs4_pnfs_ds_addr
*da
= NULL
;
809 char *netid
, *match_netid
;
810 size_t len
, match_netid_len
;
816 p
= xdr_inline_decode(xdr
, 4);
819 nlen
= be32_to_cpup(p
++);
821 p
= xdr_inline_decode(xdr
, nlen
);
825 netid
= kmalloc(nlen
+1, gfp_flags
);
826 if (unlikely(!netid
))
830 memcpy(netid
, p
, nlen
);
832 /* r_addr: ip/ip6addr with port in dec octets - see RFC 5665 */
833 p
= xdr_inline_decode(xdr
, 4);
836 rlen
= be32_to_cpup(p
);
838 p
= xdr_inline_decode(xdr
, rlen
);
842 /* port is ".ABC.DEF", 8 chars max */
843 if (rlen
> INET6_ADDRSTRLEN
+ IPV6_SCOPE_ID_LEN
+ 8) {
844 dprintk("%s: Invalid address, length %d\n", __func__
,
848 buf
= kmalloc(rlen
+ 1, gfp_flags
);
850 dprintk("%s: Not enough memory\n", __func__
);
854 memcpy(buf
, p
, rlen
);
856 /* replace port '.' with '-' */
857 portstr
= strrchr(buf
, '.');
859 dprintk("%s: Failed finding expected dot in port\n",
865 /* find '.' between address and port */
866 portstr
= strrchr(buf
, '.');
868 dprintk("%s: Failed finding expected dot between address and "
874 da
= kzalloc(sizeof(*da
), gfp_flags
);
878 INIT_LIST_HEAD(&da
->da_node
);
880 if (!rpc_pton(net
, buf
, portstr
-buf
, (struct sockaddr
*)&da
->da_addr
,
881 sizeof(da
->da_addr
))) {
882 dprintk("%s: error parsing address %s\n", __func__
, buf
);
887 sscanf(portstr
, "%d-%d", &tmp
[0], &tmp
[1]);
888 port
= htons((tmp
[0] << 8) | (tmp
[1]));
890 switch (da
->da_addr
.ss_family
) {
892 ((struct sockaddr_in
*)&da
->da_addr
)->sin_port
= port
;
893 da
->da_addrlen
= sizeof(struct sockaddr_in
);
899 ((struct sockaddr_in6
*)&da
->da_addr
)->sin6_port
= port
;
900 da
->da_addrlen
= sizeof(struct sockaddr_in6
);
901 match_netid
= "tcp6";
908 dprintk("%s: unsupported address family: %u\n",
909 __func__
, da
->da_addr
.ss_family
);
913 if (nlen
!= match_netid_len
|| strncmp(netid
, match_netid
, nlen
)) {
914 dprintk("%s: ERROR: r_netid \"%s\" != \"%s\"\n",
915 __func__
, netid
, match_netid
);
919 /* save human readable address */
920 len
= strlen(startsep
) + strlen(buf
) + strlen(endsep
) + 7;
921 da
->da_remotestr
= kzalloc(len
, gfp_flags
);
923 /* NULL is ok, only used for dprintk */
924 if (da
->da_remotestr
)
925 snprintf(da
->da_remotestr
, len
, "%s%s%s:%u", startsep
,
926 buf
, endsep
, ntohs(port
));
928 dprintk("%s: Parsed DS addr %s\n", __func__
, da
->da_remotestr
);
936 dprintk("%s: Error parsing DS addr: %s\n", __func__
, buf
);
943 EXPORT_SYMBOL_GPL(nfs4_decode_mp_ds_addr
);
946 pnfs_layout_mark_request_commit(struct nfs_page
*req
,
947 struct pnfs_layout_segment
*lseg
,
948 struct nfs_commit_info
*cinfo
,
951 struct list_head
*list
;
952 struct pnfs_commit_bucket
*buckets
;
954 spin_lock(&cinfo
->inode
->i_lock
);
955 buckets
= cinfo
->ds
->buckets
;
956 list
= &buckets
[ds_commit_idx
].written
;
957 if (list_empty(list
)) {
958 if (!pnfs_is_valid_lseg(lseg
)) {
959 spin_unlock(&cinfo
->inode
->i_lock
);
960 cinfo
->completion_ops
->resched_write(cinfo
, req
);
963 /* Non-empty buckets hold a reference on the lseg. That ref
964 * is normally transferred to the COMMIT call and released
965 * there. It could also be released if the last req is pulled
966 * off due to a rewrite, in which case it will be done in
967 * pnfs_common_clear_request_commit
969 WARN_ON_ONCE(buckets
[ds_commit_idx
].wlseg
!= NULL
);
970 buckets
[ds_commit_idx
].wlseg
= pnfs_get_lseg(lseg
);
972 set_bit(PG_COMMIT_TO_DS
, &req
->wb_flags
);
973 cinfo
->ds
->nwritten
++;
975 nfs_request_add_commit_list_locked(req
, list
, cinfo
);
976 spin_unlock(&cinfo
->inode
->i_lock
);
977 nfs_mark_page_unstable(req
->wb_page
, cinfo
);
979 EXPORT_SYMBOL_GPL(pnfs_layout_mark_request_commit
);
982 pnfs_nfs_generic_sync(struct inode
*inode
, bool datasync
)
986 if (!pnfs_layoutcommit_outstanding(inode
))
988 ret
= nfs_commit_inode(inode
, FLUSH_SYNC
);
993 return pnfs_layoutcommit_inode(inode
, true);
995 EXPORT_SYMBOL_GPL(pnfs_nfs_generic_sync
);