flexfilelayoutdev.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Device operations for the pnfs nfs4 file layout driver.
  4. *
  5. * Copyright (c) 2014, Primary Data, Inc. All rights reserved.
  6. *
  7. * Tao Peng <bergwolf@primarydata.com>
  8. */
  9. #include <linux/nfs_fs.h>
  10. #include <linux/vmalloc.h>
  11. #include <linux/module.h>
  12. #include <linux/sunrpc/addr.h>
  13. #include "../internal.h"
  14. #include "../nfs4session.h"
  15. #include "flexfilelayout.h"
  16. #define NFSDBG_FACILITY NFSDBG_PNFS_LD
  17. static unsigned int dataserver_timeo = NFS_DEF_TCP_TIMEO;
  18. static unsigned int dataserver_retrans;
  19. static bool ff_layout_has_available_ds(struct pnfs_layout_segment *lseg);
  20. void nfs4_ff_layout_put_deviceid(struct nfs4_ff_layout_ds *mirror_ds)
  21. {
  22. if (!IS_ERR_OR_NULL(mirror_ds))
  23. nfs4_put_deviceid_node(&mirror_ds->id_node);
  24. }
  25. void nfs4_ff_layout_free_deviceid(struct nfs4_ff_layout_ds *mirror_ds)
  26. {
  27. nfs4_print_deviceid(&mirror_ds->id_node.deviceid);
  28. nfs4_pnfs_ds_put(mirror_ds->ds);
  29. kfree(mirror_ds->ds_versions);
  30. kfree_rcu(mirror_ds, id_node.rcu);
  31. }
  32. /* Decode opaque device data and construct new_ds using it */
  33. struct nfs4_ff_layout_ds *
  34. nfs4_ff_alloc_deviceid_node(struct nfs_server *server, struct pnfs_device *pdev,
  35. gfp_t gfp_flags)
  36. {
  37. struct xdr_stream stream;
  38. struct xdr_buf buf;
  39. struct page *scratch;
  40. struct list_head dsaddrs;
  41. struct nfs4_pnfs_ds_addr *da;
  42. struct nfs4_ff_layout_ds *new_ds = NULL;
  43. struct nfs4_ff_ds_version *ds_versions = NULL;
  44. u32 mp_count;
  45. u32 version_count;
  46. __be32 *p;
  47. int i, ret = -ENOMEM;
  48. /* set up xdr stream */
  49. scratch = alloc_page(gfp_flags);
  50. if (!scratch)
  51. goto out_err;
  52. new_ds = kzalloc(sizeof(struct nfs4_ff_layout_ds), gfp_flags);
  53. if (!new_ds)
  54. goto out_scratch;
  55. nfs4_init_deviceid_node(&new_ds->id_node,
  56. server,
  57. &pdev->dev_id);
  58. INIT_LIST_HEAD(&dsaddrs);
  59. xdr_init_decode_pages(&stream, &buf, pdev->pages, pdev->pglen);
  60. xdr_set_scratch_buffer(&stream, page_address(scratch), PAGE_SIZE);
  61. /* multipath count */
  62. p = xdr_inline_decode(&stream, 4);
  63. if (unlikely(!p))
  64. goto out_err_drain_dsaddrs;
  65. mp_count = be32_to_cpup(p);
  66. dprintk("%s: multipath ds count %d\n", __func__, mp_count);
  67. for (i = 0; i < mp_count; i++) {
  68. /* multipath ds */
  69. da = nfs4_decode_mp_ds_addr(server->nfs_client->cl_net,
  70. &stream, gfp_flags);
  71. if (da)
  72. list_add_tail(&da->da_node, &dsaddrs);
  73. }
  74. if (list_empty(&dsaddrs)) {
  75. dprintk("%s: no suitable DS addresses found\n",
  76. __func__);
  77. ret = -ENOMEDIUM;
  78. goto out_err_drain_dsaddrs;
  79. }
  80. /* version count */
  81. p = xdr_inline_decode(&stream, 4);
  82. if (unlikely(!p))
  83. goto out_err_drain_dsaddrs;
  84. version_count = be32_to_cpup(p);
  85. dprintk("%s: version count %d\n", __func__, version_count);
  86. ds_versions = kcalloc(version_count,
  87. sizeof(struct nfs4_ff_ds_version),
  88. gfp_flags);
  89. if (!ds_versions)
  90. goto out_scratch;
  91. for (i = 0; i < version_count; i++) {
  92. /* 20 = version(4) + minor_version(4) + rsize(4) + wsize(4) +
  93. * tightly_coupled(4) */
  94. p = xdr_inline_decode(&stream, 20);
  95. if (unlikely(!p))
  96. goto out_err_drain_dsaddrs;
  97. ds_versions[i].version = be32_to_cpup(p++);
  98. ds_versions[i].minor_version = be32_to_cpup(p++);
  99. ds_versions[i].rsize = nfs_block_size(be32_to_cpup(p++), NULL);
  100. ds_versions[i].wsize = nfs_block_size(be32_to_cpup(p++), NULL);
  101. ds_versions[i].tightly_coupled = be32_to_cpup(p);
  102. if (ds_versions[i].rsize > NFS_MAX_FILE_IO_SIZE)
  103. ds_versions[i].rsize = NFS_MAX_FILE_IO_SIZE;
  104. if (ds_versions[i].wsize > NFS_MAX_FILE_IO_SIZE)
  105. ds_versions[i].wsize = NFS_MAX_FILE_IO_SIZE;
  106. /*
  107. * check for valid major/minor combination.
  108. * currently we support dataserver which talk:
  109. * v3, v4.0, v4.1, v4.2
  110. */
  111. if (!((ds_versions[i].version == 3 && ds_versions[i].minor_version == 0) ||
  112. (ds_versions[i].version == 4 && ds_versions[i].minor_version < 3))) {
  113. dprintk("%s: [%d] unsupported ds version %d-%d\n", __func__,
  114. i, ds_versions[i].version,
  115. ds_versions[i].minor_version);
  116. ret = -EPROTONOSUPPORT;
  117. goto out_err_drain_dsaddrs;
  118. }
  119. dprintk("%s: [%d] vers %u minor_ver %u rsize %u wsize %u coupled %d\n",
  120. __func__, i, ds_versions[i].version,
  121. ds_versions[i].minor_version,
  122. ds_versions[i].rsize,
  123. ds_versions[i].wsize,
  124. ds_versions[i].tightly_coupled);
  125. }
  126. new_ds->ds_versions = ds_versions;
  127. new_ds->ds_versions_cnt = version_count;
  128. new_ds->ds = nfs4_pnfs_ds_add(&dsaddrs, gfp_flags);
  129. if (!new_ds->ds)
  130. goto out_err_drain_dsaddrs;
  131. /* If DS was already in cache, free ds addrs */
  132. while (!list_empty(&dsaddrs)) {
  133. da = list_first_entry(&dsaddrs,
  134. struct nfs4_pnfs_ds_addr,
  135. da_node);
  136. list_del_init(&da->da_node);
  137. kfree(da->da_remotestr);
  138. kfree(da);
  139. }
  140. __free_page(scratch);
  141. return new_ds;
  142. out_err_drain_dsaddrs:
  143. while (!list_empty(&dsaddrs)) {
  144. da = list_first_entry(&dsaddrs, struct nfs4_pnfs_ds_addr,
  145. da_node);
  146. list_del_init(&da->da_node);
  147. kfree(da->da_remotestr);
  148. kfree(da);
  149. }
  150. kfree(ds_versions);
  151. out_scratch:
  152. __free_page(scratch);
  153. out_err:
  154. kfree(new_ds);
  155. dprintk("%s ERROR: returning %d\n", __func__, ret);
  156. return NULL;
  157. }
  158. static void ff_layout_mark_devid_invalid(struct pnfs_layout_segment *lseg,
  159. struct nfs4_deviceid_node *devid)
  160. {
  161. nfs4_delete_deviceid(devid->ld, devid->nfs_client, &devid->deviceid);
  162. if (!ff_layout_has_available_ds(lseg))
  163. pnfs_error_mark_layout_for_return(lseg->pls_layout->plh_inode,
  164. lseg);
  165. }
  166. static bool ff_layout_mirror_valid(struct pnfs_layout_segment *lseg,
  167. struct nfs4_ff_layout_mirror *mirror,
  168. bool create)
  169. {
  170. if (mirror == NULL || IS_ERR(mirror->mirror_ds))
  171. goto outerr;
  172. if (mirror->mirror_ds == NULL) {
  173. if (create) {
  174. struct nfs4_deviceid_node *node;
  175. struct pnfs_layout_hdr *lh = lseg->pls_layout;
  176. struct nfs4_ff_layout_ds *mirror_ds = ERR_PTR(-ENODEV);
  177. node = nfs4_find_get_deviceid(NFS_SERVER(lh->plh_inode),
  178. &mirror->devid, lh->plh_lc_cred,
  179. GFP_KERNEL);
  180. if (node)
  181. mirror_ds = FF_LAYOUT_MIRROR_DS(node);
  182. /* check for race with another call to this function */
  183. if (cmpxchg(&mirror->mirror_ds, NULL, mirror_ds) &&
  184. mirror_ds != ERR_PTR(-ENODEV))
  185. nfs4_put_deviceid_node(node);
  186. } else
  187. goto outerr;
  188. }
  189. if (IS_ERR(mirror->mirror_ds))
  190. goto outerr;
  191. if (mirror->mirror_ds->ds == NULL) {
  192. struct nfs4_deviceid_node *devid;
  193. devid = &mirror->mirror_ds->id_node;
  194. ff_layout_mark_devid_invalid(lseg, devid);
  195. return false;
  196. }
  197. return true;
  198. outerr:
  199. pnfs_error_mark_layout_for_return(lseg->pls_layout->plh_inode, lseg);
  200. return false;
  201. }
  202. static void extend_ds_error(struct nfs4_ff_layout_ds_err *err,
  203. u64 offset, u64 length)
  204. {
  205. u64 end;
  206. end = max_t(u64, pnfs_end_offset(err->offset, err->length),
  207. pnfs_end_offset(offset, length));
  208. err->offset = min_t(u64, err->offset, offset);
  209. err->length = end - err->offset;
  210. }
  211. static int
  212. ff_ds_error_match(const struct nfs4_ff_layout_ds_err *e1,
  213. const struct nfs4_ff_layout_ds_err *e2)
  214. {
  215. int ret;
  216. if (e1->opnum != e2->opnum)
  217. return e1->opnum < e2->opnum ? -1 : 1;
  218. if (e1->status != e2->status)
  219. return e1->status < e2->status ? -1 : 1;
  220. ret = memcmp(e1->stateid.data, e2->stateid.data,
  221. sizeof(e1->stateid.data));
  222. if (ret != 0)
  223. return ret;
  224. ret = memcmp(&e1->deviceid, &e2->deviceid, sizeof(e1->deviceid));
  225. if (ret != 0)
  226. return ret;
  227. if (pnfs_end_offset(e1->offset, e1->length) < e2->offset)
  228. return -1;
  229. if (e1->offset > pnfs_end_offset(e2->offset, e2->length))
  230. return 1;
  231. /* If ranges overlap or are contiguous, they are the same */
  232. return 0;
  233. }
  234. static void
  235. ff_layout_add_ds_error_locked(struct nfs4_flexfile_layout *flo,
  236. struct nfs4_ff_layout_ds_err *dserr)
  237. {
  238. struct nfs4_ff_layout_ds_err *err, *tmp;
  239. struct list_head *head = &flo->error_list;
  240. int match;
  241. /* Do insertion sort w/ merges */
  242. list_for_each_entry_safe(err, tmp, &flo->error_list, list) {
  243. match = ff_ds_error_match(err, dserr);
  244. if (match < 0)
  245. continue;
  246. if (match > 0) {
  247. /* Add entry "dserr" _before_ entry "err" */
  248. head = &err->list;
  249. break;
  250. }
  251. /* Entries match, so merge "err" into "dserr" */
  252. extend_ds_error(dserr, err->offset, err->length);
  253. list_replace(&err->list, &dserr->list);
  254. kfree(err);
  255. return;
  256. }
  257. list_add_tail(&dserr->list, head);
  258. }
  259. int ff_layout_track_ds_error(struct nfs4_flexfile_layout *flo,
  260. struct nfs4_ff_layout_mirror *mirror, u64 offset,
  261. u64 length, int status, enum nfs_opnum4 opnum,
  262. gfp_t gfp_flags)
  263. {
  264. struct nfs4_ff_layout_ds_err *dserr;
  265. if (status == 0)
  266. return 0;
  267. if (IS_ERR_OR_NULL(mirror->mirror_ds))
  268. return -EINVAL;
  269. dserr = kmalloc(sizeof(*dserr), gfp_flags);
  270. if (!dserr)
  271. return -ENOMEM;
  272. INIT_LIST_HEAD(&dserr->list);
  273. dserr->offset = offset;
  274. dserr->length = length;
  275. dserr->status = status;
  276. dserr->opnum = opnum;
  277. nfs4_stateid_copy(&dserr->stateid, &mirror->stateid);
  278. memcpy(&dserr->deviceid, &mirror->mirror_ds->id_node.deviceid,
  279. NFS4_DEVICEID4_SIZE);
  280. spin_lock(&flo->generic_hdr.plh_inode->i_lock);
  281. ff_layout_add_ds_error_locked(flo, dserr);
  282. spin_unlock(&flo->generic_hdr.plh_inode->i_lock);
  283. return 0;
  284. }
  285. static struct rpc_cred *
  286. ff_layout_get_mirror_cred(struct nfs4_ff_layout_mirror *mirror, u32 iomode)
  287. {
  288. struct rpc_cred *cred, __rcu **pcred;
  289. if (iomode == IOMODE_READ)
  290. pcred = &mirror->ro_cred;
  291. else
  292. pcred = &mirror->rw_cred;
  293. rcu_read_lock();
  294. do {
  295. cred = rcu_dereference(*pcred);
  296. if (!cred)
  297. break;
  298. cred = get_rpccred_rcu(cred);
  299. } while(!cred);
  300. rcu_read_unlock();
  301. return cred;
  302. }
  303. struct nfs_fh *
  304. nfs4_ff_layout_select_ds_fh(struct pnfs_layout_segment *lseg, u32 mirror_idx)
  305. {
  306. struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, mirror_idx);
  307. struct nfs_fh *fh = NULL;
  308. if (!ff_layout_mirror_valid(lseg, mirror, false)) {
  309. pr_err_ratelimited("NFS: %s: No data server for mirror offset index %d\n",
  310. __func__, mirror_idx);
  311. goto out;
  312. }
  313. /* FIXME: For now assume there is only 1 version available for the DS */
  314. fh = &mirror->fh_versions[0];
  315. out:
  316. return fh;
  317. }
  318. int
  319. nfs4_ff_layout_select_ds_stateid(struct pnfs_layout_segment *lseg,
  320. u32 mirror_idx,
  321. nfs4_stateid *stateid)
  322. {
  323. struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, mirror_idx);
  324. if (!ff_layout_mirror_valid(lseg, mirror, false)) {
  325. pr_err_ratelimited("NFS: %s: No data server for mirror offset index %d\n",
  326. __func__, mirror_idx);
  327. goto out;
  328. }
  329. nfs4_stateid_copy(stateid, &mirror->stateid);
  330. return 1;
  331. out:
  332. return 0;
  333. }
  334. /**
  335. * nfs4_ff_layout_prepare_ds - prepare a DS connection for an RPC call
  336. * @lseg: the layout segment we're operating on
  337. * @ds_idx: index of the DS to use
  338. * @fail_return: return layout on connect failure?
  339. *
  340. * Try to prepare a DS connection to accept an RPC call. This involves
  341. * selecting a mirror to use and connecting the client to it if it's not
  342. * already connected.
  343. *
  344. * Since we only need a single functioning mirror to satisfy a read, we don't
  345. * want to return the layout if there is one. For writes though, any down
  346. * mirror should result in a LAYOUTRETURN. @fail_return is how we distinguish
  347. * between the two cases.
  348. *
  349. * Returns a pointer to a connected DS object on success or NULL on failure.
  350. */
  351. struct nfs4_pnfs_ds *
  352. nfs4_ff_layout_prepare_ds(struct pnfs_layout_segment *lseg, u32 ds_idx,
  353. bool fail_return)
  354. {
  355. struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
  356. struct nfs4_pnfs_ds *ds = NULL;
  357. struct nfs4_deviceid_node *devid;
  358. struct inode *ino = lseg->pls_layout->plh_inode;
  359. struct nfs_server *s = NFS_SERVER(ino);
  360. unsigned int max_payload;
  361. int status;
  362. if (!ff_layout_mirror_valid(lseg, mirror, true)) {
  363. pr_err_ratelimited("NFS: %s: No data server for offset index %d\n",
  364. __func__, ds_idx);
  365. goto out;
  366. }
  367. devid = &mirror->mirror_ds->id_node;
  368. if (ff_layout_test_devid_unavailable(devid))
  369. goto out_fail;
  370. ds = mirror->mirror_ds->ds;
  371. /* matching smp_wmb() in _nfs4_pnfs_v3/4_ds_connect */
  372. smp_rmb();
  373. if (ds->ds_clp)
  374. goto out;
  375. /* FIXME: For now we assume the server sent only one version of NFS
  376. * to use for the DS.
  377. */
  378. status = nfs4_pnfs_ds_connect(s, ds, devid, dataserver_timeo,
  379. dataserver_retrans,
  380. mirror->mirror_ds->ds_versions[0].version,
  381. mirror->mirror_ds->ds_versions[0].minor_version);
  382. /* connect success, check rsize/wsize limit */
  383. if (!status) {
  384. max_payload =
  385. nfs_block_size(rpc_max_payload(ds->ds_clp->cl_rpcclient),
  386. NULL);
  387. if (mirror->mirror_ds->ds_versions[0].rsize > max_payload)
  388. mirror->mirror_ds->ds_versions[0].rsize = max_payload;
  389. if (mirror->mirror_ds->ds_versions[0].wsize > max_payload)
  390. mirror->mirror_ds->ds_versions[0].wsize = max_payload;
  391. goto out;
  392. }
  393. out_fail:
  394. ff_layout_track_ds_error(FF_LAYOUT_FROM_HDR(lseg->pls_layout),
  395. mirror, lseg->pls_range.offset,
  396. lseg->pls_range.length, NFS4ERR_NXIO,
  397. OP_ILLEGAL, GFP_NOIO);
  398. if (fail_return || !ff_layout_has_available_ds(lseg))
  399. pnfs_error_mark_layout_for_return(ino, lseg);
  400. ds = NULL;
  401. out:
  402. return ds;
  403. }
  404. struct rpc_cred *
  405. ff_layout_get_ds_cred(struct pnfs_layout_segment *lseg, u32 ds_idx,
  406. struct rpc_cred *mdscred)
  407. {
  408. struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
  409. struct rpc_cred *cred;
  410. if (mirror) {
  411. cred = ff_layout_get_mirror_cred(mirror, lseg->pls_range.iomode);
  412. if (!cred)
  413. cred = get_rpccred(mdscred);
  414. } else {
  415. cred = get_rpccred(mdscred);
  416. }
  417. return cred;
  418. }
  419. /**
  420. * Find or create a DS rpc client with th MDS server rpc client auth flavor
  421. * in the nfs_client cl_ds_clients list.
  422. */
  423. struct rpc_clnt *
  424. nfs4_ff_find_or_create_ds_client(struct pnfs_layout_segment *lseg, u32 ds_idx,
  425. struct nfs_client *ds_clp, struct inode *inode)
  426. {
  427. struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
  428. switch (mirror->mirror_ds->ds_versions[0].version) {
  429. case 3:
  430. /* For NFSv3 DS, flavor is set when creating DS connections */
  431. return ds_clp->cl_rpcclient;
  432. case 4:
  433. return nfs4_find_or_create_ds_client(ds_clp, inode);
  434. default:
  435. BUG();
  436. }
  437. }
  438. void ff_layout_free_ds_ioerr(struct list_head *head)
  439. {
  440. struct nfs4_ff_layout_ds_err *err;
  441. while (!list_empty(head)) {
  442. err = list_first_entry(head,
  443. struct nfs4_ff_layout_ds_err,
  444. list);
  445. list_del(&err->list);
  446. kfree(err);
  447. }
  448. }
  449. /* called with inode i_lock held */
  450. int ff_layout_encode_ds_ioerr(struct xdr_stream *xdr, const struct list_head *head)
  451. {
  452. struct nfs4_ff_layout_ds_err *err;
  453. __be32 *p;
  454. list_for_each_entry(err, head, list) {
  455. /* offset(8) + length(8) + stateid(NFS4_STATEID_SIZE)
  456. * + array length + deviceid(NFS4_DEVICEID4_SIZE)
  457. * + status(4) + opnum(4)
  458. */
  459. p = xdr_reserve_space(xdr,
  460. 28 + NFS4_STATEID_SIZE + NFS4_DEVICEID4_SIZE);
  461. if (unlikely(!p))
  462. return -ENOBUFS;
  463. p = xdr_encode_hyper(p, err->offset);
  464. p = xdr_encode_hyper(p, err->length);
  465. p = xdr_encode_opaque_fixed(p, &err->stateid,
  466. NFS4_STATEID_SIZE);
  467. /* Encode 1 error */
  468. *p++ = cpu_to_be32(1);
  469. p = xdr_encode_opaque_fixed(p, &err->deviceid,
  470. NFS4_DEVICEID4_SIZE);
  471. *p++ = cpu_to_be32(err->status);
  472. *p++ = cpu_to_be32(err->opnum);
  473. dprintk("%s: offset %llu length %llu status %d op %d\n",
  474. __func__, err->offset, err->length, err->status,
  475. err->opnum);
  476. }
  477. return 0;
  478. }
  479. static
  480. unsigned int do_layout_fetch_ds_ioerr(struct pnfs_layout_hdr *lo,
  481. const struct pnfs_layout_range *range,
  482. struct list_head *head,
  483. unsigned int maxnum)
  484. {
  485. struct nfs4_flexfile_layout *flo = FF_LAYOUT_FROM_HDR(lo);
  486. struct inode *inode = lo->plh_inode;
  487. struct nfs4_ff_layout_ds_err *err, *n;
  488. unsigned int ret = 0;
  489. spin_lock(&inode->i_lock);
  490. list_for_each_entry_safe(err, n, &flo->error_list, list) {
  491. if (!pnfs_is_range_intersecting(err->offset,
  492. pnfs_end_offset(err->offset, err->length),
  493. range->offset,
  494. pnfs_end_offset(range->offset, range->length)))
  495. continue;
  496. if (!maxnum)
  497. break;
  498. list_move(&err->list, head);
  499. maxnum--;
  500. ret++;
  501. }
  502. spin_unlock(&inode->i_lock);
  503. return ret;
  504. }
  505. unsigned int ff_layout_fetch_ds_ioerr(struct pnfs_layout_hdr *lo,
  506. const struct pnfs_layout_range *range,
  507. struct list_head *head,
  508. unsigned int maxnum)
  509. {
  510. unsigned int ret;
  511. ret = do_layout_fetch_ds_ioerr(lo, range, head, maxnum);
  512. /* If we're over the max, discard all remaining entries */
  513. if (ret == maxnum) {
  514. LIST_HEAD(discard);
  515. do_layout_fetch_ds_ioerr(lo, range, &discard, -1);
  516. ff_layout_free_ds_ioerr(&discard);
  517. }
  518. return ret;
  519. }
  520. static bool ff_read_layout_has_available_ds(struct pnfs_layout_segment *lseg)
  521. {
  522. struct nfs4_ff_layout_mirror *mirror;
  523. struct nfs4_deviceid_node *devid;
  524. u32 idx;
  525. for (idx = 0; idx < FF_LAYOUT_MIRROR_COUNT(lseg); idx++) {
  526. mirror = FF_LAYOUT_COMP(lseg, idx);
  527. if (mirror) {
  528. if (!mirror->mirror_ds)
  529. return true;
  530. if (IS_ERR(mirror->mirror_ds))
  531. continue;
  532. devid = &mirror->mirror_ds->id_node;
  533. if (!ff_layout_test_devid_unavailable(devid))
  534. return true;
  535. }
  536. }
  537. return false;
  538. }
  539. static bool ff_rw_layout_has_available_ds(struct pnfs_layout_segment *lseg)
  540. {
  541. struct nfs4_ff_layout_mirror *mirror;
  542. struct nfs4_deviceid_node *devid;
  543. u32 idx;
  544. for (idx = 0; idx < FF_LAYOUT_MIRROR_COUNT(lseg); idx++) {
  545. mirror = FF_LAYOUT_COMP(lseg, idx);
  546. if (!mirror || IS_ERR(mirror->mirror_ds))
  547. return false;
  548. if (!mirror->mirror_ds)
  549. continue;
  550. devid = &mirror->mirror_ds->id_node;
  551. if (ff_layout_test_devid_unavailable(devid))
  552. return false;
  553. }
  554. return FF_LAYOUT_MIRROR_COUNT(lseg) != 0;
  555. }
  556. static bool ff_layout_has_available_ds(struct pnfs_layout_segment *lseg)
  557. {
  558. if (lseg->pls_range.iomode == IOMODE_READ)
  559. return ff_read_layout_has_available_ds(lseg);
  560. /* Note: RW layout needs all mirrors available */
  561. return ff_rw_layout_has_available_ds(lseg);
  562. }
  563. bool ff_layout_avoid_mds_available_ds(struct pnfs_layout_segment *lseg)
  564. {
  565. return ff_layout_no_fallback_to_mds(lseg) ||
  566. ff_layout_has_available_ds(lseg);
  567. }
  568. bool ff_layout_avoid_read_on_rw(struct pnfs_layout_segment *lseg)
  569. {
  570. return lseg->pls_range.iomode == IOMODE_RW &&
  571. ff_layout_no_read_on_rw(lseg);
  572. }
  573. module_param(dataserver_retrans, uint, 0644);
  574. MODULE_PARM_DESC(dataserver_retrans, "The number of times the NFSv4.1 client "
  575. "retries a request before it attempts further "
  576. " recovery action.");
  577. module_param(dataserver_timeo, uint, 0644);
  578. MODULE_PARM_DESC(dataserver_timeo, "The time (in tenths of a second) the "
  579. "NFSv4.1 client waits for a response from a "
  580. " data server before it retries an NFS request.");