nfssvc.c 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872
  1. /*
  2. * Central processing for nfsd.
  3. *
  4. * Authors: Olaf Kirch ([email protected])
  5. *
  6. * Copyright (C) 1995, 1996, 1997 Olaf Kirch <[email protected]>
  7. */
  8. #include <linux/sched.h>
  9. #include <linux/freezer.h>
  10. #include <linux/module.h>
  11. #include <linux/fs_struct.h>
  12. #include <linux/swap.h>
  13. #include <linux/sunrpc/stats.h>
  14. #include <linux/sunrpc/svcsock.h>
  15. #include <linux/sunrpc/svc_xprt.h>
  16. #include <linux/lockd/bind.h>
  17. #include <linux/nfsacl.h>
  18. #include <linux/seq_file.h>
  19. #include <linux/inetdevice.h>
  20. #include <net/addrconf.h>
  21. #include <net/ipv6.h>
  22. #include <net/net_namespace.h>
  23. #include "nfsd.h"
  24. #include "cache.h"
  25. #include "vfs.h"
  26. #include "netns.h"
  27. #define NFSDDBG_FACILITY NFSDDBG_SVC
  28. extern struct svc_program nfsd_program;
  29. static int nfsd(void *vrqstp);
  30. /*
  31. * nfsd_mutex protects nn->nfsd_serv -- both the pointer itself and the members
  32. * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
  33. * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
  34. *
  35. * If (out side the lock) nn->nfsd_serv is non-NULL, then it must point to a
  36. * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
  37. * of nfsd threads must exist and each must listed in ->sp_all_threads in each
  38. * entry of ->sv_pools[].
  39. *
  40. * Transitions of the thread count between zero and non-zero are of particular
  41. * interest since the svc_serv needs to be created and initialized at that
  42. * point, or freed.
  43. *
  44. * Finally, the nfsd_mutex also protects some of the global variables that are
  45. * accessed when nfsd starts and that are settable via the write_* routines in
  46. * nfsctl.c. In particular:
  47. *
  48. * user_recovery_dirname
  49. * user_lease_time
  50. * nfsd_versions
  51. */
  52. DEFINE_MUTEX(nfsd_mutex);
  53. /*
  54. * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
  55. * nfsd_drc_max_pages limits the total amount of memory available for
  56. * version 4.1 DRC caches.
  57. * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
  58. */
  59. spinlock_t nfsd_drc_lock;
  60. unsigned long nfsd_drc_max_mem;
  61. unsigned long nfsd_drc_mem_used;
  62. #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
  63. static struct svc_stat nfsd_acl_svcstats;
  64. static struct svc_version * nfsd_acl_version[] = {
  65. [2] = &nfsd_acl_version2,
  66. [3] = &nfsd_acl_version3,
  67. };
  68. #define NFSD_ACL_MINVERS 2
  69. #define NFSD_ACL_NRVERS ARRAY_SIZE(nfsd_acl_version)
  70. static struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS];
  71. static struct svc_program nfsd_acl_program = {
  72. .pg_prog = NFS_ACL_PROGRAM,
  73. .pg_nvers = NFSD_ACL_NRVERS,
  74. .pg_vers = nfsd_acl_versions,
  75. .pg_name = "nfsacl",
  76. .pg_class = "nfsd",
  77. .pg_stats = &nfsd_acl_svcstats,
  78. .pg_authenticate = &svc_set_client,
  79. };
  80. static struct svc_stat nfsd_acl_svcstats = {
  81. .program = &nfsd_acl_program,
  82. };
  83. #endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
  84. static struct svc_version * nfsd_version[] = {
  85. [2] = &nfsd_version2,
  86. #if defined(CONFIG_NFSD_V3)
  87. [3] = &nfsd_version3,
  88. #endif
  89. #if defined(CONFIG_NFSD_V4)
  90. [4] = &nfsd_version4,
  91. #endif
  92. };
  93. #define NFSD_MINVERS 2
  94. #define NFSD_NRVERS ARRAY_SIZE(nfsd_version)
  95. static struct svc_version *nfsd_versions[NFSD_NRVERS];
  96. struct svc_program nfsd_program = {
  97. #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
  98. .pg_next = &nfsd_acl_program,
  99. #endif
  100. .pg_prog = NFS_PROGRAM, /* program number */
  101. .pg_nvers = NFSD_NRVERS, /* nr of entries in nfsd_version */
  102. .pg_vers = nfsd_versions, /* version table */
  103. .pg_name = "nfsd", /* program name */
  104. .pg_class = "nfsd", /* authentication class */
  105. .pg_stats = &nfsd_svcstats, /* version table */
  106. .pg_authenticate = &svc_set_client, /* export authentication */
  107. };
  108. static bool nfsd_supported_minorversions[NFSD_SUPPORTED_MINOR_VERSION + 1] = {
  109. [0] = 1,
  110. [1] = 1,
  111. [2] = 1,
  112. };
  113. int nfsd_vers(int vers, enum vers_op change)
  114. {
  115. if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
  116. return 0;
  117. switch(change) {
  118. case NFSD_SET:
  119. nfsd_versions[vers] = nfsd_version[vers];
  120. #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
  121. if (vers < NFSD_ACL_NRVERS)
  122. nfsd_acl_versions[vers] = nfsd_acl_version[vers];
  123. #endif
  124. break;
  125. case NFSD_CLEAR:
  126. nfsd_versions[vers] = NULL;
  127. #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
  128. if (vers < NFSD_ACL_NRVERS)
  129. nfsd_acl_versions[vers] = NULL;
  130. #endif
  131. break;
  132. case NFSD_TEST:
  133. return nfsd_versions[vers] != NULL;
  134. case NFSD_AVAIL:
  135. return nfsd_version[vers] != NULL;
  136. }
  137. return 0;
  138. }
  139. int nfsd_minorversion(u32 minorversion, enum vers_op change)
  140. {
  141. if (minorversion > NFSD_SUPPORTED_MINOR_VERSION &&
  142. change != NFSD_AVAIL)
  143. return -1;
  144. switch(change) {
  145. case NFSD_SET:
  146. nfsd_supported_minorversions[minorversion] = true;
  147. break;
  148. case NFSD_CLEAR:
  149. nfsd_supported_minorversions[minorversion] = false;
  150. break;
  151. case NFSD_TEST:
  152. return nfsd_supported_minorversions[minorversion];
  153. case NFSD_AVAIL:
  154. return minorversion <= NFSD_SUPPORTED_MINOR_VERSION;
  155. }
  156. return 0;
  157. }
  158. /*
  159. * Maximum number of nfsd processes
  160. */
  161. #define NFSD_MAXSERVS 8192
  162. int nfsd_nrthreads(struct net *net)
  163. {
  164. int rv = 0;
  165. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  166. mutex_lock(&nfsd_mutex);
  167. if (nn->nfsd_serv)
  168. rv = nn->nfsd_serv->sv_nrthreads;
  169. mutex_unlock(&nfsd_mutex);
  170. return rv;
  171. }
  172. static int nfsd_init_socks(struct net *net)
  173. {
  174. int error;
  175. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  176. if (!list_empty(&nn->nfsd_serv->sv_permsocks))
  177. return 0;
  178. error = svc_create_xprt(nn->nfsd_serv, "udp", net, PF_INET, NFS_PORT,
  179. SVC_SOCK_DEFAULTS);
  180. if (error < 0)
  181. return error;
  182. error = svc_create_xprt(nn->nfsd_serv, "tcp", net, PF_INET, NFS_PORT,
  183. SVC_SOCK_DEFAULTS);
  184. if (error < 0)
  185. return error;
  186. return 0;
  187. }
  188. static int nfsd_users = 0;
  189. static int nfsd_startup_generic(int nrservs)
  190. {
  191. int ret;
  192. if (nfsd_users++)
  193. return 0;
  194. /*
  195. * Readahead param cache - will no-op if it already exists.
  196. * (Note therefore results will be suboptimal if number of
  197. * threads is modified after nfsd start.)
  198. */
  199. ret = nfsd_racache_init(2*nrservs);
  200. if (ret)
  201. goto dec_users;
  202. ret = nfs4_state_start();
  203. if (ret)
  204. goto out_racache;
  205. return 0;
  206. out_racache:
  207. nfsd_racache_shutdown();
  208. dec_users:
  209. nfsd_users--;
  210. return ret;
  211. }
  212. static void nfsd_shutdown_generic(void)
  213. {
  214. if (--nfsd_users)
  215. return;
  216. nfs4_state_shutdown();
  217. nfsd_racache_shutdown();
  218. }
  219. static bool nfsd_needs_lockd(void)
  220. {
  221. #if defined(CONFIG_NFSD_V3)
  222. return (nfsd_versions[2] != NULL) || (nfsd_versions[3] != NULL);
  223. #else
  224. return (nfsd_versions[2] != NULL);
  225. #endif
  226. }
  227. static int nfsd_startup_net(int nrservs, struct net *net)
  228. {
  229. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  230. int ret;
  231. if (nn->nfsd_net_up)
  232. return 0;
  233. ret = nfsd_startup_generic(nrservs);
  234. if (ret)
  235. return ret;
  236. ret = nfsd_init_socks(net);
  237. if (ret)
  238. goto out_socks;
  239. if (nfsd_needs_lockd() && !nn->lockd_up) {
  240. ret = lockd_up(net);
  241. if (ret)
  242. goto out_socks;
  243. nn->lockd_up = 1;
  244. }
  245. ret = nfs4_state_start_net(net);
  246. if (ret)
  247. goto out_lockd;
  248. nn->nfsd_net_up = true;
  249. return 0;
  250. out_lockd:
  251. if (nn->lockd_up) {
  252. lockd_down(net);
  253. nn->lockd_up = 0;
  254. }
  255. out_socks:
  256. nfsd_shutdown_generic();
  257. return ret;
  258. }
  259. static void nfsd_shutdown_net(struct net *net)
  260. {
  261. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  262. nfs4_state_shutdown_net(net);
  263. if (nn->lockd_up) {
  264. lockd_down(net);
  265. nn->lockd_up = 0;
  266. }
  267. nn->nfsd_net_up = false;
  268. nfsd_shutdown_generic();
  269. }
  270. static int nfsd_inetaddr_event(struct notifier_block *this, unsigned long event,
  271. void *ptr)
  272. {
  273. struct in_ifaddr *ifa = (struct in_ifaddr *)ptr;
  274. struct net_device *dev = ifa->ifa_dev->dev;
  275. struct net *net = dev_net(dev);
  276. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  277. struct sockaddr_in sin;
  278. if (event != NETDEV_DOWN)
  279. goto out;
  280. if (nn->nfsd_serv) {
  281. dprintk("nfsd_inetaddr_event: removed %pI4\n", &ifa->ifa_local);
  282. sin.sin_family = AF_INET;
  283. sin.sin_addr.s_addr = ifa->ifa_local;
  284. svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin);
  285. }
  286. out:
  287. return NOTIFY_DONE;
  288. }
  289. static struct notifier_block nfsd_inetaddr_notifier = {
  290. .notifier_call = nfsd_inetaddr_event,
  291. };
  292. #if IS_ENABLED(CONFIG_IPV6)
  293. static int nfsd_inet6addr_event(struct notifier_block *this,
  294. unsigned long event, void *ptr)
  295. {
  296. struct inet6_ifaddr *ifa = (struct inet6_ifaddr *)ptr;
  297. struct net_device *dev = ifa->idev->dev;
  298. struct net *net = dev_net(dev);
  299. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  300. struct sockaddr_in6 sin6;
  301. if (event != NETDEV_DOWN)
  302. goto out;
  303. if (nn->nfsd_serv) {
  304. dprintk("nfsd_inet6addr_event: removed %pI6\n", &ifa->addr);
  305. sin6.sin6_family = AF_INET6;
  306. sin6.sin6_addr = ifa->addr;
  307. svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin6);
  308. }
  309. out:
  310. return NOTIFY_DONE;
  311. }
  312. static struct notifier_block nfsd_inet6addr_notifier = {
  313. .notifier_call = nfsd_inet6addr_event,
  314. };
  315. #endif
  316. /* Only used under nfsd_mutex, so this atomic may be overkill: */
  317. static atomic_t nfsd_notifier_refcount = ATOMIC_INIT(0);
  318. static void nfsd_last_thread(struct svc_serv *serv, struct net *net)
  319. {
  320. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  321. /* check if the notifier still has clients */
  322. if (atomic_dec_return(&nfsd_notifier_refcount) == 0) {
  323. unregister_inetaddr_notifier(&nfsd_inetaddr_notifier);
  324. #if IS_ENABLED(CONFIG_IPV6)
  325. unregister_inet6addr_notifier(&nfsd_inet6addr_notifier);
  326. #endif
  327. }
  328. /*
  329. * write_ports can create the server without actually starting
  330. * any threads--if we get shut down before any threads are
  331. * started, then nfsd_last_thread will be run before any of this
  332. * other initialization has been done except the rpcb information.
  333. */
  334. svc_rpcb_cleanup(serv, net);
  335. if (!nn->nfsd_net_up)
  336. return;
  337. nfsd_shutdown_net(net);
  338. printk(KERN_WARNING "nfsd: last server has exited, flushing export "
  339. "cache\n");
  340. nfsd_export_flush(net);
  341. }
  342. void nfsd_reset_versions(void)
  343. {
  344. int i;
  345. for (i = 0; i < NFSD_NRVERS; i++)
  346. if (nfsd_vers(i, NFSD_TEST))
  347. return;
  348. for (i = 0; i < NFSD_NRVERS; i++)
  349. if (i != 4)
  350. nfsd_vers(i, NFSD_SET);
  351. else {
  352. int minor = 0;
  353. while (nfsd_minorversion(minor, NFSD_SET) >= 0)
  354. minor++;
  355. }
  356. }
  357. /*
  358. * Each session guarantees a negotiated per slot memory cache for replies
  359. * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
  360. * NFSv4.1 server might want to use more memory for a DRC than a machine
  361. * with mutiple services.
  362. *
  363. * Impose a hard limit on the number of pages for the DRC which varies
  364. * according to the machines free pages. This is of course only a default.
  365. *
  366. * For now this is a #defined shift which could be under admin control
  367. * in the future.
  368. */
  369. static void set_max_drc(void)
  370. {
  371. #define NFSD_DRC_SIZE_SHIFT 7
  372. nfsd_drc_max_mem = (nr_free_buffer_pages()
  373. >> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
  374. nfsd_drc_mem_used = 0;
  375. spin_lock_init(&nfsd_drc_lock);
  376. dprintk("%s nfsd_drc_max_mem %lu \n", __func__, nfsd_drc_max_mem);
  377. }
  378. static int nfsd_get_default_max_blksize(void)
  379. {
  380. struct sysinfo i;
  381. unsigned long long target;
  382. unsigned long ret;
  383. si_meminfo(&i);
  384. target = (i.totalram - i.totalhigh) << PAGE_SHIFT;
  385. /*
  386. * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig
  387. * machines, but only uses 32K on 128M machines. Bottom out at
  388. * 8K on 32M and smaller. Of course, this is only a default.
  389. */
  390. target >>= 12;
  391. ret = NFSSVC_MAXBLKSIZE;
  392. while (ret > target && ret >= 8*1024*2)
  393. ret /= 2;
  394. return ret;
  395. }
  396. static struct svc_serv_ops nfsd_thread_sv_ops = {
  397. .svo_shutdown = nfsd_last_thread,
  398. .svo_function = nfsd,
  399. .svo_enqueue_xprt = svc_xprt_do_enqueue,
  400. .svo_setup = svc_set_num_threads,
  401. .svo_module = THIS_MODULE,
  402. };
  403. int nfsd_create_serv(struct net *net)
  404. {
  405. int error;
  406. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  407. WARN_ON(!mutex_is_locked(&nfsd_mutex));
  408. if (nn->nfsd_serv) {
  409. svc_get(nn->nfsd_serv);
  410. return 0;
  411. }
  412. if (nfsd_max_blksize == 0)
  413. nfsd_max_blksize = nfsd_get_default_max_blksize();
  414. nfsd_reset_versions();
  415. nn->nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
  416. &nfsd_thread_sv_ops);
  417. if (nn->nfsd_serv == NULL)
  418. return -ENOMEM;
  419. nn->nfsd_serv->sv_maxconn = nn->max_connections;
  420. error = svc_bind(nn->nfsd_serv, net);
  421. if (error < 0) {
  422. svc_destroy(nn->nfsd_serv);
  423. return error;
  424. }
  425. set_max_drc();
  426. /* check if the notifier is already set */
  427. if (atomic_inc_return(&nfsd_notifier_refcount) == 1) {
  428. register_inetaddr_notifier(&nfsd_inetaddr_notifier);
  429. #if IS_ENABLED(CONFIG_IPV6)
  430. register_inet6addr_notifier(&nfsd_inet6addr_notifier);
  431. #endif
  432. }
  433. do_gettimeofday(&nn->nfssvc_boot); /* record boot time */
  434. return 0;
  435. }
  436. int nfsd_nrpools(struct net *net)
  437. {
  438. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  439. if (nn->nfsd_serv == NULL)
  440. return 0;
  441. else
  442. return nn->nfsd_serv->sv_nrpools;
  443. }
  444. int nfsd_get_nrthreads(int n, int *nthreads, struct net *net)
  445. {
  446. int i = 0;
  447. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  448. if (nn->nfsd_serv != NULL) {
  449. for (i = 0; i < nn->nfsd_serv->sv_nrpools && i < n; i++)
  450. nthreads[i] = nn->nfsd_serv->sv_pools[i].sp_nrthreads;
  451. }
  452. return 0;
  453. }
  454. void nfsd_destroy(struct net *net)
  455. {
  456. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  457. int destroy = (nn->nfsd_serv->sv_nrthreads == 1);
  458. if (destroy)
  459. svc_shutdown_net(nn->nfsd_serv, net);
  460. svc_destroy(nn->nfsd_serv);
  461. if (destroy)
  462. nn->nfsd_serv = NULL;
  463. }
  464. int nfsd_set_nrthreads(int n, int *nthreads, struct net *net)
  465. {
  466. int i = 0;
  467. int tot = 0;
  468. int err = 0;
  469. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  470. WARN_ON(!mutex_is_locked(&nfsd_mutex));
  471. if (nn->nfsd_serv == NULL || n <= 0)
  472. return 0;
  473. if (n > nn->nfsd_serv->sv_nrpools)
  474. n = nn->nfsd_serv->sv_nrpools;
  475. /* enforce a global maximum number of threads */
  476. tot = 0;
  477. for (i = 0; i < n; i++) {
  478. nthreads[i] = min(nthreads[i], NFSD_MAXSERVS);
  479. tot += nthreads[i];
  480. }
  481. if (tot > NFSD_MAXSERVS) {
  482. /* total too large: scale down requested numbers */
  483. for (i = 0; i < n && tot > 0; i++) {
  484. int new = nthreads[i] * NFSD_MAXSERVS / tot;
  485. tot -= (nthreads[i] - new);
  486. nthreads[i] = new;
  487. }
  488. for (i = 0; i < n && tot > 0; i++) {
  489. nthreads[i]--;
  490. tot--;
  491. }
  492. }
  493. /*
  494. * There must always be a thread in pool 0; the admin
  495. * can't shut down NFS completely using pool_threads.
  496. */
  497. if (nthreads[0] == 0)
  498. nthreads[0] = 1;
  499. /* apply the new numbers */
  500. svc_get(nn->nfsd_serv);
  501. for (i = 0; i < n; i++) {
  502. err = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
  503. &nn->nfsd_serv->sv_pools[i], nthreads[i]);
  504. if (err)
  505. break;
  506. }
  507. nfsd_destroy(net);
  508. return err;
  509. }
  510. /*
  511. * Adjust the number of threads and return the new number of threads.
  512. * This is also the function that starts the server if necessary, if
  513. * this is the first time nrservs is nonzero.
  514. */
  515. int
  516. nfsd_svc(int nrservs, struct net *net)
  517. {
  518. int error;
  519. bool nfsd_up_before;
  520. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  521. mutex_lock(&nfsd_mutex);
  522. dprintk("nfsd: creating service\n");
  523. nrservs = max(nrservs, 0);
  524. nrservs = min(nrservs, NFSD_MAXSERVS);
  525. error = 0;
  526. if (nrservs == 0 && nn->nfsd_serv == NULL)
  527. goto out;
  528. error = nfsd_create_serv(net);
  529. if (error)
  530. goto out;
  531. nfsd_up_before = nn->nfsd_net_up;
  532. error = nfsd_startup_net(nrservs, net);
  533. if (error)
  534. goto out_destroy;
  535. error = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
  536. NULL, nrservs);
  537. if (error)
  538. goto out_shutdown;
  539. /* We are holding a reference to nn->nfsd_serv which
  540. * we don't want to count in the return value,
  541. * so subtract 1
  542. */
  543. error = nn->nfsd_serv->sv_nrthreads - 1;
  544. out_shutdown:
  545. if (error < 0 && !nfsd_up_before)
  546. nfsd_shutdown_net(net);
  547. out_destroy:
  548. nfsd_destroy(net); /* Release server */
  549. out:
  550. mutex_unlock(&nfsd_mutex);
  551. return error;
  552. }
  553. /*
  554. * This is the NFS server kernel thread
  555. */
  556. static int
  557. nfsd(void *vrqstp)
  558. {
  559. struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
  560. struct svc_xprt *perm_sock = list_entry(rqstp->rq_server->sv_permsocks.next, typeof(struct svc_xprt), xpt_list);
  561. struct net *net = perm_sock->xpt_net;
  562. struct nfsd_net *nn = net_generic(net, nfsd_net_id);
  563. int err;
  564. /* Lock module and set up kernel thread */
  565. mutex_lock(&nfsd_mutex);
  566. /* At this point, the thread shares current->fs
  567. * with the init process. We need to create files with a
  568. * umask of 0 instead of init's umask. */
  569. if (unshare_fs_struct() < 0) {
  570. printk("Unable to start nfsd thread: out of memory\n");
  571. goto out;
  572. }
  573. current->fs->umask = 0;
  574. /*
  575. * thread is spawned with all signals set to SIG_IGN, re-enable
  576. * the ones that will bring down the thread
  577. */
  578. allow_signal(SIGKILL);
  579. allow_signal(SIGHUP);
  580. allow_signal(SIGINT);
  581. allow_signal(SIGQUIT);
  582. nfsdstats.th_cnt++;
  583. mutex_unlock(&nfsd_mutex);
  584. set_freezable();
  585. /*
  586. * The main request loop
  587. */
  588. for (;;) {
  589. /* Update sv_maxconn if it has changed */
  590. rqstp->rq_server->sv_maxconn = nn->max_connections;
  591. /*
  592. * Find a socket with data available and call its
  593. * recvfrom routine.
  594. */
  595. while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
  596. ;
  597. if (err == -EINTR)
  598. break;
  599. validate_process_creds();
  600. svc_process(rqstp);
  601. validate_process_creds();
  602. }
  603. /* Clear signals before calling svc_exit_thread() */
  604. flush_signals(current);
  605. mutex_lock(&nfsd_mutex);
  606. nfsdstats.th_cnt --;
  607. out:
  608. rqstp->rq_server = NULL;
  609. /* Release the thread */
  610. svc_exit_thread(rqstp);
  611. nfsd_destroy(net);
  612. /* Release module */
  613. mutex_unlock(&nfsd_mutex);
  614. module_put_and_exit(0);
  615. return 0;
  616. }
  617. static __be32 map_new_errors(u32 vers, __be32 nfserr)
  618. {
  619. if (nfserr == nfserr_jukebox && vers == 2)
  620. return nfserr_dropit;
  621. if (nfserr == nfserr_wrongsec && vers < 4)
  622. return nfserr_acces;
  623. return nfserr;
  624. }
  625. /*
  626. * A write procedure can have a large argument, and a read procedure can
  627. * have a large reply, but no NFSv2 or NFSv3 procedure has argument and
  628. * reply that can both be larger than a page. The xdr code has taken
  629. * advantage of this assumption to be a sloppy about bounds checking in
  630. * some cases. Pending a rewrite of the NFSv2/v3 xdr code to fix that
  631. * problem, we enforce these assumptions here:
  632. */
  633. static bool nfs_request_too_big(struct svc_rqst *rqstp,
  634. struct svc_procedure *proc)
  635. {
  636. /*
  637. * The ACL code has more careful bounds-checking and is not
  638. * susceptible to this problem:
  639. */
  640. if (rqstp->rq_prog != NFS_PROGRAM)
  641. return false;
  642. /*
  643. * Ditto NFSv4 (which can in theory have argument and reply both
  644. * more than a page):
  645. */
  646. if (rqstp->rq_vers >= 4)
  647. return false;
  648. /* The reply will be small, we're OK: */
  649. if (proc->pc_xdrressize > 0 &&
  650. proc->pc_xdrressize < XDR_QUADLEN(PAGE_SIZE))
  651. return false;
  652. return rqstp->rq_arg.len > PAGE_SIZE;
  653. }
  654. int
  655. nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
  656. {
  657. struct svc_procedure *proc;
  658. kxdrproc_t xdr;
  659. __be32 nfserr;
  660. __be32 *nfserrp;
  661. dprintk("nfsd_dispatch: vers %d proc %d\n",
  662. rqstp->rq_vers, rqstp->rq_proc);
  663. proc = rqstp->rq_procinfo;
  664. if (nfs_request_too_big(rqstp, proc)) {
  665. dprintk("nfsd: NFSv%d argument too large\n", rqstp->rq_vers);
  666. *statp = rpc_garbage_args;
  667. return 1;
  668. }
  669. /*
  670. * Give the xdr decoder a chance to change this if it wants
  671. * (necessary in the NFSv4.0 compound case)
  672. */
  673. rqstp->rq_cachetype = proc->pc_cachetype;
  674. /* Decode arguments */
  675. xdr = proc->pc_decode;
  676. if (xdr && !xdr(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base,
  677. rqstp->rq_argp)) {
  678. dprintk("nfsd: failed to decode arguments!\n");
  679. *statp = rpc_garbage_args;
  680. return 1;
  681. }
  682. /* Check whether we have this call in the cache. */
  683. switch (nfsd_cache_lookup(rqstp)) {
  684. case RC_DROPIT:
  685. return 0;
  686. case RC_REPLY:
  687. return 1;
  688. case RC_DOIT:;
  689. /* do it */
  690. }
  691. /* need to grab the location to store the status, as
  692. * nfsv4 does some encoding while processing
  693. */
  694. nfserrp = rqstp->rq_res.head[0].iov_base
  695. + rqstp->rq_res.head[0].iov_len;
  696. rqstp->rq_res.head[0].iov_len += sizeof(__be32);
  697. /* Now call the procedure handler, and encode NFS status. */
  698. nfserr = proc->pc_func(rqstp, rqstp->rq_argp, rqstp->rq_resp);
  699. nfserr = map_new_errors(rqstp->rq_vers, nfserr);
  700. if (nfserr == nfserr_dropit || test_bit(RQ_DROPME, &rqstp->rq_flags)) {
  701. dprintk("nfsd: Dropping request; may be revisited later\n");
  702. nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
  703. return 0;
  704. }
  705. if (rqstp->rq_proc != 0)
  706. *nfserrp++ = nfserr;
  707. /* Encode result.
  708. * For NFSv2, additional info is never returned in case of an error.
  709. */
  710. if (!(nfserr && rqstp->rq_vers == 2)) {
  711. xdr = proc->pc_encode;
  712. if (xdr && !xdr(rqstp, nfserrp,
  713. rqstp->rq_resp)) {
  714. /* Failed to encode result. Release cache entry */
  715. dprintk("nfsd: failed to encode result!\n");
  716. nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
  717. *statp = rpc_system_err;
  718. return 1;
  719. }
  720. }
  721. /* Store reply in cache. */
  722. nfsd_cache_update(rqstp, rqstp->rq_cachetype, statp + 1);
  723. return 1;
  724. }
  725. int nfsd_pool_stats_open(struct inode *inode, struct file *file)
  726. {
  727. int ret;
  728. struct nfsd_net *nn = net_generic(inode->i_sb->s_fs_info, nfsd_net_id);
  729. mutex_lock(&nfsd_mutex);
  730. if (nn->nfsd_serv == NULL) {
  731. mutex_unlock(&nfsd_mutex);
  732. return -ENODEV;
  733. }
  734. /* bump up the psudo refcount while traversing */
  735. svc_get(nn->nfsd_serv);
  736. ret = svc_pool_stats_open(nn->nfsd_serv, file);
  737. mutex_unlock(&nfsd_mutex);
  738. return ret;
  739. }
  740. int nfsd_pool_stats_release(struct inode *inode, struct file *file)
  741. {
  742. int ret = seq_release(inode, file);
  743. struct net *net = inode->i_sb->s_fs_info;
  744. mutex_lock(&nfsd_mutex);
  745. /* this function really, really should have been called svc_put() */
  746. nfsd_destroy(net);
  747. mutex_unlock(&nfsd_mutex);
  748. return ret;
  749. }