page.c 31 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202
  1. /* Cache page management and data I/O routines
  2. *
  3. * Copyright (C) 2004-2008 Red Hat, Inc. All Rights Reserved.
  4. * Written by David Howells ([email protected])
  5. *
  6. * This program is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU General Public License
  8. * as published by the Free Software Foundation; either version
  9. * 2 of the License, or (at your option) any later version.
  10. */
  11. #define FSCACHE_DEBUG_LEVEL PAGE
  12. #include <linux/module.h>
  13. #include <linux/fscache-cache.h>
  14. #include <linux/buffer_head.h>
  15. #include <linux/pagevec.h>
  16. #include <linux/slab.h>
  17. #include "internal.h"
  18. /*
  19. * check to see if a page is being written to the cache
  20. */
  21. bool __fscache_check_page_write(struct fscache_cookie *cookie, struct page *page)
  22. {
  23. void *val;
  24. rcu_read_lock();
  25. val = radix_tree_lookup(&cookie->stores, page->index);
  26. rcu_read_unlock();
  27. return val != NULL;
  28. }
  29. EXPORT_SYMBOL(__fscache_check_page_write);
  30. /*
  31. * wait for a page to finish being written to the cache
  32. */
  33. void __fscache_wait_on_page_write(struct fscache_cookie *cookie, struct page *page)
  34. {
  35. wait_queue_head_t *wq = bit_waitqueue(&cookie->flags, 0);
  36. wait_event(*wq, !__fscache_check_page_write(cookie, page));
  37. }
  38. EXPORT_SYMBOL(__fscache_wait_on_page_write);
  39. /*
  40. * wait for a page to finish being written to the cache. Put a timeout here
  41. * since we might be called recursively via parent fs.
  42. */
  43. static
  44. bool release_page_wait_timeout(struct fscache_cookie *cookie, struct page *page)
  45. {
  46. wait_queue_head_t *wq = bit_waitqueue(&cookie->flags, 0);
  47. return wait_event_timeout(*wq, !__fscache_check_page_write(cookie, page),
  48. HZ);
  49. }
  50. /*
  51. * decide whether a page can be released, possibly by cancelling a store to it
  52. * - we're allowed to sleep if __GFP_DIRECT_RECLAIM is flagged
  53. */
  54. bool __fscache_maybe_release_page(struct fscache_cookie *cookie,
  55. struct page *page,
  56. gfp_t gfp)
  57. {
  58. struct page *xpage;
  59. void *val;
  60. _enter("%p,%p,%x", cookie, page, gfp);
  61. try_again:
  62. rcu_read_lock();
  63. val = radix_tree_lookup(&cookie->stores, page->index);
  64. if (!val) {
  65. rcu_read_unlock();
  66. fscache_stat(&fscache_n_store_vmscan_not_storing);
  67. __fscache_uncache_page(cookie, page);
  68. return true;
  69. }
  70. /* see if the page is actually undergoing storage - if so we can't get
  71. * rid of it till the cache has finished with it */
  72. if (radix_tree_tag_get(&cookie->stores, page->index,
  73. FSCACHE_COOKIE_STORING_TAG)) {
  74. rcu_read_unlock();
  75. goto page_busy;
  76. }
  77. /* the page is pending storage, so we attempt to cancel the store and
  78. * discard the store request so that the page can be reclaimed */
  79. spin_lock(&cookie->stores_lock);
  80. rcu_read_unlock();
  81. if (radix_tree_tag_get(&cookie->stores, page->index,
  82. FSCACHE_COOKIE_STORING_TAG)) {
  83. /* the page started to undergo storage whilst we were looking,
  84. * so now we can only wait or return */
  85. spin_unlock(&cookie->stores_lock);
  86. goto page_busy;
  87. }
  88. xpage = radix_tree_delete(&cookie->stores, page->index);
  89. spin_unlock(&cookie->stores_lock);
  90. if (xpage) {
  91. fscache_stat(&fscache_n_store_vmscan_cancelled);
  92. fscache_stat(&fscache_n_store_radix_deletes);
  93. ASSERTCMP(xpage, ==, page);
  94. } else {
  95. fscache_stat(&fscache_n_store_vmscan_gone);
  96. }
  97. wake_up_bit(&cookie->flags, 0);
  98. if (xpage)
  99. put_page(xpage);
  100. __fscache_uncache_page(cookie, page);
  101. return true;
  102. page_busy:
  103. /* We will wait here if we're allowed to, but that could deadlock the
  104. * allocator as the work threads writing to the cache may all end up
  105. * sleeping on memory allocation, so we may need to impose a timeout
  106. * too. */
  107. if (!(gfp & __GFP_DIRECT_RECLAIM) || !(gfp & __GFP_FS)) {
  108. fscache_stat(&fscache_n_store_vmscan_busy);
  109. return false;
  110. }
  111. fscache_stat(&fscache_n_store_vmscan_wait);
  112. if (!release_page_wait_timeout(cookie, page))
  113. _debug("fscache writeout timeout page: %p{%lx}",
  114. page, page->index);
  115. gfp &= ~__GFP_DIRECT_RECLAIM;
  116. goto try_again;
  117. }
  118. EXPORT_SYMBOL(__fscache_maybe_release_page);
  119. /*
  120. * note that a page has finished being written to the cache
  121. */
  122. static void fscache_end_page_write(struct fscache_object *object,
  123. struct page *page)
  124. {
  125. struct fscache_cookie *cookie;
  126. struct page *xpage = NULL;
  127. spin_lock(&object->lock);
  128. cookie = object->cookie;
  129. if (cookie) {
  130. /* delete the page from the tree if it is now no longer
  131. * pending */
  132. spin_lock(&cookie->stores_lock);
  133. radix_tree_tag_clear(&cookie->stores, page->index,
  134. FSCACHE_COOKIE_STORING_TAG);
  135. if (!radix_tree_tag_get(&cookie->stores, page->index,
  136. FSCACHE_COOKIE_PENDING_TAG)) {
  137. fscache_stat(&fscache_n_store_radix_deletes);
  138. xpage = radix_tree_delete(&cookie->stores, page->index);
  139. }
  140. spin_unlock(&cookie->stores_lock);
  141. wake_up_bit(&cookie->flags, 0);
  142. }
  143. spin_unlock(&object->lock);
  144. if (xpage)
  145. put_page(xpage);
  146. }
  147. /*
  148. * actually apply the changed attributes to a cache object
  149. */
  150. static void fscache_attr_changed_op(struct fscache_operation *op)
  151. {
  152. struct fscache_object *object = op->object;
  153. int ret;
  154. _enter("{OBJ%x OP%x}", object->debug_id, op->debug_id);
  155. fscache_stat(&fscache_n_attr_changed_calls);
  156. if (fscache_object_is_active(object)) {
  157. fscache_stat(&fscache_n_cop_attr_changed);
  158. ret = object->cache->ops->attr_changed(object);
  159. fscache_stat_d(&fscache_n_cop_attr_changed);
  160. if (ret < 0)
  161. fscache_abort_object(object);
  162. }
  163. fscache_op_complete(op, true);
  164. _leave("");
  165. }
  166. /*
  167. * notification that the attributes on an object have changed
  168. */
  169. int __fscache_attr_changed(struct fscache_cookie *cookie)
  170. {
  171. struct fscache_operation *op;
  172. struct fscache_object *object;
  173. bool wake_cookie = false;
  174. _enter("%p", cookie);
  175. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  176. fscache_stat(&fscache_n_attr_changed);
  177. op = kzalloc(sizeof(*op), GFP_KERNEL);
  178. if (!op) {
  179. fscache_stat(&fscache_n_attr_changed_nomem);
  180. _leave(" = -ENOMEM");
  181. return -ENOMEM;
  182. }
  183. fscache_operation_init(op, fscache_attr_changed_op, NULL, NULL);
  184. op->flags = FSCACHE_OP_ASYNC |
  185. (1 << FSCACHE_OP_EXCLUSIVE) |
  186. (1 << FSCACHE_OP_UNUSE_COOKIE);
  187. spin_lock(&cookie->lock);
  188. if (!fscache_cookie_enabled(cookie) ||
  189. hlist_empty(&cookie->backing_objects))
  190. goto nobufs;
  191. object = hlist_entry(cookie->backing_objects.first,
  192. struct fscache_object, cookie_link);
  193. __fscache_use_cookie(cookie);
  194. if (fscache_submit_exclusive_op(object, op) < 0)
  195. goto nobufs_dec;
  196. spin_unlock(&cookie->lock);
  197. fscache_stat(&fscache_n_attr_changed_ok);
  198. fscache_put_operation(op);
  199. _leave(" = 0");
  200. return 0;
  201. nobufs_dec:
  202. wake_cookie = __fscache_unuse_cookie(cookie);
  203. nobufs:
  204. spin_unlock(&cookie->lock);
  205. fscache_put_operation(op);
  206. if (wake_cookie)
  207. __fscache_wake_unused_cookie(cookie);
  208. fscache_stat(&fscache_n_attr_changed_nobufs);
  209. _leave(" = %d", -ENOBUFS);
  210. return -ENOBUFS;
  211. }
  212. EXPORT_SYMBOL(__fscache_attr_changed);
  213. /*
  214. * Handle cancellation of a pending retrieval op
  215. */
  216. static void fscache_do_cancel_retrieval(struct fscache_operation *_op)
  217. {
  218. struct fscache_retrieval *op =
  219. container_of(_op, struct fscache_retrieval, op);
  220. atomic_set(&op->n_pages, 0);
  221. }
  222. /*
  223. * release a retrieval op reference
  224. */
  225. static void fscache_release_retrieval_op(struct fscache_operation *_op)
  226. {
  227. struct fscache_retrieval *op =
  228. container_of(_op, struct fscache_retrieval, op);
  229. _enter("{OP%x}", op->op.debug_id);
  230. ASSERTIFCMP(op->op.state != FSCACHE_OP_ST_INITIALISED,
  231. atomic_read(&op->n_pages), ==, 0);
  232. fscache_hist(fscache_retrieval_histogram, op->start_time);
  233. if (op->context)
  234. fscache_put_context(op->cookie, op->context);
  235. _leave("");
  236. }
  237. /*
  238. * allocate a retrieval op
  239. */
  240. static struct fscache_retrieval *fscache_alloc_retrieval(
  241. struct fscache_cookie *cookie,
  242. struct address_space *mapping,
  243. fscache_rw_complete_t end_io_func,
  244. void *context)
  245. {
  246. struct fscache_retrieval *op;
  247. /* allocate a retrieval operation and attempt to submit it */
  248. op = kzalloc(sizeof(*op), GFP_NOIO);
  249. if (!op) {
  250. fscache_stat(&fscache_n_retrievals_nomem);
  251. return NULL;
  252. }
  253. fscache_operation_init(&op->op, NULL,
  254. fscache_do_cancel_retrieval,
  255. fscache_release_retrieval_op);
  256. op->op.flags = FSCACHE_OP_MYTHREAD |
  257. (1UL << FSCACHE_OP_WAITING) |
  258. (1UL << FSCACHE_OP_UNUSE_COOKIE);
  259. op->cookie = cookie;
  260. op->mapping = mapping;
  261. op->end_io_func = end_io_func;
  262. op->context = context;
  263. op->start_time = jiffies;
  264. INIT_LIST_HEAD(&op->to_do);
  265. /* Pin the netfs read context in case we need to do the actual netfs
  266. * read because we've encountered a cache read failure.
  267. */
  268. if (context)
  269. fscache_get_context(op->cookie, context);
  270. return op;
  271. }
  272. /*
  273. * wait for a deferred lookup to complete
  274. */
  275. int fscache_wait_for_deferred_lookup(struct fscache_cookie *cookie)
  276. {
  277. unsigned long jif;
  278. _enter("");
  279. if (!test_bit(FSCACHE_COOKIE_LOOKING_UP, &cookie->flags)) {
  280. _leave(" = 0 [imm]");
  281. return 0;
  282. }
  283. fscache_stat(&fscache_n_retrievals_wait);
  284. jif = jiffies;
  285. if (wait_on_bit(&cookie->flags, FSCACHE_COOKIE_LOOKING_UP,
  286. TASK_INTERRUPTIBLE) != 0) {
  287. fscache_stat(&fscache_n_retrievals_intr);
  288. _leave(" = -ERESTARTSYS");
  289. return -ERESTARTSYS;
  290. }
  291. ASSERT(!test_bit(FSCACHE_COOKIE_LOOKING_UP, &cookie->flags));
  292. smp_rmb();
  293. fscache_hist(fscache_retrieval_delay_histogram, jif);
  294. _leave(" = 0 [dly]");
  295. return 0;
  296. }
  297. /*
  298. * wait for an object to become active (or dead)
  299. */
  300. int fscache_wait_for_operation_activation(struct fscache_object *object,
  301. struct fscache_operation *op,
  302. atomic_t *stat_op_waits,
  303. atomic_t *stat_object_dead)
  304. {
  305. int ret;
  306. if (!test_bit(FSCACHE_OP_WAITING, &op->flags))
  307. goto check_if_dead;
  308. _debug(">>> WT");
  309. if (stat_op_waits)
  310. fscache_stat(stat_op_waits);
  311. if (wait_on_bit(&op->flags, FSCACHE_OP_WAITING,
  312. TASK_INTERRUPTIBLE) != 0) {
  313. ret = fscache_cancel_op(op, false);
  314. if (ret == 0)
  315. return -ERESTARTSYS;
  316. /* it's been removed from the pending queue by another party,
  317. * so we should get to run shortly */
  318. wait_on_bit(&op->flags, FSCACHE_OP_WAITING,
  319. TASK_UNINTERRUPTIBLE);
  320. }
  321. _debug("<<< GO");
  322. check_if_dead:
  323. if (op->state == FSCACHE_OP_ST_CANCELLED) {
  324. if (stat_object_dead)
  325. fscache_stat(stat_object_dead);
  326. _leave(" = -ENOBUFS [cancelled]");
  327. return -ENOBUFS;
  328. }
  329. if (unlikely(fscache_object_is_dying(object) ||
  330. fscache_cache_is_broken(object))) {
  331. enum fscache_operation_state state = op->state;
  332. fscache_cancel_op(op, true);
  333. if (stat_object_dead)
  334. fscache_stat(stat_object_dead);
  335. _leave(" = -ENOBUFS [obj dead %d]", state);
  336. return -ENOBUFS;
  337. }
  338. return 0;
  339. }
  340. /*
  341. * read a page from the cache or allocate a block in which to store it
  342. * - we return:
  343. * -ENOMEM - out of memory, nothing done
  344. * -ERESTARTSYS - interrupted
  345. * -ENOBUFS - no backing object available in which to cache the block
  346. * -ENODATA - no data available in the backing object for this block
  347. * 0 - dispatched a read - it'll call end_io_func() when finished
  348. */
  349. int __fscache_read_or_alloc_page(struct fscache_cookie *cookie,
  350. struct page *page,
  351. fscache_rw_complete_t end_io_func,
  352. void *context,
  353. gfp_t gfp)
  354. {
  355. struct fscache_retrieval *op;
  356. struct fscache_object *object;
  357. bool wake_cookie = false;
  358. int ret;
  359. _enter("%p,%p,,,", cookie, page);
  360. fscache_stat(&fscache_n_retrievals);
  361. if (hlist_empty(&cookie->backing_objects))
  362. goto nobufs;
  363. if (test_bit(FSCACHE_COOKIE_INVALIDATING, &cookie->flags)) {
  364. _leave(" = -ENOBUFS [invalidating]");
  365. return -ENOBUFS;
  366. }
  367. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  368. ASSERTCMP(page, !=, NULL);
  369. if (fscache_wait_for_deferred_lookup(cookie) < 0)
  370. return -ERESTARTSYS;
  371. op = fscache_alloc_retrieval(cookie, page->mapping,
  372. end_io_func, context);
  373. if (!op) {
  374. _leave(" = -ENOMEM");
  375. return -ENOMEM;
  376. }
  377. atomic_set(&op->n_pages, 1);
  378. spin_lock(&cookie->lock);
  379. if (!fscache_cookie_enabled(cookie) ||
  380. hlist_empty(&cookie->backing_objects))
  381. goto nobufs_unlock;
  382. object = hlist_entry(cookie->backing_objects.first,
  383. struct fscache_object, cookie_link);
  384. ASSERT(test_bit(FSCACHE_OBJECT_IS_LOOKED_UP, &object->flags));
  385. __fscache_use_cookie(cookie);
  386. atomic_inc(&object->n_reads);
  387. __set_bit(FSCACHE_OP_DEC_READ_CNT, &op->op.flags);
  388. if (fscache_submit_op(object, &op->op) < 0)
  389. goto nobufs_unlock_dec;
  390. spin_unlock(&cookie->lock);
  391. fscache_stat(&fscache_n_retrieval_ops);
  392. /* we wait for the operation to become active, and then process it
  393. * *here*, in this thread, and not in the thread pool */
  394. ret = fscache_wait_for_operation_activation(
  395. object, &op->op,
  396. __fscache_stat(&fscache_n_retrieval_op_waits),
  397. __fscache_stat(&fscache_n_retrievals_object_dead));
  398. if (ret < 0)
  399. goto error;
  400. /* ask the cache to honour the operation */
  401. if (test_bit(FSCACHE_COOKIE_NO_DATA_YET, &object->cookie->flags)) {
  402. fscache_stat(&fscache_n_cop_allocate_page);
  403. ret = object->cache->ops->allocate_page(op, page, gfp);
  404. fscache_stat_d(&fscache_n_cop_allocate_page);
  405. if (ret == 0)
  406. ret = -ENODATA;
  407. } else {
  408. fscache_stat(&fscache_n_cop_read_or_alloc_page);
  409. ret = object->cache->ops->read_or_alloc_page(op, page, gfp);
  410. fscache_stat_d(&fscache_n_cop_read_or_alloc_page);
  411. }
  412. error:
  413. if (ret == -ENOMEM)
  414. fscache_stat(&fscache_n_retrievals_nomem);
  415. else if (ret == -ERESTARTSYS)
  416. fscache_stat(&fscache_n_retrievals_intr);
  417. else if (ret == -ENODATA)
  418. fscache_stat(&fscache_n_retrievals_nodata);
  419. else if (ret < 0)
  420. fscache_stat(&fscache_n_retrievals_nobufs);
  421. else
  422. fscache_stat(&fscache_n_retrievals_ok);
  423. fscache_put_retrieval(op);
  424. _leave(" = %d", ret);
  425. return ret;
  426. nobufs_unlock_dec:
  427. atomic_dec(&object->n_reads);
  428. wake_cookie = __fscache_unuse_cookie(cookie);
  429. nobufs_unlock:
  430. spin_unlock(&cookie->lock);
  431. if (wake_cookie)
  432. __fscache_wake_unused_cookie(cookie);
  433. fscache_put_retrieval(op);
  434. nobufs:
  435. fscache_stat(&fscache_n_retrievals_nobufs);
  436. _leave(" = -ENOBUFS");
  437. return -ENOBUFS;
  438. }
  439. EXPORT_SYMBOL(__fscache_read_or_alloc_page);
  440. /*
  441. * read a list of page from the cache or allocate a block in which to store
  442. * them
  443. * - we return:
  444. * -ENOMEM - out of memory, some pages may be being read
  445. * -ERESTARTSYS - interrupted, some pages may be being read
  446. * -ENOBUFS - no backing object or space available in which to cache any
  447. * pages not being read
  448. * -ENODATA - no data available in the backing object for some or all of
  449. * the pages
  450. * 0 - dispatched a read on all pages
  451. *
  452. * end_io_func() will be called for each page read from the cache as it is
  453. * finishes being read
  454. *
  455. * any pages for which a read is dispatched will be removed from pages and
  456. * nr_pages
  457. */
  458. int __fscache_read_or_alloc_pages(struct fscache_cookie *cookie,
  459. struct address_space *mapping,
  460. struct list_head *pages,
  461. unsigned *nr_pages,
  462. fscache_rw_complete_t end_io_func,
  463. void *context,
  464. gfp_t gfp)
  465. {
  466. struct fscache_retrieval *op;
  467. struct fscache_object *object;
  468. bool wake_cookie = false;
  469. int ret;
  470. _enter("%p,,%d,,,", cookie, *nr_pages);
  471. fscache_stat(&fscache_n_retrievals);
  472. if (hlist_empty(&cookie->backing_objects))
  473. goto nobufs;
  474. if (test_bit(FSCACHE_COOKIE_INVALIDATING, &cookie->flags)) {
  475. _leave(" = -ENOBUFS [invalidating]");
  476. return -ENOBUFS;
  477. }
  478. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  479. ASSERTCMP(*nr_pages, >, 0);
  480. ASSERT(!list_empty(pages));
  481. if (fscache_wait_for_deferred_lookup(cookie) < 0)
  482. return -ERESTARTSYS;
  483. op = fscache_alloc_retrieval(cookie, mapping, end_io_func, context);
  484. if (!op)
  485. return -ENOMEM;
  486. atomic_set(&op->n_pages, *nr_pages);
  487. spin_lock(&cookie->lock);
  488. if (!fscache_cookie_enabled(cookie) ||
  489. hlist_empty(&cookie->backing_objects))
  490. goto nobufs_unlock;
  491. object = hlist_entry(cookie->backing_objects.first,
  492. struct fscache_object, cookie_link);
  493. __fscache_use_cookie(cookie);
  494. atomic_inc(&object->n_reads);
  495. __set_bit(FSCACHE_OP_DEC_READ_CNT, &op->op.flags);
  496. if (fscache_submit_op(object, &op->op) < 0)
  497. goto nobufs_unlock_dec;
  498. spin_unlock(&cookie->lock);
  499. fscache_stat(&fscache_n_retrieval_ops);
  500. /* we wait for the operation to become active, and then process it
  501. * *here*, in this thread, and not in the thread pool */
  502. ret = fscache_wait_for_operation_activation(
  503. object, &op->op,
  504. __fscache_stat(&fscache_n_retrieval_op_waits),
  505. __fscache_stat(&fscache_n_retrievals_object_dead));
  506. if (ret < 0)
  507. goto error;
  508. /* ask the cache to honour the operation */
  509. if (test_bit(FSCACHE_COOKIE_NO_DATA_YET, &object->cookie->flags)) {
  510. fscache_stat(&fscache_n_cop_allocate_pages);
  511. ret = object->cache->ops->allocate_pages(
  512. op, pages, nr_pages, gfp);
  513. fscache_stat_d(&fscache_n_cop_allocate_pages);
  514. } else {
  515. fscache_stat(&fscache_n_cop_read_or_alloc_pages);
  516. ret = object->cache->ops->read_or_alloc_pages(
  517. op, pages, nr_pages, gfp);
  518. fscache_stat_d(&fscache_n_cop_read_or_alloc_pages);
  519. }
  520. error:
  521. if (ret == -ENOMEM)
  522. fscache_stat(&fscache_n_retrievals_nomem);
  523. else if (ret == -ERESTARTSYS)
  524. fscache_stat(&fscache_n_retrievals_intr);
  525. else if (ret == -ENODATA)
  526. fscache_stat(&fscache_n_retrievals_nodata);
  527. else if (ret < 0)
  528. fscache_stat(&fscache_n_retrievals_nobufs);
  529. else
  530. fscache_stat(&fscache_n_retrievals_ok);
  531. fscache_put_retrieval(op);
  532. _leave(" = %d", ret);
  533. return ret;
  534. nobufs_unlock_dec:
  535. atomic_dec(&object->n_reads);
  536. wake_cookie = __fscache_unuse_cookie(cookie);
  537. nobufs_unlock:
  538. spin_unlock(&cookie->lock);
  539. fscache_put_retrieval(op);
  540. if (wake_cookie)
  541. __fscache_wake_unused_cookie(cookie);
  542. nobufs:
  543. fscache_stat(&fscache_n_retrievals_nobufs);
  544. _leave(" = -ENOBUFS");
  545. return -ENOBUFS;
  546. }
  547. EXPORT_SYMBOL(__fscache_read_or_alloc_pages);
  548. /*
  549. * allocate a block in the cache on which to store a page
  550. * - we return:
  551. * -ENOMEM - out of memory, nothing done
  552. * -ERESTARTSYS - interrupted
  553. * -ENOBUFS - no backing object available in which to cache the block
  554. * 0 - block allocated
  555. */
  556. int __fscache_alloc_page(struct fscache_cookie *cookie,
  557. struct page *page,
  558. gfp_t gfp)
  559. {
  560. struct fscache_retrieval *op;
  561. struct fscache_object *object;
  562. bool wake_cookie = false;
  563. int ret;
  564. _enter("%p,%p,,,", cookie, page);
  565. fscache_stat(&fscache_n_allocs);
  566. if (hlist_empty(&cookie->backing_objects))
  567. goto nobufs;
  568. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  569. ASSERTCMP(page, !=, NULL);
  570. if (test_bit(FSCACHE_COOKIE_INVALIDATING, &cookie->flags)) {
  571. _leave(" = -ENOBUFS [invalidating]");
  572. return -ENOBUFS;
  573. }
  574. if (fscache_wait_for_deferred_lookup(cookie) < 0)
  575. return -ERESTARTSYS;
  576. op = fscache_alloc_retrieval(cookie, page->mapping, NULL, NULL);
  577. if (!op)
  578. return -ENOMEM;
  579. atomic_set(&op->n_pages, 1);
  580. spin_lock(&cookie->lock);
  581. if (!fscache_cookie_enabled(cookie) ||
  582. hlist_empty(&cookie->backing_objects))
  583. goto nobufs_unlock;
  584. object = hlist_entry(cookie->backing_objects.first,
  585. struct fscache_object, cookie_link);
  586. __fscache_use_cookie(cookie);
  587. if (fscache_submit_op(object, &op->op) < 0)
  588. goto nobufs_unlock_dec;
  589. spin_unlock(&cookie->lock);
  590. fscache_stat(&fscache_n_alloc_ops);
  591. ret = fscache_wait_for_operation_activation(
  592. object, &op->op,
  593. __fscache_stat(&fscache_n_alloc_op_waits),
  594. __fscache_stat(&fscache_n_allocs_object_dead));
  595. if (ret < 0)
  596. goto error;
  597. /* ask the cache to honour the operation */
  598. fscache_stat(&fscache_n_cop_allocate_page);
  599. ret = object->cache->ops->allocate_page(op, page, gfp);
  600. fscache_stat_d(&fscache_n_cop_allocate_page);
  601. error:
  602. if (ret == -ERESTARTSYS)
  603. fscache_stat(&fscache_n_allocs_intr);
  604. else if (ret < 0)
  605. fscache_stat(&fscache_n_allocs_nobufs);
  606. else
  607. fscache_stat(&fscache_n_allocs_ok);
  608. fscache_put_retrieval(op);
  609. _leave(" = %d", ret);
  610. return ret;
  611. nobufs_unlock_dec:
  612. wake_cookie = __fscache_unuse_cookie(cookie);
  613. nobufs_unlock:
  614. spin_unlock(&cookie->lock);
  615. fscache_put_retrieval(op);
  616. if (wake_cookie)
  617. __fscache_wake_unused_cookie(cookie);
  618. nobufs:
  619. fscache_stat(&fscache_n_allocs_nobufs);
  620. _leave(" = -ENOBUFS");
  621. return -ENOBUFS;
  622. }
  623. EXPORT_SYMBOL(__fscache_alloc_page);
  624. /*
  625. * Unmark pages allocate in the readahead code path (via:
  626. * fscache_readpages_or_alloc) after delegating to the base filesystem
  627. */
  628. void __fscache_readpages_cancel(struct fscache_cookie *cookie,
  629. struct list_head *pages)
  630. {
  631. struct page *page;
  632. list_for_each_entry(page, pages, lru) {
  633. if (PageFsCache(page))
  634. __fscache_uncache_page(cookie, page);
  635. }
  636. }
  637. EXPORT_SYMBOL(__fscache_readpages_cancel);
  638. /*
  639. * release a write op reference
  640. */
  641. static void fscache_release_write_op(struct fscache_operation *_op)
  642. {
  643. _enter("{OP%x}", _op->debug_id);
  644. }
  645. /*
  646. * perform the background storage of a page into the cache
  647. */
  648. static void fscache_write_op(struct fscache_operation *_op)
  649. {
  650. struct fscache_storage *op =
  651. container_of(_op, struct fscache_storage, op);
  652. struct fscache_object *object = op->op.object;
  653. struct fscache_cookie *cookie;
  654. struct page *page;
  655. unsigned n;
  656. void *results[1];
  657. int ret;
  658. _enter("{OP%x,%d}", op->op.debug_id, atomic_read(&op->op.usage));
  659. again:
  660. spin_lock(&object->lock);
  661. cookie = object->cookie;
  662. if (!fscache_object_is_active(object)) {
  663. /* If we get here, then the on-disk cache object likely longer
  664. * exists, so we should just cancel this write operation.
  665. */
  666. spin_unlock(&object->lock);
  667. fscache_op_complete(&op->op, false);
  668. _leave(" [inactive]");
  669. return;
  670. }
  671. if (!cookie) {
  672. /* If we get here, then the cookie belonging to the object was
  673. * detached, probably by the cookie being withdrawn due to
  674. * memory pressure, which means that the pages we might write
  675. * to the cache from no longer exist - therefore, we can just
  676. * cancel this write operation.
  677. */
  678. spin_unlock(&object->lock);
  679. fscache_op_complete(&op->op, false);
  680. _leave(" [cancel] op{f=%lx s=%u} obj{s=%s f=%lx}",
  681. _op->flags, _op->state, object->state->short_name,
  682. object->flags);
  683. return;
  684. }
  685. spin_lock(&cookie->stores_lock);
  686. fscache_stat(&fscache_n_store_calls);
  687. /* find a page to store */
  688. page = NULL;
  689. n = radix_tree_gang_lookup_tag(&cookie->stores, results, 0, 1,
  690. FSCACHE_COOKIE_PENDING_TAG);
  691. if (n != 1)
  692. goto superseded;
  693. page = results[0];
  694. _debug("gang %d [%lx]", n, page->index);
  695. radix_tree_tag_set(&cookie->stores, page->index,
  696. FSCACHE_COOKIE_STORING_TAG);
  697. radix_tree_tag_clear(&cookie->stores, page->index,
  698. FSCACHE_COOKIE_PENDING_TAG);
  699. spin_unlock(&cookie->stores_lock);
  700. spin_unlock(&object->lock);
  701. if (page->index >= op->store_limit)
  702. goto discard_page;
  703. fscache_stat(&fscache_n_store_pages);
  704. fscache_stat(&fscache_n_cop_write_page);
  705. ret = object->cache->ops->write_page(op, page);
  706. fscache_stat_d(&fscache_n_cop_write_page);
  707. fscache_end_page_write(object, page);
  708. if (ret < 0) {
  709. fscache_abort_object(object);
  710. fscache_op_complete(&op->op, true);
  711. } else {
  712. fscache_enqueue_operation(&op->op);
  713. }
  714. _leave("");
  715. return;
  716. discard_page:
  717. fscache_stat(&fscache_n_store_pages_over_limit);
  718. fscache_end_page_write(object, page);
  719. goto again;
  720. superseded:
  721. /* this writer is going away and there aren't any more things to
  722. * write */
  723. _debug("cease");
  724. spin_unlock(&cookie->stores_lock);
  725. clear_bit(FSCACHE_OBJECT_PENDING_WRITE, &object->flags);
  726. spin_unlock(&object->lock);
  727. fscache_op_complete(&op->op, true);
  728. _leave("");
  729. }
  730. /*
  731. * Clear the pages pending writing for invalidation
  732. */
  733. void fscache_invalidate_writes(struct fscache_cookie *cookie)
  734. {
  735. struct page *page;
  736. void *results[16];
  737. int n, i;
  738. _enter("");
  739. for (;;) {
  740. spin_lock(&cookie->stores_lock);
  741. n = radix_tree_gang_lookup_tag(&cookie->stores, results, 0,
  742. ARRAY_SIZE(results),
  743. FSCACHE_COOKIE_PENDING_TAG);
  744. if (n == 0) {
  745. spin_unlock(&cookie->stores_lock);
  746. break;
  747. }
  748. for (i = n - 1; i >= 0; i--) {
  749. page = results[i];
  750. radix_tree_delete(&cookie->stores, page->index);
  751. }
  752. spin_unlock(&cookie->stores_lock);
  753. for (i = n - 1; i >= 0; i--)
  754. put_page(results[i]);
  755. }
  756. wake_up_bit(&cookie->flags, 0);
  757. _leave("");
  758. }
  759. /*
  760. * request a page be stored in the cache
  761. * - returns:
  762. * -ENOMEM - out of memory, nothing done
  763. * -ENOBUFS - no backing object available in which to cache the page
  764. * 0 - dispatched a write - it'll call end_io_func() when finished
  765. *
  766. * if the cookie still has a backing object at this point, that object can be
  767. * in one of a few states with respect to storage processing:
  768. *
  769. * (1) negative lookup, object not yet created (FSCACHE_COOKIE_CREATING is
  770. * set)
  771. *
  772. * (a) no writes yet
  773. *
  774. * (b) writes deferred till post-creation (mark page for writing and
  775. * return immediately)
  776. *
  777. * (2) negative lookup, object created, initial fill being made from netfs
  778. *
  779. * (a) fill point not yet reached this page (mark page for writing and
  780. * return)
  781. *
  782. * (b) fill point passed this page (queue op to store this page)
  783. *
  784. * (3) object extant (queue op to store this page)
  785. *
  786. * any other state is invalid
  787. */
  788. int __fscache_write_page(struct fscache_cookie *cookie,
  789. struct page *page,
  790. gfp_t gfp)
  791. {
  792. struct fscache_storage *op;
  793. struct fscache_object *object;
  794. bool wake_cookie = false;
  795. int ret;
  796. _enter("%p,%x,", cookie, (u32) page->flags);
  797. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  798. ASSERT(PageFsCache(page));
  799. fscache_stat(&fscache_n_stores);
  800. if (test_bit(FSCACHE_COOKIE_INVALIDATING, &cookie->flags)) {
  801. _leave(" = -ENOBUFS [invalidating]");
  802. return -ENOBUFS;
  803. }
  804. op = kzalloc(sizeof(*op), GFP_NOIO | __GFP_NOMEMALLOC | __GFP_NORETRY);
  805. if (!op)
  806. goto nomem;
  807. fscache_operation_init(&op->op, fscache_write_op, NULL,
  808. fscache_release_write_op);
  809. op->op.flags = FSCACHE_OP_ASYNC |
  810. (1 << FSCACHE_OP_WAITING) |
  811. (1 << FSCACHE_OP_UNUSE_COOKIE);
  812. ret = radix_tree_maybe_preload(gfp & ~__GFP_HIGHMEM);
  813. if (ret < 0)
  814. goto nomem_free;
  815. ret = -ENOBUFS;
  816. spin_lock(&cookie->lock);
  817. if (!fscache_cookie_enabled(cookie) ||
  818. hlist_empty(&cookie->backing_objects))
  819. goto nobufs;
  820. object = hlist_entry(cookie->backing_objects.first,
  821. struct fscache_object, cookie_link);
  822. if (test_bit(FSCACHE_IOERROR, &object->cache->flags))
  823. goto nobufs;
  824. /* add the page to the pending-storage radix tree on the backing
  825. * object */
  826. spin_lock(&object->lock);
  827. spin_lock(&cookie->stores_lock);
  828. _debug("store limit %llx", (unsigned long long) object->store_limit);
  829. ret = radix_tree_insert(&cookie->stores, page->index, page);
  830. if (ret < 0) {
  831. if (ret == -EEXIST)
  832. goto already_queued;
  833. _debug("insert failed %d", ret);
  834. goto nobufs_unlock_obj;
  835. }
  836. radix_tree_tag_set(&cookie->stores, page->index,
  837. FSCACHE_COOKIE_PENDING_TAG);
  838. get_page(page);
  839. /* we only want one writer at a time, but we do need to queue new
  840. * writers after exclusive ops */
  841. if (test_and_set_bit(FSCACHE_OBJECT_PENDING_WRITE, &object->flags))
  842. goto already_pending;
  843. spin_unlock(&cookie->stores_lock);
  844. spin_unlock(&object->lock);
  845. op->op.debug_id = atomic_inc_return(&fscache_op_debug_id);
  846. op->store_limit = object->store_limit;
  847. __fscache_use_cookie(cookie);
  848. if (fscache_submit_op(object, &op->op) < 0)
  849. goto submit_failed;
  850. spin_unlock(&cookie->lock);
  851. radix_tree_preload_end();
  852. fscache_stat(&fscache_n_store_ops);
  853. fscache_stat(&fscache_n_stores_ok);
  854. /* the work queue now carries its own ref on the object */
  855. fscache_put_operation(&op->op);
  856. _leave(" = 0");
  857. return 0;
  858. already_queued:
  859. fscache_stat(&fscache_n_stores_again);
  860. already_pending:
  861. spin_unlock(&cookie->stores_lock);
  862. spin_unlock(&object->lock);
  863. spin_unlock(&cookie->lock);
  864. radix_tree_preload_end();
  865. fscache_put_operation(&op->op);
  866. fscache_stat(&fscache_n_stores_ok);
  867. _leave(" = 0");
  868. return 0;
  869. submit_failed:
  870. spin_lock(&cookie->stores_lock);
  871. radix_tree_delete(&cookie->stores, page->index);
  872. spin_unlock(&cookie->stores_lock);
  873. wake_cookie = __fscache_unuse_cookie(cookie);
  874. put_page(page);
  875. ret = -ENOBUFS;
  876. goto nobufs;
  877. nobufs_unlock_obj:
  878. spin_unlock(&cookie->stores_lock);
  879. spin_unlock(&object->lock);
  880. nobufs:
  881. spin_unlock(&cookie->lock);
  882. radix_tree_preload_end();
  883. fscache_put_operation(&op->op);
  884. if (wake_cookie)
  885. __fscache_wake_unused_cookie(cookie);
  886. fscache_stat(&fscache_n_stores_nobufs);
  887. _leave(" = -ENOBUFS");
  888. return -ENOBUFS;
  889. nomem_free:
  890. fscache_put_operation(&op->op);
  891. nomem:
  892. fscache_stat(&fscache_n_stores_oom);
  893. _leave(" = -ENOMEM");
  894. return -ENOMEM;
  895. }
  896. EXPORT_SYMBOL(__fscache_write_page);
  897. /*
  898. * remove a page from the cache
  899. */
  900. void __fscache_uncache_page(struct fscache_cookie *cookie, struct page *page)
  901. {
  902. struct fscache_object *object;
  903. _enter(",%p", page);
  904. ASSERTCMP(cookie->def->type, !=, FSCACHE_COOKIE_TYPE_INDEX);
  905. ASSERTCMP(page, !=, NULL);
  906. fscache_stat(&fscache_n_uncaches);
  907. /* cache withdrawal may beat us to it */
  908. if (!PageFsCache(page))
  909. goto done;
  910. /* get the object */
  911. spin_lock(&cookie->lock);
  912. if (hlist_empty(&cookie->backing_objects)) {
  913. ClearPageFsCache(page);
  914. goto done_unlock;
  915. }
  916. object = hlist_entry(cookie->backing_objects.first,
  917. struct fscache_object, cookie_link);
  918. /* there might now be stuff on disk we could read */
  919. clear_bit(FSCACHE_COOKIE_NO_DATA_YET, &cookie->flags);
  920. /* only invoke the cache backend if we managed to mark the page
  921. * uncached here; this deals with synchronisation vs withdrawal */
  922. if (TestClearPageFsCache(page) &&
  923. object->cache->ops->uncache_page) {
  924. /* the cache backend releases the cookie lock */
  925. fscache_stat(&fscache_n_cop_uncache_page);
  926. object->cache->ops->uncache_page(object, page);
  927. fscache_stat_d(&fscache_n_cop_uncache_page);
  928. goto done;
  929. }
  930. done_unlock:
  931. spin_unlock(&cookie->lock);
  932. done:
  933. _leave("");
  934. }
  935. EXPORT_SYMBOL(__fscache_uncache_page);
  936. /**
  937. * fscache_mark_page_cached - Mark a page as being cached
  938. * @op: The retrieval op pages are being marked for
  939. * @page: The page to be marked
  940. *
  941. * Mark a netfs page as being cached. After this is called, the netfs
  942. * must call fscache_uncache_page() to remove the mark.
  943. */
  944. void fscache_mark_page_cached(struct fscache_retrieval *op, struct page *page)
  945. {
  946. struct fscache_cookie *cookie = op->op.object->cookie;
  947. #ifdef CONFIG_FSCACHE_STATS
  948. atomic_inc(&fscache_n_marks);
  949. #endif
  950. _debug("- mark %p{%lx}", page, page->index);
  951. if (TestSetPageFsCache(page)) {
  952. static bool once_only;
  953. if (!once_only) {
  954. once_only = true;
  955. pr_warn("Cookie type %s marked page %lx multiple times\n",
  956. cookie->def->name, page->index);
  957. }
  958. }
  959. if (cookie->def->mark_page_cached)
  960. cookie->def->mark_page_cached(cookie->netfs_data,
  961. op->mapping, page);
  962. }
  963. EXPORT_SYMBOL(fscache_mark_page_cached);
  964. /**
  965. * fscache_mark_pages_cached - Mark pages as being cached
  966. * @op: The retrieval op pages are being marked for
  967. * @pagevec: The pages to be marked
  968. *
  969. * Mark a bunch of netfs pages as being cached. After this is called,
  970. * the netfs must call fscache_uncache_page() to remove the mark.
  971. */
  972. void fscache_mark_pages_cached(struct fscache_retrieval *op,
  973. struct pagevec *pagevec)
  974. {
  975. unsigned long loop;
  976. for (loop = 0; loop < pagevec->nr; loop++)
  977. fscache_mark_page_cached(op, pagevec->pages[loop]);
  978. pagevec_reinit(pagevec);
  979. }
  980. EXPORT_SYMBOL(fscache_mark_pages_cached);
  981. /*
  982. * Uncache all the pages in an inode that are marked PG_fscache, assuming them
  983. * to be associated with the given cookie.
  984. */
  985. void __fscache_uncache_all_inode_pages(struct fscache_cookie *cookie,
  986. struct inode *inode)
  987. {
  988. struct address_space *mapping = inode->i_mapping;
  989. struct pagevec pvec;
  990. pgoff_t next;
  991. int i;
  992. _enter("%p,%p", cookie, inode);
  993. if (!mapping || mapping->nrpages == 0) {
  994. _leave(" [no pages]");
  995. return;
  996. }
  997. pagevec_init(&pvec, 0);
  998. next = 0;
  999. do {
  1000. if (!pagevec_lookup(&pvec, mapping, next, PAGEVEC_SIZE))
  1001. break;
  1002. for (i = 0; i < pagevec_count(&pvec); i++) {
  1003. struct page *page = pvec.pages[i];
  1004. next = page->index;
  1005. if (PageFsCache(page)) {
  1006. __fscache_wait_on_page_write(cookie, page);
  1007. __fscache_uncache_page(cookie, page);
  1008. }
  1009. }
  1010. pagevec_release(&pvec);
  1011. cond_resched();
  1012. } while (++next);
  1013. _leave("");
  1014. }
  1015. EXPORT_SYMBOL(__fscache_uncache_all_inode_pages);