delayed-inode.c 52 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004
  1. /*
  2. * Copyright (C) 2011 Fujitsu. All rights reserved.
  3. * Written by Miao Xie <miaox@cn.fujitsu.com>
  4. *
  5. * This program is free software; you can redistribute it and/or
  6. * modify it under the terms of the GNU General Public
  7. * License v2 as published by the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  12. * General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public
  15. * License along with this program; if not, write to the
  16. * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  17. * Boston, MA 021110-1307, USA.
  18. */
  19. #include <linux/slab.h>
  20. #include "delayed-inode.h"
  21. #include "disk-io.h"
  22. #include "transaction.h"
  23. #include "ctree.h"
  24. #define BTRFS_DELAYED_WRITEBACK 512
  25. #define BTRFS_DELAYED_BACKGROUND 128
  26. #define BTRFS_DELAYED_BATCH 16
  27. static struct kmem_cache *delayed_node_cache;
  28. int __init btrfs_delayed_inode_init(void)
  29. {
  30. delayed_node_cache = kmem_cache_create("btrfs_delayed_node",
  31. sizeof(struct btrfs_delayed_node),
  32. 0,
  33. SLAB_RECLAIM_ACCOUNT | SLAB_MEM_SPREAD,
  34. NULL);
  35. if (!delayed_node_cache)
  36. return -ENOMEM;
  37. return 0;
  38. }
  39. void btrfs_delayed_inode_exit(void)
  40. {
  41. if (delayed_node_cache)
  42. kmem_cache_destroy(delayed_node_cache);
  43. }
  44. static inline void btrfs_init_delayed_node(
  45. struct btrfs_delayed_node *delayed_node,
  46. struct btrfs_root *root, u64 inode_id)
  47. {
  48. delayed_node->root = root;
  49. delayed_node->inode_id = inode_id;
  50. atomic_set(&delayed_node->refs, 0);
  51. delayed_node->count = 0;
  52. delayed_node->flags = 0;
  53. delayed_node->ins_root = RB_ROOT;
  54. delayed_node->del_root = RB_ROOT;
  55. mutex_init(&delayed_node->mutex);
  56. delayed_node->index_cnt = 0;
  57. INIT_LIST_HEAD(&delayed_node->n_list);
  58. INIT_LIST_HEAD(&delayed_node->p_list);
  59. delayed_node->bytes_reserved = 0;
  60. memset(&delayed_node->inode_item, 0, sizeof(delayed_node->inode_item));
  61. }
  62. static inline int btrfs_is_continuous_delayed_item(
  63. struct btrfs_delayed_item *item1,
  64. struct btrfs_delayed_item *item2)
  65. {
  66. if (item1->key.type == BTRFS_DIR_INDEX_KEY &&
  67. item1->key.objectid == item2->key.objectid &&
  68. item1->key.type == item2->key.type &&
  69. item1->key.offset + 1 == item2->key.offset)
  70. return 1;
  71. return 0;
  72. }
  73. static inline struct btrfs_delayed_root *btrfs_get_delayed_root(
  74. struct btrfs_root *root)
  75. {
  76. return root->fs_info->delayed_root;
  77. }
  78. static struct btrfs_delayed_node *btrfs_get_delayed_node(struct inode *inode)
  79. {
  80. struct btrfs_inode *btrfs_inode = BTRFS_I(inode);
  81. struct btrfs_root *root = btrfs_inode->root;
  82. u64 ino = btrfs_ino(inode);
  83. struct btrfs_delayed_node *node;
  84. node = ACCESS_ONCE(btrfs_inode->delayed_node);
  85. if (node) {
  86. atomic_inc(&node->refs);
  87. return node;
  88. }
  89. spin_lock(&root->inode_lock);
  90. node = radix_tree_lookup(&root->delayed_nodes_tree, ino);
  91. if (node) {
  92. if (btrfs_inode->delayed_node) {
  93. atomic_inc(&node->refs); /* can be accessed */
  94. BUG_ON(btrfs_inode->delayed_node != node);
  95. spin_unlock(&root->inode_lock);
  96. return node;
  97. }
  98. btrfs_inode->delayed_node = node;
  99. /* can be accessed and cached in the inode */
  100. atomic_add(2, &node->refs);
  101. spin_unlock(&root->inode_lock);
  102. return node;
  103. }
  104. spin_unlock(&root->inode_lock);
  105. return NULL;
  106. }
  107. /* Will return either the node or PTR_ERR(-ENOMEM) */
  108. static struct btrfs_delayed_node *btrfs_get_or_create_delayed_node(
  109. struct inode *inode)
  110. {
  111. struct btrfs_delayed_node *node;
  112. struct btrfs_inode *btrfs_inode = BTRFS_I(inode);
  113. struct btrfs_root *root = btrfs_inode->root;
  114. u64 ino = btrfs_ino(inode);
  115. int ret;
  116. again:
  117. node = btrfs_get_delayed_node(inode);
  118. if (node)
  119. return node;
  120. node = kmem_cache_alloc(delayed_node_cache, GFP_NOFS);
  121. if (!node)
  122. return ERR_PTR(-ENOMEM);
  123. btrfs_init_delayed_node(node, root, ino);
  124. /* cached in the btrfs inode and can be accessed */
  125. atomic_add(2, &node->refs);
  126. ret = radix_tree_preload(GFP_NOFS & ~__GFP_HIGHMEM);
  127. if (ret) {
  128. kmem_cache_free(delayed_node_cache, node);
  129. return ERR_PTR(ret);
  130. }
  131. spin_lock(&root->inode_lock);
  132. ret = radix_tree_insert(&root->delayed_nodes_tree, ino, node);
  133. if (ret == -EEXIST) {
  134. spin_unlock(&root->inode_lock);
  135. kmem_cache_free(delayed_node_cache, node);
  136. radix_tree_preload_end();
  137. goto again;
  138. }
  139. btrfs_inode->delayed_node = node;
  140. spin_unlock(&root->inode_lock);
  141. radix_tree_preload_end();
  142. return node;
  143. }
  144. /*
  145. * Call it when holding delayed_node->mutex
  146. *
  147. * If mod = 1, add this node into the prepared list.
  148. */
  149. static void btrfs_queue_delayed_node(struct btrfs_delayed_root *root,
  150. struct btrfs_delayed_node *node,
  151. int mod)
  152. {
  153. spin_lock(&root->lock);
  154. if (test_bit(BTRFS_DELAYED_NODE_IN_LIST, &node->flags)) {
  155. if (!list_empty(&node->p_list))
  156. list_move_tail(&node->p_list, &root->prepare_list);
  157. else if (mod)
  158. list_add_tail(&node->p_list, &root->prepare_list);
  159. } else {
  160. list_add_tail(&node->n_list, &root->node_list);
  161. list_add_tail(&node->p_list, &root->prepare_list);
  162. atomic_inc(&node->refs); /* inserted into list */
  163. root->nodes++;
  164. set_bit(BTRFS_DELAYED_NODE_IN_LIST, &node->flags);
  165. }
  166. spin_unlock(&root->lock);
  167. }
  168. /* Call it when holding delayed_node->mutex */
  169. static void btrfs_dequeue_delayed_node(struct btrfs_delayed_root *root,
  170. struct btrfs_delayed_node *node)
  171. {
  172. spin_lock(&root->lock);
  173. if (test_bit(BTRFS_DELAYED_NODE_IN_LIST, &node->flags)) {
  174. root->nodes--;
  175. atomic_dec(&node->refs); /* not in the list */
  176. list_del_init(&node->n_list);
  177. if (!list_empty(&node->p_list))
  178. list_del_init(&node->p_list);
  179. clear_bit(BTRFS_DELAYED_NODE_IN_LIST, &node->flags);
  180. }
  181. spin_unlock(&root->lock);
  182. }
  183. static struct btrfs_delayed_node *btrfs_first_delayed_node(
  184. struct btrfs_delayed_root *delayed_root)
  185. {
  186. struct list_head *p;
  187. struct btrfs_delayed_node *node = NULL;
  188. spin_lock(&delayed_root->lock);
  189. if (list_empty(&delayed_root->node_list))
  190. goto out;
  191. p = delayed_root->node_list.next;
  192. node = list_entry(p, struct btrfs_delayed_node, n_list);
  193. atomic_inc(&node->refs);
  194. out:
  195. spin_unlock(&delayed_root->lock);
  196. return node;
  197. }
  198. static struct btrfs_delayed_node *btrfs_next_delayed_node(
  199. struct btrfs_delayed_node *node)
  200. {
  201. struct btrfs_delayed_root *delayed_root;
  202. struct list_head *p;
  203. struct btrfs_delayed_node *next = NULL;
  204. delayed_root = node->root->fs_info->delayed_root;
  205. spin_lock(&delayed_root->lock);
  206. if (!test_bit(BTRFS_DELAYED_NODE_IN_LIST, &node->flags)) {
  207. /* not in the list */
  208. if (list_empty(&delayed_root->node_list))
  209. goto out;
  210. p = delayed_root->node_list.next;
  211. } else if (list_is_last(&node->n_list, &delayed_root->node_list))
  212. goto out;
  213. else
  214. p = node->n_list.next;
  215. next = list_entry(p, struct btrfs_delayed_node, n_list);
  216. atomic_inc(&next->refs);
  217. out:
  218. spin_unlock(&delayed_root->lock);
  219. return next;
  220. }
  221. static void __btrfs_release_delayed_node(
  222. struct btrfs_delayed_node *delayed_node,
  223. int mod)
  224. {
  225. struct btrfs_delayed_root *delayed_root;
  226. if (!delayed_node)
  227. return;
  228. delayed_root = delayed_node->root->fs_info->delayed_root;
  229. mutex_lock(&delayed_node->mutex);
  230. if (delayed_node->count)
  231. btrfs_queue_delayed_node(delayed_root, delayed_node, mod);
  232. else
  233. btrfs_dequeue_delayed_node(delayed_root, delayed_node);
  234. mutex_unlock(&delayed_node->mutex);
  235. if (atomic_dec_and_test(&delayed_node->refs)) {
  236. bool free = false;
  237. struct btrfs_root *root = delayed_node->root;
  238. spin_lock(&root->inode_lock);
  239. if (atomic_read(&delayed_node->refs) == 0) {
  240. radix_tree_delete(&root->delayed_nodes_tree,
  241. delayed_node->inode_id);
  242. free = true;
  243. }
  244. spin_unlock(&root->inode_lock);
  245. if (free)
  246. kmem_cache_free(delayed_node_cache, delayed_node);
  247. }
  248. }
  249. static inline void btrfs_release_delayed_node(struct btrfs_delayed_node *node)
  250. {
  251. __btrfs_release_delayed_node(node, 0);
  252. }
  253. static struct btrfs_delayed_node *btrfs_first_prepared_delayed_node(
  254. struct btrfs_delayed_root *delayed_root)
  255. {
  256. struct list_head *p;
  257. struct btrfs_delayed_node *node = NULL;
  258. spin_lock(&delayed_root->lock);
  259. if (list_empty(&delayed_root->prepare_list))
  260. goto out;
  261. p = delayed_root->prepare_list.next;
  262. list_del_init(p);
  263. node = list_entry(p, struct btrfs_delayed_node, p_list);
  264. atomic_inc(&node->refs);
  265. out:
  266. spin_unlock(&delayed_root->lock);
  267. return node;
  268. }
  269. static inline void btrfs_release_prepared_delayed_node(
  270. struct btrfs_delayed_node *node)
  271. {
  272. __btrfs_release_delayed_node(node, 1);
  273. }
  274. static struct btrfs_delayed_item *btrfs_alloc_delayed_item(u32 data_len)
  275. {
  276. struct btrfs_delayed_item *item;
  277. item = kmalloc(sizeof(*item) + data_len, GFP_NOFS);
  278. if (item) {
  279. item->data_len = data_len;
  280. item->ins_or_del = 0;
  281. item->bytes_reserved = 0;
  282. item->delayed_node = NULL;
  283. atomic_set(&item->refs, 1);
  284. }
  285. return item;
  286. }
  287. /*
  288. * __btrfs_lookup_delayed_item - look up the delayed item by key
  289. * @delayed_node: pointer to the delayed node
  290. * @key: the key to look up
  291. * @prev: used to store the prev item if the right item isn't found
  292. * @next: used to store the next item if the right item isn't found
  293. *
  294. * Note: if we don't find the right item, we will return the prev item and
  295. * the next item.
  296. */
  297. static struct btrfs_delayed_item *__btrfs_lookup_delayed_item(
  298. struct rb_root *root,
  299. struct btrfs_key *key,
  300. struct btrfs_delayed_item **prev,
  301. struct btrfs_delayed_item **next)
  302. {
  303. struct rb_node *node, *prev_node = NULL;
  304. struct btrfs_delayed_item *delayed_item = NULL;
  305. int ret = 0;
  306. node = root->rb_node;
  307. while (node) {
  308. delayed_item = rb_entry(node, struct btrfs_delayed_item,
  309. rb_node);
  310. prev_node = node;
  311. ret = btrfs_comp_cpu_keys(&delayed_item->key, key);
  312. if (ret < 0)
  313. node = node->rb_right;
  314. else if (ret > 0)
  315. node = node->rb_left;
  316. else
  317. return delayed_item;
  318. }
  319. if (prev) {
  320. if (!prev_node)
  321. *prev = NULL;
  322. else if (ret < 0)
  323. *prev = delayed_item;
  324. else if ((node = rb_prev(prev_node)) != NULL) {
  325. *prev = rb_entry(node, struct btrfs_delayed_item,
  326. rb_node);
  327. } else
  328. *prev = NULL;
  329. }
  330. if (next) {
  331. if (!prev_node)
  332. *next = NULL;
  333. else if (ret > 0)
  334. *next = delayed_item;
  335. else if ((node = rb_next(prev_node)) != NULL) {
  336. *next = rb_entry(node, struct btrfs_delayed_item,
  337. rb_node);
  338. } else
  339. *next = NULL;
  340. }
  341. return NULL;
  342. }
  343. static struct btrfs_delayed_item *__btrfs_lookup_delayed_insertion_item(
  344. struct btrfs_delayed_node *delayed_node,
  345. struct btrfs_key *key)
  346. {
  347. struct btrfs_delayed_item *item;
  348. item = __btrfs_lookup_delayed_item(&delayed_node->ins_root, key,
  349. NULL, NULL);
  350. return item;
  351. }
  352. static int __btrfs_add_delayed_item(struct btrfs_delayed_node *delayed_node,
  353. struct btrfs_delayed_item *ins,
  354. int action)
  355. {
  356. struct rb_node **p, *node;
  357. struct rb_node *parent_node = NULL;
  358. struct rb_root *root;
  359. struct btrfs_delayed_item *item;
  360. int cmp;
  361. if (action == BTRFS_DELAYED_INSERTION_ITEM)
  362. root = &delayed_node->ins_root;
  363. else if (action == BTRFS_DELAYED_DELETION_ITEM)
  364. root = &delayed_node->del_root;
  365. else
  366. BUG();
  367. p = &root->rb_node;
  368. node = &ins->rb_node;
  369. while (*p) {
  370. parent_node = *p;
  371. item = rb_entry(parent_node, struct btrfs_delayed_item,
  372. rb_node);
  373. cmp = btrfs_comp_cpu_keys(&item->key, &ins->key);
  374. if (cmp < 0)
  375. p = &(*p)->rb_right;
  376. else if (cmp > 0)
  377. p = &(*p)->rb_left;
  378. else
  379. return -EEXIST;
  380. }
  381. rb_link_node(node, parent_node, p);
  382. rb_insert_color(node, root);
  383. ins->delayed_node = delayed_node;
  384. ins->ins_or_del = action;
  385. if (ins->key.type == BTRFS_DIR_INDEX_KEY &&
  386. action == BTRFS_DELAYED_INSERTION_ITEM &&
  387. ins->key.offset >= delayed_node->index_cnt)
  388. delayed_node->index_cnt = ins->key.offset + 1;
  389. delayed_node->count++;
  390. atomic_inc(&delayed_node->root->fs_info->delayed_root->items);
  391. return 0;
  392. }
  393. static int __btrfs_add_delayed_insertion_item(struct btrfs_delayed_node *node,
  394. struct btrfs_delayed_item *item)
  395. {
  396. return __btrfs_add_delayed_item(node, item,
  397. BTRFS_DELAYED_INSERTION_ITEM);
  398. }
  399. static int __btrfs_add_delayed_deletion_item(struct btrfs_delayed_node *node,
  400. struct btrfs_delayed_item *item)
  401. {
  402. return __btrfs_add_delayed_item(node, item,
  403. BTRFS_DELAYED_DELETION_ITEM);
  404. }
  405. static void finish_one_item(struct btrfs_delayed_root *delayed_root)
  406. {
  407. int seq = atomic_inc_return(&delayed_root->items_seq);
  408. /*
  409. * atomic_dec_return implies a barrier for waitqueue_active
  410. */
  411. if ((atomic_dec_return(&delayed_root->items) <
  412. BTRFS_DELAYED_BACKGROUND || seq % BTRFS_DELAYED_BATCH == 0) &&
  413. waitqueue_active(&delayed_root->wait))
  414. wake_up(&delayed_root->wait);
  415. }
  416. static void __btrfs_remove_delayed_item(struct btrfs_delayed_item *delayed_item)
  417. {
  418. struct rb_root *root;
  419. struct btrfs_delayed_root *delayed_root;
  420. delayed_root = delayed_item->delayed_node->root->fs_info->delayed_root;
  421. BUG_ON(!delayed_root);
  422. BUG_ON(delayed_item->ins_or_del != BTRFS_DELAYED_DELETION_ITEM &&
  423. delayed_item->ins_or_del != BTRFS_DELAYED_INSERTION_ITEM);
  424. if (delayed_item->ins_or_del == BTRFS_DELAYED_INSERTION_ITEM)
  425. root = &delayed_item->delayed_node->ins_root;
  426. else
  427. root = &delayed_item->delayed_node->del_root;
  428. rb_erase(&delayed_item->rb_node, root);
  429. delayed_item->delayed_node->count--;
  430. finish_one_item(delayed_root);
  431. }
  432. static void btrfs_release_delayed_item(struct btrfs_delayed_item *item)
  433. {
  434. if (item) {
  435. __btrfs_remove_delayed_item(item);
  436. if (atomic_dec_and_test(&item->refs))
  437. kfree(item);
  438. }
  439. }
  440. static struct btrfs_delayed_item *__btrfs_first_delayed_insertion_item(
  441. struct btrfs_delayed_node *delayed_node)
  442. {
  443. struct rb_node *p;
  444. struct btrfs_delayed_item *item = NULL;
  445. p = rb_first(&delayed_node->ins_root);
  446. if (p)
  447. item = rb_entry(p, struct btrfs_delayed_item, rb_node);
  448. return item;
  449. }
  450. static struct btrfs_delayed_item *__btrfs_first_delayed_deletion_item(
  451. struct btrfs_delayed_node *delayed_node)
  452. {
  453. struct rb_node *p;
  454. struct btrfs_delayed_item *item = NULL;
  455. p = rb_first(&delayed_node->del_root);
  456. if (p)
  457. item = rb_entry(p, struct btrfs_delayed_item, rb_node);
  458. return item;
  459. }
  460. static struct btrfs_delayed_item *__btrfs_next_delayed_item(
  461. struct btrfs_delayed_item *item)
  462. {
  463. struct rb_node *p;
  464. struct btrfs_delayed_item *next = NULL;
  465. p = rb_next(&item->rb_node);
  466. if (p)
  467. next = rb_entry(p, struct btrfs_delayed_item, rb_node);
  468. return next;
  469. }
  470. static int btrfs_delayed_item_reserve_metadata(struct btrfs_trans_handle *trans,
  471. struct btrfs_root *root,
  472. struct btrfs_delayed_item *item)
  473. {
  474. struct btrfs_block_rsv *src_rsv;
  475. struct btrfs_block_rsv *dst_rsv;
  476. u64 num_bytes;
  477. int ret;
  478. if (!trans->bytes_reserved)
  479. return 0;
  480. src_rsv = trans->block_rsv;
  481. dst_rsv = &root->fs_info->delayed_block_rsv;
  482. num_bytes = btrfs_calc_trans_metadata_size(root, 1);
  483. ret = btrfs_block_rsv_migrate(src_rsv, dst_rsv, num_bytes);
  484. if (!ret) {
  485. trace_btrfs_space_reservation(root->fs_info, "delayed_item",
  486. item->key.objectid,
  487. num_bytes, 1);
  488. item->bytes_reserved = num_bytes;
  489. }
  490. return ret;
  491. }
  492. static void btrfs_delayed_item_release_metadata(struct btrfs_root *root,
  493. struct btrfs_delayed_item *item)
  494. {
  495. struct btrfs_block_rsv *rsv;
  496. if (!item->bytes_reserved)
  497. return;
  498. rsv = &root->fs_info->delayed_block_rsv;
  499. trace_btrfs_space_reservation(root->fs_info, "delayed_item",
  500. item->key.objectid, item->bytes_reserved,
  501. 0);
  502. btrfs_block_rsv_release(root, rsv,
  503. item->bytes_reserved);
  504. }
  505. static int btrfs_delayed_inode_reserve_metadata(
  506. struct btrfs_trans_handle *trans,
  507. struct btrfs_root *root,
  508. struct inode *inode,
  509. struct btrfs_delayed_node *node)
  510. {
  511. struct btrfs_block_rsv *src_rsv;
  512. struct btrfs_block_rsv *dst_rsv;
  513. u64 num_bytes;
  514. int ret;
  515. bool release = false;
  516. src_rsv = trans->block_rsv;
  517. dst_rsv = &root->fs_info->delayed_block_rsv;
  518. num_bytes = btrfs_calc_trans_metadata_size(root, 1);
  519. /*
  520. * btrfs_dirty_inode will update the inode under btrfs_join_transaction
  521. * which doesn't reserve space for speed. This is a problem since we
  522. * still need to reserve space for this update, so try to reserve the
  523. * space.
  524. *
  525. * Now if src_rsv == delalloc_block_rsv we'll let it just steal since
  526. * we're accounted for.
  527. */
  528. if (!src_rsv || (!trans->bytes_reserved &&
  529. src_rsv->type != BTRFS_BLOCK_RSV_DELALLOC)) {
  530. ret = btrfs_block_rsv_add(root, dst_rsv, num_bytes,
  531. BTRFS_RESERVE_NO_FLUSH);
  532. /*
  533. * Since we're under a transaction reserve_metadata_bytes could
  534. * try to commit the transaction which will make it return
  535. * EAGAIN to make us stop the transaction we have, so return
  536. * ENOSPC instead so that btrfs_dirty_inode knows what to do.
  537. */
  538. if (ret == -EAGAIN)
  539. ret = -ENOSPC;
  540. if (!ret) {
  541. node->bytes_reserved = num_bytes;
  542. trace_btrfs_space_reservation(root->fs_info,
  543. "delayed_inode",
  544. btrfs_ino(inode),
  545. num_bytes, 1);
  546. }
  547. return ret;
  548. } else if (src_rsv->type == BTRFS_BLOCK_RSV_DELALLOC) {
  549. spin_lock(&BTRFS_I(inode)->lock);
  550. if (test_and_clear_bit(BTRFS_INODE_DELALLOC_META_RESERVED,
  551. &BTRFS_I(inode)->runtime_flags)) {
  552. spin_unlock(&BTRFS_I(inode)->lock);
  553. release = true;
  554. goto migrate;
  555. }
  556. spin_unlock(&BTRFS_I(inode)->lock);
  557. /* Ok we didn't have space pre-reserved. This shouldn't happen
  558. * too often but it can happen if we do delalloc to an existing
  559. * inode which gets dirtied because of the time update, and then
  560. * isn't touched again until after the transaction commits and
  561. * then we try to write out the data. First try to be nice and
  562. * reserve something strictly for us. If not be a pain and try
  563. * to steal from the delalloc block rsv.
  564. */
  565. ret = btrfs_block_rsv_add(root, dst_rsv, num_bytes,
  566. BTRFS_RESERVE_NO_FLUSH);
  567. if (!ret)
  568. goto out;
  569. ret = btrfs_block_rsv_migrate(src_rsv, dst_rsv, num_bytes);
  570. if (!WARN_ON(ret))
  571. goto out;
  572. /*
  573. * Ok this is a problem, let's just steal from the global rsv
  574. * since this really shouldn't happen that often.
  575. */
  576. ret = btrfs_block_rsv_migrate(&root->fs_info->global_block_rsv,
  577. dst_rsv, num_bytes);
  578. goto out;
  579. }
  580. migrate:
  581. ret = btrfs_block_rsv_migrate(src_rsv, dst_rsv, num_bytes);
  582. out:
  583. /*
  584. * Migrate only takes a reservation, it doesn't touch the size of the
  585. * block_rsv. This is to simplify people who don't normally have things
  586. * migrated from their block rsv. If they go to release their
  587. * reservation, that will decrease the size as well, so if migrate
  588. * reduced size we'd end up with a negative size. But for the
  589. * delalloc_meta_reserved stuff we will only know to drop 1 reservation,
  590. * but we could in fact do this reserve/migrate dance several times
  591. * between the time we did the original reservation and we'd clean it
  592. * up. So to take care of this, release the space for the meta
  593. * reservation here. I think it may be time for a documentation page on
  594. * how block rsvs. work.
  595. */
  596. if (!ret) {
  597. trace_btrfs_space_reservation(root->fs_info, "delayed_inode",
  598. btrfs_ino(inode), num_bytes, 1);
  599. node->bytes_reserved = num_bytes;
  600. }
  601. if (release) {
  602. trace_btrfs_space_reservation(root->fs_info, "delalloc",
  603. btrfs_ino(inode), num_bytes, 0);
  604. btrfs_block_rsv_release(root, src_rsv, num_bytes);
  605. }
  606. return ret;
  607. }
  608. static void btrfs_delayed_inode_release_metadata(struct btrfs_root *root,
  609. struct btrfs_delayed_node *node)
  610. {
  611. struct btrfs_block_rsv *rsv;
  612. if (!node->bytes_reserved)
  613. return;
  614. rsv = &root->fs_info->delayed_block_rsv;
  615. trace_btrfs_space_reservation(root->fs_info, "delayed_inode",
  616. node->inode_id, node->bytes_reserved, 0);
  617. btrfs_block_rsv_release(root, rsv,
  618. node->bytes_reserved);
  619. node->bytes_reserved = 0;
  620. }
  621. /*
  622. * This helper will insert some continuous items into the same leaf according
  623. * to the free space of the leaf.
  624. */
  625. static int btrfs_batch_insert_items(struct btrfs_root *root,
  626. struct btrfs_path *path,
  627. struct btrfs_delayed_item *item)
  628. {
  629. struct btrfs_delayed_item *curr, *next;
  630. int free_space;
  631. int total_data_size = 0, total_size = 0;
  632. struct extent_buffer *leaf;
  633. char *data_ptr;
  634. struct btrfs_key *keys;
  635. u32 *data_size;
  636. struct list_head head;
  637. int slot;
  638. int nitems;
  639. int i;
  640. int ret = 0;
  641. BUG_ON(!path->nodes[0]);
  642. leaf = path->nodes[0];
  643. free_space = btrfs_leaf_free_space(root, leaf);
  644. INIT_LIST_HEAD(&head);
  645. next = item;
  646. nitems = 0;
  647. /*
  648. * count the number of the continuous items that we can insert in batch
  649. */
  650. while (total_size + next->data_len + sizeof(struct btrfs_item) <=
  651. free_space) {
  652. total_data_size += next->data_len;
  653. total_size += next->data_len + sizeof(struct btrfs_item);
  654. list_add_tail(&next->tree_list, &head);
  655. nitems++;
  656. curr = next;
  657. next = __btrfs_next_delayed_item(curr);
  658. if (!next)
  659. break;
  660. if (!btrfs_is_continuous_delayed_item(curr, next))
  661. break;
  662. }
  663. if (!nitems) {
  664. ret = 0;
  665. goto out;
  666. }
  667. /*
  668. * we need allocate some memory space, but it might cause the task
  669. * to sleep, so we set all locked nodes in the path to blocking locks
  670. * first.
  671. */
  672. btrfs_set_path_blocking(path);
  673. keys = kmalloc_array(nitems, sizeof(struct btrfs_key), GFP_NOFS);
  674. if (!keys) {
  675. ret = -ENOMEM;
  676. goto out;
  677. }
  678. data_size = kmalloc_array(nitems, sizeof(u32), GFP_NOFS);
  679. if (!data_size) {
  680. ret = -ENOMEM;
  681. goto error;
  682. }
  683. /* get keys of all the delayed items */
  684. i = 0;
  685. list_for_each_entry(next, &head, tree_list) {
  686. keys[i] = next->key;
  687. data_size[i] = next->data_len;
  688. i++;
  689. }
  690. /* reset all the locked nodes in the patch to spinning locks. */
  691. btrfs_clear_path_blocking(path, NULL, 0);
  692. /* insert the keys of the items */
  693. setup_items_for_insert(root, path, keys, data_size,
  694. total_data_size, total_size, nitems);
  695. /* insert the dir index items */
  696. slot = path->slots[0];
  697. list_for_each_entry_safe(curr, next, &head, tree_list) {
  698. data_ptr = btrfs_item_ptr(leaf, slot, char);
  699. write_extent_buffer(leaf, &curr->data,
  700. (unsigned long)data_ptr,
  701. curr->data_len);
  702. slot++;
  703. btrfs_delayed_item_release_metadata(root, curr);
  704. list_del(&curr->tree_list);
  705. btrfs_release_delayed_item(curr);
  706. }
  707. error:
  708. kfree(data_size);
  709. kfree(keys);
  710. out:
  711. return ret;
  712. }
  713. /*
  714. * This helper can just do simple insertion that needn't extend item for new
  715. * data, such as directory name index insertion, inode insertion.
  716. */
  717. static int btrfs_insert_delayed_item(struct btrfs_trans_handle *trans,
  718. struct btrfs_root *root,
  719. struct btrfs_path *path,
  720. struct btrfs_delayed_item *delayed_item)
  721. {
  722. struct extent_buffer *leaf;
  723. char *ptr;
  724. int ret;
  725. ret = btrfs_insert_empty_item(trans, root, path, &delayed_item->key,
  726. delayed_item->data_len);
  727. if (ret < 0 && ret != -EEXIST)
  728. return ret;
  729. leaf = path->nodes[0];
  730. ptr = btrfs_item_ptr(leaf, path->slots[0], char);
  731. write_extent_buffer(leaf, delayed_item->data, (unsigned long)ptr,
  732. delayed_item->data_len);
  733. btrfs_mark_buffer_dirty(leaf);
  734. btrfs_delayed_item_release_metadata(root, delayed_item);
  735. return 0;
  736. }
  737. /*
  738. * we insert an item first, then if there are some continuous items, we try
  739. * to insert those items into the same leaf.
  740. */
  741. static int btrfs_insert_delayed_items(struct btrfs_trans_handle *trans,
  742. struct btrfs_path *path,
  743. struct btrfs_root *root,
  744. struct btrfs_delayed_node *node)
  745. {
  746. struct btrfs_delayed_item *curr, *prev;
  747. int ret = 0;
  748. do_again:
  749. mutex_lock(&node->mutex);
  750. curr = __btrfs_first_delayed_insertion_item(node);
  751. if (!curr)
  752. goto insert_end;
  753. ret = btrfs_insert_delayed_item(trans, root, path, curr);
  754. if (ret < 0) {
  755. btrfs_release_path(path);
  756. goto insert_end;
  757. }
  758. prev = curr;
  759. curr = __btrfs_next_delayed_item(prev);
  760. if (curr && btrfs_is_continuous_delayed_item(prev, curr)) {
  761. /* insert the continuous items into the same leaf */
  762. path->slots[0]++;
  763. btrfs_batch_insert_items(root, path, curr);
  764. }
  765. btrfs_release_delayed_item(prev);
  766. btrfs_mark_buffer_dirty(path->nodes[0]);
  767. btrfs_release_path(path);
  768. mutex_unlock(&node->mutex);
  769. goto do_again;
  770. insert_end:
  771. mutex_unlock(&node->mutex);
  772. return ret;
  773. }
  774. static int btrfs_batch_delete_items(struct btrfs_trans_handle *trans,
  775. struct btrfs_root *root,
  776. struct btrfs_path *path,
  777. struct btrfs_delayed_item *item)
  778. {
  779. struct btrfs_delayed_item *curr, *next;
  780. struct extent_buffer *leaf;
  781. struct btrfs_key key;
  782. struct list_head head;
  783. int nitems, i, last_item;
  784. int ret = 0;
  785. BUG_ON(!path->nodes[0]);
  786. leaf = path->nodes[0];
  787. i = path->slots[0];
  788. last_item = btrfs_header_nritems(leaf) - 1;
  789. if (i > last_item)
  790. return -ENOENT; /* FIXME: Is errno suitable? */
  791. next = item;
  792. INIT_LIST_HEAD(&head);
  793. btrfs_item_key_to_cpu(leaf, &key, i);
  794. nitems = 0;
  795. /*
  796. * count the number of the dir index items that we can delete in batch
  797. */
  798. while (btrfs_comp_cpu_keys(&next->key, &key) == 0) {
  799. list_add_tail(&next->tree_list, &head);
  800. nitems++;
  801. curr = next;
  802. next = __btrfs_next_delayed_item(curr);
  803. if (!next)
  804. break;
  805. if (!btrfs_is_continuous_delayed_item(curr, next))
  806. break;
  807. i++;
  808. if (i > last_item)
  809. break;
  810. btrfs_item_key_to_cpu(leaf, &key, i);
  811. }
  812. if (!nitems)
  813. return 0;
  814. ret = btrfs_del_items(trans, root, path, path->slots[0], nitems);
  815. if (ret)
  816. goto out;
  817. list_for_each_entry_safe(curr, next, &head, tree_list) {
  818. btrfs_delayed_item_release_metadata(root, curr);
  819. list_del(&curr->tree_list);
  820. btrfs_release_delayed_item(curr);
  821. }
  822. out:
  823. return ret;
  824. }
  825. static int btrfs_delete_delayed_items(struct btrfs_trans_handle *trans,
  826. struct btrfs_path *path,
  827. struct btrfs_root *root,
  828. struct btrfs_delayed_node *node)
  829. {
  830. struct btrfs_delayed_item *curr, *prev;
  831. int ret = 0;
  832. do_again:
  833. mutex_lock(&node->mutex);
  834. curr = __btrfs_first_delayed_deletion_item(node);
  835. if (!curr)
  836. goto delete_fail;
  837. ret = btrfs_search_slot(trans, root, &curr->key, path, -1, 1);
  838. if (ret < 0)
  839. goto delete_fail;
  840. else if (ret > 0) {
  841. /*
  842. * can't find the item which the node points to, so this node
  843. * is invalid, just drop it.
  844. */
  845. prev = curr;
  846. curr = __btrfs_next_delayed_item(prev);
  847. btrfs_release_delayed_item(prev);
  848. ret = 0;
  849. btrfs_release_path(path);
  850. if (curr) {
  851. mutex_unlock(&node->mutex);
  852. goto do_again;
  853. } else
  854. goto delete_fail;
  855. }
  856. btrfs_batch_delete_items(trans, root, path, curr);
  857. btrfs_release_path(path);
  858. mutex_unlock(&node->mutex);
  859. goto do_again;
  860. delete_fail:
  861. btrfs_release_path(path);
  862. mutex_unlock(&node->mutex);
  863. return ret;
  864. }
  865. static void btrfs_release_delayed_inode(struct btrfs_delayed_node *delayed_node)
  866. {
  867. struct btrfs_delayed_root *delayed_root;
  868. if (delayed_node &&
  869. test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags)) {
  870. BUG_ON(!delayed_node->root);
  871. clear_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags);
  872. delayed_node->count--;
  873. delayed_root = delayed_node->root->fs_info->delayed_root;
  874. finish_one_item(delayed_root);
  875. }
  876. }
  877. static void btrfs_release_delayed_iref(struct btrfs_delayed_node *delayed_node)
  878. {
  879. struct btrfs_delayed_root *delayed_root;
  880. ASSERT(delayed_node->root);
  881. clear_bit(BTRFS_DELAYED_NODE_DEL_IREF, &delayed_node->flags);
  882. delayed_node->count--;
  883. delayed_root = delayed_node->root->fs_info->delayed_root;
  884. finish_one_item(delayed_root);
  885. }
  886. static int __btrfs_update_delayed_inode(struct btrfs_trans_handle *trans,
  887. struct btrfs_root *root,
  888. struct btrfs_path *path,
  889. struct btrfs_delayed_node *node)
  890. {
  891. struct btrfs_key key;
  892. struct btrfs_inode_item *inode_item;
  893. struct extent_buffer *leaf;
  894. int mod;
  895. int ret;
  896. key.objectid = node->inode_id;
  897. key.type = BTRFS_INODE_ITEM_KEY;
  898. key.offset = 0;
  899. if (test_bit(BTRFS_DELAYED_NODE_DEL_IREF, &node->flags))
  900. mod = -1;
  901. else
  902. mod = 1;
  903. ret = btrfs_lookup_inode(trans, root, path, &key, mod);
  904. if (ret > 0) {
  905. btrfs_release_path(path);
  906. return -ENOENT;
  907. } else if (ret < 0) {
  908. return ret;
  909. }
  910. leaf = path->nodes[0];
  911. inode_item = btrfs_item_ptr(leaf, path->slots[0],
  912. struct btrfs_inode_item);
  913. write_extent_buffer(leaf, &node->inode_item, (unsigned long)inode_item,
  914. sizeof(struct btrfs_inode_item));
  915. btrfs_mark_buffer_dirty(leaf);
  916. if (!test_bit(BTRFS_DELAYED_NODE_DEL_IREF, &node->flags))
  917. goto no_iref;
  918. path->slots[0]++;
  919. if (path->slots[0] >= btrfs_header_nritems(leaf))
  920. goto search;
  921. again:
  922. btrfs_item_key_to_cpu(leaf, &key, path->slots[0]);
  923. if (key.objectid != node->inode_id)
  924. goto out;
  925. if (key.type != BTRFS_INODE_REF_KEY &&
  926. key.type != BTRFS_INODE_EXTREF_KEY)
  927. goto out;
  928. /*
  929. * Delayed iref deletion is for the inode who has only one link,
  930. * so there is only one iref. The case that several irefs are
  931. * in the same item doesn't exist.
  932. */
  933. btrfs_del_item(trans, root, path);
  934. out:
  935. btrfs_release_delayed_iref(node);
  936. no_iref:
  937. btrfs_release_path(path);
  938. err_out:
  939. btrfs_delayed_inode_release_metadata(root, node);
  940. btrfs_release_delayed_inode(node);
  941. return ret;
  942. search:
  943. btrfs_release_path(path);
  944. key.type = BTRFS_INODE_EXTREF_KEY;
  945. key.offset = -1;
  946. ret = btrfs_search_slot(trans, root, &key, path, -1, 1);
  947. if (ret < 0)
  948. goto err_out;
  949. ASSERT(ret);
  950. ret = 0;
  951. leaf = path->nodes[0];
  952. path->slots[0]--;
  953. goto again;
  954. }
  955. static inline int btrfs_update_delayed_inode(struct btrfs_trans_handle *trans,
  956. struct btrfs_root *root,
  957. struct btrfs_path *path,
  958. struct btrfs_delayed_node *node)
  959. {
  960. int ret;
  961. mutex_lock(&node->mutex);
  962. if (!test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &node->flags)) {
  963. mutex_unlock(&node->mutex);
  964. return 0;
  965. }
  966. ret = __btrfs_update_delayed_inode(trans, root, path, node);
  967. mutex_unlock(&node->mutex);
  968. return ret;
  969. }
  970. static inline int
  971. __btrfs_commit_inode_delayed_items(struct btrfs_trans_handle *trans,
  972. struct btrfs_path *path,
  973. struct btrfs_delayed_node *node)
  974. {
  975. int ret;
  976. ret = btrfs_insert_delayed_items(trans, path, node->root, node);
  977. if (ret)
  978. return ret;
  979. ret = btrfs_delete_delayed_items(trans, path, node->root, node);
  980. if (ret)
  981. return ret;
  982. ret = btrfs_update_delayed_inode(trans, node->root, path, node);
  983. return ret;
  984. }
  985. /*
  986. * Called when committing the transaction.
  987. * Returns 0 on success.
  988. * Returns < 0 on error and returns with an aborted transaction with any
  989. * outstanding delayed items cleaned up.
  990. */
  991. static int __btrfs_run_delayed_items(struct btrfs_trans_handle *trans,
  992. struct btrfs_root *root, int nr)
  993. {
  994. struct btrfs_delayed_root *delayed_root;
  995. struct btrfs_delayed_node *curr_node, *prev_node;
  996. struct btrfs_path *path;
  997. struct btrfs_block_rsv *block_rsv;
  998. int ret = 0;
  999. bool count = (nr > 0);
  1000. if (trans->aborted)
  1001. return -EIO;
  1002. path = btrfs_alloc_path();
  1003. if (!path)
  1004. return -ENOMEM;
  1005. path->leave_spinning = 1;
  1006. block_rsv = trans->block_rsv;
  1007. trans->block_rsv = &root->fs_info->delayed_block_rsv;
  1008. delayed_root = btrfs_get_delayed_root(root);
  1009. curr_node = btrfs_first_delayed_node(delayed_root);
  1010. while (curr_node && (!count || (count && nr--))) {
  1011. ret = __btrfs_commit_inode_delayed_items(trans, path,
  1012. curr_node);
  1013. if (ret) {
  1014. btrfs_release_delayed_node(curr_node);
  1015. curr_node = NULL;
  1016. btrfs_abort_transaction(trans, root, ret);
  1017. break;
  1018. }
  1019. prev_node = curr_node;
  1020. curr_node = btrfs_next_delayed_node(curr_node);
  1021. btrfs_release_delayed_node(prev_node);
  1022. }
  1023. if (curr_node)
  1024. btrfs_release_delayed_node(curr_node);
  1025. btrfs_free_path(path);
  1026. trans->block_rsv = block_rsv;
  1027. return ret;
  1028. }
  1029. int btrfs_run_delayed_items(struct btrfs_trans_handle *trans,
  1030. struct btrfs_root *root)
  1031. {
  1032. return __btrfs_run_delayed_items(trans, root, -1);
  1033. }
  1034. int btrfs_run_delayed_items_nr(struct btrfs_trans_handle *trans,
  1035. struct btrfs_root *root, int nr)
  1036. {
  1037. return __btrfs_run_delayed_items(trans, root, nr);
  1038. }
  1039. int btrfs_commit_inode_delayed_items(struct btrfs_trans_handle *trans,
  1040. struct inode *inode)
  1041. {
  1042. struct btrfs_delayed_node *delayed_node = btrfs_get_delayed_node(inode);
  1043. struct btrfs_path *path;
  1044. struct btrfs_block_rsv *block_rsv;
  1045. int ret;
  1046. if (!delayed_node)
  1047. return 0;
  1048. mutex_lock(&delayed_node->mutex);
  1049. if (!delayed_node->count) {
  1050. mutex_unlock(&delayed_node->mutex);
  1051. btrfs_release_delayed_node(delayed_node);
  1052. return 0;
  1053. }
  1054. mutex_unlock(&delayed_node->mutex);
  1055. path = btrfs_alloc_path();
  1056. if (!path) {
  1057. btrfs_release_delayed_node(delayed_node);
  1058. return -ENOMEM;
  1059. }
  1060. path->leave_spinning = 1;
  1061. block_rsv = trans->block_rsv;
  1062. trans->block_rsv = &delayed_node->root->fs_info->delayed_block_rsv;
  1063. ret = __btrfs_commit_inode_delayed_items(trans, path, delayed_node);
  1064. btrfs_release_delayed_node(delayed_node);
  1065. btrfs_free_path(path);
  1066. trans->block_rsv = block_rsv;
  1067. return ret;
  1068. }
  1069. int btrfs_commit_inode_delayed_inode(struct inode *inode)
  1070. {
  1071. struct btrfs_trans_handle *trans;
  1072. struct btrfs_delayed_node *delayed_node = btrfs_get_delayed_node(inode);
  1073. struct btrfs_path *path;
  1074. struct btrfs_block_rsv *block_rsv;
  1075. int ret;
  1076. if (!delayed_node)
  1077. return 0;
  1078. mutex_lock(&delayed_node->mutex);
  1079. if (!test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags)) {
  1080. mutex_unlock(&delayed_node->mutex);
  1081. btrfs_release_delayed_node(delayed_node);
  1082. return 0;
  1083. }
  1084. mutex_unlock(&delayed_node->mutex);
  1085. trans = btrfs_join_transaction(delayed_node->root);
  1086. if (IS_ERR(trans)) {
  1087. ret = PTR_ERR(trans);
  1088. goto out;
  1089. }
  1090. path = btrfs_alloc_path();
  1091. if (!path) {
  1092. ret = -ENOMEM;
  1093. goto trans_out;
  1094. }
  1095. path->leave_spinning = 1;
  1096. block_rsv = trans->block_rsv;
  1097. trans->block_rsv = &delayed_node->root->fs_info->delayed_block_rsv;
  1098. mutex_lock(&delayed_node->mutex);
  1099. if (test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags))
  1100. ret = __btrfs_update_delayed_inode(trans, delayed_node->root,
  1101. path, delayed_node);
  1102. else
  1103. ret = 0;
  1104. mutex_unlock(&delayed_node->mutex);
  1105. btrfs_free_path(path);
  1106. trans->block_rsv = block_rsv;
  1107. trans_out:
  1108. btrfs_end_transaction(trans, delayed_node->root);
  1109. btrfs_btree_balance_dirty(delayed_node->root);
  1110. out:
  1111. btrfs_release_delayed_node(delayed_node);
  1112. return ret;
  1113. }
  1114. void btrfs_remove_delayed_node(struct inode *inode)
  1115. {
  1116. struct btrfs_delayed_node *delayed_node;
  1117. delayed_node = ACCESS_ONCE(BTRFS_I(inode)->delayed_node);
  1118. if (!delayed_node)
  1119. return;
  1120. BTRFS_I(inode)->delayed_node = NULL;
  1121. btrfs_release_delayed_node(delayed_node);
  1122. }
  1123. struct btrfs_async_delayed_work {
  1124. struct btrfs_delayed_root *delayed_root;
  1125. int nr;
  1126. struct btrfs_work work;
  1127. };
  1128. static void btrfs_async_run_delayed_root(struct btrfs_work *work)
  1129. {
  1130. struct btrfs_async_delayed_work *async_work;
  1131. struct btrfs_delayed_root *delayed_root;
  1132. struct btrfs_trans_handle *trans;
  1133. struct btrfs_path *path;
  1134. struct btrfs_delayed_node *delayed_node = NULL;
  1135. struct btrfs_root *root;
  1136. struct btrfs_block_rsv *block_rsv;
  1137. int total_done = 0;
  1138. async_work = container_of(work, struct btrfs_async_delayed_work, work);
  1139. delayed_root = async_work->delayed_root;
  1140. path = btrfs_alloc_path();
  1141. if (!path)
  1142. goto out;
  1143. again:
  1144. if (atomic_read(&delayed_root->items) < BTRFS_DELAYED_BACKGROUND / 2)
  1145. goto free_path;
  1146. delayed_node = btrfs_first_prepared_delayed_node(delayed_root);
  1147. if (!delayed_node)
  1148. goto free_path;
  1149. path->leave_spinning = 1;
  1150. root = delayed_node->root;
  1151. trans = btrfs_join_transaction(root);
  1152. if (IS_ERR(trans))
  1153. goto release_path;
  1154. block_rsv = trans->block_rsv;
  1155. trans->block_rsv = &root->fs_info->delayed_block_rsv;
  1156. __btrfs_commit_inode_delayed_items(trans, path, delayed_node);
  1157. trans->block_rsv = block_rsv;
  1158. btrfs_end_transaction(trans, root);
  1159. btrfs_btree_balance_dirty_nodelay(root);
  1160. release_path:
  1161. btrfs_release_path(path);
  1162. total_done++;
  1163. btrfs_release_prepared_delayed_node(delayed_node);
  1164. if ((async_work->nr == 0 && total_done < BTRFS_DELAYED_WRITEBACK) ||
  1165. total_done < async_work->nr)
  1166. goto again;
  1167. free_path:
  1168. btrfs_free_path(path);
  1169. out:
  1170. wake_up(&delayed_root->wait);
  1171. kfree(async_work);
  1172. }
  1173. static int btrfs_wq_run_delayed_node(struct btrfs_delayed_root *delayed_root,
  1174. struct btrfs_fs_info *fs_info, int nr)
  1175. {
  1176. struct btrfs_async_delayed_work *async_work;
  1177. if (atomic_read(&delayed_root->items) < BTRFS_DELAYED_BACKGROUND ||
  1178. btrfs_workqueue_normal_congested(fs_info->delayed_workers))
  1179. return 0;
  1180. async_work = kmalloc(sizeof(*async_work), GFP_NOFS);
  1181. if (!async_work)
  1182. return -ENOMEM;
  1183. async_work->delayed_root = delayed_root;
  1184. btrfs_init_work(&async_work->work, btrfs_delayed_meta_helper,
  1185. btrfs_async_run_delayed_root, NULL, NULL);
  1186. async_work->nr = nr;
  1187. btrfs_queue_work(fs_info->delayed_workers, &async_work->work);
  1188. return 0;
  1189. }
  1190. void btrfs_assert_delayed_root_empty(struct btrfs_root *root)
  1191. {
  1192. struct btrfs_delayed_root *delayed_root;
  1193. delayed_root = btrfs_get_delayed_root(root);
  1194. WARN_ON(btrfs_first_delayed_node(delayed_root));
  1195. }
  1196. static int could_end_wait(struct btrfs_delayed_root *delayed_root, int seq)
  1197. {
  1198. int val = atomic_read(&delayed_root->items_seq);
  1199. if (val < seq || val >= seq + BTRFS_DELAYED_BATCH)
  1200. return 1;
  1201. if (atomic_read(&delayed_root->items) < BTRFS_DELAYED_BACKGROUND)
  1202. return 1;
  1203. return 0;
  1204. }
  1205. void btrfs_balance_delayed_items(struct btrfs_root *root)
  1206. {
  1207. struct btrfs_delayed_root *delayed_root;
  1208. struct btrfs_fs_info *fs_info = root->fs_info;
  1209. delayed_root = btrfs_get_delayed_root(root);
  1210. if (atomic_read(&delayed_root->items) < BTRFS_DELAYED_BACKGROUND)
  1211. return;
  1212. if (atomic_read(&delayed_root->items) >= BTRFS_DELAYED_WRITEBACK) {
  1213. int seq;
  1214. int ret;
  1215. seq = atomic_read(&delayed_root->items_seq);
  1216. ret = btrfs_wq_run_delayed_node(delayed_root, fs_info, 0);
  1217. if (ret)
  1218. return;
  1219. wait_event_interruptible(delayed_root->wait,
  1220. could_end_wait(delayed_root, seq));
  1221. return;
  1222. }
  1223. btrfs_wq_run_delayed_node(delayed_root, fs_info, BTRFS_DELAYED_BATCH);
  1224. }
  1225. /* Will return 0 or -ENOMEM */
  1226. int btrfs_insert_delayed_dir_index(struct btrfs_trans_handle *trans,
  1227. struct btrfs_root *root, const char *name,
  1228. int name_len, struct inode *dir,
  1229. struct btrfs_disk_key *disk_key, u8 type,
  1230. u64 index)
  1231. {
  1232. struct btrfs_delayed_node *delayed_node;
  1233. struct btrfs_delayed_item *delayed_item;
  1234. struct btrfs_dir_item *dir_item;
  1235. int ret;
  1236. delayed_node = btrfs_get_or_create_delayed_node(dir);
  1237. if (IS_ERR(delayed_node))
  1238. return PTR_ERR(delayed_node);
  1239. delayed_item = btrfs_alloc_delayed_item(sizeof(*dir_item) + name_len);
  1240. if (!delayed_item) {
  1241. ret = -ENOMEM;
  1242. goto release_node;
  1243. }
  1244. delayed_item->key.objectid = btrfs_ino(dir);
  1245. delayed_item->key.type = BTRFS_DIR_INDEX_KEY;
  1246. delayed_item->key.offset = index;
  1247. dir_item = (struct btrfs_dir_item *)delayed_item->data;
  1248. dir_item->location = *disk_key;
  1249. btrfs_set_stack_dir_transid(dir_item, trans->transid);
  1250. btrfs_set_stack_dir_data_len(dir_item, 0);
  1251. btrfs_set_stack_dir_name_len(dir_item, name_len);
  1252. btrfs_set_stack_dir_type(dir_item, type);
  1253. memcpy((char *)(dir_item + 1), name, name_len);
  1254. ret = btrfs_delayed_item_reserve_metadata(trans, root, delayed_item);
  1255. /*
  1256. * we have reserved enough space when we start a new transaction,
  1257. * so reserving metadata failure is impossible
  1258. */
  1259. BUG_ON(ret);
  1260. mutex_lock(&delayed_node->mutex);
  1261. ret = __btrfs_add_delayed_insertion_item(delayed_node, delayed_item);
  1262. if (unlikely(ret)) {
  1263. btrfs_err(root->fs_info, "err add delayed dir index item(name: %.*s) "
  1264. "into the insertion tree of the delayed node"
  1265. "(root id: %llu, inode id: %llu, errno: %d)",
  1266. name_len, name, delayed_node->root->objectid,
  1267. delayed_node->inode_id, ret);
  1268. BUG();
  1269. }
  1270. mutex_unlock(&delayed_node->mutex);
  1271. release_node:
  1272. btrfs_release_delayed_node(delayed_node);
  1273. return ret;
  1274. }
  1275. static int btrfs_delete_delayed_insertion_item(struct btrfs_root *root,
  1276. struct btrfs_delayed_node *node,
  1277. struct btrfs_key *key)
  1278. {
  1279. struct btrfs_delayed_item *item;
  1280. mutex_lock(&node->mutex);
  1281. item = __btrfs_lookup_delayed_insertion_item(node, key);
  1282. if (!item) {
  1283. mutex_unlock(&node->mutex);
  1284. return 1;
  1285. }
  1286. btrfs_delayed_item_release_metadata(root, item);
  1287. btrfs_release_delayed_item(item);
  1288. mutex_unlock(&node->mutex);
  1289. return 0;
  1290. }
  1291. int btrfs_delete_delayed_dir_index(struct btrfs_trans_handle *trans,
  1292. struct btrfs_root *root, struct inode *dir,
  1293. u64 index)
  1294. {
  1295. struct btrfs_delayed_node *node;
  1296. struct btrfs_delayed_item *item;
  1297. struct btrfs_key item_key;
  1298. int ret;
  1299. node = btrfs_get_or_create_delayed_node(dir);
  1300. if (IS_ERR(node))
  1301. return PTR_ERR(node);
  1302. item_key.objectid = btrfs_ino(dir);
  1303. item_key.type = BTRFS_DIR_INDEX_KEY;
  1304. item_key.offset = index;
  1305. ret = btrfs_delete_delayed_insertion_item(root, node, &item_key);
  1306. if (!ret)
  1307. goto end;
  1308. item = btrfs_alloc_delayed_item(0);
  1309. if (!item) {
  1310. ret = -ENOMEM;
  1311. goto end;
  1312. }
  1313. item->key = item_key;
  1314. ret = btrfs_delayed_item_reserve_metadata(trans, root, item);
  1315. /*
  1316. * we have reserved enough space when we start a new transaction,
  1317. * so reserving metadata failure is impossible.
  1318. */
  1319. BUG_ON(ret);
  1320. mutex_lock(&node->mutex);
  1321. ret = __btrfs_add_delayed_deletion_item(node, item);
  1322. if (unlikely(ret)) {
  1323. btrfs_err(root->fs_info, "err add delayed dir index item(index: %llu) "
  1324. "into the deletion tree of the delayed node"
  1325. "(root id: %llu, inode id: %llu, errno: %d)",
  1326. index, node->root->objectid, node->inode_id,
  1327. ret);
  1328. BUG();
  1329. }
  1330. mutex_unlock(&node->mutex);
  1331. end:
  1332. btrfs_release_delayed_node(node);
  1333. return ret;
  1334. }
  1335. int btrfs_inode_delayed_dir_index_count(struct inode *inode)
  1336. {
  1337. struct btrfs_delayed_node *delayed_node = btrfs_get_delayed_node(inode);
  1338. if (!delayed_node)
  1339. return -ENOENT;
  1340. /*
  1341. * Since we have held i_mutex of this directory, it is impossible that
  1342. * a new directory index is added into the delayed node and index_cnt
  1343. * is updated now. So we needn't lock the delayed node.
  1344. */
  1345. if (!delayed_node->index_cnt) {
  1346. btrfs_release_delayed_node(delayed_node);
  1347. return -EINVAL;
  1348. }
  1349. BTRFS_I(inode)->index_cnt = delayed_node->index_cnt;
  1350. btrfs_release_delayed_node(delayed_node);
  1351. return 0;
  1352. }
  1353. void btrfs_get_delayed_items(struct inode *inode, struct list_head *ins_list,
  1354. struct list_head *del_list)
  1355. {
  1356. struct btrfs_delayed_node *delayed_node;
  1357. struct btrfs_delayed_item *item;
  1358. delayed_node = btrfs_get_delayed_node(inode);
  1359. if (!delayed_node)
  1360. return;
  1361. mutex_lock(&delayed_node->mutex);
  1362. item = __btrfs_first_delayed_insertion_item(delayed_node);
  1363. while (item) {
  1364. atomic_inc(&item->refs);
  1365. list_add_tail(&item->readdir_list, ins_list);
  1366. item = __btrfs_next_delayed_item(item);
  1367. }
  1368. item = __btrfs_first_delayed_deletion_item(delayed_node);
  1369. while (item) {
  1370. atomic_inc(&item->refs);
  1371. list_add_tail(&item->readdir_list, del_list);
  1372. item = __btrfs_next_delayed_item(item);
  1373. }
  1374. mutex_unlock(&delayed_node->mutex);
  1375. /*
  1376. * This delayed node is still cached in the btrfs inode, so refs
  1377. * must be > 1 now, and we needn't check it is going to be freed
  1378. * or not.
  1379. *
  1380. * Besides that, this function is used to read dir, we do not
  1381. * insert/delete delayed items in this period. So we also needn't
  1382. * requeue or dequeue this delayed node.
  1383. */
  1384. atomic_dec(&delayed_node->refs);
  1385. }
  1386. void btrfs_put_delayed_items(struct list_head *ins_list,
  1387. struct list_head *del_list)
  1388. {
  1389. struct btrfs_delayed_item *curr, *next;
  1390. list_for_each_entry_safe(curr, next, ins_list, readdir_list) {
  1391. list_del(&curr->readdir_list);
  1392. if (atomic_dec_and_test(&curr->refs))
  1393. kfree(curr);
  1394. }
  1395. list_for_each_entry_safe(curr, next, del_list, readdir_list) {
  1396. list_del(&curr->readdir_list);
  1397. if (atomic_dec_and_test(&curr->refs))
  1398. kfree(curr);
  1399. }
  1400. }
  1401. int btrfs_should_delete_dir_index(struct list_head *del_list,
  1402. u64 index)
  1403. {
  1404. struct btrfs_delayed_item *curr, *next;
  1405. int ret;
  1406. if (list_empty(del_list))
  1407. return 0;
  1408. list_for_each_entry_safe(curr, next, del_list, readdir_list) {
  1409. if (curr->key.offset > index)
  1410. break;
  1411. list_del(&curr->readdir_list);
  1412. ret = (curr->key.offset == index);
  1413. if (atomic_dec_and_test(&curr->refs))
  1414. kfree(curr);
  1415. if (ret)
  1416. return 1;
  1417. else
  1418. continue;
  1419. }
  1420. return 0;
  1421. }
  1422. /*
  1423. * btrfs_readdir_delayed_dir_index - read dir info stored in the delayed tree
  1424. *
  1425. */
  1426. int btrfs_readdir_delayed_dir_index(struct dir_context *ctx,
  1427. struct list_head *ins_list, bool *emitted)
  1428. {
  1429. struct btrfs_dir_item *di;
  1430. struct btrfs_delayed_item *curr, *next;
  1431. struct btrfs_key location;
  1432. char *name;
  1433. int name_len;
  1434. int over = 0;
  1435. unsigned char d_type;
  1436. if (list_empty(ins_list))
  1437. return 0;
  1438. /*
  1439. * Changing the data of the delayed item is impossible. So
  1440. * we needn't lock them. And we have held i_mutex of the
  1441. * directory, nobody can delete any directory indexes now.
  1442. */
  1443. list_for_each_entry_safe(curr, next, ins_list, readdir_list) {
  1444. list_del(&curr->readdir_list);
  1445. if (curr->key.offset < ctx->pos) {
  1446. if (atomic_dec_and_test(&curr->refs))
  1447. kfree(curr);
  1448. continue;
  1449. }
  1450. ctx->pos = curr->key.offset;
  1451. di = (struct btrfs_dir_item *)curr->data;
  1452. name = (char *)(di + 1);
  1453. name_len = btrfs_stack_dir_name_len(di);
  1454. d_type = btrfs_filetype_table[di->type];
  1455. btrfs_disk_key_to_cpu(&location, &di->location);
  1456. over = !dir_emit(ctx, name, name_len,
  1457. location.objectid, d_type);
  1458. if (atomic_dec_and_test(&curr->refs))
  1459. kfree(curr);
  1460. if (over)
  1461. return 1;
  1462. *emitted = true;
  1463. }
  1464. return 0;
  1465. }
  1466. static void fill_stack_inode_item(struct btrfs_trans_handle *trans,
  1467. struct btrfs_inode_item *inode_item,
  1468. struct inode *inode)
  1469. {
  1470. btrfs_set_stack_inode_uid(inode_item, i_uid_read(inode));
  1471. btrfs_set_stack_inode_gid(inode_item, i_gid_read(inode));
  1472. btrfs_set_stack_inode_size(inode_item, BTRFS_I(inode)->disk_i_size);
  1473. btrfs_set_stack_inode_mode(inode_item, inode->i_mode);
  1474. btrfs_set_stack_inode_nlink(inode_item, inode->i_nlink);
  1475. btrfs_set_stack_inode_nbytes(inode_item, inode_get_bytes(inode));
  1476. btrfs_set_stack_inode_generation(inode_item,
  1477. BTRFS_I(inode)->generation);
  1478. btrfs_set_stack_inode_sequence(inode_item, inode->i_version);
  1479. btrfs_set_stack_inode_transid(inode_item, trans->transid);
  1480. btrfs_set_stack_inode_rdev(inode_item, inode->i_rdev);
  1481. btrfs_set_stack_inode_flags(inode_item, BTRFS_I(inode)->flags);
  1482. btrfs_set_stack_inode_block_group(inode_item, 0);
  1483. btrfs_set_stack_timespec_sec(&inode_item->atime,
  1484. inode->i_atime.tv_sec);
  1485. btrfs_set_stack_timespec_nsec(&inode_item->atime,
  1486. inode->i_atime.tv_nsec);
  1487. btrfs_set_stack_timespec_sec(&inode_item->mtime,
  1488. inode->i_mtime.tv_sec);
  1489. btrfs_set_stack_timespec_nsec(&inode_item->mtime,
  1490. inode->i_mtime.tv_nsec);
  1491. btrfs_set_stack_timespec_sec(&inode_item->ctime,
  1492. inode->i_ctime.tv_sec);
  1493. btrfs_set_stack_timespec_nsec(&inode_item->ctime,
  1494. inode->i_ctime.tv_nsec);
  1495. btrfs_set_stack_timespec_sec(&inode_item->otime,
  1496. BTRFS_I(inode)->i_otime.tv_sec);
  1497. btrfs_set_stack_timespec_nsec(&inode_item->otime,
  1498. BTRFS_I(inode)->i_otime.tv_nsec);
  1499. }
  1500. int btrfs_fill_inode(struct inode *inode, u32 *rdev)
  1501. {
  1502. struct btrfs_delayed_node *delayed_node;
  1503. struct btrfs_inode_item *inode_item;
  1504. delayed_node = btrfs_get_delayed_node(inode);
  1505. if (!delayed_node)
  1506. return -ENOENT;
  1507. mutex_lock(&delayed_node->mutex);
  1508. if (!test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags)) {
  1509. mutex_unlock(&delayed_node->mutex);
  1510. btrfs_release_delayed_node(delayed_node);
  1511. return -ENOENT;
  1512. }
  1513. inode_item = &delayed_node->inode_item;
  1514. i_uid_write(inode, btrfs_stack_inode_uid(inode_item));
  1515. i_gid_write(inode, btrfs_stack_inode_gid(inode_item));
  1516. btrfs_i_size_write(inode, btrfs_stack_inode_size(inode_item));
  1517. inode->i_mode = btrfs_stack_inode_mode(inode_item);
  1518. set_nlink(inode, btrfs_stack_inode_nlink(inode_item));
  1519. inode_set_bytes(inode, btrfs_stack_inode_nbytes(inode_item));
  1520. BTRFS_I(inode)->generation = btrfs_stack_inode_generation(inode_item);
  1521. BTRFS_I(inode)->last_trans = btrfs_stack_inode_transid(inode_item);
  1522. inode->i_version = btrfs_stack_inode_sequence(inode_item);
  1523. inode->i_rdev = 0;
  1524. *rdev = btrfs_stack_inode_rdev(inode_item);
  1525. BTRFS_I(inode)->flags = btrfs_stack_inode_flags(inode_item);
  1526. inode->i_atime.tv_sec = btrfs_stack_timespec_sec(&inode_item->atime);
  1527. inode->i_atime.tv_nsec = btrfs_stack_timespec_nsec(&inode_item->atime);
  1528. inode->i_mtime.tv_sec = btrfs_stack_timespec_sec(&inode_item->mtime);
  1529. inode->i_mtime.tv_nsec = btrfs_stack_timespec_nsec(&inode_item->mtime);
  1530. inode->i_ctime.tv_sec = btrfs_stack_timespec_sec(&inode_item->ctime);
  1531. inode->i_ctime.tv_nsec = btrfs_stack_timespec_nsec(&inode_item->ctime);
  1532. BTRFS_I(inode)->i_otime.tv_sec =
  1533. btrfs_stack_timespec_sec(&inode_item->otime);
  1534. BTRFS_I(inode)->i_otime.tv_nsec =
  1535. btrfs_stack_timespec_nsec(&inode_item->otime);
  1536. inode->i_generation = BTRFS_I(inode)->generation;
  1537. BTRFS_I(inode)->index_cnt = (u64)-1;
  1538. mutex_unlock(&delayed_node->mutex);
  1539. btrfs_release_delayed_node(delayed_node);
  1540. return 0;
  1541. }
  1542. int btrfs_delayed_update_inode(struct btrfs_trans_handle *trans,
  1543. struct btrfs_root *root, struct inode *inode)
  1544. {
  1545. struct btrfs_delayed_node *delayed_node;
  1546. int ret = 0;
  1547. delayed_node = btrfs_get_or_create_delayed_node(inode);
  1548. if (IS_ERR(delayed_node))
  1549. return PTR_ERR(delayed_node);
  1550. mutex_lock(&delayed_node->mutex);
  1551. if (test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags)) {
  1552. fill_stack_inode_item(trans, &delayed_node->inode_item, inode);
  1553. goto release_node;
  1554. }
  1555. ret = btrfs_delayed_inode_reserve_metadata(trans, root, inode,
  1556. delayed_node);
  1557. if (ret)
  1558. goto release_node;
  1559. fill_stack_inode_item(trans, &delayed_node->inode_item, inode);
  1560. set_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags);
  1561. delayed_node->count++;
  1562. atomic_inc(&root->fs_info->delayed_root->items);
  1563. release_node:
  1564. mutex_unlock(&delayed_node->mutex);
  1565. btrfs_release_delayed_node(delayed_node);
  1566. return ret;
  1567. }
  1568. int btrfs_delayed_delete_inode_ref(struct inode *inode)
  1569. {
  1570. struct btrfs_delayed_node *delayed_node;
  1571. /*
  1572. * we don't do delayed inode updates during log recovery because it
  1573. * leads to enospc problems. This means we also can't do
  1574. * delayed inode refs
  1575. */
  1576. if (BTRFS_I(inode)->root->fs_info->log_root_recovering)
  1577. return -EAGAIN;
  1578. delayed_node = btrfs_get_or_create_delayed_node(inode);
  1579. if (IS_ERR(delayed_node))
  1580. return PTR_ERR(delayed_node);
  1581. /*
  1582. * We don't reserve space for inode ref deletion is because:
  1583. * - We ONLY do async inode ref deletion for the inode who has only
  1584. * one link(i_nlink == 1), it means there is only one inode ref.
  1585. * And in most case, the inode ref and the inode item are in the
  1586. * same leaf, and we will deal with them at the same time.
  1587. * Since we are sure we will reserve the space for the inode item,
  1588. * it is unnecessary to reserve space for inode ref deletion.
  1589. * - If the inode ref and the inode item are not in the same leaf,
  1590. * We also needn't worry about enospc problem, because we reserve
  1591. * much more space for the inode update than it needs.
  1592. * - At the worst, we can steal some space from the global reservation.
  1593. * It is very rare.
  1594. */
  1595. mutex_lock(&delayed_node->mutex);
  1596. if (test_bit(BTRFS_DELAYED_NODE_DEL_IREF, &delayed_node->flags))
  1597. goto release_node;
  1598. set_bit(BTRFS_DELAYED_NODE_DEL_IREF, &delayed_node->flags);
  1599. delayed_node->count++;
  1600. atomic_inc(&BTRFS_I(inode)->root->fs_info->delayed_root->items);
  1601. release_node:
  1602. mutex_unlock(&delayed_node->mutex);
  1603. btrfs_release_delayed_node(delayed_node);
  1604. return 0;
  1605. }
  1606. static void __btrfs_kill_delayed_node(struct btrfs_delayed_node *delayed_node)
  1607. {
  1608. struct btrfs_root *root = delayed_node->root;
  1609. struct btrfs_delayed_item *curr_item, *prev_item;
  1610. mutex_lock(&delayed_node->mutex);
  1611. curr_item = __btrfs_first_delayed_insertion_item(delayed_node);
  1612. while (curr_item) {
  1613. btrfs_delayed_item_release_metadata(root, curr_item);
  1614. prev_item = curr_item;
  1615. curr_item = __btrfs_next_delayed_item(prev_item);
  1616. btrfs_release_delayed_item(prev_item);
  1617. }
  1618. curr_item = __btrfs_first_delayed_deletion_item(delayed_node);
  1619. while (curr_item) {
  1620. btrfs_delayed_item_release_metadata(root, curr_item);
  1621. prev_item = curr_item;
  1622. curr_item = __btrfs_next_delayed_item(prev_item);
  1623. btrfs_release_delayed_item(prev_item);
  1624. }
  1625. if (test_bit(BTRFS_DELAYED_NODE_DEL_IREF, &delayed_node->flags))
  1626. btrfs_release_delayed_iref(delayed_node);
  1627. if (test_bit(BTRFS_DELAYED_NODE_INODE_DIRTY, &delayed_node->flags)) {
  1628. btrfs_delayed_inode_release_metadata(root, delayed_node);
  1629. btrfs_release_delayed_inode(delayed_node);
  1630. }
  1631. mutex_unlock(&delayed_node->mutex);
  1632. }
  1633. void btrfs_kill_delayed_inode_items(struct inode *inode)
  1634. {
  1635. struct btrfs_delayed_node *delayed_node;
  1636. delayed_node = btrfs_get_delayed_node(inode);
  1637. if (!delayed_node)
  1638. return;
  1639. __btrfs_kill_delayed_node(delayed_node);
  1640. btrfs_release_delayed_node(delayed_node);
  1641. }
  1642. void btrfs_kill_all_delayed_nodes(struct btrfs_root *root)
  1643. {
  1644. u64 inode_id = 0;
  1645. struct btrfs_delayed_node *delayed_nodes[8];
  1646. int i, n;
  1647. while (1) {
  1648. spin_lock(&root->inode_lock);
  1649. n = radix_tree_gang_lookup(&root->delayed_nodes_tree,
  1650. (void **)delayed_nodes, inode_id,
  1651. ARRAY_SIZE(delayed_nodes));
  1652. if (!n) {
  1653. spin_unlock(&root->inode_lock);
  1654. break;
  1655. }
  1656. inode_id = delayed_nodes[n - 1]->inode_id + 1;
  1657. for (i = 0; i < n; i++)
  1658. atomic_inc(&delayed_nodes[i]->refs);
  1659. spin_unlock(&root->inode_lock);
  1660. for (i = 0; i < n; i++) {
  1661. __btrfs_kill_delayed_node(delayed_nodes[i]);
  1662. btrfs_release_delayed_node(delayed_nodes[i]);
  1663. }
  1664. }
  1665. }
  1666. void btrfs_destroy_delayed_inodes(struct btrfs_root *root)
  1667. {
  1668. struct btrfs_delayed_root *delayed_root;
  1669. struct btrfs_delayed_node *curr_node, *prev_node;
  1670. delayed_root = btrfs_get_delayed_root(root);
  1671. curr_node = btrfs_first_delayed_node(delayed_root);
  1672. while (curr_node) {
  1673. __btrfs_kill_delayed_node(curr_node);
  1674. prev_node = curr_node;
  1675. curr_node = btrfs_next_delayed_node(curr_node);
  1676. btrfs_release_delayed_node(prev_node);
  1677. }
  1678. }