]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - fs/notify/inode_mark.c
fs: move i_sb_list out from under inode_lock
[mirror_ubuntu-jammy-kernel.git] / fs / notify / inode_mark.c
CommitLineData
3be25f49
EP
1/*
2 * Copyright (C) 2008 Red Hat, Inc., Eric Paris <eparis@redhat.com>
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2, or (at your option)
7 * any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; see the file COPYING. If not, write to
16 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
17 */
18
3be25f49
EP
19#include <linux/fs.h>
20#include <linux/init.h>
21#include <linux/kernel.h>
22#include <linux/module.h>
23#include <linux/mutex.h>
3be25f49 24#include <linux/spinlock.h>
164bc619 25#include <linux/writeback.h> /* for inode_lock */
3be25f49
EP
26
27#include <asm/atomic.h>
28
29#include <linux/fsnotify_backend.h>
30#include "fsnotify.h"
31
55fa6091
DC
32#include "../internal.h"
33
3be25f49
EP
34/*
35 * Recalculate the mask of events relevant to a given inode locked.
36 */
37static void fsnotify_recalc_inode_mask_locked(struct inode *inode)
38{
841bdc10 39 struct fsnotify_mark *mark;
3be25f49
EP
40 struct hlist_node *pos;
41 __u32 new_mask = 0;
42
43 assert_spin_locked(&inode->i_lock);
44
841bdc10
EP
45 hlist_for_each_entry(mark, pos, &inode->i_fsnotify_marks, i.i_list)
46 new_mask |= mark->mask;
3be25f49
EP
47 inode->i_fsnotify_mask = new_mask;
48}
49
50/*
51 * Recalculate the inode->i_fsnotify_mask, or the mask of all FS_* event types
52 * any notifier is interested in hearing for this inode.
53 */
54void fsnotify_recalc_inode_mask(struct inode *inode)
55{
56 spin_lock(&inode->i_lock);
57 fsnotify_recalc_inode_mask_locked(inode);
58 spin_unlock(&inode->i_lock);
c28f7e56
EP
59
60 __fsnotify_update_child_dentry_flags(inode);
3be25f49
EP
61}
62
5444e298 63void fsnotify_destroy_inode_mark(struct fsnotify_mark *mark)
3be25f49 64{
5444e298 65 struct inode *inode = mark->i.inode;
3be25f49 66
5444e298
EP
67 assert_spin_locked(&mark->lock);
68 assert_spin_locked(&mark->group->mark_lock);
3be25f49 69
3be25f49
EP
70 spin_lock(&inode->i_lock);
71
a4c6e996 72 hlist_del_init_rcu(&mark->i.i_list);
841bdc10 73 mark->i.inode = NULL;
3be25f49
EP
74
75 /*
e61ce867 76 * this mark is now off the inode->i_fsnotify_marks list and we
3be25f49
EP
77 * hold the inode->i_lock, so this is the perfect time to update the
78 * inode->i_fsnotify_mask
79 */
80 fsnotify_recalc_inode_mask_locked(inode);
81
82 spin_unlock(&inode->i_lock);
3be25f49
EP
83}
84
85/*
86 * Given an inode, destroy all of the marks associated with that inode.
87 */
88void fsnotify_clear_marks_by_inode(struct inode *inode)
89{
841bdc10 90 struct fsnotify_mark *mark, *lmark;
3be25f49
EP
91 struct hlist_node *pos, *n;
92 LIST_HEAD(free_list);
93
94 spin_lock(&inode->i_lock);
841bdc10
EP
95 hlist_for_each_entry_safe(mark, pos, n, &inode->i_fsnotify_marks, i.i_list) {
96 list_add(&mark->i.free_i_list, &free_list);
a4c6e996 97 hlist_del_init_rcu(&mark->i.i_list);
841bdc10 98 fsnotify_get_mark(mark);
3be25f49
EP
99 }
100 spin_unlock(&inode->i_lock);
101
841bdc10
EP
102 list_for_each_entry_safe(mark, lmark, &free_list, i.free_i_list) {
103 fsnotify_destroy_mark(mark);
104 fsnotify_put_mark(mark);
3be25f49
EP
105 }
106}
107
4d92604c
EP
108/*
109 * Given a group clear all of the inode marks associated with that group.
110 */
111void fsnotify_clear_inode_marks_by_group(struct fsnotify_group *group)
112{
113 fsnotify_clear_marks_by_group_flags(group, FSNOTIFY_MARK_FLAG_INODE);
114}
115
3be25f49
EP
116/*
117 * given a group and inode, find the mark associated with that combination.
118 * if found take a reference to that mark and return it, else return NULL
119 */
5444e298
EP
120struct fsnotify_mark *fsnotify_find_inode_mark_locked(struct fsnotify_group *group,
121 struct inode *inode)
3be25f49 122{
841bdc10 123 struct fsnotify_mark *mark;
3be25f49
EP
124 struct hlist_node *pos;
125
126 assert_spin_locked(&inode->i_lock);
127
841bdc10
EP
128 hlist_for_each_entry(mark, pos, &inode->i_fsnotify_marks, i.i_list) {
129 if (mark->group == group) {
130 fsnotify_get_mark(mark);
131 return mark;
3be25f49
EP
132 }
133 }
134 return NULL;
135}
136
137/*
35566087
AG
138 * given a group and inode, find the mark associated with that combination.
139 * if found take a reference to that mark and return it, else return NULL
3be25f49 140 */
5444e298
EP
141struct fsnotify_mark *fsnotify_find_inode_mark(struct fsnotify_group *group,
142 struct inode *inode)
35566087
AG
143{
144 struct fsnotify_mark *mark;
145
146 spin_lock(&inode->i_lock);
5444e298 147 mark = fsnotify_find_inode_mark_locked(group, inode);
35566087
AG
148 spin_unlock(&inode->i_lock);
149
150 return mark;
151}
3be25f49 152
3be25f49 153/*
90b1e7a5
EP
154 * If we are setting a mark mask on an inode mark we should pin the inode
155 * in memory.
156 */
157void fsnotify_set_inode_mark_mask_locked(struct fsnotify_mark *mark,
158 __u32 mask)
3be25f49 159{
90b1e7a5
EP
160 struct inode *inode;
161
162 assert_spin_locked(&mark->lock);
163
164 if (mask &&
165 mark->i.inode &&
166 !(mark->flags & FSNOTIFY_MARK_FLAG_OBJECT_PINNED)) {
167 mark->flags |= FSNOTIFY_MARK_FLAG_OBJECT_PINNED;
168 inode = igrab(mark->i.inode);
169 /*
170 * we shouldn't be able to get here if the inode wasn't
171 * already safely held in memory. But bug in case it
172 * ever is wrong.
173 */
174 BUG_ON(!inode);
175 }
3be25f49
EP
176}
177
178/*
0c6532e4 179 * Attach an initialized mark to a given inode.
3be25f49 180 * These marks may be used for the fsnotify backend to determine which
0c6532e4 181 * event types should be delivered to which group and for which inodes. These
6ad2d4e3
EP
182 * marks are ordered according to priority, highest number first, and then by
183 * the group's location in memory.
3be25f49 184 */
5444e298
EP
185int fsnotify_add_inode_mark(struct fsnotify_mark *mark,
186 struct fsnotify_group *group, struct inode *inode,
187 int allow_dups)
3be25f49 188{
0c6532e4
EP
189 struct fsnotify_mark *lmark;
190 struct hlist_node *node, *last = NULL;
3be25f49
EP
191 int ret = 0;
192
700307a2 193 mark->flags |= FSNOTIFY_MARK_FLAG_INODE;
098cf2fc 194
5444e298
EP
195 assert_spin_locked(&mark->lock);
196 assert_spin_locked(&group->mark_lock);
1ef5f13c 197
3be25f49
EP
198 spin_lock(&inode->i_lock);
199
0c6532e4 200 mark->i.inode = inode;
9f0d793b 201
0c6532e4
EP
202 /* is mark the first mark? */
203 if (hlist_empty(&inode->i_fsnotify_marks)) {
a4c6e996 204 hlist_add_head_rcu(&mark->i.i_list, &inode->i_fsnotify_marks);
0c6532e4
EP
205 goto out;
206 }
3be25f49 207
0c6532e4
EP
208 /* should mark be in the middle of the current list? */
209 hlist_for_each_entry(lmark, node, &inode->i_fsnotify_marks, i.i_list) {
210 last = node;
3be25f49 211
0c6532e4
EP
212 if ((lmark->group == group) && !allow_dups) {
213 ret = -EEXIST;
214 goto out;
215 }
3be25f49 216
6ad2d4e3
EP
217 if (mark->group->priority < lmark->group->priority)
218 continue;
219
220 if ((mark->group->priority == lmark->group->priority) &&
221 (mark->group < lmark->group))
0c6532e4 222 continue;
3be25f49 223
a4c6e996 224 hlist_add_before_rcu(&mark->i.i_list, &lmark->i.i_list);
0c6532e4 225 goto out;
3be25f49
EP
226 }
227
0c6532e4
EP
228 BUG_ON(last == NULL);
229 /* mark should be the last entry. last is the current last entry */
a4c6e996 230 hlist_add_after_rcu(last, &mark->i.i_list);
0c6532e4
EP
231out:
232 fsnotify_recalc_inode_mask_locked(inode);
3be25f49 233 spin_unlock(&inode->i_lock);
3be25f49
EP
234
235 return ret;
236}
164bc619
EP
237
238/**
239 * fsnotify_unmount_inodes - an sb is unmounting. handle any watched inodes.
240 * @list: list of inodes being unmounted (sb->s_inodes)
241 *
55fa6091
DC
242 * Called during unmount with no locks held, so needs to be safe against
243 * concurrent modifiers. We temporarily drop inode_sb_list_lock and CAN block.
164bc619
EP
244 */
245void fsnotify_unmount_inodes(struct list_head *list)
246{
247 struct inode *inode, *next_i, *need_iput = NULL;
248
55fa6091 249 spin_lock(&inode_sb_list_lock);
164bc619
EP
250 list_for_each_entry_safe(inode, next_i, list, i_sb_list) {
251 struct inode *need_iput_tmp;
252
253 /*
a4ffdde6 254 * We cannot __iget() an inode in state I_FREEING,
164bc619
EP
255 * I_WILL_FREE, or I_NEW which is fine because by that point
256 * the inode cannot have any associated watches.
257 */
250df6ed
DC
258 spin_lock(&inode->i_lock);
259 if (inode->i_state & (I_FREEING|I_WILL_FREE|I_NEW)) {
260 spin_unlock(&inode->i_lock);
164bc619 261 continue;
250df6ed 262 }
164bc619
EP
263
264 /*
265 * If i_count is zero, the inode cannot have any watches and
266 * doing an __iget/iput with MS_ACTIVE clear would actually
267 * evict all inodes with zero i_count from icache which is
268 * unnecessarily violent and may in fact be illegal to do.
269 */
250df6ed
DC
270 if (!atomic_read(&inode->i_count)) {
271 spin_unlock(&inode->i_lock);
164bc619 272 continue;
250df6ed 273 }
164bc619
EP
274
275 need_iput_tmp = need_iput;
276 need_iput = NULL;
277
278 /* In case fsnotify_inode_delete() drops a reference. */
279 if (inode != need_iput_tmp)
280 __iget(inode);
281 else
282 need_iput_tmp = NULL;
250df6ed 283 spin_unlock(&inode->i_lock);
164bc619
EP
284
285 /* In case the dropping of a reference would nuke next_i. */
286 if ((&next_i->i_sb_list != list) &&
250df6ed
DC
287 atomic_read(&next_i->i_count)) {
288 spin_lock(&next_i->i_lock);
289 if (!(next_i->i_state & (I_FREEING | I_WILL_FREE))) {
290 __iget(next_i);
291 need_iput = next_i;
292 }
293 spin_unlock(&next_i->i_lock);
164bc619
EP
294 }
295
296 /*
55fa6091 297 * We can safely drop inode_sb_list_lock here because we hold
164bc619 298 * references on both inode and next_i. Also no new inodes
55fa6091 299 * will be added since the umount has begun.
164bc619 300 */
55fa6091 301 spin_unlock(&inode_sb_list_lock);
164bc619
EP
302
303 if (need_iput_tmp)
304 iput(need_iput_tmp);
305
306 /* for each watch, send FS_UNMOUNT and then remove it */
307 fsnotify(inode, FS_UNMOUNT, inode, FSNOTIFY_EVENT_INODE, NULL, 0);
308
309 fsnotify_inode_delete(inode);
310
311 iput(inode);
312
55fa6091 313 spin_lock(&inode_sb_list_lock);
164bc619 314 }
55fa6091 315 spin_unlock(&inode_sb_list_lock);
164bc619 316}