blob: a18b8d7a30759b468f0afb33322cdd97703ff63c [file] [log] [blame]
xjb04a4022021-11-25 15:01:52 +08001// SPDX-License-Identifier: GPL-2.0
2#include <linux/fanotify.h>
3#include <linux/fdtable.h>
4#include <linux/fsnotify_backend.h>
5#include <linux/init.h>
6#include <linux/jiffies.h>
7#include <linux/kernel.h> /* UINT_MAX */
8#include <linux/mount.h>
9#include <linux/sched.h>
10#include <linux/sched/user.h>
11#include <linux/sched/signal.h>
12#include <linux/types.h>
13#include <linux/wait.h>
14#include <linux/audit.h>
15#include <linux/sched/mm.h>
16
17#include "fanotify.h"
18
19static bool should_merge(struct fsnotify_event *old_fsn,
20 struct fsnotify_event *new_fsn)
21{
22 struct fanotify_event_info *old, *new;
23
24 pr_debug("%s: old=%p new=%p\n", __func__, old_fsn, new_fsn);
25 old = FANOTIFY_E(old_fsn);
26 new = FANOTIFY_E(new_fsn);
27
28 if (old_fsn->inode == new_fsn->inode && old->tgid == new->tgid &&
29 old->path.mnt == new->path.mnt &&
30 old->path.dentry == new->path.dentry)
31 return true;
32 return false;
33}
34
35/* and the list better be locked by something too! */
36static int fanotify_merge(struct list_head *list, struct fsnotify_event *event)
37{
38 struct fsnotify_event *test_event;
39
40 pr_debug("%s: list=%p event=%p\n", __func__, list, event);
41
42 /*
43 * Don't merge a permission event with any other event so that we know
44 * the event structure we have created in fanotify_handle_event() is the
45 * one we should check for permission response.
46 */
47 if (fanotify_is_perm_event(event->mask))
48 return 0;
49
50 list_for_each_entry_reverse(test_event, list, list) {
51 if (should_merge(test_event, event)) {
52 test_event->mask |= event->mask;
53 return 1;
54 }
55 }
56
57 return 0;
58}
59
60static int fanotify_get_response(struct fsnotify_group *group,
61 struct fanotify_perm_event_info *event,
62 struct fsnotify_iter_info *iter_info)
63{
64 int ret;
65
66 pr_debug("%s: group=%p event=%p\n", __func__, group, event);
67
68 wait_event(group->fanotify_data.access_waitq, event->response);
69
70 /* userspace responded, convert to something usable */
71 switch (event->response & ~FAN_AUDIT) {
72 case FAN_ALLOW:
73 ret = 0;
74 break;
75 case FAN_DENY:
76 default:
77 ret = -EPERM;
78 }
79
80 /* Check if the response should be audited */
81 if (event->response & FAN_AUDIT)
82 audit_fanotify(event->response & ~FAN_AUDIT);
83
84 event->response = 0;
85
86 pr_debug("%s: group=%p event=%p about to return ret=%d\n", __func__,
87 group, event, ret);
88
89 return ret;
90}
91
92static bool fanotify_should_send_event(struct fsnotify_iter_info *iter_info,
93 u32 event_mask, const void *data,
94 int data_type)
95{
96 __u32 marks_mask = 0, marks_ignored_mask = 0;
97 const struct path *path = data;
98 struct fsnotify_mark *mark;
99 int type;
100
101 pr_debug("%s: report_mask=%x mask=%x data=%p data_type=%d\n",
102 __func__, iter_info->report_mask, event_mask, data, data_type);
103
104 /* if we don't have enough info to send an event to userspace say no */
105 if (data_type != FSNOTIFY_EVENT_PATH)
106 return false;
107
108 /* sorry, fanotify only gives a damn about files and dirs */
109 if (!d_is_reg(path->dentry) &&
110 !d_can_lookup(path->dentry))
111 return false;
112
113 fsnotify_foreach_obj_type(type) {
114 if (!fsnotify_iter_should_report_type(iter_info, type))
115 continue;
116 mark = iter_info->marks[type];
117 /*
118 * If the event is for a child and this mark doesn't care about
119 * events on a child, don't send it!
120 */
121 if (event_mask & FS_EVENT_ON_CHILD &&
122 (type != FSNOTIFY_OBJ_TYPE_INODE ||
123 !(mark->mask & FS_EVENT_ON_CHILD)))
124 continue;
125
126 marks_mask |= mark->mask;
127 marks_ignored_mask |= mark->ignored_mask;
128 }
129
130 if (d_is_dir(path->dentry) &&
131 !(marks_mask & FS_ISDIR & ~marks_ignored_mask))
132 return false;
133
134 if (event_mask & FAN_ALL_OUTGOING_EVENTS & marks_mask &
135 ~marks_ignored_mask)
136 return true;
137
138 return false;
139}
140
141struct fanotify_event_info *fanotify_alloc_event(struct fsnotify_group *group,
142 struct inode *inode, u32 mask,
143 const struct path *path)
144{
145 struct fanotify_event_info *event = NULL;
146 gfp_t gfp = GFP_KERNEL_ACCOUNT;
147
148 /*
149 * For queues with unlimited length lost events are not expected and
150 * can possibly have security implications. Avoid losing events when
151 * memory is short. For the limited size queues, avoid OOM killer in the
152 * target monitoring memcg as it may have security repercussion.
153 */
154 if (group->max_events == UINT_MAX)
155 gfp |= __GFP_NOFAIL;
156 else
157 gfp |= __GFP_RETRY_MAYFAIL;
158
159 /* Whoever is interested in the event, pays for the allocation. */
160 memalloc_use_memcg(group->memcg);
161
162 if (fanotify_is_perm_event(mask)) {
163 struct fanotify_perm_event_info *pevent;
164
165 pevent = kmem_cache_alloc(fanotify_perm_event_cachep, gfp);
166 if (!pevent)
167 goto out;
168 event = &pevent->fae;
169 pevent->response = 0;
170 goto init;
171 }
172 event = kmem_cache_alloc(fanotify_event_cachep, gfp);
173 if (!event)
174 goto out;
175init: __maybe_unused
176 fsnotify_init_event(&event->fse, inode, mask);
177 event->tgid = get_pid(task_tgid(current));
178 if (path) {
179 event->path = *path;
180 path_get(&event->path);
181 } else {
182 event->path.mnt = NULL;
183 event->path.dentry = NULL;
184 }
185out:
186 memalloc_unuse_memcg();
187 return event;
188}
189
190static int fanotify_handle_event(struct fsnotify_group *group,
191 struct inode *inode,
192 u32 mask, const void *data, int data_type,
193 const unsigned char *file_name, u32 cookie,
194 struct fsnotify_iter_info *iter_info)
195{
196 int ret = 0;
197 struct fanotify_event_info *event;
198 struct fsnotify_event *fsn_event;
199
200 BUILD_BUG_ON(FAN_ACCESS != FS_ACCESS);
201 BUILD_BUG_ON(FAN_MODIFY != FS_MODIFY);
202 BUILD_BUG_ON(FAN_CLOSE_NOWRITE != FS_CLOSE_NOWRITE);
203 BUILD_BUG_ON(FAN_CLOSE_WRITE != FS_CLOSE_WRITE);
204 BUILD_BUG_ON(FAN_OPEN != FS_OPEN);
205 BUILD_BUG_ON(FAN_EVENT_ON_CHILD != FS_EVENT_ON_CHILD);
206 BUILD_BUG_ON(FAN_Q_OVERFLOW != FS_Q_OVERFLOW);
207 BUILD_BUG_ON(FAN_OPEN_PERM != FS_OPEN_PERM);
208 BUILD_BUG_ON(FAN_ACCESS_PERM != FS_ACCESS_PERM);
209 BUILD_BUG_ON(FAN_ONDIR != FS_ISDIR);
210
211 if (!fanotify_should_send_event(iter_info, mask, data, data_type))
212 return 0;
213
214 pr_debug("%s: group=%p inode=%p mask=%x\n", __func__, group, inode,
215 mask);
216
217 if (fanotify_is_perm_event(mask)) {
218 /*
219 * fsnotify_prepare_user_wait() fails if we race with mark
220 * deletion. Just let the operation pass in that case.
221 */
222 if (!fsnotify_prepare_user_wait(iter_info))
223 return 0;
224 }
225
226 event = fanotify_alloc_event(group, inode, mask, data);
227 ret = -ENOMEM;
228 if (unlikely(!event)) {
229 /*
230 * We don't queue overflow events for permission events as
231 * there the access is denied and so no event is in fact lost.
232 */
233 if (!fanotify_is_perm_event(mask))
234 fsnotify_queue_overflow(group);
235 goto finish;
236 }
237
238 fsn_event = &event->fse;
239 ret = fsnotify_add_event(group, fsn_event, fanotify_merge);
240 if (ret) {
241 /* Permission events shouldn't be merged */
242 BUG_ON(ret == 1 && mask & FAN_ALL_PERM_EVENTS);
243 /* Our event wasn't used in the end. Free it. */
244 fsnotify_destroy_event(group, fsn_event);
245
246 ret = 0;
247 } else if (fanotify_is_perm_event(mask)) {
248 ret = fanotify_get_response(group, FANOTIFY_PE(fsn_event),
249 iter_info);
250 fsnotify_destroy_event(group, fsn_event);
251 }
252finish:
253 if (fanotify_is_perm_event(mask))
254 fsnotify_finish_user_wait(iter_info);
255
256 return ret;
257}
258
259static void fanotify_free_group_priv(struct fsnotify_group *group)
260{
261 struct user_struct *user;
262
263 user = group->fanotify_data.user;
264 atomic_dec(&user->fanotify_listeners);
265 free_uid(user);
266}
267
268static void fanotify_free_event(struct fsnotify_event *fsn_event)
269{
270 struct fanotify_event_info *event;
271
272 event = FANOTIFY_E(fsn_event);
273 path_put(&event->path);
274 put_pid(event->tgid);
275 if (fanotify_is_perm_event(fsn_event->mask)) {
276 kmem_cache_free(fanotify_perm_event_cachep,
277 FANOTIFY_PE(fsn_event));
278 return;
279 }
280 kmem_cache_free(fanotify_event_cachep, event);
281}
282
283static void fanotify_free_mark(struct fsnotify_mark *fsn_mark)
284{
285 kmem_cache_free(fanotify_mark_cache, fsn_mark);
286}
287
288const struct fsnotify_ops fanotify_fsnotify_ops = {
289 .handle_event = fanotify_handle_event,
290 .free_group_priv = fanotify_free_group_priv,
291 .free_event = fanotify_free_event,
292 .free_mark = fanotify_free_mark,
293};