perf/core: Fix lock inversion between perf,trace,cpuhp

Lockdep gifted us with noticing the following 4-way lockup scenario:

perf_trace_init()
#0 mutex_lock(&event_mutex)
perf_trace_event_init()
perf_trace_event_reg()
tp_event->class->reg() := tracepoint_probe_register
#1 mutex_lock(&tracepoints_mutex)
trace_point_add_func()
#2 static_key_enable()

#2 do_cpu_up()
perf_event_init_cpu()
#3 mutex_lock(&pmus_lock)
#4 mutex_lock(&ctx->mutex)

perf_event_task_disable()
mutex_lock(&current->perf_event_mutex)
#4 ctx = perf_event_ctx_lock()
#5 perf_event_for_each_child()

do_exit()
task_work_run()
__fput()
perf_release()
perf_event_release_kernel()
#4 mutex_lock(&ctx->mutex)
#5 mutex_lock(&event->child_mutex)
free_event()
_free_event()
event->destroy() := perf_trace_destroy
#0 mutex_lock(&event_mutex);

Fix that by moving the free_event() out from under the locks.

Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Stephane Eranian <eranian@google.com>
Cc: Steven Rostedt (VMware) <rostedt@goodmis.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Vince Weaver <vincent.weaver@maine.edu>
Cc: linux-kernel@vger.kernel.org
Signed-off-by: Ingo Molnar <mingo@kernel.org>

authored by Peter Zijlstra and committed by Ingo Molnar 82d94856 1f07476e

Changed files
+11 -2
kernel
events
+11 -2
kernel/events/core.c
··· 1231 1231 * perf_event_context::lock 1232 1232 * perf_event::mmap_mutex 1233 1233 * mmap_sem 1234 + * 1235 + * cpu_hotplug_lock 1236 + * pmus_lock 1237 + * cpuctx->mutex / perf_event_context::mutex 1234 1238 */ 1235 1239 static struct perf_event_context * 1236 1240 perf_event_ctx_lock_nested(struct perf_event *event, int nesting) ··· 4200 4196 { 4201 4197 struct perf_event_context *ctx = event->ctx; 4202 4198 struct perf_event *child, *tmp; 4199 + LIST_HEAD(free_list); 4203 4200 4204 4201 /* 4205 4202 * If we got here through err_file: fput(event_file); we will not have ··· 4273 4268 struct perf_event, child_list); 4274 4269 if (tmp == child) { 4275 4270 perf_remove_from_context(child, DETACH_GROUP); 4276 - list_del(&child->child_list); 4277 - free_event(child); 4271 + list_move(&child->child_list, &free_list); 4278 4272 /* 4279 4273 * This matches the refcount bump in inherit_event(); 4280 4274 * this can't be the last reference. ··· 4287 4283 goto again; 4288 4284 } 4289 4285 mutex_unlock(&event->child_mutex); 4286 + 4287 + list_for_each_entry_safe(child, tmp, &free_list, child_list) { 4288 + list_del(&child->child_list); 4289 + free_event(child); 4290 + } 4290 4291 4291 4292 no_ctx: 4292 4293 put_event(event); /* Must be the 'last' reference */