trace.c source code [linux/kernel/trace/trace.c]

1	// SPDX-License-Identifier: GPL-2.0
2	/*
3	* ring buffer based function tracer
4	*
5	* Copyright (C) 2007-2012 Steven Rostedt <srostedt@redhat.com>
6	* Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
7	*
8	* Originally taken from the RT patch by:
9	* Arnaldo Carvalho de Melo <acme@redhat.com>
10	*
11	* Based on code from the latency_tracer, that is:
12	* Copyright (C) 2004-2006 Ingo Molnar
13	* Copyright (C) 2004 Nadia Yvette Chambers
14	*/
15	#include <linux/ring_buffer.h>
16	#include <generated/utsrelease.h>
17	#include <linux/stacktrace.h>
18	#include <linux/writeback.h>
19	#include <linux/kallsyms.h>
20	#include <linux/security.h>
21	#include <linux/seq_file.h>
22	#include <linux/irqflags.h>
23	#include <linux/debugfs.h>
24	#include <linux/tracefs.h>
25	#include <linux/pagemap.h>
26	#include <linux/hardirq.h>
27	#include <linux/linkage.h>
28	#include <linux/uaccess.h>
29	#include <linux/vmalloc.h>
30	#include <linux/ftrace.h>
31	#include <linux/module.h>
32	#include <linux/percpu.h>
33	#include <linux/splice.h>
34	#include <linux/kdebug.h>
35	#include <linux/string.h>
36	#include <linux/mount.h>
37	#include <linux/rwsem.h>
38	#include <linux/slab.h>
39	#include <linux/ctype.h>
40	#include <linux/init.h>
41	#include <linux/panic_notifier.h>
42	#include <linux/poll.h>
43	#include <linux/nmi.h>
44	#include <linux/fs.h>
45	#include <linux/trace.h>
46	#include <linux/sched/clock.h>
47	#include <linux/sched/rt.h>
48	#include <linux/fsnotify.h>
49	#include <linux/irq_work.h>
50	#include <linux/workqueue.h>
51
52	#include <asm/setup.h> /* COMMAND_LINE_SIZE */
53
54	#include "trace.h"
55	#include "trace_output.h"
56
57	#ifdef CONFIG_FTRACE_STARTUP_TEST
58	/*
59	* We need to change this state when a selftest is running.
60	* A selftest will lurk into the ring-buffer to count the
61	* entries inserted during the selftest although some concurrent
62	* insertions into the ring-buffer such as trace_printk could occurred
63	* at the same time, giving false positive or negative results.
64	*/
65	static bool __read_mostly tracing_selftest_running;
66
67	/*
68	* If boot-time tracing including tracers/events via kernel cmdline
69	* is running, we do not want to run SELFTEST.
70	*/
71	bool __read_mostly tracing_selftest_disabled;
72
73	void __init disable_tracing_selftest(const char *reason)
74	{
75	if (!tracing_selftest_disabled) {
76	tracing_selftest_disabled = true;
77	pr_info("Ftrace startup test is disabled due to %s\n", reason);
78	}
79	}
80	#else
81	#define tracing_selftest_running 0
82	#define tracing_selftest_disabled 0
83	#endif
84
85	/ Pipe tracepoints to printk /
86	static struct trace_iterator *tracepoint_print_iter;
87	int tracepoint_printk;
88	static bool tracepoint_printk_stop_on_boot __initdata;
89	static DEFINE_STATIC_KEY_FALSE(tracepoint_printk_key);
90
91	/ For tracers that don't implement custom flags /
92	static struct tracer_opt dummy_tracer_opt[] = {
93	{ }
94	};
95
96	static int
97	dummy_set_flag(struct trace_array tr, u32 old_flags, u32 bit, int* set)
98	{
99	return `0`;
100	}
101
102	/*
103	* To prevent the comm cache from being overwritten when no
104	* tracing is active, only save the comm when a trace event
105	* occurred.
106	*/
107	static DEFINE_PER_CPU(bool, trace_taskinfo_save);
108
109	/*
110	* Kill all tracing for good (never come back).
111	* It is initialized to 1 but will turn to zero if the initialization
112	* of the tracer is successful. But that is the only place that sets
113	* this back to zero.
114	*/
115	static int tracing_disabled = `1`;
116
117	cpumask_var_t __read_mostly tracing_buffer_mask;
118
119	/*
120	* ftrace_dump_on_oops - variable to dump ftrace buffer on oops
121	*
122	* If there is an oops (or kernel panic) and the ftrace_dump_on_oops
123	* is set, then ftrace_dump is called. This will output the contents
124	* of the ftrace buffers to the console. This is very useful for
125	* capturing traces that lead to crashes and outputing it to a
126	* serial console.
127	*
128	* It is default off, but you can enable it with either specifying
129	* "ftrace_dump_on_oops" in the kernel command line, or setting
130	* /proc/sys/kernel/ftrace_dump_on_oops
131	* Set 1 if you want to dump buffers of all CPUs
132	* Set 2 if you want to dump the buffer of the CPU that triggered oops
133	*/
134
135	enum ftrace_dump_mode ftrace_dump_on_oops;
136
137	/ When set, tracing will stop when a WARN() is hit /*
138	int __disable_trace_on_warning;
139
140	#ifdef CONFIG_TRACE_EVAL_MAP_FILE
141	/ Map of enums to their values, for "eval_map" file /
142	struct trace_eval_map_head {
143	struct module *mod;
144	unsigned long length;
145	};
146
147	union trace_eval_map_item;
148
149	struct trace_eval_map_tail {
150	/*
151	* "end" is first and points to NULL as it must be different
152	* than "mod" or "eval_string"
153	*/
154	union trace_eval_map_item *next;
155	const char end; /* points to NULL /
156	};
157
158	static DEFINE_MUTEX(trace_eval_mutex);
159
160	/*
161	* The trace_eval_maps are saved in an array with two extra elements,
162	* one at the beginning, and one at the end. The beginning item contains
163	* the count of the saved maps (head.length), and the module they
164	* belong to if not built in (head.mod). The ending item contains a
165	* pointer to the next array of saved eval_map items.
166	*/
167	union trace_eval_map_item {
168	struct trace_eval_map map;
169	struct trace_eval_map_head head;
170	struct trace_eval_map_tail tail;
171	};
172
173	static union trace_eval_map_item *trace_eval_maps;
174	#endif /* CONFIG_TRACE_EVAL_MAP_FILE */
175
176	int tracing_set_tracer(struct trace_array tr, const* char *buf);
177	static void ftrace_trace_userstack(struct trace_array *tr,
178	struct trace_buffer *buffer,
179	unsigned int trace_ctx);
180
181	#define MAX_TRACER_SIZE 100
182	static char bootup_tracer_buf[MAX_TRACER_SIZE] __initdata;
183	static char *default_bootup_tracer;
184
185	static bool allocate_snapshot;
186	static bool snapshot_at_boot;
187
188	static char boot_instance_info[COMMAND_LINE_SIZE] __initdata;
189	static int boot_instance_index;
190
191	static char boot_snapshot_info[COMMAND_LINE_SIZE] __initdata;
192	static int boot_snapshot_index;
193
194	static int __init set_cmdline_ftrace(char *str)
195	{
196	strscpy(p: bootup_tracer_buf, q: str, MAX_TRACER_SIZE);
197	default_bootup_tracer = bootup_tracer_buf;
198	/ We are using ftrace early, expand it /
199	trace_set_ring_buffer_expanded(NULL);
200	return `1`;
201	}
202	__setup("ftrace=", set_cmdline_ftrace);
203
204	static int __init set_ftrace_dump_on_oops(char *str)
205	{
206	if (str++ != `'='` \|\| !str \|\| !strcmp("1", str)) {
207	ftrace_dump_on_oops = DUMP_ALL;
208	return `1`;
209	}
210
211	if (!strcmp("orig_cpu", str) \|\| !strcmp("2", str)) {
212	ftrace_dump_on_oops = DUMP_ORIG;
213	return `1`;
214	}
215
216	return `0`;
217	}
218	__setup("ftrace_dump_on_oops", set_ftrace_dump_on_oops);
219
220	static int __init stop_trace_on_warning(char *str)
221	{
222	if ((strcmp(str, "=0") != `0` && strcmp(str, "=off") != `0`))
223	__disable_trace_on_warning = `1`;
224	return `1`;
225	}
226	__setup("traceoff_on_warning", stop_trace_on_warning);
227
228	static int __init boot_alloc_snapshot(char *str)
229	{
230	char *slot = boot_snapshot_info + boot_snapshot_index;
231	int left = sizeof(boot_snapshot_info) - boot_snapshot_index;
232	int ret;
233
234	if (str[`0`] == `'='`) {
235	str++;
236	if (strlen(str) >= left)
237	return -`1`;
238
239	ret = snprintf(buf: slot, size: left, fmt: "%s\t", str);
240	boot_snapshot_index += ret;
241	} else {
242	allocate_snapshot = true;
243	/ We also need the main ring buffer expanded /
244	trace_set_ring_buffer_expanded(NULL);
245	}
246	return `1`;
247	}
248	__setup("alloc_snapshot", boot_alloc_snapshot);
249
250
251	static int __init boot_snapshot(char *str)
252	{
253	snapshot_at_boot = true;
254	boot_alloc_snapshot(str);
255	return `1`;
256	}
257	__setup("ftrace_boot_snapshot", boot_snapshot);
258
259
260	static int __init boot_instance(char *str)
261	{
262	char *slot = boot_instance_info + boot_instance_index;
263	int left = sizeof(boot_instance_info) - boot_instance_index;
264	int ret;
265
266	if (strlen(str) >= left)
267	return -`1`;
268
269	ret = snprintf(buf: slot, size: left, fmt: "%s\t", str);
270	boot_instance_index += ret;
271
272	return `1`;
273	}
274	__setup("trace_instance=", boot_instance);
275
276
277	static char trace_boot_options_buf[MAX_TRACER_SIZE] __initdata;
278
279	static int __init set_trace_boot_options(char *str)
280	{
281	strscpy(p: trace_boot_options_buf, q: str, MAX_TRACER_SIZE);
282	return `1`;
283	}
284	__setup("trace_options=", set_trace_boot_options);
285
286	static char trace_boot_clock_buf[MAX_TRACER_SIZE] __initdata;
287	static char *trace_boot_clock __initdata;
288
289	static int __init set_trace_boot_clock(char *str)
290	{
291	strscpy(p: trace_boot_clock_buf, q: str, MAX_TRACER_SIZE);
292	trace_boot_clock = trace_boot_clock_buf;
293	return `1`;
294	}
295	__setup("trace_clock=", set_trace_boot_clock);
296
297	static int __init set_tracepoint_printk(char *str)
298	{
299	/ Ignore the "tp_printk_stop_on_boot" param /
300	if (*str == `'_'`)
301	return `0`;
302
303	if ((strcmp(str, "=0") != `0` && strcmp(str, "=off") != `0`))
304	tracepoint_printk = `1`;
305	return `1`;
306	}
307	__setup("tp_printk", set_tracepoint_printk);
308
309	static int __init set_tracepoint_printk_stop(char *str)
310	{
311	tracepoint_printk_stop_on_boot = true;
312	return `1`;
313	}
314	__setup("tp_printk_stop_on_boot", set_tracepoint_printk_stop);
315
316	unsigned long long ns2usecs(u64 nsec)
317	{
318	nsec += `500`;
319	do_div(nsec, `1000`);
320	return nsec;
321	}
322
323	static void
324	trace_process_export(struct trace_export *export,
325	struct ring_buffer_event event, int* flag)
326	{
327	struct trace_entry *entry;
328	unsigned int size = `0`;
329
330	if (export->flags & flag) {
331	entry = ring_buffer_event_data(event);
332	size = ring_buffer_event_length(event);
333	export->write(export, entry, size);
334	}
335	}
336
337	static DEFINE_MUTEX(ftrace_export_lock);
338
339	static struct trace_export __rcu *ftrace_exports_list __read_mostly;
340
341	static DEFINE_STATIC_KEY_FALSE(trace_function_exports_enabled);
342	static DEFINE_STATIC_KEY_FALSE(trace_event_exports_enabled);
343	static DEFINE_STATIC_KEY_FALSE(trace_marker_exports_enabled);
344
345	static inline void ftrace_exports_enable(struct trace_export *export)
346	{
347	if (export->flags & TRACE_EXPORT_FUNCTION)
348	static_branch_inc(&trace_function_exports_enabled);
349
350	if (export->flags & TRACE_EXPORT_EVENT)
351	static_branch_inc(&trace_event_exports_enabled);
352
353	if (export->flags & TRACE_EXPORT_MARKER)
354	static_branch_inc(&trace_marker_exports_enabled);
355	}
356
357	static inline void ftrace_exports_disable(struct trace_export *export)
358	{
359	if (export->flags & TRACE_EXPORT_FUNCTION)
360	static_branch_dec(&trace_function_exports_enabled);
361
362	if (export->flags & TRACE_EXPORT_EVENT)
363	static_branch_dec(&trace_event_exports_enabled);
364
365	if (export->flags & TRACE_EXPORT_MARKER)
366	static_branch_dec(&trace_marker_exports_enabled);
367	}
368
369	static void ftrace_exports(struct ring_buffer_event event, int* flag)
370	{
371	struct trace_export *export;
372
373	preempt_disable_notrace();
374
375	export = rcu_dereference_raw_check(ftrace_exports_list);
376	while (export) {
377	trace_process_export(export, event, flag);
378	export = rcu_dereference_raw_check(export->next);
379	}
380
381	preempt_enable_notrace();
382	}
383
384	static inline void
385	add_trace_export(struct trace_export list, struct** trace_export *export)
386	{
387	rcu_assign_pointer(export->next, *list);
388	/*
389	* We are entering export into the list but another
390	* CPU might be walking that list. We need to make sure
391	* the export->next pointer is valid before another CPU sees
392	* the export pointer included into the list.
393	*/
394	rcu_assign_pointer(*list, export);
395	}
396
397	static inline int
398	rm_trace_export(struct trace_export list, struct** trace_export *export)
399	{
400	struct trace_export **p;
401
402	for (p = list; p != NULL; p = &(p)->next)
403	if (*p == export)
404	break;
405
406	if (*p != export)
407	return -`1`;
408
409	rcu_assign_pointer(p, (p)->next);
410
411	return `0`;
412	}
413
414	static inline void
415	add_ftrace_export(struct trace_export list, struct** trace_export *export)
416	{
417	ftrace_exports_enable(export);
418
419	add_trace_export(list, export);
420	}
421
422	static inline int
423	rm_ftrace_export(struct trace_export list, struct** trace_export *export)
424	{
425	int ret;
426
427	ret = rm_trace_export(list, export);
428	ftrace_exports_disable(export);
429
430	return ret;
431	}
432
433	int register_ftrace_export(struct trace_export *export)
434	{
435	if (WARN_ON_ONCE(!export->write))
436	return -`1`;
437
438	mutex_lock(&ftrace_export_lock);
439
440	add_ftrace_export(list: &ftrace_exports_list, export);
441
442	mutex_unlock(lock: &ftrace_export_lock);
443
444	return `0`;
445	}
446	EXPORT_SYMBOL_GPL(register_ftrace_export);
447
448	int unregister_ftrace_export(struct trace_export *export)
449	{
450	int ret;
451
452	mutex_lock(&ftrace_export_lock);
453
454	ret = rm_ftrace_export(list: &ftrace_exports_list, export);
455
456	mutex_unlock(lock: &ftrace_export_lock);
457
458	return ret;
459	}
460	EXPORT_SYMBOL_GPL(unregister_ftrace_export);
461
462	/ trace_flags holds trace_options default values /
463	#define TRACE_DEFAULT_FLAGS \
464	(FUNCTION_DEFAULT_FLAGS \| \
465	TRACE_ITER_PRINT_PARENT \| TRACE_ITER_PRINTK \| \
466	TRACE_ITER_ANNOTATE \| TRACE_ITER_CONTEXT_INFO \| \
467	TRACE_ITER_RECORD_CMD \| TRACE_ITER_OVERWRITE \| \
468	TRACE_ITER_IRQ_INFO \| TRACE_ITER_MARKERS \| \
469	TRACE_ITER_HASH_PTR)
470
471	/ trace_options that are only supported by global_trace /
472	#define TOP_LEVEL_TRACE_FLAGS (TRACE_ITER_PRINTK \| \
473	TRACE_ITER_PRINTK_MSGONLY \| TRACE_ITER_RECORD_CMD)
474
475	/ trace_flags that are default zero for instances /
476	#define ZEROED_TRACE_FLAGS \
477	(TRACE_ITER_EVENT_FORK \| TRACE_ITER_FUNC_FORK)
478
479	/*
480	* The global_trace is the descriptor that holds the top-level tracing
481	* buffers for the live tracing.
482	*/
483	static struct trace_array global_trace = {
484	.trace_flags = TRACE_DEFAULT_FLAGS,
485	};
486
487	void trace_set_ring_buffer_expanded(struct trace_array *tr)
488	{
489	if (!tr)
490	tr = &global_trace;
491	tr->ring_buffer_expanded = true;
492	}
493
494	LIST_HEAD(ftrace_trace_arrays);
495
496	int trace_array_get(struct trace_array *this_tr)
497	{
498	struct trace_array *tr;
499	int ret = -ENODEV;
500
501	mutex_lock(&trace_types_lock);
502	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
503	if (tr == this_tr) {
504	tr->ref++;
505	ret = `0`;
506	break;
507	}
508	}
509	mutex_unlock(lock: &trace_types_lock);
510
511	return ret;
512	}
513
514	static void __trace_array_put(struct trace_array *this_tr)
515	{
516	WARN_ON(!this_tr->ref);
517	this_tr->ref--;
518	}
519
520	/**
521	* trace_array_put - Decrement the reference counter for this trace array.
522	* @this_tr : pointer to the trace array
523	*
524	* NOTE: Use this when we no longer need the trace array returned by
525	* trace_array_get_by_name(). This ensures the trace array can be later
526	* destroyed.
527	*
528	*/
529	void trace_array_put(struct trace_array *this_tr)
530	{
531	if (!this_tr)
532	return;
533
534	mutex_lock(&trace_types_lock);
535	__trace_array_put(this_tr);
536	mutex_unlock(lock: &trace_types_lock);
537	}
538	EXPORT_SYMBOL_GPL(trace_array_put);
539
540	int tracing_check_open_get_tr(struct trace_array *tr)
541	{
542	int ret;
543
544	ret = security_locked_down(what: LOCKDOWN_TRACEFS);
545	if (ret)
546	return ret;
547
548	if (tracing_disabled)
549	return -ENODEV;
550
551	if (tr && trace_array_get(this_tr: tr) < `0`)
552	return -ENODEV;
553
554	return `0`;
555	}
556
557	int call_filter_check_discard(struct trace_event_call call, void* *rec,
558	struct trace_buffer *buffer,
559	struct ring_buffer_event *event)
560	{
561	if (unlikely(call->flags & TRACE_EVENT_FL_FILTERED) &&
562	!filter_match_preds(filter: call->filter, rec)) {
563	__trace_event_discard_commit(buffer, event);
564	return `1`;
565	}
566
567	return `0`;
568	}
569
570	/**
571	* trace_find_filtered_pid - check if a pid exists in a filtered_pid list
572	* @filtered_pids: The list of pids to check
573	* @search_pid: The PID to find in @filtered_pids
574	*
575	* Returns true if @search_pid is found in @filtered_pids, and false otherwise.
576	*/
577	bool
578	trace_find_filtered_pid(struct trace_pid_list *filtered_pids, pid_t search_pid)
579	{
580	return trace_pid_list_is_set(pid_list: filtered_pids, pid: search_pid);
581	}
582
583	/**
584	* trace_ignore_this_task - should a task be ignored for tracing
585	* @filtered_pids: The list of pids to check
586	* @filtered_no_pids: The list of pids not to be traced
587	* @task: The task that should be ignored if not filtered
588	*
589	* Checks if @task should be traced or not from @filtered_pids.
590	* Returns true if @task should NOT be traced.
591	* Returns false if @task should be traced.
592	*/
593	bool
594	trace_ignore_this_task(struct trace_pid_list *filtered_pids,
595	struct trace_pid_list *filtered_no_pids,
596	struct task_struct *task)
597	{
598	/*
599	* If filtered_no_pids is not empty, and the task's pid is listed
600	* in filtered_no_pids, then return true.
601	* Otherwise, if filtered_pids is empty, that means we can
602	* trace all tasks. If it has content, then only trace pids
603	* within filtered_pids.
604	*/
605
606	return (filtered_pids &&
607	!trace_find_filtered_pid(filtered_pids, search_pid: task->pid)) \|\|
608	(filtered_no_pids &&
609	trace_find_filtered_pid(filtered_pids: filtered_no_pids, search_pid: task->pid));
610	}
611
612	/**
613	* trace_filter_add_remove_task - Add or remove a task from a pid_list
614	* @pid_list: The list to modify
615	* @self: The current task for fork or NULL for exit
616	* @task: The task to add or remove
617	*
618	* If adding a task, if @self is defined, the task is only added if @self
619	* is also included in @pid_list. This happens on fork and tasks should
620	* only be added when the parent is listed. If @self is NULL, then the
621	* @task pid will be removed from the list, which would happen on exit
622	* of a task.
623	*/
624	void trace_filter_add_remove_task(struct trace_pid_list *pid_list,
625	struct task_struct *self,
626	struct task_struct *task)
627	{
628	if (!pid_list)
629	return;
630
631	/ For forks, we only add if the forking task is listed /
632	if (self) {
633	if (!trace_find_filtered_pid(filtered_pids: pid_list, search_pid: self->pid))
634	return;
635	}
636
637	/ "self" is set for forks, and NULL for exits /
638	if (self)
639	trace_pid_list_set(pid_list, pid: task->pid);
640	else
641	trace_pid_list_clear(pid_list, pid: task->pid);
642	}
643
644	/**
645	* trace_pid_next - Used for seq_file to get to the next pid of a pid_list
646	* @pid_list: The pid list to show
647	* @v: The last pid that was shown (+1 the actual pid to let zero be displayed)
648	* @pos: The position of the file
649	*
650	* This is used by the seq_file "next" operation to iterate the pids
651	* listed in a trace_pid_list structure.
652	*
653	* Returns the pid+1 as we want to display pid of zero, but NULL would
654	* stop the iteration.
655	*/
656	void trace_pid_next(struct* trace_pid_list pid_list, void* v, loff_t pos)
657	{
658	long pid = (unsigned long)v;
659	unsigned int next;
660
661	(*pos)++;
662
663	/ pid already is +1 of the actual previous bit /
664	if (trace_pid_list_next(pid_list, pid, next: &next) < `0`)
665	return NULL;
666
667	pid = next;
668
669	/ Return pid + 1 to allow zero to be represented /
670	return (void *)(pid + `1`);
671	}
672
673	/**
674	* trace_pid_start - Used for seq_file to start reading pid lists
675	* @pid_list: The pid list to show
676	* @pos: The position of the file
677	*
678	* This is used by seq_file "start" operation to start the iteration
679	* of listing pids.
680	*
681	* Returns the pid+1 as we want to display pid of zero, but NULL would
682	* stop the iteration.
683	*/
684	void trace_pid_start(struct* trace_pid_list pid_list, loff_t pos)
685	{
686	unsigned long pid;
687	unsigned int first;
688	loff_t l = `0`;
689
690	if (trace_pid_list_first(pid_list, pid: &first) < `0`)
691	return NULL;
692
693	pid = first;
694
695	/ Return pid + 1 so that zero can be the exit value /
696	for (pid++; pid && l < *pos;
697	pid = (unsigned long)trace_pid_next(pid_list, v: (void *)pid, pos: &l))
698	;
699	return (void *)pid;
700	}
701
702	/**
703	* trace_pid_show - show the current pid in seq_file processing
704	* @m: The seq_file structure to write into
705	* @v: A void pointer of the pid (+1) value to display
706	*
707	* Can be directly used by seq_file operations to display the current
708	* pid value.
709	*/
710	int trace_pid_show(struct seq_file m, void* *v)
711	{
712	unsigned long pid = (unsigned long)v - `1`;
713
714	seq_printf(m, fmt: "%lu\n", pid);
715	return `0`;
716	}
717
718	/ 128 should be much more than enough /
719	#define PID_BUF_SIZE 127
720
721	int trace_pid_write(struct trace_pid_list *filtered_pids,
722	struct trace_pid_list **new_pid_list,
723	const char __user *ubuf, size_t cnt)
724	{
725	struct trace_pid_list *pid_list;
726	struct trace_parser parser;
727	unsigned long val;
728	int nr_pids = `0`;
729	ssize_t read = `0`;
730	ssize_t ret;
731	loff_t pos;
732	pid_t pid;
733
734	if (trace_parser_get_init(parser: &parser, PID_BUF_SIZE + `1`))
735	return -ENOMEM;
736
737	/*
738	* Always recreate a new array. The write is an all or nothing
739	* operation. Always create a new array when adding new pids by
740	* the user. If the operation fails, then the current list is
741	* not modified.
742	*/
743	pid_list = trace_pid_list_alloc();
744	if (!pid_list) {
745	trace_parser_put(parser: &parser);
746	return -ENOMEM;
747	}
748
749	if (filtered_pids) {
750	/ copy the current bits to the new max /
751	ret = trace_pid_list_first(pid_list: filtered_pids, pid: &pid);
752	while (!ret) {
753	trace_pid_list_set(pid_list, pid);
754	ret = trace_pid_list_next(pid_list: filtered_pids, pid: pid + `1`, next: &pid);
755	nr_pids++;
756	}
757	}
758
759	ret = `0`;
760	while (cnt > `0`) {
761
762	pos = `0`;
763
764	ret = trace_get_user(parser: &parser, ubuf, cnt, ppos: &pos);
765	if (ret < `0`)
766	break;
767
768	read += ret;
769	ubuf += ret;
770	cnt -= ret;
771
772	if (!trace_parser_loaded(parser: &parser))
773	break;
774
775	ret = -EINVAL;
776	if (kstrtoul(s: parser.buffer, base: `0`, res: &val))
777	break;
778
779	pid = (pid_t)val;
780
781	if (trace_pid_list_set(pid_list, pid) < `0`) {
782	ret = -`1`;
783	break;
784	}
785	nr_pids++;
786
787	trace_parser_clear(parser: &parser);
788	ret = `0`;
789	}
790	trace_parser_put(parser: &parser);
791
792	if (ret < `0`) {
793	trace_pid_list_free(pid_list);
794	return ret;
795	}
796
797	if (!nr_pids) {
798	/ Cleared the list of pids /
799	trace_pid_list_free(pid_list);
800	pid_list = NULL;
801	}
802
803	*new_pid_list = pid_list;
804
805	return read;
806	}
807
808	static u64 buffer_ftrace_now(struct array_buffer buf, int* cpu)
809	{
810	u64 ts;
811
812	/ Early boot up does not have a buffer yet /
813	if (!buf->buffer)
814	return trace_clock_local();
815
816	ts = ring_buffer_time_stamp(buffer: buf->buffer);
817	ring_buffer_normalize_time_stamp(buffer: buf->buffer, cpu, ts: &ts);
818
819	return ts;
820	}
821
822	u64 ftrace_now(int cpu)
823	{
824	return buffer_ftrace_now(buf: &global_trace.array_buffer, cpu);
825	}
826
827	/**
828	* tracing_is_enabled - Show if global_trace has been enabled
829	*
830	* Shows if the global trace has been enabled or not. It uses the
831	* mirror flag "buffer_disabled" to be used in fast paths such as for
832	* the irqsoff tracer. But it may be inaccurate due to races. If you
833	* need to know the accurate state, use tracing_is_on() which is a little
834	* slower, but accurate.
835	*/
836	int tracing_is_enabled(void)
837	{
838	/*
839	* For quick access (irqsoff uses this in fast path), just
840	* return the mirror variable of the state of the ring buffer.
841	* It's a little racy, but we don't really care.
842	*/
843	smp_rmb();
844	return !global_trace.buffer_disabled;
845	}
846
847	/*
848	* trace_buf_size is the size in bytes that is allocated
849	* for a buffer. Note, the number of bytes is always rounded
850	* to page size.
851	*
852	* This number is purposely set to a low number of 16384.
853	* If the dump on oops happens, it will be much appreciated
854	* to not have to wait for all that output. Anyway this can be
855	* boot time and run time configurable.
856	*/
857	#define TRACE_BUF_SIZE_DEFAULT 1441792UL /* 16384 * 88 (sizeof(entry)) */
858
859	static unsigned long trace_buf_size = TRACE_BUF_SIZE_DEFAULT;
860
861	/ trace_types holds a link list of available tracers. /
862	static struct tracer *trace_types __read_mostly;
863
864	/*
865	* trace_types_lock is used to protect the trace_types list.
866	*/
867	DEFINE_MUTEX(trace_types_lock);
868
869	/*
870	* serialize the access of the ring buffer
871	*
872	* ring buffer serializes readers, but it is low level protection.
873	* The validity of the events (which returns by ring_buffer_peek() ..etc)
874	* are not protected by ring buffer.
875	*
876	* The content of events may become garbage if we allow other process consumes
877	* these events concurrently:
878	* A) the page of the consumed events may become a normal page
879	* (not reader page) in ring buffer, and this page will be rewritten
880	* by events producer.
881	* B) The page of the consumed events may become a page for splice_read,
882	* and this page will be returned to system.
883	*
884	* These primitives allow multi process access to different cpu ring buffer
885	* concurrently.
886	*
887	* These primitives don't distinguish read-only and read-consume access.
888	* Multi read-only access are also serialized.
889	*/
890
891	#ifdef CONFIG_SMP
892	static DECLARE_RWSEM(all_cpu_access_lock);
893	static DEFINE_PER_CPU(struct mutex, cpu_access_lock);
894
895	static inline void trace_access_lock(int cpu)
896	{
897	if (cpu == RING_BUFFER_ALL_CPUS) {
898	/ gain it for accessing the whole ring buffer. /
899	down_write(sem: &all_cpu_access_lock);
900	} else {
901	/ gain it for accessing a cpu ring buffer. /
902
903	/ Firstly block other trace_access_lock(RING_BUFFER_ALL_CPUS). /
904	down_read(sem: &all_cpu_access_lock);
905
906	/ Secondly block other access to this @cpu ring buffer. /
907	mutex_lock(&per_cpu(cpu_access_lock, cpu));
908	}
909	}
910
911	static inline void trace_access_unlock(int cpu)
912	{
913	if (cpu == RING_BUFFER_ALL_CPUS) {
914	up_write(sem: &all_cpu_access_lock);
915	} else {
916	mutex_unlock(lock: &per_cpu(cpu_access_lock, cpu));
917	up_read(sem: &all_cpu_access_lock);
918	}
919	}
920
921	static inline void trace_access_lock_init(void)
922	{
923	int cpu;
924
925	for_each_possible_cpu(cpu)
926	mutex_init(&per_cpu(cpu_access_lock, cpu));
927	}
928
929	#else
930
931	static DEFINE_MUTEX(access_lock);
932
933	static inline void trace_access_lock(int cpu)
934	{
935	(void)cpu;
936	mutex_lock(&access_lock);
937	}
938
939	static inline void trace_access_unlock(int cpu)
940	{
941	(void)cpu;
942	mutex_unlock(&access_lock);
943	}
944
945	static inline void trace_access_lock_init(void)
946	{
947	}
948
949	#endif
950
951	#ifdef CONFIG_STACKTRACE
952	static void __ftrace_trace_stack(struct trace_buffer *buffer,
953	unsigned int trace_ctx,
954	int skip, struct pt_regs *regs);
955	static inline void ftrace_trace_stack(struct trace_array *tr,
956	struct trace_buffer *buffer,
957	unsigned int trace_ctx,
958	int skip, struct pt_regs *regs);
959
960	#else
961	static inline void __ftrace_trace_stack(struct trace_buffer *buffer,
962	unsigned int trace_ctx,
963	int skip, struct pt_regs *regs)
964	{
965	}
966	static inline void ftrace_trace_stack(struct trace_array *tr,
967	struct trace_buffer *buffer,
968	unsigned long trace_ctx,
969	int skip, struct pt_regs *regs)
970	{
971	}
972
973	#endif
974
975	static __always_inline void
976	trace_event_setup(struct ring_buffer_event *event,
977	int type, unsigned int trace_ctx)
978	{
979	struct trace_entry *ent = ring_buffer_event_data(event);
980
981	tracing_generic_entry_update(entry: ent, type, trace_ctx);
982	}
983
984	static __always_inline struct ring_buffer_event *
985	__trace_buffer_lock_reserve(struct trace_buffer *buffer,
986	int type,
987	unsigned long len,
988	unsigned int trace_ctx)
989	{
990	struct ring_buffer_event *event;
991
992	event = ring_buffer_lock_reserve(buffer, length: len);
993	if (event != NULL)
994	trace_event_setup(event, type, trace_ctx);
995
996	return event;
997	}
998
999	void tracer_tracing_on(struct trace_array *tr)
1000	{
1001	if (tr->array_buffer.buffer)
1002	ring_buffer_record_on(buffer: tr->array_buffer.buffer);
1003	/*
1004	* This flag is looked at when buffers haven't been allocated
1005	* yet, or by some tracers (like irqsoff), that just want to
1006	* know if the ring buffer has been disabled, but it can handle
1007	* races of where it gets disabled but we still do a record.
1008	* As the check is in the fast path of the tracers, it is more
1009	* important to be fast than accurate.
1010	*/
1011	tr->buffer_disabled = `0`;
1012	/ Make the flag seen by readers /
1013	smp_wmb();
1014	}
1015
1016	/**
1017	* tracing_on - enable tracing buffers
1018	*
1019	* This function enables tracing buffers that may have been
1020	* disabled with tracing_off.
1021	*/
1022	void tracing_on(void)
1023	{
1024	tracer_tracing_on(tr: &global_trace);
1025	}
1026	EXPORT_SYMBOL_GPL(tracing_on);
1027
1028
1029	static __always_inline void
1030	__buffer_unlock_commit(struct trace_buffer buffer, struct* ring_buffer_event *event)
1031	{
1032	__this_cpu_write(trace_taskinfo_save, true);
1033
1034	/ If this is the temp buffer, we need to commit fully /
1035	if (this_cpu_read(trace_buffered_event) == event) {
1036	/ Length is in event->array[0] /
1037	ring_buffer_write(buffer, length: event->array[`0`], data: &event->array[`1`]);
1038	/ Release the temp buffer /
1039	this_cpu_dec(trace_buffered_event_cnt);
1040	/ ring_buffer_unlock_commit() enables preemption /
1041	preempt_enable_notrace();
1042	} else
1043	ring_buffer_unlock_commit(buffer);
1044	}
1045
1046	int __trace_array_puts(struct trace_array tr, unsigned* long ip,
1047	const char str, int* size)
1048	{
1049	struct ring_buffer_event *event;
1050	struct trace_buffer *buffer;
1051	struct print_entry *entry;
1052	unsigned int trace_ctx;
1053	int alloc;
1054
1055	if (!(tr->trace_flags & TRACE_ITER_PRINTK))
1056	return `0`;
1057
1058	if (unlikely(tracing_selftest_running && tr == &global_trace))
1059	return `0`;
1060
1061	if (unlikely(tracing_disabled))
1062	return `0`;
1063
1064	alloc = sizeof(entry) + size + `2`; /* possible \n added /
1065
1066	trace_ctx = tracing_gen_ctx();
1067	buffer = tr->array_buffer.buffer;
1068	ring_buffer_nest_start(buffer);
1069	event = __trace_buffer_lock_reserve(buffer, type: TRACE_PRINT, len: alloc,
1070	trace_ctx);
1071	if (!event) {
1072	size = `0`;
1073	goto out;
1074	}
1075
1076	entry = ring_buffer_event_data(event);
1077	entry->ip = ip;
1078
1079	memcpy(&entry->buf, str, size);
1080
1081	/ Add a newline if necessary /
1082	if (entry->buf[size - `1`] != `'\n'`) {
1083	entry->buf[size] = `'\n'`;
1084	entry->buf[size + `1`] = `'\0'`;
1085	} else
1086	entry->buf[size] = `'\0'`;
1087
1088	__buffer_unlock_commit(buffer, event);
1089	ftrace_trace_stack(tr, buffer, trace_ctx, skip: `4`, NULL);
1090	out:
1091	ring_buffer_nest_end(buffer);
1092	return size;
1093	}
1094	EXPORT_SYMBOL_GPL(__trace_array_puts);
1095
1096	/**
1097	* __trace_puts - write a constant string into the trace buffer.
1098	* @ip: The address of the caller
1099	* @str: The constant string to write
1100	* @size: The size of the string.
1101	*/
1102	int __trace_puts(unsigned long ip, const char str, int* size)
1103	{
1104	return __trace_array_puts(&global_trace, ip, str, size);
1105	}
1106	EXPORT_SYMBOL_GPL(__trace_puts);
1107
1108	/**
1109	* __trace_bputs - write the pointer to a constant string into trace buffer
1110	* @ip: The address of the caller
1111	* @str: The constant string to write to the buffer to
1112	*/
1113	int __trace_bputs(unsigned long ip, const char *str)
1114	{
1115	struct ring_buffer_event *event;
1116	struct trace_buffer *buffer;
1117	struct bputs_entry *entry;
1118	unsigned int trace_ctx;
1119	int size = sizeof(struct bputs_entry);
1120	int ret = `0`;
1121
1122	if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
1123	return `0`;
1124
1125	if (unlikely(tracing_selftest_running \|\| tracing_disabled))
1126	return `0`;
1127
1128	trace_ctx = tracing_gen_ctx();
1129	buffer = global_trace.array_buffer.buffer;
1130
1131	ring_buffer_nest_start(buffer);
1132	event = __trace_buffer_lock_reserve(buffer, type: TRACE_BPUTS, len: size,
1133	trace_ctx);
1134	if (!event)
1135	goto out;
1136
1137	entry = ring_buffer_event_data(event);
1138	entry->ip = ip;
1139	entry->str = str;
1140
1141	__buffer_unlock_commit(buffer, event);
1142	ftrace_trace_stack(tr: &global_trace, buffer, trace_ctx, skip: `4`, NULL);
1143
1144	ret = `1`;
1145	out:
1146	ring_buffer_nest_end(buffer);
1147	return ret;
1148	}
1149	EXPORT_SYMBOL_GPL(__trace_bputs);
1150
1151	#ifdef CONFIG_TRACER_SNAPSHOT
1152	static void tracing_snapshot_instance_cond(struct trace_array *tr,
1153	void *cond_data)
1154	{
1155	struct tracer *tracer = tr->current_trace;
1156	unsigned long flags;
1157
1158	if (in_nmi()) {
1159	trace_array_puts(tr, "* SNAPSHOT CALLED FROM NMI CONTEXT *\n");
1160	trace_array_puts(tr, "* snapshot is being ignored *\n");
1161	return;
1162	}
1163
1164	if (!tr->allocated_snapshot) {
1165	trace_array_puts(tr, "* SNAPSHOT NOT ALLOCATED *\n");
1166	trace_array_puts(tr, "* stopping trace here! *\n");
1167	tracer_tracing_off(tr);
1168	return;
1169	}
1170
1171	/ Note, snapshot can not be used when the tracer uses it /
1172	if (tracer->use_max_tr) {
1173	trace_array_puts(tr, "* LATENCY TRACER ACTIVE *\n");
1174	trace_array_puts(tr, "* Can not use snapshot (sorry) *\n");
1175	return;
1176	}
1177
1178	local_irq_save(flags);
1179	update_max_tr(tr, current, smp_processor_id(), cond_data);
1180	local_irq_restore(flags);
1181	}
1182
1183	void tracing_snapshot_instance(struct trace_array *tr)
1184	{
1185	tracing_snapshot_instance_cond(tr, NULL);
1186	}
1187
1188	/**
1189	* tracing_snapshot - take a snapshot of the current buffer.
1190	*
1191	* This causes a swap between the snapshot buffer and the current live
1192	* tracing buffer. You can use this to take snapshots of the live
1193	* trace when some condition is triggered, but continue to trace.
1194	*
1195	* Note, make sure to allocate the snapshot with either
1196	* a tracing_snapshot_alloc(), or by doing it manually
1197	* with: echo 1 > /sys/kernel/tracing/snapshot
1198	*
1199	* If the snapshot buffer is not allocated, it will stop tracing.
1200	* Basically making a permanent snapshot.
1201	*/
1202	void tracing_snapshot(void)
1203	{
1204	struct trace_array *tr = &global_trace;
1205
1206	tracing_snapshot_instance(tr);
1207	}
1208	EXPORT_SYMBOL_GPL(tracing_snapshot);
1209
1210	/**
1211	* tracing_snapshot_cond - conditionally take a snapshot of the current buffer.
1212	* @tr: The tracing instance to snapshot
1213	* @cond_data: The data to be tested conditionally, and possibly saved
1214	*
1215	* This is the same as tracing_snapshot() except that the snapshot is
1216	* conditional - the snapshot will only happen if the
1217	* cond_snapshot.update() implementation receiving the cond_data
1218	* returns true, which means that the trace array's cond_snapshot
1219	* update() operation used the cond_data to determine whether the
1220	* snapshot should be taken, and if it was, presumably saved it along
1221	* with the snapshot.
1222	*/
1223	void tracing_snapshot_cond(struct trace_array tr, void* *cond_data)
1224	{
1225	tracing_snapshot_instance_cond(tr, cond_data);
1226	}
1227	EXPORT_SYMBOL_GPL(tracing_snapshot_cond);
1228
1229	/**
1230	* tracing_cond_snapshot_data - get the user data associated with a snapshot
1231	* @tr: The tracing instance
1232	*
1233	* When the user enables a conditional snapshot using
1234	* tracing_snapshot_cond_enable(), the user-defined cond_data is saved
1235	* with the snapshot. This accessor is used to retrieve it.
1236	*
1237	* Should not be called from cond_snapshot.update(), since it takes
1238	* the tr->max_lock lock, which the code calling
1239	* cond_snapshot.update() has already done.
1240	*
1241	* Returns the cond_data associated with the trace array's snapshot.
1242	*/
1243	void tracing_cond_snapshot_data(struct* trace_array *tr)
1244	{
1245	void *cond_data = NULL;
1246
1247	local_irq_disable();
1248	arch_spin_lock(&tr->max_lock);
1249
1250	if (tr->cond_snapshot)
1251	cond_data = tr->cond_snapshot->cond_data;
1252
1253	arch_spin_unlock(&tr->max_lock);
1254	local_irq_enable();
1255
1256	return cond_data;
1257	}
1258	EXPORT_SYMBOL_GPL(tracing_cond_snapshot_data);
1259
1260	static int resize_buffer_duplicate_size(struct array_buffer *trace_buf,
1261	struct array_buffer size_buf, int* cpu_id);
1262	static void set_buffer_entries(struct array_buffer buf, unsigned* long val);
1263
1264	int tracing_alloc_snapshot_instance(struct trace_array *tr)
1265	{
1266	int ret;
1267
1268	if (!tr->allocated_snapshot) {
1269
1270	/ allocate spare buffer /
1271	ret = resize_buffer_duplicate_size(trace_buf: &tr->max_buffer,
1272	size_buf: &tr->array_buffer, RING_BUFFER_ALL_CPUS);
1273	if (ret < `0`)
1274	return ret;
1275
1276	tr->allocated_snapshot = true;
1277	}
1278
1279	return `0`;
1280	}
1281
1282	static void free_snapshot(struct trace_array *tr)
1283	{
1284	/*
1285	* We don't free the ring buffer. instead, resize it because
1286	* The max_tr ring buffer has some state (e.g. ring->clock) and
1287	* we want preserve it.
1288	*/
1289	ring_buffer_resize(buffer: tr->max_buffer.buffer, size: `1`, RING_BUFFER_ALL_CPUS);
1290	set_buffer_entries(buf: &tr->max_buffer, val: `1`);
1291	tracing_reset_online_cpus(buf: &tr->max_buffer);
1292	tr->allocated_snapshot = false;
1293	}
1294
1295	/**
1296	* tracing_alloc_snapshot - allocate snapshot buffer.
1297	*
1298	* This only allocates the snapshot buffer if it isn't already
1299	* allocated - it doesn't also take a snapshot.
1300	*
1301	* This is meant to be used in cases where the snapshot buffer needs
1302	* to be set up for events that can't sleep but need to be able to
1303	* trigger a snapshot.
1304	*/
1305	int tracing_alloc_snapshot(void)
1306	{
1307	struct trace_array *tr = &global_trace;
1308	int ret;
1309
1310	ret = tracing_alloc_snapshot_instance(tr);
1311	WARN_ON(ret < `0`);
1312
1313	return ret;
1314	}
1315	EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
1316
1317	/**
1318	* tracing_snapshot_alloc - allocate and take a snapshot of the current buffer.
1319	*
1320	* This is similar to tracing_snapshot(), but it will allocate the
1321	* snapshot buffer if it isn't already allocated. Use this only
1322	* where it is safe to sleep, as the allocation may sleep.
1323	*
1324	* This causes a swap between the snapshot buffer and the current live
1325	* tracing buffer. You can use this to take snapshots of the live
1326	* trace when some condition is triggered, but continue to trace.
1327	*/
1328	void tracing_snapshot_alloc(void)
1329	{
1330	int ret;
1331
1332	ret = tracing_alloc_snapshot();
1333	if (ret < `0`)
1334	return;
1335
1336	tracing_snapshot();
1337	}
1338	EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
1339
1340	/**
1341	* tracing_snapshot_cond_enable - enable conditional snapshot for an instance
1342	* @tr: The tracing instance
1343	* @cond_data: User data to associate with the snapshot
1344	* @update: Implementation of the cond_snapshot update function
1345	*
1346	* Check whether the conditional snapshot for the given instance has
1347	* already been enabled, or if the current tracer is already using a
1348	* snapshot; if so, return -EBUSY, else create a cond_snapshot and
1349	* save the cond_data and update function inside.
1350	*
1351	* Returns 0 if successful, error otherwise.
1352	*/
1353	int tracing_snapshot_cond_enable(struct trace_array tr, void* *cond_data,
1354	cond_update_fn_t update)
1355	{
1356	struct cond_snapshot *cond_snapshot;
1357	int ret = `0`;
1358
1359	cond_snapshot = kzalloc(size: sizeof(*cond_snapshot), GFP_KERNEL);
1360	if (!cond_snapshot)
1361	return -ENOMEM;
1362
1363	cond_snapshot->cond_data = cond_data;
1364	cond_snapshot->update = update;
1365
1366	mutex_lock(&trace_types_lock);
1367
1368	ret = tracing_alloc_snapshot_instance(tr);
1369	if (ret)
1370	goto fail_unlock;
1371
1372	if (tr->current_trace->use_max_tr) {
1373	ret = -EBUSY;
1374	goto fail_unlock;
1375	}
1376
1377	/*
1378	* The cond_snapshot can only change to NULL without the
1379	* trace_types_lock. We don't care if we race with it going
1380	* to NULL, but we want to make sure that it's not set to
1381	* something other than NULL when we get here, which we can
1382	* do safely with only holding the trace_types_lock and not
1383	* having to take the max_lock.
1384	*/
1385	if (tr->cond_snapshot) {
1386	ret = -EBUSY;
1387	goto fail_unlock;
1388	}
1389
1390	local_irq_disable();
1391	arch_spin_lock(&tr->max_lock);
1392	tr->cond_snapshot = cond_snapshot;
1393	arch_spin_unlock(&tr->max_lock);
1394	local_irq_enable();
1395
1396	mutex_unlock(lock: &trace_types_lock);
1397
1398	return ret;
1399
1400	fail_unlock:
1401	mutex_unlock(lock: &trace_types_lock);
1402	kfree(objp: cond_snapshot);
1403	return ret;
1404	}
1405	EXPORT_SYMBOL_GPL(tracing_snapshot_cond_enable);
1406
1407	/**
1408	* tracing_snapshot_cond_disable - disable conditional snapshot for an instance
1409	* @tr: The tracing instance
1410	*
1411	* Check whether the conditional snapshot for the given instance is
1412	* enabled; if so, free the cond_snapshot associated with it,
1413	* otherwise return -EINVAL.
1414	*
1415	* Returns 0 if successful, error otherwise.
1416	*/
1417	int tracing_snapshot_cond_disable(struct trace_array *tr)
1418	{
1419	int ret = `0`;
1420
1421	local_irq_disable();
1422	arch_spin_lock(&tr->max_lock);
1423
1424	if (!tr->cond_snapshot)
1425	ret = -EINVAL;
1426	else {
1427	kfree(objp: tr->cond_snapshot);
1428	tr->cond_snapshot = NULL;
1429	}
1430
1431	arch_spin_unlock(&tr->max_lock);
1432	local_irq_enable();
1433
1434	return ret;
1435	}
1436	EXPORT_SYMBOL_GPL(tracing_snapshot_cond_disable);
1437	#else
1438	void tracing_snapshot(void)
1439	{
1440	WARN_ONCE(`1`, "Snapshot feature not enabled, but internal snapshot used");
1441	}
1442	EXPORT_SYMBOL_GPL(tracing_snapshot);
1443	void tracing_snapshot_cond(struct trace_array tr, void* *cond_data)
1444	{
1445	WARN_ONCE(`1`, "Snapshot feature not enabled, but internal conditional snapshot used");
1446	}
1447	EXPORT_SYMBOL_GPL(tracing_snapshot_cond);
1448	int tracing_alloc_snapshot(void)
1449	{
1450	WARN_ONCE(`1`, "Snapshot feature not enabled, but snapshot allocation used");
1451	return -ENODEV;
1452	}
1453	EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
1454	void tracing_snapshot_alloc(void)
1455	{
1456	/ Give warning /
1457	tracing_snapshot();
1458	}
1459	EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
1460	void tracing_cond_snapshot_data(struct* trace_array *tr)
1461	{
1462	return NULL;
1463	}
1464	EXPORT_SYMBOL_GPL(tracing_cond_snapshot_data);
1465	int tracing_snapshot_cond_enable(struct trace_array tr, void* *cond_data, cond_update_fn_t update)
1466	{
1467	return -ENODEV;
1468	}
1469	EXPORT_SYMBOL_GPL(tracing_snapshot_cond_enable);
1470	int tracing_snapshot_cond_disable(struct trace_array *tr)
1471	{
1472	return false;
1473	}
1474	EXPORT_SYMBOL_GPL(tracing_snapshot_cond_disable);
1475	#define free_snapshot(tr) do { } while (0)
1476	#endif /* CONFIG_TRACER_SNAPSHOT */
1477
1478	void tracer_tracing_off(struct trace_array *tr)
1479	{
1480	if (tr->array_buffer.buffer)
1481	ring_buffer_record_off(buffer: tr->array_buffer.buffer);
1482	/*
1483	* This flag is looked at when buffers haven't been allocated
1484	* yet, or by some tracers (like irqsoff), that just want to
1485	* know if the ring buffer has been disabled, but it can handle
1486	* races of where it gets disabled but we still do a record.
1487	* As the check is in the fast path of the tracers, it is more
1488	* important to be fast than accurate.
1489	*/
1490	tr->buffer_disabled = `1`;
1491	/ Make the flag seen by readers /
1492	smp_wmb();
1493	}
1494
1495	/**
1496	* tracing_off - turn off tracing buffers
1497	*
1498	* This function stops the tracing buffers from recording data.
1499	* It does not disable any overhead the tracers themselves may
1500	* be causing. This function simply causes all recording to
1501	* the ring buffers to fail.
1502	*/
1503	void tracing_off(void)
1504	{
1505	tracer_tracing_off(tr: &global_trace);
1506	}
1507	EXPORT_SYMBOL_GPL(tracing_off);
1508
1509	void disable_trace_on_warning(void)
1510	{
1511	if (__disable_trace_on_warning) {
1512	trace_array_printk_buf(buffer: global_trace.array_buffer.buffer, _THIS_IP_,
1513	fmt: "Disabling tracing due to warning\n");
1514	tracing_off();
1515	}
1516	}
1517
1518	/**
1519	* tracer_tracing_is_on - show real state of ring buffer enabled
1520	* @tr : the trace array to know if ring buffer is enabled
1521	*
1522	* Shows real state of the ring buffer if it is enabled or not.
1523	*/
1524	bool tracer_tracing_is_on(struct trace_array *tr)
1525	{
1526	if (tr->array_buffer.buffer)
1527	return ring_buffer_record_is_on(buffer: tr->array_buffer.buffer);
1528	return !tr->buffer_disabled;
1529	}
1530
1531	/**
1532	* tracing_is_on - show state of ring buffers enabled
1533	*/
1534	int tracing_is_on(void)
1535	{
1536	return tracer_tracing_is_on(tr: &global_trace);
1537	}
1538	EXPORT_SYMBOL_GPL(tracing_is_on);
1539
1540	static int __init set_buf_size(char *str)
1541	{
1542	unsigned long buf_size;
1543
1544	if (!str)
1545	return `0`;
1546	buf_size = memparse(ptr: str, retptr: &str);
1547	/*
1548	* nr_entries can not be zero and the startup
1549	* tests require some buffer space. Therefore
1550	* ensure we have at least 4096 bytes of buffer.
1551	*/
1552	trace_buf_size = max(`4096UL`, buf_size);
1553	return `1`;
1554	}
1555	__setup("trace_buf_size=", set_buf_size);
1556
1557	static int __init set_tracing_thresh(char *str)
1558	{
1559	unsigned long threshold;
1560	int ret;
1561
1562	if (!str)
1563	return `0`;
1564	ret = kstrtoul(s: str, base: `0`, res: &threshold);
1565	if (ret < `0`)
1566	return `0`;
1567	tracing_thresh = threshold * `1000`;
1568	return `1`;
1569	}
1570	__setup("tracing_thresh=", set_tracing_thresh);
1571
1572	unsigned long nsecs_to_usecs(unsigned long nsecs)
1573	{
1574	return nsecs / `1000`;
1575	}
1576
1577	/*
1578	* TRACE_FLAGS is defined as a tuple matching bit masks with strings.
1579	* It uses C(a, b) where 'a' is the eval (enum) name and 'b' is the string that
1580	* matches it. By defining "C(a, b) b", TRACE_FLAGS becomes a list
1581	* of strings in the order that the evals (enum) were defined.
1582	*/
1583	#undef C
1584	#define C(a, b) b
1585
1586	/ These must match the bit positions in trace_iterator_flags /
1587	static const char *trace_options[] = {
1588	TRACE_FLAGS
1589	NULL
1590	};
1591
1592	static struct {
1593	u64 (func)(void*);
1594	const char *name;
1595	int in_ns; / is this clock in nanoseconds? /
1596	} trace_clocks[] = {
1597	{ trace_clock_local, "local", `1` },
1598	{ trace_clock_global, "global", `1` },
1599	{ trace_clock_counter, "counter", `0` },
1600	{ trace_clock_jiffies, "uptime", `0` },
1601	{ trace_clock, "perf", `1` },
1602	{ ktime_get_mono_fast_ns, "mono", `1` },
1603	{ ktime_get_raw_fast_ns, "mono_raw", `1` },
1604	{ ktime_get_boot_fast_ns, "boot", `1` },
1605	{ ktime_get_tai_fast_ns, "tai", `1` },
1606	ARCH_TRACE_CLOCKS
1607	};
1608
1609	bool trace_clock_in_ns(struct trace_array *tr)
1610	{
1611	if (trace_clocks[tr->clock_id].in_ns)
1612	return true;
1613
1614	return false;
1615	}
1616
1617	/*
1618	* trace_parser_get_init - gets the buffer for trace parser
1619	*/
1620	int trace_parser_get_init(struct trace_parser parser, int* size)
1621	{
1622	memset(parser, `0`, sizeof(*parser));
1623
1624	parser->buffer = kmalloc(size, GFP_KERNEL);
1625	if (!parser->buffer)
1626	return `1`;
1627
1628	parser->size = size;
1629	return `0`;
1630	}
1631
1632	/*
1633	* trace_parser_put - frees the buffer for trace parser
1634	*/
1635	void trace_parser_put(struct trace_parser *parser)
1636	{
1637	kfree(objp: parser->buffer);
1638	parser->buffer = NULL;
1639	}
1640
1641	/*
1642	* trace_get_user - reads the user input string separated by space
1643	* (matched by isspace(ch))
1644	*
1645	* For each string found the 'struct trace_parser' is updated,
1646	* and the function returns.
1647	*
1648	* Returns number of bytes read.
1649	*
1650	* See kernel/trace/trace.h for 'struct trace_parser' details.
1651	*/
1652	int trace_get_user(struct trace_parser parser, const* char __user *ubuf,
1653	size_t cnt, loff_t *ppos)
1654	{
1655	char ch;
1656	size_t read = `0`;
1657	ssize_t ret;
1658
1659	if (!*ppos)
1660	trace_parser_clear(parser);
1661
1662	ret = get_user(ch, ubuf++);
1663	if (ret)
1664	goto out;
1665
1666	read++;
1667	cnt--;
1668
1669	/*
1670	* The parser is not finished with the last write,
1671	* continue reading the user input without skipping spaces.
1672	*/
1673	if (!parser->cont) {
1674	/ skip white space /
1675	while (cnt && isspace(ch)) {
1676	ret = get_user(ch, ubuf++);
1677	if (ret)
1678	goto out;
1679	read++;
1680	cnt--;
1681	}
1682
1683	parser->idx = `0`;
1684
1685	/ only spaces were written /
1686	if (isspace(ch) \|\| !ch) {
1687	*ppos += read;
1688	ret = read;
1689	goto out;
1690	}
1691	}
1692
1693	/ read the non-space input /
1694	while (cnt && !isspace(ch) && ch) {
1695	if (parser->idx < parser->size - `1`)
1696	parser->buffer[parser->idx++] = ch;
1697	else {
1698	ret = -EINVAL;
1699	goto out;
1700	}
1701	ret = get_user(ch, ubuf++);
1702	if (ret)
1703	goto out;
1704	read++;
1705	cnt--;
1706	}
1707
1708	/ We either got finished input or we have to wait for another call. /
1709	if (isspace(ch) \|\| !ch) {
1710	parser->buffer[parser->idx] = `0`;
1711	parser->cont = false;
1712	} else if (parser->idx < parser->size - `1`) {
1713	parser->cont = true;
1714	parser->buffer[parser->idx++] = ch;
1715	/ Make sure the parsed string always terminates with '\0'. /
1716	parser->buffer[parser->idx] = `0`;
1717	} else {
1718	ret = -EINVAL;
1719	goto out;
1720	}
1721
1722	*ppos += read;
1723	ret = read;
1724
1725	out:
1726	return ret;
1727	}
1728
1729	/ TODO add a seq_buf_to_buffer() /
1730	static ssize_t trace_seq_to_buffer(struct trace_seq s, void* *buf, size_t cnt)
1731	{
1732	int len;
1733
1734	if (trace_seq_used(s) <= s->readpos)
1735	return -EBUSY;
1736
1737	len = trace_seq_used(s) - s->readpos;
1738	if (cnt > len)
1739	cnt = len;
1740	memcpy(buf, s->buffer + s->readpos, cnt);
1741
1742	s->readpos += cnt;
1743	return cnt;
1744	}
1745
1746	unsigned long __read_mostly tracing_thresh;
1747
1748	#ifdef CONFIG_TRACER_MAX_TRACE
1749	static const struct file_operations tracing_max_lat_fops;
1750
1751	#ifdef LATENCY_FS_NOTIFY
1752
1753	static struct workqueue_struct *fsnotify_wq;
1754
1755	static void latency_fsnotify_workfn(struct work_struct *work)
1756	{
1757	struct trace_array tr = container_of(work, struct* trace_array,
1758	fsnotify_work);
1759	fsnotify_inode(inode: tr->d_max_latency->d_inode, FS_MODIFY);
1760	}
1761
1762	static void latency_fsnotify_workfn_irq(struct irq_work *iwork)
1763	{
1764	struct trace_array tr = container_of(iwork, struct* trace_array,
1765	fsnotify_irqwork);
1766	queue_work(wq: fsnotify_wq, work: &tr->fsnotify_work);
1767	}
1768
1769	static void trace_create_maxlat_file(struct trace_array *tr,
1770	struct dentry *d_tracer)
1771	{
1772	INIT_WORK(&tr->fsnotify_work, latency_fsnotify_workfn);
1773	init_irq_work(work: &tr->fsnotify_irqwork, func: latency_fsnotify_workfn_irq);
1774	tr->d_max_latency = trace_create_file(name: "tracing_max_latency",
1775	TRACE_MODE_WRITE,
1776	parent: d_tracer, data: tr,
1777	fops: &tracing_max_lat_fops);
1778	}
1779
1780	__init static int latency_fsnotify_init(void)
1781	{
1782	fsnotify_wq = alloc_workqueue(fmt: "tr_max_lat_wq",
1783	flags: WQ_UNBOUND \| WQ_HIGHPRI, max_active: `0`);
1784	if (!fsnotify_wq) {
1785	pr_err("Unable to allocate tr_max_lat_wq\n");
1786	return -ENOMEM;
1787	}
1788	return `0`;
1789	}
1790
1791	late_initcall_sync(latency_fsnotify_init);
1792
1793	void latency_fsnotify(struct trace_array *tr)
1794	{
1795	if (!fsnotify_wq)
1796	return;
1797	/*
1798	* We cannot call queue_work(&tr->fsnotify_work) from here because it's
1799	* possible that we are called from __schedule() or do_idle(), which
1800	* could cause a deadlock.
1801	*/
1802	irq_work_queue(work: &tr->fsnotify_irqwork);
1803	}
1804
1805	#else /* !LATENCY_FS_NOTIFY */
1806
1807	#define trace_create_maxlat_file(tr, d_tracer) \
1808	trace_create_file("tracing_max_latency", TRACE_MODE_WRITE, \
1809	d_tracer, tr, &tracing_max_lat_fops)
1810
1811	#endif
1812
1813	/*
1814	* Copy the new maximum trace into the separate maximum-trace
1815	* structure. (this way the maximum trace is permanently saved,
1816	* for later retrieval via /sys/kernel/tracing/tracing_max_latency)
1817	*/
1818	static void
1819	__update_max_tr(struct trace_array tr, struct* task_struct tsk, int* cpu)
1820	{
1821	struct array_buffer *trace_buf = &tr->array_buffer;
1822	struct array_buffer *max_buf = &tr->max_buffer;
1823	struct trace_array_cpu *data = per_cpu_ptr(trace_buf->data, cpu);
1824	struct trace_array_cpu *max_data = per_cpu_ptr(max_buf->data, cpu);
1825
1826	max_buf->cpu = cpu;
1827	max_buf->time_start = data->preempt_timestamp;
1828
1829	max_data->saved_latency = tr->max_latency;
1830	max_data->critical_start = data->critical_start;
1831	max_data->critical_end = data->critical_end;
1832
1833	strncpy(p: max_data->comm, q: tsk->comm, size: TASK_COMM_LEN);
1834	max_data->pid = tsk->pid;
1835	/*
1836	* If tsk == current, then use current_uid(), as that does not use
1837	* RCU. The irq tracer can be called out of RCU scope.
1838	*/
1839	if (tsk == current)
1840	max_data->uid = current_uid();
1841	else
1842	max_data->uid = task_uid(tsk);
1843
1844	max_data->nice = tsk->static_prio - `20` - MAX_RT_PRIO;
1845	max_data->policy = tsk->policy;
1846	max_data->rt_priority = tsk->rt_priority;
1847
1848	/ record this tasks comm /
1849	tracing_record_cmdline(task: tsk);
1850	latency_fsnotify(tr);
1851	}
1852
1853	/**
1854	* update_max_tr - snapshot all trace buffers from global_trace to max_tr
1855	* @tr: tracer
1856	* @tsk: the task with the latency
1857	* @cpu: The cpu that initiated the trace.
1858	* @cond_data: User data associated with a conditional snapshot
1859	*
1860	* Flip the buffers between the @tr and the max_tr and record information
1861	* about which task was the cause of this latency.
1862	*/
1863	void
1864	update_max_tr(struct trace_array tr, struct* task_struct tsk, int* cpu,
1865	void *cond_data)
1866	{
1867	if (tr->stop_count)
1868	return;
1869
1870	WARN_ON_ONCE(!irqs_disabled());
1871
1872	if (!tr->allocated_snapshot) {
1873	/ Only the nop tracer should hit this when disabling /
1874	WARN_ON_ONCE(tr->current_trace != &nop_trace);
1875	return;
1876	}
1877
1878	arch_spin_lock(&tr->max_lock);
1879
1880	/ Inherit the recordable setting from array_buffer /
1881	if (ring_buffer_record_is_set_on(buffer: tr->array_buffer.buffer))
1882	ring_buffer_record_on(buffer: tr->max_buffer.buffer);
1883	else
1884	ring_buffer_record_off(buffer: tr->max_buffer.buffer);
1885
1886	#ifdef CONFIG_TRACER_SNAPSHOT
1887	if (tr->cond_snapshot && !tr->cond_snapshot->update(tr, cond_data)) {
1888	arch_spin_unlock(&tr->max_lock);
1889	return;
1890	}
1891	#endif
1892	swap(tr->array_buffer.buffer, tr->max_buffer.buffer);
1893
1894	__update_max_tr(tr, tsk, cpu);
1895
1896	arch_spin_unlock(&tr->max_lock);
1897	}
1898
1899	/**
1900	* update_max_tr_single - only copy one trace over, and reset the rest
1901	* @tr: tracer
1902	* @tsk: task with the latency
1903	* @cpu: the cpu of the buffer to copy.
1904	*
1905	* Flip the trace of a single CPU buffer between the @tr and the max_tr.
1906	*/
1907	void
1908	update_max_tr_single(struct trace_array tr, struct* task_struct tsk, int* cpu)
1909	{
1910	int ret;
1911
1912	if (tr->stop_count)
1913	return;
1914
1915	WARN_ON_ONCE(!irqs_disabled());
1916	if (!tr->allocated_snapshot) {
1917	/ Only the nop tracer should hit this when disabling /
1918	WARN_ON_ONCE(tr->current_trace != &nop_trace);
1919	return;
1920	}
1921
1922	arch_spin_lock(&tr->max_lock);
1923
1924	ret = ring_buffer_swap_cpu(buffer_a: tr->max_buffer.buffer, buffer_b: tr->array_buffer.buffer, cpu);
1925
1926	if (ret == -EBUSY) {
1927	/*
1928	* We failed to swap the buffer due to a commit taking
1929	* place on this CPU. We fail to record, but we reset
1930	* the max trace buffer (no one writes directly to it)
1931	* and flag that it failed.
1932	* Another reason is resize is in progress.
1933	*/
1934	trace_array_printk_buf(buffer: tr->max_buffer.buffer, _THIS_IP_,
1935	fmt: "Failed to swap buffers due to commit or resize in progress\n");
1936	}
1937
1938	WARN_ON_ONCE(ret && ret != -EAGAIN && ret != -EBUSY);
1939
1940	__update_max_tr(tr, tsk, cpu);
1941	arch_spin_unlock(&tr->max_lock);
1942	}
1943
1944	#endif /* CONFIG_TRACER_MAX_TRACE */
1945
1946	static int wait_on_pipe(struct trace_iterator iter, int* full)
1947	{
1948	/ Iterators are static, they should be filled or empty /
1949	if (trace_buffer_iter(iter, cpu: iter->cpu_file))
1950	return `0`;
1951
1952	return ring_buffer_wait(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file,
1953	full);
1954	}
1955
1956	#ifdef CONFIG_FTRACE_STARTUP_TEST
1957	static bool selftests_can_run;
1958
1959	struct trace_selftests {
1960	struct list_head list;
1961	struct tracer *type;
1962	};
1963
1964	static LIST_HEAD(postponed_selftests);
1965
1966	static int save_selftest(struct tracer *type)
1967	{
1968	struct trace_selftests *selftest;
1969
1970	selftest = kmalloc(size: sizeof(*selftest), GFP_KERNEL);
1971	if (!selftest)
1972	return -ENOMEM;
1973
1974	selftest->type = type;
1975	list_add(new: &selftest->list, head: &postponed_selftests);
1976	return `0`;
1977	}
1978
1979	static int run_tracer_selftest(struct tracer *type)
1980	{
1981	struct trace_array *tr = &global_trace;
1982	struct tracer *saved_tracer = tr->current_trace;
1983	int ret;
1984
1985	if (!type->selftest \|\| tracing_selftest_disabled)
1986	return `0`;
1987
1988	/*
1989	* If a tracer registers early in boot up (before scheduling is
1990	* initialized and such), then do not run its selftests yet.
1991	* Instead, run it a little later in the boot process.
1992	*/
1993	if (!selftests_can_run)
1994	return save_selftest(type);
1995
1996	if (!tracing_is_on()) {
1997	pr_warn("Selftest for tracer %s skipped due to tracing disabled\n",
1998	type->name);
1999	return `0`;
2000	}
2001
2002	/*
2003	* Run a selftest on this tracer.
2004	* Here we reset the trace buffer, and set the current
2005	* tracer to be this tracer. The tracer can then run some
2006	* internal tracing to verify that everything is in order.
2007	* If we fail, we do not register this tracer.
2008	*/
2009	tracing_reset_online_cpus(buf: &tr->array_buffer);
2010
2011	tr->current_trace = type;
2012
2013	#ifdef CONFIG_TRACER_MAX_TRACE
2014	if (type->use_max_tr) {
2015	/ If we expanded the buffers, make sure the max is expanded too /
2016	if (tr->ring_buffer_expanded)
2017	ring_buffer_resize(buffer: tr->max_buffer.buffer, size: trace_buf_size,
2018	RING_BUFFER_ALL_CPUS);
2019	tr->allocated_snapshot = true;
2020	}
2021	#endif
2022
2023	/ the test is responsible for initializing and enabling /
2024	pr_info("Testing tracer %s: ", type->name);
2025	ret = type->selftest(type, tr);
2026	/ the test is responsible for resetting too /
2027	tr->current_trace = saved_tracer;
2028	if (ret) {
2029	printk(KERN_CONT "FAILED!\n");
2030	/ Add the warning after printing 'FAILED' /
2031	WARN_ON(`1`);
2032	return -`1`;
2033	}
2034	/ Only reset on passing, to avoid touching corrupted buffers /
2035	tracing_reset_online_cpus(buf: &tr->array_buffer);
2036
2037	#ifdef CONFIG_TRACER_MAX_TRACE
2038	if (type->use_max_tr) {
2039	tr->allocated_snapshot = false;
2040
2041	/ Shrink the max buffer again /
2042	if (tr->ring_buffer_expanded)
2043	ring_buffer_resize(buffer: tr->max_buffer.buffer, size: `1`,
2044	RING_BUFFER_ALL_CPUS);
2045	}
2046	#endif
2047
2048	printk(KERN_CONT "PASSED\n");
2049	return `0`;
2050	}
2051
2052	static int do_run_tracer_selftest(struct tracer *type)
2053	{
2054	int ret;
2055
2056	/*
2057	* Tests can take a long time, especially if they are run one after the
2058	* other, as does happen during bootup when all the tracers are
2059	* registered. This could cause the soft lockup watchdog to trigger.
2060	*/
2061	cond_resched();
2062
2063	tracing_selftest_running = true;
2064	ret = run_tracer_selftest(type);
2065	tracing_selftest_running = false;
2066
2067	return ret;
2068	}
2069
2070	static __init int init_trace_selftests(void)
2071	{
2072	struct trace_selftests p, n;
2073	struct tracer t, *last;
2074	int ret;
2075
2076	selftests_can_run = true;
2077
2078	mutex_lock(&trace_types_lock);
2079
2080	if (list_empty(head: &postponed_selftests))
2081	goto out;
2082
2083	pr_info("Running postponed tracer tests:\n");
2084
2085	tracing_selftest_running = true;
2086	list_for_each_entry_safe(p, n, &postponed_selftests, list) {
2087	/ This loop can take minutes when sanitizers are enabled, so*
2088	* lets make sure we allow RCU processing.
2089	*/
2090	cond_resched();
2091	ret = run_tracer_selftest(type: p->type);
2092	/ If the test fails, then warn and remove from available_tracers /
2093	if (ret < `0`) {
2094	WARN(`1`, "tracer: %s failed selftest, disabling\n",
2095	p->type->name);
2096	last = &trace_types;
2097	for (t = trace_types; t; t = t->next) {
2098	if (t == p->type) {
2099	*last = t->next;
2100	break;
2101	}
2102	last = &t->next;
2103	}
2104	}
2105	list_del(entry: &p->list);
2106	kfree(objp: p);
2107	}
2108	tracing_selftest_running = false;
2109
2110	out:
2111	mutex_unlock(lock: &trace_types_lock);
2112
2113	return `0`;
2114	}
2115	core_initcall(init_trace_selftests);
2116	#else
2117	static inline int run_tracer_selftest(struct tracer *type)
2118	{
2119	return `0`;
2120	}
2121	static inline int do_run_tracer_selftest(struct tracer *type)
2122	{
2123	return `0`;
2124	}
2125	#endif /* CONFIG_FTRACE_STARTUP_TEST */
2126
2127	static void add_tracer_options(struct trace_array tr, struct* tracer *t);
2128
2129	static void __init apply_trace_boot_options(void);
2130
2131	/**
2132	* register_tracer - register a tracer with the ftrace system.
2133	* @type: the plugin for the tracer
2134	*
2135	* Register a new plugin tracer.
2136	*/
2137	int __init register_tracer(struct tracer *type)
2138	{
2139	struct tracer *t;
2140	int ret = `0`;
2141
2142	if (!type->name) {
2143	pr_info("Tracer must have a name\n");
2144	return -`1`;
2145	}
2146
2147	if (strlen(type->name) >= MAX_TRACER_SIZE) {
2148	pr_info("Tracer has a name longer than %d\n", MAX_TRACER_SIZE);
2149	return -`1`;
2150	}
2151
2152	if (security_locked_down(what: LOCKDOWN_TRACEFS)) {
2153	pr_warn("Can not register tracer %s due to lockdown\n",
2154	type->name);
2155	return -EPERM;
2156	}
2157
2158	mutex_lock(&trace_types_lock);
2159
2160	for (t = trace_types; t; t = t->next) {
2161	if (strcmp(type->name, t->name) == `0`) {
2162	/ already found /
2163	pr_info("Tracer %s already registered\n",
2164	type->name);
2165	ret = -`1`;
2166	goto out;
2167	}
2168	}
2169
2170	if (!type->set_flag)
2171	type->set_flag = &dummy_set_flag;
2172	if (!type->flags) {
2173	/allocate a dummy tracer_flags/
2174	type->flags = kmalloc(size: sizeof(*type->flags), GFP_KERNEL);
2175	if (!type->flags) {
2176	ret = -ENOMEM;
2177	goto out;
2178	}
2179	type->flags->val = `0`;
2180	type->flags->opts = dummy_tracer_opt;
2181	} else
2182	if (!type->flags->opts)
2183	type->flags->opts = dummy_tracer_opt;
2184
2185	/ store the tracer for __set_tracer_option /
2186	type->flags->trace = type;
2187
2188	ret = do_run_tracer_selftest(type);
2189	if (ret < `0`)
2190	goto out;
2191
2192	type->next = trace_types;
2193	trace_types = type;
2194	add_tracer_options(tr: &global_trace, t: type);
2195
2196	out:
2197	mutex_unlock(lock: &trace_types_lock);
2198
2199	if (ret \|\| !default_bootup_tracer)
2200	goto out_unlock;
2201
2202	if (strncmp(default_bootup_tracer, type->name, MAX_TRACER_SIZE))
2203	goto out_unlock;
2204
2205	printk(KERN_INFO "Starting tracer '%s'\n", type->name);
2206	/ Do we want this tracer to start on bootup? /
2207	tracing_set_tracer(tr: &global_trace, buf: type->name);
2208	default_bootup_tracer = NULL;
2209
2210	apply_trace_boot_options();
2211
2212	/ disable other selftests, since this will break it. /
2213	disable_tracing_selftest(reason: "running a tracer");
2214
2215	out_unlock:
2216	return ret;
2217	}
2218
2219	static void tracing_reset_cpu(struct array_buffer buf, int* cpu)
2220	{
2221	struct trace_buffer *buffer = buf->buffer;
2222
2223	if (!buffer)
2224	return;
2225
2226	ring_buffer_record_disable(buffer);
2227
2228	/ Make sure all commits have finished /
2229	synchronize_rcu();
2230	ring_buffer_reset_cpu(buffer, cpu);
2231
2232	ring_buffer_record_enable(buffer);
2233	}
2234
2235	void tracing_reset_online_cpus(struct array_buffer *buf)
2236	{
2237	struct trace_buffer *buffer = buf->buffer;
2238
2239	if (!buffer)
2240	return;
2241
2242	ring_buffer_record_disable(buffer);
2243
2244	/ Make sure all commits have finished /
2245	synchronize_rcu();
2246
2247	buf->time_start = buffer_ftrace_now(buf, cpu: buf->cpu);
2248
2249	ring_buffer_reset_online_cpus(buffer);
2250
2251	ring_buffer_record_enable(buffer);
2252	}
2253
2254	/ Must have trace_types_lock held /
2255	void tracing_reset_all_online_cpus_unlocked(void)
2256	{
2257	struct trace_array *tr;
2258
2259	lockdep_assert_held(&trace_types_lock);
2260
2261	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
2262	if (!tr->clear_trace)
2263	continue;
2264	tr->clear_trace = false;
2265	tracing_reset_online_cpus(buf: &tr->array_buffer);
2266	#ifdef CONFIG_TRACER_MAX_TRACE
2267	tracing_reset_online_cpus(buf: &tr->max_buffer);
2268	#endif
2269	}
2270	}
2271
2272	void tracing_reset_all_online_cpus(void)
2273	{
2274	mutex_lock(&trace_types_lock);
2275	tracing_reset_all_online_cpus_unlocked();
2276	mutex_unlock(lock: &trace_types_lock);
2277	}
2278
2279	/*
2280	* The tgid_map array maps from pid to tgid; i.e. the value stored at index i
2281	* is the tgid last observed corresponding to pid=i.
2282	*/
2283	static int *tgid_map;
2284
2285	/ The maximum valid index into tgid_map. /
2286	static size_t tgid_map_max;
2287
2288	#define SAVED_CMDLINES_DEFAULT 128
2289	#define NO_CMDLINE_MAP UINT_MAX
2290	/*
2291	* Preemption must be disabled before acquiring trace_cmdline_lock.
2292	* The various trace_arrays' max_lock must be acquired in a context
2293	* where interrupt is disabled.
2294	*/
2295	static arch_spinlock_t trace_cmdline_lock = __ARCH_SPIN_LOCK_UNLOCKED;
2296	struct saved_cmdlines_buffer {
2297	unsigned map_pid_to_cmdline[PID_MAX_DEFAULT+`1`];
2298	unsigned *map_cmdline_to_pid;
2299	unsigned cmdline_num;
2300	int cmdline_idx;
2301	char *saved_cmdlines;
2302	};
2303	static struct saved_cmdlines_buffer *savedcmd;
2304
2305	static inline char get_saved_cmdlines(int* idx)
2306	{
2307	return &savedcmd->saved_cmdlines[idx * TASK_COMM_LEN];
2308	}
2309
2310	static inline void set_cmdline(int idx, const char *cmdline)
2311	{
2312	strncpy(p: get_saved_cmdlines(idx), q: cmdline, size: TASK_COMM_LEN);
2313	}
2314
2315	static int allocate_cmdlines_buffer(unsigned int val,
2316	struct saved_cmdlines_buffer *s)
2317	{
2318	s->map_cmdline_to_pid = kmalloc_array(n: val,
2319	size: sizeof(*s->map_cmdline_to_pid),
2320	GFP_KERNEL);
2321	if (!s->map_cmdline_to_pid)
2322	return -ENOMEM;
2323
2324	s->saved_cmdlines = kmalloc_array(n: TASK_COMM_LEN, size: val, GFP_KERNEL);
2325	if (!s->saved_cmdlines) {
2326	kfree(objp: s->map_cmdline_to_pid);
2327	return -ENOMEM;
2328	}
2329
2330	s->cmdline_idx = `0`;
2331	s->cmdline_num = val;
2332	memset(&s->map_pid_to_cmdline, NO_CMDLINE_MAP,
2333	sizeof(s->map_pid_to_cmdline));
2334	memset(s->map_cmdline_to_pid, NO_CMDLINE_MAP,
2335	val * sizeof(*s->map_cmdline_to_pid));
2336
2337	return `0`;
2338	}
2339
2340	static int trace_create_savedcmd(void)
2341	{
2342	int ret;
2343
2344	savedcmd = kmalloc(size: sizeof(*savedcmd), GFP_KERNEL);
2345	if (!savedcmd)
2346	return -ENOMEM;
2347
2348	ret = allocate_cmdlines_buffer(SAVED_CMDLINES_DEFAULT, s: savedcmd);
2349	if (ret < `0`) {
2350	kfree(objp: savedcmd);
2351	savedcmd = NULL;
2352	return -ENOMEM;
2353	}
2354
2355	return `0`;
2356	}
2357
2358	int is_tracing_stopped(void)
2359	{
2360	return global_trace.stop_count;
2361	}
2362
2363	/**
2364	* tracing_start - quick start of the tracer
2365	*
2366	* If tracing is enabled but was stopped by tracing_stop,
2367	* this will start the tracer back up.
2368	*/
2369	void tracing_start(void)
2370	{
2371	struct trace_buffer *buffer;
2372	unsigned long flags;
2373
2374	if (tracing_disabled)
2375	return;
2376
2377	raw_spin_lock_irqsave(&global_trace.start_lock, flags);
2378	if (--global_trace.stop_count) {
2379	if (global_trace.stop_count < `0`) {
2380	/ Someone screwed up their debugging /
2381	WARN_ON_ONCE(`1`);
2382	global_trace.stop_count = `0`;
2383	}
2384	goto out;
2385	}
2386
2387	/ Prevent the buffers from switching /
2388	arch_spin_lock(&global_trace.max_lock);
2389
2390	buffer = global_trace.array_buffer.buffer;
2391	if (buffer)
2392	ring_buffer_record_enable(buffer);
2393
2394	#ifdef CONFIG_TRACER_MAX_TRACE
2395	buffer = global_trace.max_buffer.buffer;
2396	if (buffer)
2397	ring_buffer_record_enable(buffer);
2398	#endif
2399
2400	arch_spin_unlock(&global_trace.max_lock);
2401
2402	out:
2403	raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
2404	}
2405
2406	static void tracing_start_tr(struct trace_array *tr)
2407	{
2408	struct trace_buffer *buffer;
2409	unsigned long flags;
2410
2411	if (tracing_disabled)
2412	return;
2413
2414	/ If global, we need to also start the max tracer /
2415	if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
2416	return tracing_start();
2417
2418	raw_spin_lock_irqsave(&tr->start_lock, flags);
2419
2420	if (--tr->stop_count) {
2421	if (tr->stop_count < `0`) {
2422	/ Someone screwed up their debugging /
2423	WARN_ON_ONCE(`1`);
2424	tr->stop_count = `0`;
2425	}
2426	goto out;
2427	}
2428
2429	buffer = tr->array_buffer.buffer;
2430	if (buffer)
2431	ring_buffer_record_enable(buffer);
2432
2433	out:
2434	raw_spin_unlock_irqrestore(&tr->start_lock, flags);
2435	}
2436
2437	/**
2438	* tracing_stop - quick stop of the tracer
2439	*
2440	* Light weight way to stop tracing. Use in conjunction with
2441	* tracing_start.
2442	*/
2443	void tracing_stop(void)
2444	{
2445	struct trace_buffer *buffer;
2446	unsigned long flags;
2447
2448	raw_spin_lock_irqsave(&global_trace.start_lock, flags);
2449	if (global_trace.stop_count++)
2450	goto out;
2451
2452	/ Prevent the buffers from switching /
2453	arch_spin_lock(&global_trace.max_lock);
2454
2455	buffer = global_trace.array_buffer.buffer;
2456	if (buffer)
2457	ring_buffer_record_disable(buffer);
2458
2459	#ifdef CONFIG_TRACER_MAX_TRACE
2460	buffer = global_trace.max_buffer.buffer;
2461	if (buffer)
2462	ring_buffer_record_disable(buffer);
2463	#endif
2464
2465	arch_spin_unlock(&global_trace.max_lock);
2466
2467	out:
2468	raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
2469	}
2470
2471	static void tracing_stop_tr(struct trace_array *tr)
2472	{
2473	struct trace_buffer *buffer;
2474	unsigned long flags;
2475
2476	/ If global, we need to also stop the max tracer /
2477	if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
2478	return tracing_stop();
2479
2480	raw_spin_lock_irqsave(&tr->start_lock, flags);
2481	if (tr->stop_count++)
2482	goto out;
2483
2484	buffer = tr->array_buffer.buffer;
2485	if (buffer)
2486	ring_buffer_record_disable(buffer);
2487
2488	out:
2489	raw_spin_unlock_irqrestore(&tr->start_lock, flags);
2490	}
2491
2492	static int trace_save_cmdline(struct task_struct *tsk)
2493	{
2494	unsigned tpid, idx;
2495
2496	/ treat recording of idle task as a success /
2497	if (!tsk->pid)
2498	return `1`;
2499
2500	tpid = tsk->pid & (PID_MAX_DEFAULT - `1`);
2501
2502	/*
2503	* It's not the end of the world if we don't get
2504	* the lock, but we also don't want to spin
2505	* nor do we want to disable interrupts,
2506	* so if we miss here, then better luck next time.
2507	*
2508	* This is called within the scheduler and wake up, so interrupts
2509	* had better been disabled and run queue lock been held.
2510	*/
2511	lockdep_assert_preemption_disabled();
2512	if (!arch_spin_trylock(&trace_cmdline_lock))
2513	return `0`;
2514
2515	idx = savedcmd->map_pid_to_cmdline[tpid];
2516	if (idx == NO_CMDLINE_MAP) {
2517	idx = (savedcmd->cmdline_idx + `1`) % savedcmd->cmdline_num;
2518
2519	savedcmd->map_pid_to_cmdline[tpid] = idx;
2520	savedcmd->cmdline_idx = idx;
2521	}
2522
2523	savedcmd->map_cmdline_to_pid[idx] = tsk->pid;
2524	set_cmdline(idx, cmdline: tsk->comm);
2525
2526	arch_spin_unlock(&trace_cmdline_lock);
2527
2528	return `1`;
2529	}
2530
2531	static void __trace_find_cmdline(int pid, char comm[])
2532	{
2533	unsigned map;
2534	int tpid;
2535
2536	if (!pid) {
2537	strcpy(p: comm, q: "<idle>");
2538	return;
2539	}
2540
2541	if (WARN_ON_ONCE(pid < `0`)) {
2542	strcpy(p: comm, q: "<XXX>");
2543	return;
2544	}
2545
2546	tpid = pid & (PID_MAX_DEFAULT - `1`);
2547	map = savedcmd->map_pid_to_cmdline[tpid];
2548	if (map != NO_CMDLINE_MAP) {
2549	tpid = savedcmd->map_cmdline_to_pid[map];
2550	if (tpid == pid) {
2551	strscpy(p: comm, q: get_saved_cmdlines(idx: map), size: TASK_COMM_LEN);
2552	return;
2553	}
2554	}
2555	strcpy(p: comm, q: "<...>");
2556	}
2557
2558	void trace_find_cmdline(int pid, char comm[])
2559	{
2560	preempt_disable();
2561	arch_spin_lock(&trace_cmdline_lock);
2562
2563	__trace_find_cmdline(pid, comm);
2564
2565	arch_spin_unlock(&trace_cmdline_lock);
2566	preempt_enable();
2567	}
2568
2569	static int trace_find_tgid_ptr(int* pid)
2570	{
2571	/*
2572	* Pairs with the smp_store_release in set_tracer_flag() to ensure that
2573	* if we observe a non-NULL tgid_map then we also observe the correct
2574	* tgid_map_max.
2575	*/
2576	int *map = smp_load_acquire(&tgid_map);
2577
2578	if (unlikely(!map \|\| pid > tgid_map_max))
2579	return NULL;
2580
2581	return &map[pid];
2582	}
2583
2584	int trace_find_tgid(int pid)
2585	{
2586	int *ptr = trace_find_tgid_ptr(pid);
2587
2588	return ptr ? *ptr : `0`;
2589	}
2590
2591	static int trace_save_tgid(struct task_struct *tsk)
2592	{
2593	int *ptr;
2594
2595	/ treat recording of idle task as a success /
2596	if (!tsk->pid)
2597	return `1`;
2598
2599	ptr = trace_find_tgid_ptr(pid: tsk->pid);
2600	if (!ptr)
2601	return `0`;
2602
2603	*ptr = tsk->tgid;
2604	return `1`;
2605	}
2606
2607	static bool tracing_record_taskinfo_skip(int flags)
2608	{
2609	if (unlikely(!(flags & (TRACE_RECORD_CMDLINE \| TRACE_RECORD_TGID))))
2610	return true;
2611	if (!__this_cpu_read(trace_taskinfo_save))
2612	return true;
2613	return false;
2614	}
2615
2616	/**
2617	* tracing_record_taskinfo - record the task info of a task
2618	*
2619	* @task: task to record
2620	* @flags: TRACE_RECORD_CMDLINE for recording comm
2621	* TRACE_RECORD_TGID for recording tgid
2622	*/
2623	void tracing_record_taskinfo(struct task_struct task, int* flags)
2624	{
2625	bool done;
2626
2627	if (tracing_record_taskinfo_skip(flags))
2628	return;
2629
2630	/*
2631	* Record as much task information as possible. If some fail, continue
2632	* to try to record the others.
2633	*/
2634	done = !(flags & TRACE_RECORD_CMDLINE) \|\| trace_save_cmdline(tsk: task);
2635	done &= !(flags & TRACE_RECORD_TGID) \|\| trace_save_tgid(tsk: task);
2636
2637	/ If recording any information failed, retry again soon. /
2638	if (!done)
2639	return;
2640
2641	__this_cpu_write(trace_taskinfo_save, false);
2642	}
2643
2644	/**
2645	* tracing_record_taskinfo_sched_switch - record task info for sched_switch
2646	*
2647	* @prev: previous task during sched_switch
2648	* @next: next task during sched_switch
2649	* @flags: TRACE_RECORD_CMDLINE for recording comm
2650	* TRACE_RECORD_TGID for recording tgid
2651	*/
2652	void tracing_record_taskinfo_sched_switch(struct task_struct *prev,
2653	struct task_struct next, int* flags)
2654	{
2655	bool done;
2656
2657	if (tracing_record_taskinfo_skip(flags))
2658	return;
2659
2660	/*
2661	* Record as much task information as possible. If some fail, continue
2662	* to try to record the others.
2663	*/
2664	done = !(flags & TRACE_RECORD_CMDLINE) \|\| trace_save_cmdline(tsk: prev);
2665	done &= !(flags & TRACE_RECORD_CMDLINE) \|\| trace_save_cmdline(tsk: next);
2666	done &= !(flags & TRACE_RECORD_TGID) \|\| trace_save_tgid(tsk: prev);
2667	done &= !(flags & TRACE_RECORD_TGID) \|\| trace_save_tgid(tsk: next);
2668
2669	/ If recording any information failed, retry again soon. /
2670	if (!done)
2671	return;
2672
2673	__this_cpu_write(trace_taskinfo_save, false);
2674	}
2675
2676	/ Helpers to record a specific task information /
2677	void tracing_record_cmdline(struct task_struct *task)
2678	{
2679	tracing_record_taskinfo(task, TRACE_RECORD_CMDLINE);
2680	}
2681
2682	void tracing_record_tgid(struct task_struct *task)
2683	{
2684	tracing_record_taskinfo(task, TRACE_RECORD_TGID);
2685	}
2686
2687	/*
2688	* Several functions return TRACE_TYPE_PARTIAL_LINE if the trace_seq
2689	* overflowed, and TRACE_TYPE_HANDLED otherwise. This helper function
2690	* simplifies those functions and keeps them in sync.
2691	*/
2692	enum print_line_t trace_handle_return(struct trace_seq *s)
2693	{
2694	return trace_seq_has_overflowed(s) ?
2695	TRACE_TYPE_PARTIAL_LINE : TRACE_TYPE_HANDLED;
2696	}
2697	EXPORT_SYMBOL_GPL(trace_handle_return);
2698
2699	static unsigned short migration_disable_value(void)
2700	{
2701	#if defined(CONFIG_SMP)
2702	return current->migration_disabled;
2703	#else
2704	return `0`;
2705	#endif
2706	}
2707
2708	unsigned int tracing_gen_ctx_irq_test(unsigned int irqs_status)
2709	{
2710	unsigned int trace_flags = irqs_status;
2711	unsigned int pc;
2712
2713	pc = preempt_count();
2714
2715	if (pc & NMI_MASK)
2716	trace_flags \|= TRACE_FLAG_NMI;
2717	if (pc & HARDIRQ_MASK)
2718	trace_flags \|= TRACE_FLAG_HARDIRQ;
2719	if (in_serving_softirq())
2720	trace_flags \|= TRACE_FLAG_SOFTIRQ;
2721	if (softirq_count() >> (SOFTIRQ_SHIFT + `1`))
2722	trace_flags \|= TRACE_FLAG_BH_OFF;
2723
2724	if (tif_need_resched())
2725	trace_flags \|= TRACE_FLAG_NEED_RESCHED;
2726	if (test_preempt_need_resched())
2727	trace_flags \|= TRACE_FLAG_PREEMPT_RESCHED;
2728	return (trace_flags << `16`) \| (min_t(unsigned int, pc & `0xff`, `0xf`)) \|
2729	(min_t(unsigned int, migration_disable_value(), `0xf`)) << `4`;
2730	}
2731
2732	struct ring_buffer_event *
2733	trace_buffer_lock_reserve(struct trace_buffer *buffer,
2734	int type,
2735	unsigned long len,
2736	unsigned int trace_ctx)
2737	{
2738	return __trace_buffer_lock_reserve(buffer, type, len, trace_ctx);
2739	}
2740
2741	DEFINE_PER_CPU(struct ring_buffer_event *, trace_buffered_event);
2742	DEFINE_PER_CPU(int, trace_buffered_event_cnt);
2743	static int trace_buffered_event_ref;
2744
2745	/**
2746	* trace_buffered_event_enable - enable buffering events
2747	*
2748	* When events are being filtered, it is quicker to use a temporary
2749	* buffer to write the event data into if there's a likely chance
2750	* that it will not be committed. The discard of the ring buffer
2751	* is not as fast as committing, and is much slower than copying
2752	* a commit.
2753	*
2754	* When an event is to be filtered, allocate per cpu buffers to
2755	* write the event data into, and if the event is filtered and discarded
2756	* it is simply dropped, otherwise, the entire data is to be committed
2757	* in one shot.
2758	*/
2759	void trace_buffered_event_enable(void)
2760	{
2761	struct ring_buffer_event *event;
2762	struct page *page;
2763	int cpu;
2764
2765	WARN_ON_ONCE(!mutex_is_locked(&event_mutex));
2766
2767	if (trace_buffered_event_ref++)
2768	return;
2769
2770	for_each_tracing_cpu(cpu) {
2771	page = alloc_pages_node(cpu_to_node(cpu),
2772	GFP_KERNEL \| __GFP_NORETRY, order: `0`);
2773	if (!page)
2774	goto failed;
2775
2776	event = page_address(page);
2777	memset(event, `0`, sizeof(*event));
2778
2779	per_cpu(trace_buffered_event, cpu) = event;
2780
2781	preempt_disable();
2782	if (cpu == smp_processor_id() &&
2783	__this_cpu_read(trace_buffered_event) !=
2784	per_cpu(trace_buffered_event, cpu))
2785	WARN_ON_ONCE(`1`);
2786	preempt_enable();
2787	}
2788
2789	return;
2790	failed:
2791	trace_buffered_event_disable();
2792	}
2793
2794	static void enable_trace_buffered_event(void *data)
2795	{
2796	/ Probably not needed, but do it anyway /
2797	smp_rmb();
2798	this_cpu_dec(trace_buffered_event_cnt);
2799	}
2800
2801	static void disable_trace_buffered_event(void *data)
2802	{
2803	this_cpu_inc(trace_buffered_event_cnt);
2804	}
2805
2806	/**
2807	* trace_buffered_event_disable - disable buffering events
2808	*
2809	* When a filter is removed, it is faster to not use the buffered
2810	* events, and to commit directly into the ring buffer. Free up
2811	* the temp buffers when there are no more users. This requires
2812	* special synchronization with current events.
2813	*/
2814	void trace_buffered_event_disable(void)
2815	{
2816	int cpu;
2817
2818	WARN_ON_ONCE(!mutex_is_locked(&event_mutex));
2819
2820	if (WARN_ON_ONCE(!trace_buffered_event_ref))
2821	return;
2822
2823	if (--trace_buffered_event_ref)
2824	return;
2825
2826	preempt_disable();
2827	/ For each CPU, set the buffer as used. /
2828	smp_call_function_many(mask: tracing_buffer_mask,
2829	func: disable_trace_buffered_event, NULL, wait: `1`);
2830	preempt_enable();
2831
2832	/ Wait for all current users to finish /
2833	synchronize_rcu();
2834
2835	for_each_tracing_cpu(cpu) {
2836	free_page((unsigned long)per_cpu(trace_buffered_event, cpu));
2837	per_cpu(trace_buffered_event, cpu) = NULL;
2838	}
2839	/*
2840	* Make sure trace_buffered_event is NULL before clearing
2841	* trace_buffered_event_cnt.
2842	*/
2843	smp_wmb();
2844
2845	preempt_disable();
2846	/ Do the work on each cpu /
2847	smp_call_function_many(mask: tracing_buffer_mask,
2848	func: enable_trace_buffered_event, NULL, wait: `1`);
2849	preempt_enable();
2850	}
2851
2852	static struct trace_buffer *temp_buffer;
2853
2854	struct ring_buffer_event *
2855	trace_event_buffer_lock_reserve(struct trace_buffer **current_rb,
2856	struct trace_event_file *trace_file,
2857	int type, unsigned long len,
2858	unsigned int trace_ctx)
2859	{
2860	struct ring_buffer_event *entry;
2861	struct trace_array *tr = trace_file->tr;
2862	int val;
2863
2864	*current_rb = tr->array_buffer.buffer;
2865
2866	if (!tr->no_filter_buffering_ref &&
2867	(trace_file->flags & (EVENT_FILE_FL_SOFT_DISABLED \| EVENT_FILE_FL_FILTERED))) {
2868	preempt_disable_notrace();
2869	/*
2870	* Filtering is on, so try to use the per cpu buffer first.
2871	* This buffer will simulate a ring_buffer_event,
2872	* where the type_len is zero and the array[0] will
2873	* hold the full length.
2874	* (see include/linux/ring-buffer.h for details on
2875	* how the ring_buffer_event is structured).
2876	*
2877	* Using a temp buffer during filtering and copying it
2878	* on a matched filter is quicker than writing directly
2879	* into the ring buffer and then discarding it when
2880	* it doesn't match. That is because the discard
2881	* requires several atomic operations to get right.
2882	* Copying on match and doing nothing on a failed match
2883	* is still quicker than no copy on match, but having
2884	* to discard out of the ring buffer on a failed match.
2885	*/
2886	if ((entry = __this_cpu_read(trace_buffered_event))) {
2887	int max_len = PAGE_SIZE - struct_size(entry, array, `1`);
2888
2889	val = this_cpu_inc_return(trace_buffered_event_cnt);
2890
2891	/*
2892	* Preemption is disabled, but interrupts and NMIs
2893	* can still come in now. If that happens after
2894	* the above increment, then it will have to go
2895	* back to the old method of allocating the event
2896	* on the ring buffer, and if the filter fails, it
2897	* will have to call ring_buffer_discard_commit()
2898	* to remove it.
2899	*
2900	* Need to also check the unlikely case that the
2901	* length is bigger than the temp buffer size.
2902	* If that happens, then the reserve is pretty much
2903	* guaranteed to fail, as the ring buffer currently
2904	* only allows events less than a page. But that may
2905	* change in the future, so let the ring buffer reserve
2906	* handle the failure in that case.
2907	*/
2908	if (val == `1` && likely(len <= max_len)) {
2909	trace_event_setup(event: entry, type, trace_ctx);
2910	entry->array[`0`] = len;
2911	/ Return with preemption disabled /
2912	return entry;
2913	}
2914	this_cpu_dec(trace_buffered_event_cnt);
2915	}
2916	/ __trace_buffer_lock_reserve() disables preemption /
2917	preempt_enable_notrace();
2918	}
2919
2920	entry = __trace_buffer_lock_reserve(buffer: *current_rb, type, len,
2921	trace_ctx);
2922	/*
2923	* If tracing is off, but we have triggers enabled
2924	* we still need to look at the event data. Use the temp_buffer
2925	* to store the trace event for the trigger to use. It's recursive
2926	* safe and will not be recorded anywhere.
2927	*/
2928	if (!entry && trace_file->flags & EVENT_FILE_FL_TRIGGER_COND) {
2929	*current_rb = temp_buffer;
2930	entry = __trace_buffer_lock_reserve(buffer: *current_rb, type, len,
2931	trace_ctx);
2932	}
2933	return entry;
2934	}
2935	EXPORT_SYMBOL_GPL(trace_event_buffer_lock_reserve);
2936
2937	static DEFINE_RAW_SPINLOCK(tracepoint_iter_lock);
2938	static DEFINE_MUTEX(tracepoint_printk_mutex);
2939
2940	static void output_printk(struct trace_event_buffer *fbuffer)
2941	{
2942	struct trace_event_call *event_call;
2943	struct trace_event_file *file;
2944	struct trace_event *event;
2945	unsigned long flags;
2946	struct trace_iterator *iter = tracepoint_print_iter;
2947
2948	/ We should never get here if iter is NULL /
2949	if (WARN_ON_ONCE(!iter))
2950	return;
2951
2952	event_call = fbuffer->trace_file->event_call;
2953	if (!event_call \|\| !event_call->event.funcs \|\|
2954	!event_call->event.funcs->trace)
2955	return;
2956
2957	file = fbuffer->trace_file;
2958	if (test_bit(EVENT_FILE_FL_SOFT_DISABLED_BIT, &file->flags) \|\|
2959	(unlikely(file->flags & EVENT_FILE_FL_FILTERED) &&
2960	!filter_match_preds(filter: file->filter, rec: fbuffer->entry)))
2961	return;
2962
2963	event = &fbuffer->trace_file->event_call->event;
2964
2965	raw_spin_lock_irqsave(&tracepoint_iter_lock, flags);
2966	trace_seq_init(s: &iter->seq);
2967	iter->ent = fbuffer->entry;
2968	event_call->event.funcs->trace(iter, `0`, event);
2969	trace_seq_putc(s: &iter->seq, c: `0`);
2970	printk("%s", iter->seq.buffer);
2971
2972	raw_spin_unlock_irqrestore(&tracepoint_iter_lock, flags);
2973	}
2974
2975	int tracepoint_printk_sysctl(struct ctl_table table, int* write,
2976	void buffer, size_t lenp,
2977	loff_t *ppos)
2978	{
2979	int save_tracepoint_printk;
2980	int ret;
2981
2982	mutex_lock(&tracepoint_printk_mutex);
2983	save_tracepoint_printk = tracepoint_printk;
2984
2985	ret = proc_dointvec(table, write, buffer, lenp, ppos);
2986
2987	/*
2988	* This will force exiting early, as tracepoint_printk
2989	* is always zero when tracepoint_printk_iter is not allocated
2990	*/
2991	if (!tracepoint_print_iter)
2992	tracepoint_printk = `0`;
2993
2994	if (save_tracepoint_printk == tracepoint_printk)
2995	goto out;
2996
2997	if (tracepoint_printk)
2998	static_key_enable(key: &tracepoint_printk_key.key);
2999	else
3000	static_key_disable(key: &tracepoint_printk_key.key);
3001
3002	out:
3003	mutex_unlock(lock: &tracepoint_printk_mutex);
3004
3005	return ret;
3006	}
3007
3008	void trace_event_buffer_commit(struct trace_event_buffer *fbuffer)
3009	{
3010	enum event_trigger_type tt = ETT_NONE;
3011	struct trace_event_file *file = fbuffer->trace_file;
3012
3013	if (__event_trigger_test_discard(file, buffer: fbuffer->buffer, event: fbuffer->event,
3014	entry: fbuffer->entry, tt: &tt))
3015	goto discard;
3016
3017	if (static_key_false(key: &tracepoint_printk_key.key))
3018	output_printk(fbuffer);
3019
3020	if (static_branch_unlikely(&trace_event_exports_enabled))
3021	ftrace_exports(event: fbuffer->event, TRACE_EXPORT_EVENT);
3022
3023	trace_buffer_unlock_commit_regs(tr: file->tr, buffer: fbuffer->buffer,
3024	event: fbuffer->event, trcace_ctx: fbuffer->trace_ctx, regs: fbuffer->regs);
3025
3026	discard:
3027	if (tt)
3028	event_triggers_post_call(file, tt);
3029
3030	}
3031	EXPORT_SYMBOL_GPL(trace_event_buffer_commit);
3032
3033	/*
3034	* Skip 3:
3035	*
3036	* trace_buffer_unlock_commit_regs()
3037	* trace_event_buffer_commit()
3038	* trace_event_raw_event_xxx()
3039	*/
3040	# define STACK_SKIP 3
3041
3042	void trace_buffer_unlock_commit_regs(struct trace_array *tr,
3043	struct trace_buffer *buffer,
3044	struct ring_buffer_event *event,
3045	unsigned int trace_ctx,
3046	struct pt_regs *regs)
3047	{
3048	__buffer_unlock_commit(buffer, event);
3049
3050	/*
3051	* If regs is not set, then skip the necessary functions.
3052	* Note, we can still get here via blktrace, wakeup tracer
3053	* and mmiotrace, but that's ok if they lose a function or
3054	* two. They are not that meaningful.
3055	*/
3056	ftrace_trace_stack(tr, buffer, trace_ctx, skip: regs ? `0` : STACK_SKIP, regs);
3057	ftrace_trace_userstack(tr, buffer, trace_ctx);
3058	}
3059
3060	/*
3061	* Similar to trace_buffer_unlock_commit_regs() but do not dump stack.
3062	*/
3063	void
3064	trace_buffer_unlock_commit_nostack(struct trace_buffer *buffer,
3065	struct ring_buffer_event *event)
3066	{
3067	__buffer_unlock_commit(buffer, event);
3068	}
3069
3070	void
3071	trace_function(struct trace_array tr, unsigned* long ip, unsigned long
3072	parent_ip, unsigned int trace_ctx)
3073	{
3074	struct trace_event_call *call = &event_function;
3075	struct trace_buffer *buffer = tr->array_buffer.buffer;
3076	struct ring_buffer_event *event;
3077	struct ftrace_entry *entry;
3078
3079	event = __trace_buffer_lock_reserve(buffer, type: TRACE_FN, len: sizeof(*entry),
3080	trace_ctx);
3081	if (!event)
3082	return;
3083	entry = ring_buffer_event_data(event);
3084	entry->ip = ip;
3085	entry->parent_ip = parent_ip;
3086
3087	if (!call_filter_check_discard(call, rec: entry, buffer, event)) {
3088	if (static_branch_unlikely(&trace_function_exports_enabled))
3089	ftrace_exports(event, TRACE_EXPORT_FUNCTION);
3090	__buffer_unlock_commit(buffer, event);
3091	}
3092	}
3093
3094	#ifdef CONFIG_STACKTRACE
3095
3096	/ Allow 4 levels of nesting: normal, softirq, irq, NMI /
3097	#define FTRACE_KSTACK_NESTING 4
3098
3099	#define FTRACE_KSTACK_ENTRIES (PAGE_SIZE / FTRACE_KSTACK_NESTING)
3100
3101	struct ftrace_stack {
3102	unsigned long calls[FTRACE_KSTACK_ENTRIES];
3103	};
3104
3105
3106	struct ftrace_stacks {
3107	struct ftrace_stack stacks[FTRACE_KSTACK_NESTING];
3108	};
3109
3110	static DEFINE_PER_CPU(struct ftrace_stacks, ftrace_stacks);
3111	static DEFINE_PER_CPU(int, ftrace_stack_reserve);
3112
3113	static void __ftrace_trace_stack(struct trace_buffer *buffer,
3114	unsigned int trace_ctx,
3115	int skip, struct pt_regs *regs)
3116	{
3117	struct trace_event_call *call = &event_kernel_stack;
3118	struct ring_buffer_event *event;
3119	unsigned int size, nr_entries;
3120	struct ftrace_stack *fstack;
3121	struct stack_entry *entry;
3122	int stackidx;
3123
3124	/*
3125	* Add one, for this function and the call to save_stack_trace()
3126	* If regs is set, then these functions will not be in the way.
3127	*/
3128	#ifndef CONFIG_UNWINDER_ORC
3129	if (!regs)
3130	skip++;
3131	#endif
3132
3133	preempt_disable_notrace();
3134
3135	stackidx = __this_cpu_inc_return(ftrace_stack_reserve) - `1`;
3136
3137	/ This should never happen. If it does, yell once and skip /
3138	if (WARN_ON_ONCE(stackidx >= FTRACE_KSTACK_NESTING))
3139	goto out;
3140
3141	/*
3142	* The above __this_cpu_inc_return() is 'atomic' cpu local. An
3143	* interrupt will either see the value pre increment or post
3144	* increment. If the interrupt happens pre increment it will have
3145	* restored the counter when it returns. We just need a barrier to
3146	* keep gcc from moving things around.
3147	*/
3148	barrier();
3149
3150	fstack = this_cpu_ptr(ftrace_stacks.stacks) + stackidx;
3151	size = ARRAY_SIZE(fstack->calls);
3152
3153	if (regs) {
3154	nr_entries = stack_trace_save_regs(regs, store: fstack->calls,
3155	size, skipnr: skip);
3156	} else {
3157	nr_entries = stack_trace_save(store: fstack->calls, size, skipnr: skip);
3158	}
3159
3160	event = __trace_buffer_lock_reserve(buffer, type: TRACE_STACK,
3161	struct_size(entry, caller, nr_entries),
3162	trace_ctx);
3163	if (!event)
3164	goto out;
3165	entry = ring_buffer_event_data(event);
3166
3167	entry->size = nr_entries;
3168	memcpy(&entry->caller, fstack->calls,
3169	flex_array_size(entry, caller, nr_entries));
3170
3171	if (!call_filter_check_discard(call, rec: entry, buffer, event))
3172	__buffer_unlock_commit(buffer, event);
3173
3174	out:
3175	/ Again, don't let gcc optimize things here /
3176	barrier();
3177	__this_cpu_dec(ftrace_stack_reserve);
3178	preempt_enable_notrace();
3179
3180	}
3181
3182	static inline void ftrace_trace_stack(struct trace_array *tr,
3183	struct trace_buffer *buffer,
3184	unsigned int trace_ctx,
3185	int skip, struct pt_regs *regs)
3186	{
3187	if (!(tr->trace_flags & TRACE_ITER_STACKTRACE))
3188	return;
3189
3190	__ftrace_trace_stack(buffer, trace_ctx, skip, regs);
3191	}
3192
3193	void __trace_stack(struct trace_array tr, unsigned* int trace_ctx,
3194	int skip)
3195	{
3196	struct trace_buffer *buffer = tr->array_buffer.buffer;
3197
3198	if (rcu_is_watching()) {
3199	__ftrace_trace_stack(buffer, trace_ctx, skip, NULL);
3200	return;
3201	}
3202
3203	if (WARN_ON_ONCE(IS_ENABLED(CONFIG_GENERIC_ENTRY)))
3204	return;
3205
3206	/*
3207	* When an NMI triggers, RCU is enabled via ct_nmi_enter(),
3208	* but if the above rcu_is_watching() failed, then the NMI
3209	* triggered someplace critical, and ct_irq_enter() should
3210	* not be called from NMI.
3211	*/
3212	if (unlikely(in_nmi()))
3213	return;
3214
3215	ct_irq_enter_irqson();
3216	__ftrace_trace_stack(buffer, trace_ctx, skip, NULL);
3217	ct_irq_exit_irqson();
3218	}
3219
3220	/**
3221	* trace_dump_stack - record a stack back trace in the trace buffer
3222	* @skip: Number of functions to skip (helper handlers)
3223	*/
3224	void trace_dump_stack(int skip)
3225	{
3226	if (tracing_disabled \|\| tracing_selftest_running)
3227	return;
3228
3229	#ifndef CONFIG_UNWINDER_ORC
3230	/ Skip 1 to skip this function. /
3231	skip++;
3232	#endif
3233	__ftrace_trace_stack(buffer: global_trace.array_buffer.buffer,
3234	trace_ctx: tracing_gen_ctx(), skip, NULL);
3235	}
3236	EXPORT_SYMBOL_GPL(trace_dump_stack);
3237
3238	#ifdef CONFIG_USER_STACKTRACE_SUPPORT
3239	static DEFINE_PER_CPU(int, user_stack_count);
3240
3241	static void
3242	ftrace_trace_userstack(struct trace_array *tr,
3243	struct trace_buffer buffer, unsigned* int trace_ctx)
3244	{
3245	struct trace_event_call *call = &event_user_stack;
3246	struct ring_buffer_event *event;
3247	struct userstack_entry *entry;
3248
3249	if (!(tr->trace_flags & TRACE_ITER_USERSTACKTRACE))
3250	return;
3251
3252	/*
3253	* NMIs can not handle page faults, even with fix ups.
3254	* The save user stack can (and often does) fault.
3255	*/
3256	if (unlikely(in_nmi()))
3257	return;
3258
3259	/*
3260	* prevent recursion, since the user stack tracing may
3261	* trigger other kernel events.
3262	*/
3263	preempt_disable();
3264	if (__this_cpu_read(user_stack_count))
3265	goto out;
3266
3267	__this_cpu_inc(user_stack_count);
3268
3269	event = __trace_buffer_lock_reserve(buffer, type: TRACE_USER_STACK,
3270	len: sizeof(*entry), trace_ctx);
3271	if (!event)
3272	goto out_drop_count;
3273	entry = ring_buffer_event_data(event);
3274
3275	entry->tgid = current->tgid;
3276	memset(&entry->caller, `0`, sizeof(entry->caller));
3277
3278	stack_trace_save_user(store: entry->caller, FTRACE_STACK_ENTRIES);
3279	if (!call_filter_check_discard(call, rec: entry, buffer, event))
3280	__buffer_unlock_commit(buffer, event);
3281
3282	out_drop_count:
3283	__this_cpu_dec(user_stack_count);
3284	out:
3285	preempt_enable();
3286	}
3287	#else /* CONFIG_USER_STACKTRACE_SUPPORT */
3288	static void ftrace_trace_userstack(struct trace_array *tr,
3289	struct trace_buffer *buffer,
3290	unsigned int trace_ctx)
3291	{
3292	}
3293	#endif /* !CONFIG_USER_STACKTRACE_SUPPORT */
3294
3295	#endif /* CONFIG_STACKTRACE */
3296
3297	static inline void
3298	func_repeats_set_delta_ts(struct func_repeats_entry *entry,
3299	unsigned long long delta)
3300	{
3301	entry->bottom_delta_ts = delta & U32_MAX;
3302	entry->top_delta_ts = (delta >> `32`);
3303	}
3304
3305	void trace_last_func_repeats(struct trace_array *tr,
3306	struct trace_func_repeats *last_info,
3307	unsigned int trace_ctx)
3308	{
3309	struct trace_buffer *buffer = tr->array_buffer.buffer;
3310	struct func_repeats_entry *entry;
3311	struct ring_buffer_event *event;
3312	u64 delta;
3313
3314	event = __trace_buffer_lock_reserve(buffer, type: TRACE_FUNC_REPEATS,
3315	len: sizeof(*entry), trace_ctx);
3316	if (!event)
3317	return;
3318
3319	delta = ring_buffer_event_time_stamp(buffer, event) -
3320	last_info->ts_last_call;
3321
3322	entry = ring_buffer_event_data(event);
3323	entry->ip = last_info->ip;
3324	entry->parent_ip = last_info->parent_ip;
3325	entry->count = last_info->count;
3326	func_repeats_set_delta_ts(entry, delta);
3327
3328	__buffer_unlock_commit(buffer, event);
3329	}
3330
3331	/ created for use with alloc_percpu /
3332	struct trace_buffer_struct {
3333	int nesting;
3334	char buffer[`4`][TRACE_BUF_SIZE];
3335	};
3336
3337	static struct trace_buffer_struct __percpu *trace_percpu_buffer;
3338
3339	/*
3340	* This allows for lockless recording. If we're nested too deeply, then
3341	* this returns NULL.
3342	*/
3343	static char get_trace_buf(void*)
3344	{
3345	struct trace_buffer_struct *buffer = this_cpu_ptr(trace_percpu_buffer);
3346
3347	if (!trace_percpu_buffer \|\| buffer->nesting >= `4`)
3348	return NULL;
3349
3350	buffer->nesting++;
3351
3352	/ Interrupts must see nesting incremented before we use the buffer /
3353	barrier();
3354	return &buffer->buffer[buffer->nesting - `1`][`0`];
3355	}
3356
3357	static void put_trace_buf(void)
3358	{
3359	/ Don't let the decrement of nesting leak before this /
3360	barrier();
3361	this_cpu_dec(trace_percpu_buffer->nesting);
3362	}
3363
3364	static int alloc_percpu_trace_buffer(void)
3365	{
3366	struct trace_buffer_struct __percpu *buffers;
3367
3368	if (trace_percpu_buffer)
3369	return `0`;
3370
3371	buffers = alloc_percpu(struct trace_buffer_struct);
3372	if (MEM_FAIL(!buffers, "Could not allocate percpu trace_printk buffer"))
3373	return -ENOMEM;
3374
3375	trace_percpu_buffer = buffers;
3376	return `0`;
3377	}
3378
3379	static int buffers_allocated;
3380
3381	void trace_printk_init_buffers(void)
3382	{
3383	if (buffers_allocated)
3384	return;
3385
3386	if (alloc_percpu_trace_buffer())
3387	return;
3388
3389	/ trace_printk() is for debug use only. Don't use it in production. /
3390
3391	pr_warn("\n");
3392	pr_warn("**********************************************************\n");
3393	pr_warn(" NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE \n");
3394	pr_warn(" \n");
3395	pr_warn(" trace_printk() being used. Allocating extra memory. \n");
3396	pr_warn(" \n");
3397	pr_warn(" This means that this is a DEBUG kernel and it is \n");
3398	pr_warn(" unsafe for production use. \n");
3399	pr_warn(" \n");
3400	pr_warn(" If you see this message and you are not debugging \n");
3401	pr_warn(" the kernel, report this immediately to your vendor! \n");
3402	pr_warn(" \n");
3403	pr_warn(" NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE \n");
3404	pr_warn("**********************************************************\n");
3405
3406	/ Expand the buffers to set size /
3407	tracing_update_buffers(tr: &global_trace);
3408
3409	buffers_allocated = `1`;
3410
3411	/*
3412	* trace_printk_init_buffers() can be called by modules.
3413	* If that happens, then we need to start cmdline recording
3414	* directly here. If the global_trace.buffer is already
3415	* allocated here, then this was called by module code.
3416	*/
3417	if (global_trace.array_buffer.buffer)
3418	tracing_start_cmdline_record();
3419	}
3420	EXPORT_SYMBOL_GPL(trace_printk_init_buffers);
3421
3422	void trace_printk_start_comm(void)
3423	{
3424	/ Start tracing comms if trace printk is set /
3425	if (!buffers_allocated)
3426	return;
3427	tracing_start_cmdline_record();
3428	}
3429
3430	static void trace_printk_start_stop_comm(int enabled)
3431	{
3432	if (!buffers_allocated)
3433	return;
3434
3435	if (enabled)
3436	tracing_start_cmdline_record();
3437	else
3438	tracing_stop_cmdline_record();
3439	}
3440
3441	/**
3442	* trace_vbprintk - write binary msg to tracing buffer
3443	* @ip: The address of the caller
3444	* @fmt: The string format to write to the buffer
3445	* @args: Arguments for @fmt
3446	*/
3447	int trace_vbprintk(unsigned long ip, const char *fmt, va_list args)
3448	{
3449	struct trace_event_call *call = &event_bprint;
3450	struct ring_buffer_event *event;
3451	struct trace_buffer *buffer;
3452	struct trace_array *tr = &global_trace;
3453	struct bprint_entry *entry;
3454	unsigned int trace_ctx;
3455	char *tbuffer;
3456	int len = `0`, size;
3457
3458	if (unlikely(tracing_selftest_running \|\| tracing_disabled))
3459	return `0`;
3460
3461	/ Don't pollute graph traces with trace_vprintk internals /
3462	pause_graph_tracing();
3463
3464	trace_ctx = tracing_gen_ctx();
3465	preempt_disable_notrace();
3466
3467	tbuffer = get_trace_buf();
3468	if (!tbuffer) {
3469	len = `0`;
3470	goto out_nobuffer;
3471	}
3472
3473	len = vbin_printf(bin_buf: (u32 )tbuffer, TRACE_BUF_SIZE/sizeof(int*), fmt, args);
3474
3475	if (len > TRACE_BUF_SIZE/sizeof(int) \|\| len < `0`)
3476	goto out_put;
3477
3478	size = sizeof(entry) + sizeof(u32) len;
3479	buffer = tr->array_buffer.buffer;
3480	ring_buffer_nest_start(buffer);
3481	event = __trace_buffer_lock_reserve(buffer, type: TRACE_BPRINT, len: size,
3482	trace_ctx);
3483	if (!event)
3484	goto out;
3485	entry = ring_buffer_event_data(event);
3486	entry->ip = ip;
3487	entry->fmt = fmt;
3488
3489	memcpy(entry->buf, tbuffer, sizeof(u32) * len);
3490	if (!call_filter_check_discard(call, rec: entry, buffer, event)) {
3491	__buffer_unlock_commit(buffer, event);
3492	ftrace_trace_stack(tr, buffer, trace_ctx, skip: `6`, NULL);
3493	}
3494
3495	out:
3496	ring_buffer_nest_end(buffer);
3497	out_put:
3498	put_trace_buf();
3499
3500	out_nobuffer:
3501	preempt_enable_notrace();
3502	unpause_graph_tracing();
3503
3504	return len;
3505	}
3506	EXPORT_SYMBOL_GPL(trace_vbprintk);
3507
3508	__printf(`3`, `0`)
3509	static int
3510	__trace_array_vprintk(struct trace_buffer *buffer,
3511	unsigned long ip, const char *fmt, va_list args)
3512	{
3513	struct trace_event_call *call = &event_print;
3514	struct ring_buffer_event *event;
3515	int len = `0`, size;
3516	struct print_entry *entry;
3517	unsigned int trace_ctx;
3518	char *tbuffer;
3519
3520	if (tracing_disabled)
3521	return `0`;
3522
3523	/ Don't pollute graph traces with trace_vprintk internals /
3524	pause_graph_tracing();
3525
3526	trace_ctx = tracing_gen_ctx();
3527	preempt_disable_notrace();
3528
3529
3530	tbuffer = get_trace_buf();
3531	if (!tbuffer) {
3532	len = `0`;
3533	goto out_nobuffer;
3534	}
3535
3536	len = vscnprintf(buf: tbuffer, TRACE_BUF_SIZE, fmt, args);
3537
3538	size = sizeof(*entry) + len + `1`;
3539	ring_buffer_nest_start(buffer);
3540	event = __trace_buffer_lock_reserve(buffer, type: TRACE_PRINT, len: size,
3541	trace_ctx);
3542	if (!event)
3543	goto out;
3544	entry = ring_buffer_event_data(event);
3545	entry->ip = ip;
3546
3547	memcpy(&entry->buf, tbuffer, len + `1`);
3548	if (!call_filter_check_discard(call, rec: entry, buffer, event)) {
3549	__buffer_unlock_commit(buffer, event);
3550	ftrace_trace_stack(tr: &global_trace, buffer, trace_ctx, skip: `6`, NULL);
3551	}
3552
3553	out:
3554	ring_buffer_nest_end(buffer);
3555	put_trace_buf();
3556
3557	out_nobuffer:
3558	preempt_enable_notrace();
3559	unpause_graph_tracing();
3560
3561	return len;
3562	}
3563
3564	__printf(`3`, `0`)
3565	int trace_array_vprintk(struct trace_array *tr,
3566	unsigned long ip, const char *fmt, va_list args)
3567	{
3568	if (tracing_selftest_running && tr == &global_trace)
3569	return `0`;
3570
3571	return __trace_array_vprintk(buffer: tr->array_buffer.buffer, ip, fmt, args);
3572	}
3573
3574	/**
3575	* trace_array_printk - Print a message to a specific instance
3576	* @tr: The instance trace_array descriptor
3577	* @ip: The instruction pointer that this is called from.
3578	* @fmt: The format to print (printf format)
3579	*
3580	* If a subsystem sets up its own instance, they have the right to
3581	* printk strings into their tracing instance buffer using this
3582	* function. Note, this function will not write into the top level
3583	* buffer (use trace_printk() for that), as writing into the top level
3584	* buffer should only have events that can be individually disabled.
3585	* trace_printk() is only used for debugging a kernel, and should not
3586	* be ever incorporated in normal use.
3587	*
3588	* trace_array_printk() can be used, as it will not add noise to the
3589	* top level tracing buffer.
3590	*
3591	* Note, trace_array_init_printk() must be called on @tr before this
3592	* can be used.
3593	*/
3594	__printf(`3`, `0`)
3595	int trace_array_printk(struct trace_array *tr,
3596	unsigned long ip, const char *fmt, ...)
3597	{
3598	int ret;
3599	va_list ap;
3600
3601	if (!tr)
3602	return -ENOENT;
3603
3604	/ This is only allowed for created instances /
3605	if (tr == &global_trace)
3606	return `0`;
3607
3608	if (!(tr->trace_flags & TRACE_ITER_PRINTK))
3609	return `0`;
3610
3611	va_start(ap, fmt);
3612	ret = trace_array_vprintk(tr, ip, fmt, args: ap);
3613	va_end(ap);
3614	return ret;
3615	}
3616	EXPORT_SYMBOL_GPL(trace_array_printk);
3617
3618	/**
3619	* trace_array_init_printk - Initialize buffers for trace_array_printk()
3620	* @tr: The trace array to initialize the buffers for
3621	*
3622	* As trace_array_printk() only writes into instances, they are OK to
3623	* have in the kernel (unlike trace_printk()). This needs to be called
3624	* before trace_array_printk() can be used on a trace_array.
3625	*/
3626	int trace_array_init_printk(struct trace_array *tr)
3627	{
3628	if (!tr)
3629	return -ENOENT;
3630
3631	/ This is only allowed for created instances /
3632	if (tr == &global_trace)
3633	return -EINVAL;
3634
3635	return alloc_percpu_trace_buffer();
3636	}
3637	EXPORT_SYMBOL_GPL(trace_array_init_printk);
3638
3639	__printf(`3`, `4`)
3640	int trace_array_printk_buf(struct trace_buffer *buffer,
3641	unsigned long ip, const char *fmt, ...)
3642	{
3643	int ret;
3644	va_list ap;
3645
3646	if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
3647	return `0`;
3648
3649	va_start(ap, fmt);
3650	ret = __trace_array_vprintk(buffer, ip, fmt, args: ap);
3651	va_end(ap);
3652	return ret;
3653	}
3654
3655	__printf(`2`, `0`)
3656	int trace_vprintk(unsigned long ip, const char *fmt, va_list args)
3657	{
3658	return trace_array_vprintk(tr: &global_trace, ip, fmt, args);
3659	}
3660	EXPORT_SYMBOL_GPL(trace_vprintk);
3661
3662	static void trace_iterator_increment(struct trace_iterator *iter)
3663	{
3664	struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, cpu: iter->cpu);
3665
3666	iter->idx++;
3667	if (buf_iter)
3668	ring_buffer_iter_advance(iter: buf_iter);
3669	}
3670
3671	static struct trace_entry *
3672	peek_next_entry(struct trace_iterator iter, int* cpu, u64 *ts,
3673	unsigned long *lost_events)
3674	{
3675	struct ring_buffer_event *event;
3676	struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, cpu);
3677
3678	if (buf_iter) {
3679	event = ring_buffer_iter_peek(iter: buf_iter, ts);
3680	if (lost_events)
3681	*lost_events = ring_buffer_iter_dropped(iter: buf_iter) ?
3682	(unsigned long)-`1` : `0`;
3683	} else {
3684	event = ring_buffer_peek(buffer: iter->array_buffer->buffer, cpu, ts,
3685	lost_events);
3686	}
3687
3688	if (event) {
3689	iter->ent_size = ring_buffer_event_length(event);
3690	return ring_buffer_event_data(event);
3691	}
3692	iter->ent_size = `0`;
3693	return NULL;
3694	}
3695
3696	static struct trace_entry *
3697	__find_next_entry(struct trace_iterator iter, int* *ent_cpu,
3698	unsigned long missing_events, u64 ent_ts)
3699	{
3700	struct trace_buffer *buffer = iter->array_buffer->buffer;
3701	struct trace_entry ent, next = NULL;
3702	unsigned long lost_events = `0`, next_lost = `0`;
3703	int cpu_file = iter->cpu_file;
3704	u64 next_ts = `0`, ts;
3705	int next_cpu = -`1`;
3706	int next_size = `0`;
3707	int cpu;
3708
3709	/*
3710	* If we are in a per_cpu trace file, don't bother by iterating over
3711	* all cpu and peek directly.
3712	*/
3713	if (cpu_file > RING_BUFFER_ALL_CPUS) {
3714	if (ring_buffer_empty_cpu(buffer, cpu: cpu_file))
3715	return NULL;
3716	ent = peek_next_entry(iter, cpu: cpu_file, ts: ent_ts, lost_events: missing_events);
3717	if (ent_cpu)
3718	*ent_cpu = cpu_file;
3719
3720	return ent;
3721	}
3722
3723	for_each_tracing_cpu(cpu) {
3724
3725	if (ring_buffer_empty_cpu(buffer, cpu))
3726	continue;
3727
3728	ent = peek_next_entry(iter, cpu, ts: &ts, lost_events: &lost_events);
3729
3730	/*
3731	* Pick the entry with the smallest timestamp:
3732	*/
3733	if (ent && (!next \|\| ts < next_ts)) {
3734	next = ent;
3735	next_cpu = cpu;
3736	next_ts = ts;
3737	next_lost = lost_events;
3738	next_size = iter->ent_size;
3739	}
3740	}
3741
3742	iter->ent_size = next_size;
3743
3744	if (ent_cpu)
3745	*ent_cpu = next_cpu;
3746
3747	if (ent_ts)
3748	*ent_ts = next_ts;
3749
3750	if (missing_events)
3751	*missing_events = next_lost;
3752
3753	return next;
3754	}
3755
3756	#define STATIC_FMT_BUF_SIZE 128
3757	static char static_fmt_buf[STATIC_FMT_BUF_SIZE];
3758
3759	char trace_iter_expand_format(struct* trace_iterator *iter)
3760	{
3761	char *tmp;
3762
3763	/*
3764	* iter->tr is NULL when used with tp_printk, which makes
3765	* this get called where it is not safe to call krealloc().
3766	*/
3767	if (!iter->tr \|\| iter->fmt == static_fmt_buf)
3768	return NULL;
3769
3770	tmp = krealloc(objp: iter->fmt, new_size: iter->fmt_size + STATIC_FMT_BUF_SIZE,
3771	GFP_KERNEL);
3772	if (tmp) {
3773	iter->fmt_size += STATIC_FMT_BUF_SIZE;
3774	iter->fmt = tmp;
3775	}
3776
3777	return tmp;
3778	}
3779
3780	/ Returns true if the string is safe to dereference from an event /
3781	static bool trace_safe_str(struct trace_iterator iter, const* char *str,
3782	bool star, int len)
3783	{
3784	unsigned long addr = (unsigned long)str;
3785	struct trace_event *trace_event;
3786	struct trace_event_call *event;
3787
3788	/ Ignore strings with no length /
3789	if (star && !len)
3790	return true;
3791
3792	/ OK if part of the event data /
3793	if ((addr >= (unsigned long)iter->ent) &&
3794	(addr < (unsigned long)iter->ent + iter->ent_size))
3795	return true;
3796
3797	/ OK if part of the temp seq buffer /
3798	if ((addr >= (unsigned long)iter->tmp_seq.buffer) &&
3799	(addr < (unsigned long)iter->tmp_seq.buffer + PAGE_SIZE))
3800	return true;
3801
3802	/ Core rodata can not be freed /
3803	if (is_kernel_rodata(addr))
3804	return true;
3805
3806	if (trace_is_tracepoint_string(str))
3807	return true;
3808
3809	/*
3810	* Now this could be a module event, referencing core module
3811	* data, which is OK.
3812	*/
3813	if (!iter->ent)
3814	return false;
3815
3816	trace_event = ftrace_find_event(type: iter->ent->type);
3817	if (!trace_event)
3818	return false;
3819
3820	event = container_of(trace_event, struct trace_event_call, event);
3821	if ((event->flags & TRACE_EVENT_FL_DYNAMIC) \|\| !event->module)
3822	return false;
3823
3824	/ Would rather have rodata, but this will suffice /
3825	if (within_module_core(addr, mod: event->module))
3826	return true;
3827
3828	return false;
3829	}
3830
3831	static DEFINE_STATIC_KEY_FALSE(trace_no_verify);
3832
3833	static int test_can_verify_check(const char *fmt, ...)
3834	{
3835	char buf[`16`];
3836	va_list ap;
3837	int ret;
3838
3839	/*
3840	* The verifier is dependent on vsnprintf() modifies the va_list
3841	* passed to it, where it is sent as a reference. Some architectures
3842	* (like x86_32) passes it by value, which means that vsnprintf()
3843	* does not modify the va_list passed to it, and the verifier
3844	* would then need to be able to understand all the values that
3845	* vsnprintf can use. If it is passed by value, then the verifier
3846	* is disabled.
3847	*/
3848	va_start(ap, fmt);
3849	vsnprintf(buf, size: `16`, fmt: "%d", args: ap);
3850	ret = va_arg(ap, int);
3851	va_end(ap);
3852
3853	return ret;
3854	}
3855
3856	static void test_can_verify(void)
3857	{
3858	if (!test_can_verify_check(fmt: "%d %d", `0`, `1`)) {
3859	pr_info("trace event string verifier disabled\n");
3860	static_branch_inc(&trace_no_verify);
3861	}
3862	}
3863
3864	/**
3865	* trace_check_vprintf - Check dereferenced strings while writing to the seq buffer
3866	* @iter: The iterator that holds the seq buffer and the event being printed
3867	* @fmt: The format used to print the event
3868	* @ap: The va_list holding the data to print from @fmt.
3869	*
3870	* This writes the data into the @iter->seq buffer using the data from
3871	* @fmt and @ap. If the format has a %s, then the source of the string
3872	* is examined to make sure it is safe to print, otherwise it will
3873	* warn and print "[UNSAFE MEMORY]" in place of the dereferenced string
3874	* pointer.
3875	*/
3876	void trace_check_vprintf(struct trace_iterator iter, const* char *fmt,
3877	va_list ap)
3878	{
3879	const char *p = fmt;
3880	const char *str;
3881	int i, j;
3882
3883	if (WARN_ON_ONCE(!fmt))
3884	return;
3885
3886	if (static_branch_unlikely(&trace_no_verify))
3887	goto print;
3888
3889	/ Don't bother checking when doing a ftrace_dump() /
3890	if (iter->fmt == static_fmt_buf)
3891	goto print;
3892
3893	while (*p) {
3894	bool star = false;
3895	int len = `0`;
3896
3897	j = `0`;
3898
3899	/ We only care about %s and variants /
3900	for (i = `0`; p[i]; i++) {
3901	if (i + `1` >= iter->fmt_size) {
3902	/*
3903	* If we can't expand the copy buffer,
3904	* just print it.
3905	*/
3906	if (!trace_iter_expand_format(iter))
3907	goto print;
3908	}
3909
3910	if (p[i] == `'\\'` && p[i+`1`]) {
3911	i++;
3912	continue;
3913	}
3914	if (p[i] == `'%'`) {
3915	/ Need to test cases like %08.s /*
3916	for (j = `1`; p[i+j]; j++) {
3917	if (isdigit(c: p[i+j]) \|\|
3918	p[i+j] == `'.'`)
3919	continue;
3920	if (p[i+j] == `'*'`) {
3921	star = true;
3922	continue;
3923	}
3924	break;
3925	}
3926	if (p[i+j] == `'s'`)
3927	break;
3928	star = false;
3929	}
3930	j = `0`;
3931	}
3932	/ If no %s found then just print normally /
3933	if (!p[i])
3934	break;
3935
3936	/ Copy up to the %s, and print that /
3937	strncpy(p: iter->fmt, q: p, size: i);
3938	iter->fmt[i] = `'\0'`;
3939	trace_seq_vprintf(s: &iter->seq, fmt: iter->fmt, args: ap);
3940
3941	/*
3942	* If iter->seq is full, the above call no longer guarantees
3943	* that ap is in sync with fmt processing, and further calls
3944	* to va_arg() can return wrong positional arguments.
3945	*
3946	* Ensure that ap is no longer used in this case.
3947	*/
3948	if (iter->seq.full) {
3949	p = "";
3950	break;
3951	}
3952
3953	if (star)
3954	len = va_arg(ap, int);
3955
3956	/ The ap now points to the string data of the %s /
3957	str = va_arg(ap, const char *);
3958
3959	/*
3960	* If you hit this warning, it is likely that the
3961	* trace event in question used %s on a string that
3962	* was saved at the time of the event, but may not be
3963	* around when the trace is read. Use __string(),
3964	* __assign_str() and __get_str() helpers in the TRACE_EVENT()
3965	* instead. See samples/trace_events/trace-events-sample.h
3966	* for reference.
3967	*/
3968	if (WARN_ONCE(!trace_safe_str(iter, str, star, len),
3969	"fmt: '%s' current_buffer: '%s'",
3970	fmt, seq_buf_str(&iter->seq.seq))) {
3971	int ret;
3972
3973	/ Try to safely read the string /
3974	if (star) {
3975	if (len + `1` > iter->fmt_size)
3976	len = iter->fmt_size - `1`;
3977	if (len < `0`)
3978	len = `0`;
3979	ret = copy_from_kernel_nofault(dst: iter->fmt, src: str, size: len);
3980	iter->fmt[len] = `0`;
3981	star = false;
3982	} else {
3983	ret = strncpy_from_kernel_nofault(dst: iter->fmt, unsafe_addr: str,
3984	count: iter->fmt_size);
3985	}
3986	if (ret < `0`)
3987	trace_seq_printf(s: &iter->seq, fmt: "(0x%px)", str);
3988	else
3989	trace_seq_printf(s: &iter->seq, fmt: "(0x%px:%s)",
3990	str, iter->fmt);
3991	str = "[UNSAFE-MEMORY]";
3992	strcpy(p: iter->fmt, q: "%s");
3993	} else {
3994	strncpy(p: iter->fmt, q: p + i, size: j + `1`);
3995	iter->fmt[j+`1`] = `'\0'`;
3996	}
3997	if (star)
3998	trace_seq_printf(s: &iter->seq, fmt: iter->fmt, len, str);
3999	else
4000	trace_seq_printf(s: &iter->seq, fmt: iter->fmt, str);
4001
4002	p += i + j + `1`;
4003	}
4004	print:
4005	if (*p)
4006	trace_seq_vprintf(s: &iter->seq, fmt: p, args: ap);
4007	}
4008
4009	const char trace_event_format(struct* trace_iterator iter, const* char *fmt)
4010	{
4011	const char p, new_fmt;
4012	char *q;
4013
4014	if (WARN_ON_ONCE(!fmt))
4015	return fmt;
4016
4017	if (!iter->tr \|\| iter->tr->trace_flags & TRACE_ITER_HASH_PTR)
4018	return fmt;
4019
4020	p = fmt;
4021	new_fmt = q = iter->fmt;
4022	while (*p) {
4023	if (unlikely(q - new_fmt + `3` > iter->fmt_size)) {
4024	if (!trace_iter_expand_format(iter))
4025	return fmt;
4026
4027	q += iter->fmt - new_fmt;
4028	new_fmt = iter->fmt;
4029	}
4030
4031	q++ = p++;
4032
4033	/ Replace %p with %px /
4034	if (p[-`1`] == `'%'`) {
4035	if (p[`0`] == `'%'`) {
4036	q++ = p++;
4037	} else if (p[`0`] == `'p'` && !isalnum(p[`1`])) {
4038	q++ = p++;
4039	*q++ = `'x'`;
4040	}
4041	}
4042	}
4043	*q = `'\0'`;
4044
4045	return new_fmt;
4046	}
4047
4048	#define STATIC_TEMP_BUF_SIZE 128
4049	static char static_temp_buf[STATIC_TEMP_BUF_SIZE] __aligned(`4`);
4050
4051	/ Find the next real entry, without updating the iterator itself /
4052	struct trace_entry trace_find_next_entry(struct* trace_iterator *iter,
4053	int ent_cpu, u64 ent_ts)
4054	{
4055	/ __find_next_entry will reset ent_size /
4056	int ent_size = iter->ent_size;
4057	struct trace_entry *entry;
4058
4059	/*
4060	* If called from ftrace_dump(), then the iter->temp buffer
4061	* will be the static_temp_buf and not created from kmalloc.
4062	* If the entry size is greater than the buffer, we can
4063	* not save it. Just return NULL in that case. This is only
4064	* used to add markers when two consecutive events' time
4065	* stamps have a large delta. See trace_print_lat_context()
4066	*/
4067	if (iter->temp == static_temp_buf &&
4068	STATIC_TEMP_BUF_SIZE < ent_size)
4069	return NULL;
4070
4071	/*
4072	* The __find_next_entry() may call peek_next_entry(), which may
4073	* call ring_buffer_peek() that may make the contents of iter->ent
4074	* undefined. Need to copy iter->ent now.
4075	*/
4076	if (iter->ent && iter->ent != iter->temp) {
4077	if ((!iter->temp \|\| iter->temp_size < iter->ent_size) &&
4078	!WARN_ON_ONCE(iter->temp == static_temp_buf)) {
4079	void *temp;
4080	temp = kmalloc(size: iter->ent_size, GFP_KERNEL);
4081	if (!temp)
4082	return NULL;
4083	kfree(objp: iter->temp);
4084	iter->temp = temp;
4085	iter->temp_size = iter->ent_size;
4086	}
4087	memcpy(iter->temp, iter->ent, iter->ent_size);
4088	iter->ent = iter->temp;
4089	}
4090	entry = __find_next_entry(iter, ent_cpu, NULL, ent_ts);
4091	/ Put back the original ent_size /
4092	iter->ent_size = ent_size;
4093
4094	return entry;
4095	}
4096
4097	/ Find the next real entry, and increment the iterator to the next entry /
4098	void trace_find_next_entry_inc(struct* trace_iterator *iter)
4099	{
4100	iter->ent = __find_next_entry(iter, ent_cpu: &iter->cpu,
4101	missing_events: &iter->lost_events, ent_ts: &iter->ts);
4102
4103	if (iter->ent)
4104	trace_iterator_increment(iter);
4105
4106	return iter->ent ? iter : NULL;
4107	}
4108
4109	static void trace_consume(struct trace_iterator *iter)
4110	{
4111	ring_buffer_consume(buffer: iter->array_buffer->buffer, cpu: iter->cpu, ts: &iter->ts,
4112	lost_events: &iter->lost_events);
4113	}
4114
4115	static void s_next(struct* seq_file m, void* v, loff_t pos)
4116	{
4117	struct trace_iterator *iter = m->private;
4118	int i = (int)*pos;
4119	void *ent;
4120
4121	WARN_ON_ONCE(iter->leftover);
4122
4123	(*pos)++;
4124
4125	/ can't go backwards /
4126	if (iter->idx > i)
4127	return NULL;
4128
4129	if (iter->idx < `0`)
4130	ent = trace_find_next_entry_inc(iter);
4131	else
4132	ent = iter;
4133
4134	while (ent && iter->idx < i)
4135	ent = trace_find_next_entry_inc(iter);
4136
4137	iter->pos = *pos;
4138
4139	return ent;
4140	}
4141
4142	void tracing_iter_reset(struct trace_iterator iter, int* cpu)
4143	{
4144	struct ring_buffer_iter *buf_iter;
4145	unsigned long entries = `0`;
4146	u64 ts;
4147
4148	per_cpu_ptr(iter->array_buffer->data, cpu)->skipped_entries = `0`;
4149
4150	buf_iter = trace_buffer_iter(iter, cpu);
4151	if (!buf_iter)
4152	return;
4153
4154	ring_buffer_iter_reset(iter: buf_iter);
4155
4156	/*
4157	* We could have the case with the max latency tracers
4158	* that a reset never took place on a cpu. This is evident
4159	* by the timestamp being before the start of the buffer.
4160	*/
4161	while (ring_buffer_iter_peek(iter: buf_iter, ts: &ts)) {
4162	if (ts >= iter->array_buffer->time_start)
4163	break;
4164	entries++;
4165	ring_buffer_iter_advance(iter: buf_iter);
4166	}
4167
4168	per_cpu_ptr(iter->array_buffer->data, cpu)->skipped_entries = entries;
4169	}
4170
4171	/*
4172	* The current tracer is copied to avoid a global locking
4173	* all around.
4174	*/
4175	static void s_start(struct* seq_file m, loff_t pos)
4176	{
4177	struct trace_iterator *iter = m->private;
4178	struct trace_array *tr = iter->tr;
4179	int cpu_file = iter->cpu_file;
4180	void *p = NULL;
4181	loff_t l = `0`;
4182	int cpu;
4183
4184	mutex_lock(&trace_types_lock);
4185	if (unlikely(tr->current_trace != iter->trace)) {
4186	/ Close iter->trace before switching to the new current tracer /
4187	if (iter->trace->close)
4188	iter->trace->close(iter);
4189	iter->trace = tr->current_trace;
4190	/ Reopen the new current tracer /
4191	if (iter->trace->open)
4192	iter->trace->open(iter);
4193	}
4194	mutex_unlock(lock: &trace_types_lock);
4195
4196	#ifdef CONFIG_TRACER_MAX_TRACE
4197	if (iter->snapshot && iter->trace->use_max_tr)
4198	return ERR_PTR(error: -EBUSY);
4199	#endif
4200
4201	if (*pos != iter->pos) {
4202	iter->ent = NULL;
4203	iter->cpu = `0`;
4204	iter->idx = -`1`;
4205
4206	if (cpu_file == RING_BUFFER_ALL_CPUS) {
4207	for_each_tracing_cpu(cpu)
4208	tracing_iter_reset(iter, cpu);
4209	} else
4210	tracing_iter_reset(iter, cpu: cpu_file);
4211
4212	iter->leftover = `0`;
4213	for (p = iter; p && l < *pos; p = s_next(m, v: p, pos: &l))
4214	;
4215
4216	} else {
4217	/*
4218	* If we overflowed the seq_file before, then we want
4219	* to just reuse the trace_seq buffer again.
4220	*/
4221	if (iter->leftover)
4222	p = iter;
4223	else {
4224	l = *pos - `1`;
4225	p = s_next(m, v: p, pos: &l);
4226	}
4227	}
4228
4229	trace_event_read_lock();
4230	trace_access_lock(cpu: cpu_file);
4231	return p;
4232	}
4233
4234	static void s_stop(struct seq_file m, void* *p)
4235	{
4236	struct trace_iterator *iter = m->private;
4237
4238	#ifdef CONFIG_TRACER_MAX_TRACE
4239	if (iter->snapshot && iter->trace->use_max_tr)
4240	return;
4241	#endif
4242
4243	trace_access_unlock(cpu: iter->cpu_file);
4244	trace_event_read_unlock();
4245	}
4246
4247	static void
4248	get_total_entries_cpu(struct array_buffer buf, unsigned* long *total,
4249	unsigned long entries, int* cpu)
4250	{
4251	unsigned long count;
4252
4253	count = ring_buffer_entries_cpu(buffer: buf->buffer, cpu);
4254	/*
4255	* If this buffer has skipped entries, then we hold all
4256	* entries for the trace and we need to ignore the
4257	* ones before the time stamp.
4258	*/
4259	if (per_cpu_ptr(buf->data, cpu)->skipped_entries) {
4260	count -= per_cpu_ptr(buf->data, cpu)->skipped_entries;
4261	/ total is the same as the entries /
4262	*total = count;
4263	} else
4264	*total = count +
4265	ring_buffer_overrun_cpu(buffer: buf->buffer, cpu);
4266	*entries = count;
4267	}
4268
4269	static void
4270	get_total_entries(struct array_buffer *buf,
4271	unsigned long total, unsigned* long *entries)
4272	{
4273	unsigned long t, e;
4274	int cpu;
4275
4276	*total = `0`;
4277	*entries = `0`;
4278
4279	for_each_tracing_cpu(cpu) {
4280	get_total_entries_cpu(buf, total: &t, entries: &e, cpu);
4281	*total += t;
4282	*entries += e;
4283	}
4284	}
4285
4286	unsigned long trace_total_entries_cpu(struct trace_array tr, int* cpu)
4287	{
4288	unsigned long total, entries;
4289
4290	if (!tr)
4291	tr = &global_trace;
4292
4293	get_total_entries_cpu(buf: &tr->array_buffer, total: &total, entries: &entries, cpu);
4294
4295	return entries;
4296	}
4297
4298	unsigned long trace_total_entries(struct trace_array *tr)
4299	{
4300	unsigned long total, entries;
4301
4302	if (!tr)
4303	tr = &global_trace;
4304
4305	get_total_entries(buf: &tr->array_buffer, total: &total, entries: &entries);
4306
4307	return entries;
4308	}
4309
4310	static void print_lat_help_header(struct seq_file *m)
4311	{
4312	seq_puts(m, s: "# _------=> CPU# \n"
4313	"# / _-----=> irqs-off/BH-disabled\n"
4314	"# \| / _----=> need-resched \n"
4315	"# \|\| / _---=> hardirq/softirq \n"
4316	"# \|\|\| / _--=> preempt-depth \n"
4317	"# \|\|\|\| / _-=> migrate-disable \n"
4318	"# \|\|\|\|\| / delay \n"
4319	"# cmd pid \|\|\|\|\|\| time \| caller \n"
4320	"# \\ / \|\|\|\|\|\| \\ \| / \n");
4321	}
4322
4323	static void print_event_info(struct array_buffer buf, struct* seq_file *m)
4324	{
4325	unsigned long total;
4326	unsigned long entries;
4327
4328	get_total_entries(buf, total: &total, entries: &entries);
4329	seq_printf(m, fmt: "# entries-in-buffer/entries-written: %lu/%lu #P:%d\n",
4330	entries, total, num_online_cpus());
4331	seq_puts(m, s: "#\n");
4332	}
4333
4334	static void print_func_help_header(struct array_buffer buf, struct* seq_file *m,
4335	unsigned int flags)
4336	{
4337	bool tgid = flags & TRACE_ITER_RECORD_TGID;
4338
4339	print_event_info(buf, m);
4340
4341	seq_printf(m, fmt: "# TASK-PID %s CPU# TIMESTAMP FUNCTION\n", tgid ? " TGID " : "");
4342	seq_printf(m, fmt: "# \| \| %s \| \| \|\n", tgid ? " \| " : "");
4343	}
4344
4345	static void print_func_help_header_irq(struct array_buffer buf, struct* seq_file *m,
4346	unsigned int flags)
4347	{
4348	bool tgid = flags & TRACE_ITER_RECORD_TGID;
4349	static const char space[] = " ";
4350	int prec = tgid ? `12` : `2`;
4351
4352	print_event_info(buf, m);
4353
4354	seq_printf(m, fmt: "# %.*s _-----=> irqs-off/BH-disabled\n", prec, space);
4355	seq_printf(m, fmt: "# %.*s / _----=> need-resched\n", prec, space);
4356	seq_printf(m, fmt: "# %.*s\| / _---=> hardirq/softirq\n", prec, space);
4357	seq_printf(m, fmt: "# %.*s\|\| / _--=> preempt-depth\n", prec, space);
4358	seq_printf(m, fmt: "# %.*s\|\|\| / _-=> migrate-disable\n", prec, space);
4359	seq_printf(m, fmt: "# %.*s\|\|\|\| / delay\n", prec, space);
4360	seq_printf(m, fmt: "# TASK-PID %.*s CPU# \|\|\|\|\| TIMESTAMP FUNCTION\n", prec, " TGID ");
4361	seq_printf(m, fmt: "# \| \| %.*s \| \|\|\|\|\| \| \|\n", prec, " \| ");
4362	}
4363
4364	void
4365	print_trace_header(struct seq_file m, struct* trace_iterator *iter)
4366	{
4367	unsigned long sym_flags = (global_trace.trace_flags & TRACE_ITER_SYM_MASK);
4368	struct array_buffer *buf = iter->array_buffer;
4369	struct trace_array_cpu *data = per_cpu_ptr(buf->data, buf->cpu);
4370	struct tracer *type = iter->trace;
4371	unsigned long entries;
4372	unsigned long total;
4373	const char *name = type->name;
4374
4375	get_total_entries(buf, total: &total, entries: &entries);
4376
4377	seq_printf(m, fmt: "# %s latency trace v1.1.5 on %s\n",
4378	name, UTS_RELEASE);
4379	seq_puts(m, s: "# -----------------------------------"
4380	"---------------------------------\n");
4381	seq_printf(m, fmt: "# latency: %lu us, #%lu/%lu, CPU#%d \|"
4382	" (M:%s VP:%d, KP:%d, SP:%d HP:%d",
4383	nsecs_to_usecs(nsecs: data->saved_latency),
4384	entries,
4385	total,
4386	buf->cpu,
4387	preempt_model_none() ? "server" :
4388	preempt_model_voluntary() ? "desktop" :
4389	preempt_model_full() ? "preempt" :
4390	preempt_model_rt() ? "preempt_rt" :
4391	"unknown",
4392	/ These are reserved for later use /
4393	`0`, `0`, `0`, `0`);
4394	#ifdef CONFIG_SMP
4395	seq_printf(m, fmt: " #P:%d)\n", num_online_cpus());
4396	#else
4397	seq_puts(m, ")\n");
4398	#endif
4399	seq_puts(m, s: "# -----------------\n");
4400	seq_printf(m, fmt: "# \| task: %.16s-%d "
4401	"(uid:%d nice:%ld policy:%ld rt_prio:%ld)\n",
4402	data->comm, data->pid,
4403	from_kuid_munged(to: seq_user_ns(seq: m), uid: data->uid), data->nice,
4404	data->policy, data->rt_priority);
4405	seq_puts(m, s: "# -----------------\n");
4406
4407	if (data->critical_start) {
4408	seq_puts(m, s: "# => started at: ");
4409	seq_print_ip_sym(s: &iter->seq, ip: data->critical_start, sym_flags);
4410	trace_print_seq(m, s: &iter->seq);
4411	seq_puts(m, s: "\n# => ended at: ");
4412	seq_print_ip_sym(s: &iter->seq, ip: data->critical_end, sym_flags);
4413	trace_print_seq(m, s: &iter->seq);
4414	seq_puts(m, s: "\n#\n");
4415	}
4416
4417	seq_puts(m, s: "#\n");
4418	}
4419
4420	static void test_cpu_buff_start(struct trace_iterator *iter)
4421	{
4422	struct trace_seq *s = &iter->seq;
4423	struct trace_array *tr = iter->tr;
4424
4425	if (!(tr->trace_flags & TRACE_ITER_ANNOTATE))
4426	return;
4427
4428	if (!(iter->iter_flags & TRACE_FILE_ANNOTATE))
4429	return;
4430
4431	if (cpumask_available(mask: iter->started) &&
4432	cpumask_test_cpu(cpu: iter->cpu, cpumask: iter->started))
4433	return;
4434
4435	if (per_cpu_ptr(iter->array_buffer->data, iter->cpu)->skipped_entries)
4436	return;
4437
4438	if (cpumask_available(mask: iter->started))
4439	cpumask_set_cpu(cpu: iter->cpu, dstp: iter->started);
4440
4441	/ Don't print started cpu buffer for the first entry of the trace /
4442	if (iter->idx > `1`)
4443	trace_seq_printf(s, fmt: "##### CPU %u buffer started ####\n",
4444	iter->cpu);
4445	}
4446
4447	static enum print_line_t print_trace_fmt(struct trace_iterator *iter)
4448	{
4449	struct trace_array *tr = iter->tr;
4450	struct trace_seq *s = &iter->seq;
4451	unsigned long sym_flags = (tr->trace_flags & TRACE_ITER_SYM_MASK);
4452	struct trace_entry *entry;
4453	struct trace_event *event;
4454
4455	entry = iter->ent;
4456
4457	test_cpu_buff_start(iter);
4458
4459	event = ftrace_find_event(type: entry->type);
4460
4461	if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
4462	if (iter->iter_flags & TRACE_FILE_LAT_FMT)
4463	trace_print_lat_context(iter);
4464	else
4465	trace_print_context(iter);
4466	}
4467
4468	if (trace_seq_has_overflowed(s))
4469	return TRACE_TYPE_PARTIAL_LINE;
4470
4471	if (event) {
4472	if (tr->trace_flags & TRACE_ITER_FIELDS)
4473	return print_event_fields(iter, event);
4474	return event->funcs->trace(iter, sym_flags, event);
4475	}
4476
4477	trace_seq_printf(s, fmt: "Unknown type %d\n", entry->type);
4478
4479	return trace_handle_return(s);
4480	}
4481
4482	static enum print_line_t print_raw_fmt(struct trace_iterator *iter)
4483	{
4484	struct trace_array *tr = iter->tr;
4485	struct trace_seq *s = &iter->seq;
4486	struct trace_entry *entry;
4487	struct trace_event *event;
4488
4489	entry = iter->ent;
4490
4491	if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO)
4492	trace_seq_printf(s, fmt: "%d %d %llu ",
4493	entry->pid, iter->cpu, iter->ts);
4494
4495	if (trace_seq_has_overflowed(s))
4496	return TRACE_TYPE_PARTIAL_LINE;
4497
4498	event = ftrace_find_event(type: entry->type);
4499	if (event)
4500	return event->funcs->raw(iter, `0`, event);
4501
4502	trace_seq_printf(s, fmt: "%d ?\n", entry->type);
4503
4504	return trace_handle_return(s);
4505	}
4506
4507	static enum print_line_t print_hex_fmt(struct trace_iterator *iter)
4508	{
4509	struct trace_array *tr = iter->tr;
4510	struct trace_seq *s = &iter->seq;
4511	unsigned char newline = `'\n'`;
4512	struct trace_entry *entry;
4513	struct trace_event *event;
4514
4515	entry = iter->ent;
4516
4517	if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
4518	SEQ_PUT_HEX_FIELD(s, entry->pid);
4519	SEQ_PUT_HEX_FIELD(s, iter->cpu);
4520	SEQ_PUT_HEX_FIELD(s, iter->ts);
4521	if (trace_seq_has_overflowed(s))
4522	return TRACE_TYPE_PARTIAL_LINE;
4523	}
4524
4525	event = ftrace_find_event(type: entry->type);
4526	if (event) {
4527	enum print_line_t ret = event->funcs->hex(iter, `0`, event);
4528	if (ret != TRACE_TYPE_HANDLED)
4529	return ret;
4530	}
4531
4532	SEQ_PUT_FIELD(s, newline);
4533
4534	return trace_handle_return(s);
4535	}
4536
4537	static enum print_line_t print_bin_fmt(struct trace_iterator *iter)
4538	{
4539	struct trace_array *tr = iter->tr;
4540	struct trace_seq *s = &iter->seq;
4541	struct trace_entry *entry;
4542	struct trace_event *event;
4543
4544	entry = iter->ent;
4545
4546	if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
4547	SEQ_PUT_FIELD(s, entry->pid);
4548	SEQ_PUT_FIELD(s, iter->cpu);
4549	SEQ_PUT_FIELD(s, iter->ts);
4550	if (trace_seq_has_overflowed(s))
4551	return TRACE_TYPE_PARTIAL_LINE;
4552	}
4553
4554	event = ftrace_find_event(type: entry->type);
4555	return event ? event->funcs->binary(iter, `0`, event) :
4556	TRACE_TYPE_HANDLED;
4557	}
4558
4559	int trace_empty(struct trace_iterator *iter)
4560	{
4561	struct ring_buffer_iter *buf_iter;
4562	int cpu;
4563
4564	/ If we are looking at one CPU buffer, only check that one /
4565	if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
4566	cpu = iter->cpu_file;
4567	buf_iter = trace_buffer_iter(iter, cpu);
4568	if (buf_iter) {
4569	if (!ring_buffer_iter_empty(iter: buf_iter))
4570	return `0`;
4571	} else {
4572	if (!ring_buffer_empty_cpu(buffer: iter->array_buffer->buffer, cpu))
4573	return `0`;
4574	}
4575	return `1`;
4576	}
4577
4578	for_each_tracing_cpu(cpu) {
4579	buf_iter = trace_buffer_iter(iter, cpu);
4580	if (buf_iter) {
4581	if (!ring_buffer_iter_empty(iter: buf_iter))
4582	return `0`;
4583	} else {
4584	if (!ring_buffer_empty_cpu(buffer: iter->array_buffer->buffer, cpu))
4585	return `0`;
4586	}
4587	}
4588
4589	return `1`;
4590	}
4591
4592	/ Called with trace_event_read_lock() held. /
4593	enum print_line_t print_trace_line(struct trace_iterator *iter)
4594	{
4595	struct trace_array *tr = iter->tr;
4596	unsigned long trace_flags = tr->trace_flags;
4597	enum print_line_t ret;
4598
4599	if (iter->lost_events) {
4600	if (iter->lost_events == (unsigned long)-`1`)
4601	trace_seq_printf(s: &iter->seq, fmt: "CPU:%d [LOST EVENTS]\n",
4602	iter->cpu);
4603	else
4604	trace_seq_printf(s: &iter->seq, fmt: "CPU:%d [LOST %lu EVENTS]\n",
4605	iter->cpu, iter->lost_events);
4606	if (trace_seq_has_overflowed(s: &iter->seq))
4607	return TRACE_TYPE_PARTIAL_LINE;
4608	}
4609
4610	if (iter->trace && iter->trace->print_line) {
4611	ret = iter->trace->print_line(iter);
4612	if (ret != TRACE_TYPE_UNHANDLED)
4613	return ret;
4614	}
4615
4616	if (iter->ent->type == TRACE_BPUTS &&
4617	trace_flags & TRACE_ITER_PRINTK &&
4618	trace_flags & TRACE_ITER_PRINTK_MSGONLY)
4619	return trace_print_bputs_msg_only(iter);
4620
4621	if (iter->ent->type == TRACE_BPRINT &&
4622	trace_flags & TRACE_ITER_PRINTK &&
4623	trace_flags & TRACE_ITER_PRINTK_MSGONLY)
4624	return trace_print_bprintk_msg_only(iter);
4625
4626	if (iter->ent->type == TRACE_PRINT &&
4627	trace_flags & TRACE_ITER_PRINTK &&
4628	trace_flags & TRACE_ITER_PRINTK_MSGONLY)
4629	return trace_print_printk_msg_only(iter);
4630
4631	if (trace_flags & TRACE_ITER_BIN)
4632	return print_bin_fmt(iter);
4633
4634	if (trace_flags & TRACE_ITER_HEX)
4635	return print_hex_fmt(iter);
4636
4637	if (trace_flags & TRACE_ITER_RAW)
4638	return print_raw_fmt(iter);
4639
4640	return print_trace_fmt(iter);
4641	}
4642
4643	void trace_latency_header(struct seq_file *m)
4644	{
4645	struct trace_iterator *iter = m->private;
4646	struct trace_array *tr = iter->tr;
4647
4648	/ print nothing if the buffers are empty /
4649	if (trace_empty(iter))
4650	return;
4651
4652	if (iter->iter_flags & TRACE_FILE_LAT_FMT)
4653	print_trace_header(m, iter);
4654
4655	if (!(tr->trace_flags & TRACE_ITER_VERBOSE))
4656	print_lat_help_header(m);
4657	}
4658
4659	void trace_default_header(struct seq_file *m)
4660	{
4661	struct trace_iterator *iter = m->private;
4662	struct trace_array *tr = iter->tr;
4663	unsigned long trace_flags = tr->trace_flags;
4664
4665	if (!(trace_flags & TRACE_ITER_CONTEXT_INFO))
4666	return;
4667
4668	if (iter->iter_flags & TRACE_FILE_LAT_FMT) {
4669	/ print nothing if the buffers are empty /
4670	if (trace_empty(iter))
4671	return;
4672	print_trace_header(m, iter);
4673	if (!(trace_flags & TRACE_ITER_VERBOSE))
4674	print_lat_help_header(m);
4675	} else {
4676	if (!(trace_flags & TRACE_ITER_VERBOSE)) {
4677	if (trace_flags & TRACE_ITER_IRQ_INFO)
4678	print_func_help_header_irq(buf: iter->array_buffer,
4679	m, flags: trace_flags);
4680	else
4681	print_func_help_header(buf: iter->array_buffer, m,
4682	flags: trace_flags);
4683	}
4684	}
4685	}
4686
4687	static void test_ftrace_alive(struct seq_file *m)
4688	{
4689	if (!ftrace_is_dead())
4690	return;
4691	seq_puts(m, s: "# WARNING: FUNCTION TRACING IS CORRUPTED\n"
4692	"# MAY BE MISSING FUNCTION EVENTS\n");
4693	}
4694
4695	#ifdef CONFIG_TRACER_MAX_TRACE
4696	static void show_snapshot_main_help(struct seq_file *m)
4697	{
4698	seq_puts(m, s: "# echo 0 > snapshot : Clears and frees snapshot buffer\n"
4699	"# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
4700	"# Takes a snapshot of the main buffer.\n"
4701	"# echo 2 > snapshot : Clears snapshot buffer (but does not allocate or free)\n"
4702	"# (Doesn't have to be '2' works with any number that\n"
4703	"# is not a '0' or '1')\n");
4704	}
4705
4706	static void show_snapshot_percpu_help(struct seq_file *m)
4707	{
4708	seq_puts(m, s: "# echo 0 > snapshot : Invalid for per_cpu snapshot file.\n");
4709	#ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
4710	seq_puts(m, s: "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
4711	"# Takes a snapshot of the main buffer for this cpu.\n");
4712	#else
4713	seq_puts(m, "# echo 1 > snapshot : Not supported with this kernel.\n"
4714	"# Must use main snapshot file to allocate.\n");
4715	#endif
4716	seq_puts(m, s: "# echo 2 > snapshot : Clears this cpu's snapshot buffer (but does not allocate)\n"
4717	"# (Doesn't have to be '2' works with any number that\n"
4718	"# is not a '0' or '1')\n");
4719	}
4720
4721	static void print_snapshot_help(struct seq_file m, struct* trace_iterator *iter)
4722	{
4723	if (iter->tr->allocated_snapshot)
4724	seq_puts(m, s: "#\n# * Snapshot is allocated *\n#\n");
4725	else
4726	seq_puts(m, s: "#\n# * Snapshot is freed *\n#\n");
4727
4728	seq_puts(m, s: "# Snapshot commands:\n");
4729	if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
4730	show_snapshot_main_help(m);
4731	else
4732	show_snapshot_percpu_help(m);
4733	}
4734	#else
4735	/ Should never be called /
4736	static inline void print_snapshot_help(struct seq_file m, struct* trace_iterator *iter) { }
4737	#endif
4738
4739	static int s_show(struct seq_file m, void* *v)
4740	{
4741	struct trace_iterator *iter = v;
4742	int ret;
4743
4744	if (iter->ent == NULL) {
4745	if (iter->tr) {
4746	seq_printf(m, fmt: "# tracer: %s\n", iter->trace->name);
4747	seq_puts(m, s: "#\n");
4748	test_ftrace_alive(m);
4749	}
4750	if (iter->snapshot && trace_empty(iter))
4751	print_snapshot_help(m, iter);
4752	else if (iter->trace && iter->trace->print_header)
4753	iter->trace->print_header(m);
4754	else
4755	trace_default_header(m);
4756
4757	} else if (iter->leftover) {
4758	/*
4759	* If we filled the seq_file buffer earlier, we
4760	* want to just show it now.
4761	*/
4762	ret = trace_print_seq(m, s: &iter->seq);
4763
4764	/ ret should this time be zero, but you never know /
4765	iter->leftover = ret;
4766
4767	} else {
4768	print_trace_line(iter);
4769	ret = trace_print_seq(m, s: &iter->seq);
4770	/*
4771	* If we overflow the seq_file buffer, then it will
4772	* ask us for this data again at start up.
4773	* Use that instead.
4774	* ret is 0 if seq_file write succeeded.
4775	* -1 otherwise.
4776	*/
4777	iter->leftover = ret;
4778	}
4779
4780	return `0`;
4781	}
4782
4783	/*
4784	* Should be used after trace_array_get(), trace_types_lock
4785	* ensures that i_cdev was already initialized.
4786	*/
4787	static inline int tracing_get_cpu(struct inode *inode)
4788	{
4789	if (inode->i_cdev) / See trace_create_cpu_file() /
4790	return (long)inode->i_cdev - `1`;
4791	return RING_BUFFER_ALL_CPUS;
4792	}
4793
4794	static const struct seq_operations tracer_seq_ops = {
4795	.start = s_start,
4796	.next = s_next,
4797	.stop = s_stop,
4798	.show = s_show,
4799	};
4800
4801	/*
4802	* Note, as iter itself can be allocated and freed in different
4803	* ways, this function is only used to free its content, and not
4804	* the iterator itself. The only requirement to all the allocations
4805	* is that it must zero all fields (kzalloc), as freeing works with
4806	* ethier allocated content or NULL.
4807	*/
4808	static void free_trace_iter_content(struct trace_iterator *iter)
4809	{
4810	/ The fmt is either NULL, allocated or points to static_fmt_buf /
4811	if (iter->fmt != static_fmt_buf)
4812	kfree(objp: iter->fmt);
4813
4814	kfree(objp: iter->temp);
4815	kfree(objp: iter->buffer_iter);
4816	mutex_destroy(lock: &iter->mutex);
4817	free_cpumask_var(mask: iter->started);
4818	}
4819
4820	static struct trace_iterator *
4821	__tracing_open(struct inode inode, struct* file *file, bool snapshot)
4822	{
4823	struct trace_array *tr = inode->i_private;
4824	struct trace_iterator *iter;
4825	int cpu;
4826
4827	if (tracing_disabled)
4828	return ERR_PTR(error: -ENODEV);
4829
4830	iter = __seq_open_private(file, &tracer_seq_ops, sizeof(*iter));
4831	if (!iter)
4832	return ERR_PTR(error: -ENOMEM);
4833
4834	iter->buffer_iter = kcalloc(n: nr_cpu_ids, size: sizeof(*iter->buffer_iter),
4835	GFP_KERNEL);
4836	if (!iter->buffer_iter)
4837	goto release;
4838
4839	/*
4840	* trace_find_next_entry() may need to save off iter->ent.
4841	* It will place it into the iter->temp buffer. As most
4842	* events are less than 128, allocate a buffer of that size.
4843	* If one is greater, then trace_find_next_entry() will
4844	* allocate a new buffer to adjust for the bigger iter->ent.
4845	* It's not critical if it fails to get allocated here.
4846	*/
4847	iter->temp = kmalloc(size: `128`, GFP_KERNEL);
4848	if (iter->temp)
4849	iter->temp_size = `128`;
4850
4851	/*
4852	* trace_event_printf() may need to modify given format
4853	* string to replace %p with %px so that it shows real address
4854	* instead of hash value. However, that is only for the event
4855	* tracing, other tracer may not need. Defer the allocation
4856	* until it is needed.
4857	*/
4858	iter->fmt = NULL;
4859	iter->fmt_size = `0`;
4860
4861	mutex_lock(&trace_types_lock);
4862	iter->trace = tr->current_trace;
4863
4864	if (!zalloc_cpumask_var(mask: &iter->started, GFP_KERNEL))
4865	goto fail;
4866
4867	iter->tr = tr;
4868
4869	#ifdef CONFIG_TRACER_MAX_TRACE
4870	/ Currently only the top directory has a snapshot /
4871	if (tr->current_trace->print_max \|\| snapshot)
4872	iter->array_buffer = &tr->max_buffer;
4873	else
4874	#endif
4875	iter->array_buffer = &tr->array_buffer;
4876	iter->snapshot = snapshot;
4877	iter->pos = -`1`;
4878	iter->cpu_file = tracing_get_cpu(inode);
4879	mutex_init(&iter->mutex);
4880
4881	/ Notify the tracer early; before we stop tracing. /
4882	if (iter->trace->open)
4883	iter->trace->open(iter);
4884
4885	/ Annotate start of buffers if we had overruns /
4886	if (ring_buffer_overruns(buffer: iter->array_buffer->buffer))
4887	iter->iter_flags \|= TRACE_FILE_ANNOTATE;
4888
4889	/ Output in nanoseconds only if we are using a clock in nanoseconds. /
4890	if (trace_clocks[tr->clock_id].in_ns)
4891	iter->iter_flags \|= TRACE_FILE_TIME_IN_NS;
4892
4893	/*
4894	* If pause-on-trace is enabled, then stop the trace while
4895	* dumping, unless this is the "snapshot" file
4896	*/
4897	if (!iter->snapshot && (tr->trace_flags & TRACE_ITER_PAUSE_ON_TRACE))
4898	tracing_stop_tr(tr);
4899
4900	if (iter->cpu_file == RING_BUFFER_ALL_CPUS) {
4901	for_each_tracing_cpu(cpu) {
4902	iter->buffer_iter[cpu] =
4903	ring_buffer_read_prepare(buffer: iter->array_buffer->buffer,
4904	cpu, GFP_KERNEL);
4905	}
4906	ring_buffer_read_prepare_sync();
4907	for_each_tracing_cpu(cpu) {
4908	ring_buffer_read_start(iter: iter->buffer_iter[cpu]);
4909	tracing_iter_reset(iter, cpu);
4910	}
4911	} else {
4912	cpu = iter->cpu_file;
4913	iter->buffer_iter[cpu] =
4914	ring_buffer_read_prepare(buffer: iter->array_buffer->buffer,
4915	cpu, GFP_KERNEL);
4916	ring_buffer_read_prepare_sync();
4917	ring_buffer_read_start(iter: iter->buffer_iter[cpu]);
4918	tracing_iter_reset(iter, cpu);
4919	}
4920
4921	mutex_unlock(lock: &trace_types_lock);
4922
4923	return iter;
4924
4925	fail:
4926	mutex_unlock(lock: &trace_types_lock);
4927	free_trace_iter_content(iter);
4928	release:
4929	seq_release_private(inode, file);
4930	return ERR_PTR(error: -ENOMEM);
4931	}
4932
4933	int tracing_open_generic(struct inode inode, struct* file *filp)
4934	{
4935	int ret;
4936
4937	ret = tracing_check_open_get_tr(NULL);
4938	if (ret)
4939	return ret;
4940
4941	filp->private_data = inode->i_private;
4942	return `0`;
4943	}
4944
4945	bool tracing_is_disabled(void)
4946	{
4947	return (tracing_disabled) ? true: false;
4948	}
4949
4950	/*
4951	* Open and update trace_array ref count.
4952	* Must have the current trace_array passed to it.
4953	*/
4954	int tracing_open_generic_tr(struct inode inode, struct* file *filp)
4955	{
4956	struct trace_array *tr = inode->i_private;
4957	int ret;
4958
4959	ret = tracing_check_open_get_tr(tr);
4960	if (ret)
4961	return ret;
4962
4963	filp->private_data = inode->i_private;
4964
4965	return `0`;
4966	}
4967
4968	/*
4969	* The private pointer of the inode is the trace_event_file.
4970	* Update the tr ref count associated to it.
4971	*/
4972	int tracing_open_file_tr(struct inode inode, struct* file *filp)
4973	{
4974	struct trace_event_file *file = inode->i_private;
4975	int ret;
4976
4977	ret = tracing_check_open_get_tr(tr: file->tr);
4978	if (ret)
4979	return ret;
4980
4981	mutex_lock(&event_mutex);
4982
4983	/ Fail if the file is marked for removal /
4984	if (file->flags & EVENT_FILE_FL_FREED) {
4985	trace_array_put(file->tr);
4986	ret = -ENODEV;
4987	} else {
4988	event_file_get(file);
4989	}
4990
4991	mutex_unlock(lock: &event_mutex);
4992	if (ret)
4993	return ret;
4994
4995	filp->private_data = inode->i_private;
4996
4997	return `0`;
4998	}
4999
5000	int tracing_release_file_tr(struct inode inode, struct* file *filp)
5001	{
5002	struct trace_event_file *file = inode->i_private;
5003
5004	trace_array_put(file->tr);
5005	event_file_put(file);
5006
5007	return `0`;
5008	}
5009
5010	static int tracing_mark_open(struct inode inode, struct* file *filp)
5011	{
5012	stream_open(inode, filp);
5013	return tracing_open_generic_tr(inode, filp);
5014	}
5015
5016	static int tracing_release(struct inode inode, struct* file *file)
5017	{
5018	struct trace_array *tr = inode->i_private;
5019	struct seq_file *m = file->private_data;
5020	struct trace_iterator *iter;
5021	int cpu;
5022
5023	if (!(file->f_mode & FMODE_READ)) {
5024	trace_array_put(tr);
5025	return `0`;
5026	}
5027
5028	/ Writes do not use seq_file /
5029	iter = m->private;
5030	mutex_lock(&trace_types_lock);
5031
5032	for_each_tracing_cpu(cpu) {
5033	if (iter->buffer_iter[cpu])
5034	ring_buffer_read_finish(iter: iter->buffer_iter[cpu]);
5035	}
5036
5037	if (iter->trace && iter->trace->close)
5038	iter->trace->close(iter);
5039
5040	if (!iter->snapshot && tr->stop_count)
5041	/ reenable tracing if it was previously enabled /
5042	tracing_start_tr(tr);
5043
5044	__trace_array_put(this_tr: tr);
5045
5046	mutex_unlock(lock: &trace_types_lock);
5047
5048	free_trace_iter_content(iter);
5049	seq_release_private(inode, file);
5050
5051	return `0`;
5052	}
5053
5054	static int tracing_release_generic_tr(struct inode inode, struct* file *file)
5055	{
5056	struct trace_array *tr = inode->i_private;
5057
5058	trace_array_put(tr);
5059	return `0`;
5060	}
5061
5062	static int tracing_single_release_tr(struct inode inode, struct* file *file)
5063	{
5064	struct trace_array *tr = inode->i_private;
5065
5066	trace_array_put(tr);
5067
5068	return single_release(inode, file);
5069	}
5070
5071	static int tracing_open(struct inode inode, struct* file *file)
5072	{
5073	struct trace_array *tr = inode->i_private;
5074	struct trace_iterator *iter;
5075	int ret;
5076
5077	ret = tracing_check_open_get_tr(tr);
5078	if (ret)
5079	return ret;
5080
5081	/ If this file was open for write, then erase contents /
5082	if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC)) {
5083	int cpu = tracing_get_cpu(inode);
5084	struct array_buffer *trace_buf = &tr->array_buffer;
5085
5086	#ifdef CONFIG_TRACER_MAX_TRACE
5087	if (tr->current_trace->print_max)
5088	trace_buf = &tr->max_buffer;
5089	#endif
5090
5091	if (cpu == RING_BUFFER_ALL_CPUS)
5092	tracing_reset_online_cpus(buf: trace_buf);
5093	else
5094	tracing_reset_cpu(buf: trace_buf, cpu);
5095	}
5096
5097	if (file->f_mode & FMODE_READ) {
5098	iter = __tracing_open(inode, file, snapshot: false);
5099	if (IS_ERR(ptr: iter))
5100	ret = PTR_ERR(ptr: iter);
5101	else if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
5102	iter->iter_flags \|= TRACE_FILE_LAT_FMT;
5103	}
5104
5105	if (ret < `0`)
5106	trace_array_put(tr);
5107
5108	return ret;
5109	}
5110
5111	/*
5112	* Some tracers are not suitable for instance buffers.
5113	* A tracer is always available for the global array (toplevel)
5114	* or if it explicitly states that it is.
5115	*/
5116	static bool
5117	trace_ok_for_array(struct tracer t, struct* trace_array *tr)
5118	{
5119	return (tr->flags & TRACE_ARRAY_FL_GLOBAL) \|\| t->allow_instances;
5120	}
5121
5122	/ Find the next tracer that this trace array may use /
5123	static struct tracer *
5124	get_tracer_for_array(struct trace_array tr, struct* tracer *t)
5125	{
5126	while (t && !trace_ok_for_array(t, tr))
5127	t = t->next;
5128
5129	return t;
5130	}
5131
5132	static void *
5133	t_next(struct seq_file m, void* v, loff_t pos)
5134	{
5135	struct trace_array *tr = m->private;
5136	struct tracer *t = v;
5137
5138	(*pos)++;
5139
5140	if (t)
5141	t = get_tracer_for_array(tr, t: t->next);
5142
5143	return t;
5144	}
5145
5146	static void t_start(struct* seq_file m, loff_t pos)
5147	{
5148	struct trace_array *tr = m->private;
5149	struct tracer *t;
5150	loff_t l = `0`;
5151
5152	mutex_lock(&trace_types_lock);
5153
5154	t = get_tracer_for_array(tr, t: trace_types);
5155	for (; t && l < *pos; t = t_next(m, v: t, pos: &l))
5156	;
5157
5158	return t;
5159	}
5160
5161	static void t_stop(struct seq_file m, void* *p)
5162	{
5163	mutex_unlock(lock: &trace_types_lock);
5164	}
5165
5166	static int t_show(struct seq_file m, void* *v)
5167	{
5168	struct tracer *t = v;
5169
5170	if (!t)
5171	return `0`;
5172
5173	seq_puts(m, s: t->name);
5174	if (t->next)
5175	seq_putc(m, c: `' '`);
5176	else
5177	seq_putc(m, c: `'\n'`);
5178
5179	return `0`;
5180	}
5181
5182	static const struct seq_operations show_traces_seq_ops = {
5183	.start = t_start,
5184	.next = t_next,
5185	.stop = t_stop,
5186	.show = t_show,
5187	};
5188
5189	static int show_traces_open(struct inode inode, struct* file *file)
5190	{
5191	struct trace_array *tr = inode->i_private;
5192	struct seq_file *m;
5193	int ret;
5194
5195	ret = tracing_check_open_get_tr(tr);
5196	if (ret)
5197	return ret;
5198
5199	ret = seq_open(file, &show_traces_seq_ops);
5200	if (ret) {
5201	trace_array_put(tr);
5202	return ret;
5203	}
5204
5205	m = file->private_data;
5206	m->private = tr;
5207
5208	return `0`;
5209	}
5210
5211	static int show_traces_release(struct inode inode, struct* file *file)
5212	{
5213	struct trace_array *tr = inode->i_private;
5214
5215	trace_array_put(tr);
5216	return seq_release(inode, file);
5217	}
5218
5219	static ssize_t
5220	tracing_write_stub(struct file filp, const* char __user *ubuf,
5221	size_t count, loff_t *ppos)
5222	{
5223	return count;
5224	}
5225
5226	loff_t tracing_lseek(struct file file, loff_t offset, int* whence)
5227	{
5228	int ret;
5229
5230	if (file->f_mode & FMODE_READ)
5231	ret = seq_lseek(file, offset, whence);
5232	else
5233	file->f_pos = ret = `0`;
5234
5235	return ret;
5236	}
5237
5238	static const struct file_operations tracing_fops = {
5239	.open = tracing_open,
5240	.read = seq_read,
5241	.read_iter = seq_read_iter,
5242	.splice_read = copy_splice_read,
5243	.write = tracing_write_stub,
5244	.llseek = tracing_lseek,
5245	.release = tracing_release,
5246	};
5247
5248	static const struct file_operations show_traces_fops = {
5249	.open = show_traces_open,
5250	.read = seq_read,
5251	.llseek = seq_lseek,
5252	.release = show_traces_release,
5253	};
5254
5255	static ssize_t
5256	tracing_cpumask_read(struct file filp, char* __user *ubuf,
5257	size_t count, loff_t *ppos)
5258	{
5259	struct trace_array *tr = file_inode(f: filp)->i_private;
5260	char *mask_str;
5261	int len;
5262
5263	len = snprintf(NULL, size: `0`, fmt: "%*pb\n",
5264	cpumask_pr_args(tr->tracing_cpumask)) + `1`;
5265	mask_str = kmalloc(size: len, GFP_KERNEL);
5266	if (!mask_str)
5267	return -ENOMEM;
5268
5269	len = snprintf(buf: mask_str, size: len, fmt: "%*pb\n",
5270	cpumask_pr_args(tr->tracing_cpumask));
5271	if (len >= count) {
5272	count = -EINVAL;
5273	goto out_err;
5274	}
5275	count = simple_read_from_buffer(to: ubuf, count, ppos, from: mask_str, available: len);
5276
5277	out_err:
5278	kfree(objp: mask_str);
5279
5280	return count;
5281	}
5282
5283	int tracing_set_cpumask(struct trace_array *tr,
5284	cpumask_var_t tracing_cpumask_new)
5285	{
5286	int cpu;
5287
5288	if (!tr)
5289	return -EINVAL;
5290
5291	local_irq_disable();
5292	arch_spin_lock(&tr->max_lock);
5293	for_each_tracing_cpu(cpu) {
5294	/*
5295	* Increase/decrease the disabled counter if we are
5296	* about to flip a bit in the cpumask:
5297	*/
5298	if (cpumask_test_cpu(cpu, cpumask: tr->tracing_cpumask) &&
5299	!cpumask_test_cpu(cpu, cpumask: tracing_cpumask_new)) {
5300	atomic_inc(v: &per_cpu_ptr(tr->array_buffer.data, cpu)->disabled);
5301	ring_buffer_record_disable_cpu(buffer: tr->array_buffer.buffer, cpu);
5302	#ifdef CONFIG_TRACER_MAX_TRACE
5303	ring_buffer_record_disable_cpu(buffer: tr->max_buffer.buffer, cpu);
5304	#endif
5305	}
5306	if (!cpumask_test_cpu(cpu, cpumask: tr->tracing_cpumask) &&
5307	cpumask_test_cpu(cpu, cpumask: tracing_cpumask_new)) {
5308	atomic_dec(v: &per_cpu_ptr(tr->array_buffer.data, cpu)->disabled);
5309	ring_buffer_record_enable_cpu(buffer: tr->array_buffer.buffer, cpu);
5310	#ifdef CONFIG_TRACER_MAX_TRACE
5311	ring_buffer_record_enable_cpu(buffer: tr->max_buffer.buffer, cpu);
5312	#endif
5313	}
5314	}
5315	arch_spin_unlock(&tr->max_lock);
5316	local_irq_enable();
5317
5318	cpumask_copy(dstp: tr->tracing_cpumask, srcp: tracing_cpumask_new);
5319
5320	return `0`;
5321	}
5322
5323	static ssize_t
5324	tracing_cpumask_write(struct file filp, const* char __user *ubuf,
5325	size_t count, loff_t *ppos)
5326	{
5327	struct trace_array *tr = file_inode(f: filp)->i_private;
5328	cpumask_var_t tracing_cpumask_new;
5329	int err;
5330
5331	if (!zalloc_cpumask_var(mask: &tracing_cpumask_new, GFP_KERNEL))
5332	return -ENOMEM;
5333
5334	err = cpumask_parse_user(buf: ubuf, len: count, dstp: tracing_cpumask_new);
5335	if (err)
5336	goto err_free;
5337
5338	err = tracing_set_cpumask(tr, tracing_cpumask_new);
5339	if (err)
5340	goto err_free;
5341
5342	free_cpumask_var(mask: tracing_cpumask_new);
5343
5344	return count;
5345
5346	err_free:
5347	free_cpumask_var(mask: tracing_cpumask_new);
5348
5349	return err;
5350	}
5351
5352	static const struct file_operations tracing_cpumask_fops = {
5353	.open = tracing_open_generic_tr,
5354	.read = tracing_cpumask_read,
5355	.write = tracing_cpumask_write,
5356	.release = tracing_release_generic_tr,
5357	.llseek = generic_file_llseek,
5358	};
5359
5360	static int tracing_trace_options_show(struct seq_file m, void* *v)
5361	{
5362	struct tracer_opt *trace_opts;
5363	struct trace_array *tr = m->private;
5364	u32 tracer_flags;
5365	int i;
5366
5367	mutex_lock(&trace_types_lock);
5368	tracer_flags = tr->current_trace->flags->val;
5369	trace_opts = tr->current_trace->flags->opts;
5370
5371	for (i = `0`; trace_options[i]; i++) {
5372	if (tr->trace_flags & (`1` << i))
5373	seq_printf(m, fmt: "%s\n", trace_options[i]);
5374	else
5375	seq_printf(m, fmt: "no%s\n", trace_options[i]);
5376	}
5377
5378	for (i = `0`; trace_opts[i].name; i++) {
5379	if (tracer_flags & trace_opts[i].bit)
5380	seq_printf(m, fmt: "%s\n", trace_opts[i].name);
5381	else
5382	seq_printf(m, fmt: "no%s\n", trace_opts[i].name);
5383	}
5384	mutex_unlock(lock: &trace_types_lock);
5385
5386	return `0`;
5387	}
5388
5389	static int __set_tracer_option(struct trace_array *tr,
5390	struct tracer_flags *tracer_flags,
5391	struct tracer_opt opts, int* neg)
5392	{
5393	struct tracer *trace = tracer_flags->trace;
5394	int ret;
5395
5396	ret = trace->set_flag(tr, tracer_flags->val, opts->bit, !neg);
5397	if (ret)
5398	return ret;
5399
5400	if (neg)
5401	tracer_flags->val &= ~opts->bit;
5402	else
5403	tracer_flags->val \|= opts->bit;
5404	return `0`;
5405	}
5406
5407	/ Try to assign a tracer specific option /
5408	static int set_tracer_option(struct trace_array tr, char* cmp, int* neg)
5409	{
5410	struct tracer *trace = tr->current_trace;
5411	struct tracer_flags *tracer_flags = trace->flags;
5412	struct tracer_opt *opts = NULL;
5413	int i;
5414
5415	for (i = `0`; tracer_flags->opts[i].name; i++) {
5416	opts = &tracer_flags->opts[i];
5417
5418	if (strcmp(cmp, opts->name) == `0`)
5419	return __set_tracer_option(tr, tracer_flags: trace->flags, opts, neg);
5420	}
5421
5422	return -EINVAL;
5423	}
5424
5425	/ Some tracers require overwrite to stay enabled /
5426	int trace_keep_overwrite(struct tracer tracer, u32 mask, int* set)
5427	{
5428	if (tracer->enabled && (mask & TRACE_ITER_OVERWRITE) && !set)
5429	return -`1`;
5430
5431	return `0`;
5432	}
5433
5434	int set_tracer_flag(struct trace_array tr, unsigned* int mask, int enabled)
5435	{
5436	int *map;
5437
5438	if ((mask == TRACE_ITER_RECORD_TGID) \|\|
5439	(mask == TRACE_ITER_RECORD_CMD))
5440	lockdep_assert_held(&event_mutex);
5441
5442	/ do nothing if flag is already set /
5443	if (!!(tr->trace_flags & mask) == !!enabled)
5444	return `0`;
5445
5446	/ Give the tracer a chance to approve the change /
5447	if (tr->current_trace->flag_changed)
5448	if (tr->current_trace->flag_changed(tr, mask, !!enabled))
5449	return -EINVAL;
5450
5451	if (enabled)
5452	tr->trace_flags \|= mask;
5453	else
5454	tr->trace_flags &= ~mask;
5455
5456	if (mask == TRACE_ITER_RECORD_CMD)
5457	trace_event_enable_cmd_record(enable: enabled);
5458
5459	if (mask == TRACE_ITER_RECORD_TGID) {
5460	if (!tgid_map) {
5461	tgid_map_max = pid_max;
5462	map = kvcalloc(n: tgid_map_max + `1`, size: sizeof(*tgid_map),
5463	GFP_KERNEL);
5464
5465	/*
5466	* Pairs with smp_load_acquire() in
5467	* trace_find_tgid_ptr() to ensure that if it observes
5468	* the tgid_map we just allocated then it also observes
5469	* the corresponding tgid_map_max value.
5470	*/
5471	smp_store_release(&tgid_map, map);
5472	}
5473	if (!tgid_map) {
5474	tr->trace_flags &= ~TRACE_ITER_RECORD_TGID;
5475	return -ENOMEM;
5476	}
5477
5478	trace_event_enable_tgid_record(enable: enabled);
5479	}
5480
5481	if (mask == TRACE_ITER_EVENT_FORK)
5482	trace_event_follow_fork(tr, enable: enabled);
5483
5484	if (mask == TRACE_ITER_FUNC_FORK)
5485	ftrace_pid_follow_fork(tr, enable: enabled);
5486
5487	if (mask == TRACE_ITER_OVERWRITE) {
5488	ring_buffer_change_overwrite(buffer: tr->array_buffer.buffer, val: enabled);
5489	#ifdef CONFIG_TRACER_MAX_TRACE
5490	ring_buffer_change_overwrite(buffer: tr->max_buffer.buffer, val: enabled);
5491	#endif
5492	}
5493
5494	if (mask == TRACE_ITER_PRINTK) {
5495	trace_printk_start_stop_comm(enabled);
5496	trace_printk_control(enabled);
5497	}
5498
5499	return `0`;
5500	}
5501
5502	int trace_set_options(struct trace_array tr, char* *option)
5503	{
5504	char *cmp;
5505	int neg = `0`;
5506	int ret;
5507	size_t orig_len = strlen(option);
5508	int len;
5509
5510	cmp = strstrip(str: option);
5511
5512	len = str_has_prefix(str: cmp, prefix: "no");
5513	if (len)
5514	neg = `1`;
5515
5516	cmp += len;
5517
5518	mutex_lock(&event_mutex);
5519	mutex_lock(&trace_types_lock);
5520
5521	ret = match_string(array: trace_options, n: -`1`, string: cmp);
5522	/ If no option could be set, test the specific tracer options /
5523	if (ret < `0`)
5524	ret = set_tracer_option(tr, cmp, neg);
5525	else
5526	ret = set_tracer_flag(tr, mask: `1` << ret, enabled: !neg);
5527
5528	mutex_unlock(lock: &trace_types_lock);
5529	mutex_unlock(lock: &event_mutex);
5530
5531	/*
5532	* If the first trailing whitespace is replaced with '\0' by strstrip,
5533	* turn it back into a space.
5534	*/
5535	if (orig_len > strlen(option))
5536	option[strlen(option)] = `' '`;
5537
5538	return ret;
5539	}
5540
5541	static void __init apply_trace_boot_options(void)
5542	{
5543	char *buf = trace_boot_options_buf;
5544	char *option;
5545
5546	while (true) {
5547	option = strsep(&buf, ",");
5548
5549	if (!option)
5550	break;
5551
5552	if (*option)
5553	trace_set_options(tr: &global_trace, option);
5554
5555	/ Put back the comma to allow this to be called again /
5556	if (buf)
5557	*(buf - `1`) = `','`;
5558	}
5559	}
5560
5561	static ssize_t
5562	tracing_trace_options_write(struct file filp, const* char __user *ubuf,
5563	size_t cnt, loff_t *ppos)
5564	{
5565	struct seq_file *m = filp->private_data;
5566	struct trace_array *tr = m->private;
5567	char buf[`64`];
5568	int ret;
5569
5570	if (cnt >= sizeof(buf))
5571	return -EINVAL;
5572
5573	if (copy_from_user(to: buf, from: ubuf, n: cnt))
5574	return -EFAULT;
5575
5576	buf[cnt] = `0`;
5577
5578	ret = trace_set_options(tr, option: buf);
5579	if (ret < `0`)
5580	return ret;
5581
5582	*ppos += cnt;
5583
5584	return cnt;
5585	}
5586
5587	static int tracing_trace_options_open(struct inode inode, struct* file *file)
5588	{
5589	struct trace_array *tr = inode->i_private;
5590	int ret;
5591
5592	ret = tracing_check_open_get_tr(tr);
5593	if (ret)
5594	return ret;
5595
5596	ret = single_open(file, tracing_trace_options_show, inode->i_private);
5597	if (ret < `0`)
5598	trace_array_put(tr);
5599
5600	return ret;
5601	}
5602
5603	static const struct file_operations tracing_iter_fops = {
5604	.open = tracing_trace_options_open,
5605	.read = seq_read,
5606	.llseek = seq_lseek,
5607	.release = tracing_single_release_tr,
5608	.write = tracing_trace_options_write,
5609	};
5610
5611	static const char readme_msg[] =
5612	"tracing mini-HOWTO:\n\n"
5613	"# echo 0 > tracing_on : quick way to disable tracing\n"
5614	"# echo 1 > tracing_on : quick way to re-enable tracing\n\n"
5615	" Important files:\n"
5616	" trace\t\t\t- The static contents of the buffer\n"
5617	"\t\t\t To clear the buffer write into this file: echo > trace\n"
5618	" trace_pipe\t\t- A consuming read to see the contents of the buffer\n"
5619	" current_tracer\t- function and latency tracers\n"
5620	" available_tracers\t- list of configured tracers for current_tracer\n"
5621	" error_log\t- error log for failed commands (that support it)\n"
5622	" buffer_size_kb\t- view and modify size of per cpu buffer\n"
5623	" buffer_total_size_kb - view total size of all cpu buffers\n\n"
5624	" trace_clock\t\t- change the clock used to order events\n"
5625	" local: Per cpu clock but may not be synced across CPUs\n"
5626	" global: Synced across CPUs but slows tracing down.\n"
5627	" counter: Not a clock, but just an increment\n"
5628	" uptime: Jiffy counter from time of boot\n"
5629	" perf: Same clock that perf events use\n"
5630	#ifdef CONFIG_X86_64
5631	" x86-tsc: TSC cycle counter\n"
5632	#endif
5633	"\n timestamp_mode\t- view the mode used to timestamp events\n"
5634	" delta: Delta difference against a buffer-wide timestamp\n"
5635	" absolute: Absolute (standalone) timestamp\n"
5636	"\n trace_marker\t\t- Writes into this file writes into the kernel buffer\n"
5637	"\n trace_marker_raw\t\t- Writes into this file writes binary data into the kernel buffer\n"
5638	" tracing_cpumask\t- Limit which CPUs to trace\n"
5639	" instances\t\t- Make sub-buffers with: mkdir instances/foo\n"
5640	"\t\t\t Remove sub-buffer with rmdir\n"
5641	" trace_options\t\t- Set format or modify how tracing happens\n"
5642	"\t\t\t Disable an option by prefixing 'no' to the\n"
5643	"\t\t\t option name\n"
5644	" saved_cmdlines_size\t- echo command number in here to store comm-pid list\n"
5645	#ifdef CONFIG_DYNAMIC_FTRACE
5646	"\n available_filter_functions - list of functions that can be filtered on\n"
5647	" set_ftrace_filter\t- echo function name in here to only trace these\n"
5648	"\t\t\t functions\n"
5649	"\t accepts: func_full_name or glob-matching-pattern\n"
5650	"\t modules: Can select a group via module\n"
5651	"\t Format: :mod:<module-name>\n"
5652	"\t example: echo :mod:ext3 > set_ftrace_filter\n"
5653	"\t triggers: a command to perform when function is hit\n"
5654	"\t Format: <function>:<trigger>[:count]\n"
5655	"\t trigger: traceon, traceoff\n"
5656	"\t\t enable_event:<system>:<event>\n"
5657	"\t\t disable_event:<system>:<event>\n"
5658	#ifdef CONFIG_STACKTRACE
5659	"\t\t stacktrace\n"
5660	#endif
5661	#ifdef CONFIG_TRACER_SNAPSHOT
5662	"\t\t snapshot\n"
5663	#endif
5664	"\t\t dump\n"
5665	"\t\t cpudump\n"
5666	"\t example: echo do_fault:traceoff > set_ftrace_filter\n"
5667	"\t echo do_trap:traceoff:3 > set_ftrace_filter\n"
5668	"\t The first one will disable tracing every time do_fault is hit\n"
5669	"\t The second will disable tracing at most 3 times when do_trap is hit\n"
5670	"\t The first time do trap is hit and it disables tracing, the\n"
5671	"\t counter will decrement to 2. If tracing is already disabled,\n"
5672	"\t the counter will not decrement. It only decrements when the\n"
5673	"\t trigger did work\n"
5674	"\t To remove trigger without count:\n"
5675	"\t echo '!<function>:<trigger> > set_ftrace_filter\n"
5676	"\t To remove trigger with a count:\n"
5677	"\t echo '!<function>:<trigger>:0 > set_ftrace_filter\n"
5678	" set_ftrace_notrace\t- echo function name in here to never trace.\n"
5679	"\t accepts: func_full_name, func_end, func_begin, func_middle\n"
5680	"\t modules: Can select a group via module command :mod:\n"
5681	"\t Does not accept triggers\n"
5682	#endif /* CONFIG_DYNAMIC_FTRACE */
5683	#ifdef CONFIG_FUNCTION_TRACER
5684	" set_ftrace_pid\t- Write pid(s) to only function trace those pids\n"
5685	"\t\t (function)\n"
5686	" set_ftrace_notrace_pid\t- Write pid(s) to not function trace those pids\n"
5687	"\t\t (function)\n"
5688	#endif
5689	#ifdef CONFIG_FUNCTION_GRAPH_TRACER
5690	" set_graph_function\t- Trace the nested calls of a function (function_graph)\n"
5691	" set_graph_notrace\t- Do not trace the nested calls of a function (function_graph)\n"
5692	" max_graph_depth\t- Trace a limited depth of nested calls (0 is unlimited)\n"
5693	#endif
5694	#ifdef CONFIG_TRACER_SNAPSHOT
5695	"\n snapshot\t\t- Like 'trace' but shows the content of the static\n"
5696	"\t\t\t snapshot buffer. Read the contents for more\n"
5697	"\t\t\t information\n"
5698	#endif
5699	#ifdef CONFIG_STACK_TRACER
5700	" stack_trace\t\t- Shows the max stack trace when active\n"
5701	" stack_max_size\t- Shows current max stack size that was traced\n"
5702	"\t\t\t Write into this file to reset the max size (trigger a\n"
5703	"\t\t\t new trace)\n"
5704	#ifdef CONFIG_DYNAMIC_FTRACE
5705	" stack_trace_filter\t- Like set_ftrace_filter but limits what stack_trace\n"
5706	"\t\t\t traces\n"
5707	#endif
5708	#endif /* CONFIG_STACK_TRACER */
5709	#ifdef CONFIG_DYNAMIC_EVENTS
5710	" dynamic_events\t\t- Create/append/remove/show the generic dynamic events\n"
5711	"\t\t\t Write into this file to define/undefine new trace events.\n"
5712	#endif
5713	#ifdef CONFIG_KPROBE_EVENTS
5714	" kprobe_events\t\t- Create/append/remove/show the kernel dynamic events\n"
5715	"\t\t\t Write into this file to define/undefine new trace events.\n"
5716	#endif
5717	#ifdef CONFIG_UPROBE_EVENTS
5718	" uprobe_events\t\t- Create/append/remove/show the userspace dynamic events\n"
5719	"\t\t\t Write into this file to define/undefine new trace events.\n"
5720	#endif
5721	#if defined(CONFIG_KPROBE_EVENTS) \|\| defined(CONFIG_UPROBE_EVENTS) \|\| \
5722	defined(CONFIG_FPROBE_EVENTS)
5723	"\t accepts: event-definitions (one definition per line)\n"
5724	#if defined(CONFIG_KPROBE_EVENTS) \|\| defined(CONFIG_UPROBE_EVENTS)
5725	"\t Format: p[:[<group>/][<event>]] <place> [<args>]\n"
5726	"\t r[maxactive][:[<group>/][<event>]] <place> [<args>]\n"
5727	#endif
5728	#ifdef CONFIG_FPROBE_EVENTS
5729	"\t f[:[<group>/][<event>]] <func-name>[%return] [<args>]\n"
5730	"\t t[:[<group>/][<event>]] <tracepoint> [<args>]\n"
5731	#endif
5732	#ifdef CONFIG_HIST_TRIGGERS
5733	"\t s:[synthetic/]<event> <field> [<field>]\n"
5734	#endif
5735	"\t e[:[<group>/][<event>]] <attached-group>.<attached-event> [<args>] [if <filter>]\n"
5736	"\t -:[<group>/][<event>]\n"
5737	#ifdef CONFIG_KPROBE_EVENTS
5738	"\t place: [<module>:]<symbol>[+<offset>]\|<memaddr>\n"
5739	"place (kretprobe): [<module>:]<symbol>[+<offset>]%return\|<memaddr>\n"
5740	#endif
5741	#ifdef CONFIG_UPROBE_EVENTS
5742	" place (uprobe): <path>:<offset>[%return][(ref_ctr_offset)]\n"
5743	#endif
5744	"\t args: <name>=fetcharg[:type]\n"
5745	"\t fetcharg: (%<register>\|$<efield>), @<address>, @<symbol>[+\|-<offset>],\n"
5746	#ifdef CONFIG_HAVE_FUNCTION_ARG_ACCESS_API
5747	#ifdef CONFIG_PROBE_EVENTS_BTF_ARGS
5748	"\t $stack<index>, $stack, $retval, $comm, $arg<N>,\n"
5749	"\t <argname>[->field[->field\|.field...]],\n"
5750	#else
5751	"\t $stack<index>, $stack, $retval, $comm, $arg<N>,\n"
5752	#endif
5753	#else
5754	"\t $stack<index>, $stack, $retval, $comm,\n"
5755	#endif
5756	"\t +\|-[u]<offset>(<fetcharg>), \\imm-value, \\\"imm-string\"\n"
5757	"\t type: s8/16/32/64, u8/16/32/64, x8/16/32/64, char, string, symbol,\n"
5758	"\t b<bit-width>@<bit-offset>/<container-size>, ustring,\n"
5759	"\t symstr, <type>\\[<array-size>\\]\n"
5760	#ifdef CONFIG_HIST_TRIGGERS
5761	"\t field: <stype> <name>;\n"
5762	"\t stype: u8/u16/u32/u64, s8/s16/s32/s64, pid_t,\n"
5763	"\t [unsigned] char/int/long\n"
5764	#endif
5765	"\t efield: For event probes ('e' types), the field is on of the fields\n"
5766	"\t of the <attached-group>/<attached-event>.\n"
5767	#endif
5768	" events/\t\t- Directory containing all trace event subsystems:\n"
5769	" enable\t\t- Write 0/1 to enable/disable tracing of all events\n"
5770	" events/<system>/\t- Directory containing all trace events for <system>:\n"
5771	" enable\t\t- Write 0/1 to enable/disable tracing of all <system>\n"
5772	"\t\t\t events\n"
5773	" filter\t\t- If set, only events passing filter are traced\n"
5774	" events/<system>/<event>/\t- Directory containing control files for\n"
5775	"\t\t\t <event>:\n"
5776	" enable\t\t- Write 0/1 to enable/disable tracing of <event>\n"
5777	" filter\t\t- If set, only events passing filter are traced\n"
5778	" trigger\t\t- If set, a command to perform when event is hit\n"
5779	"\t Format: <trigger>[:count][if <filter>]\n"
5780	"\t trigger: traceon, traceoff\n"
5781	"\t enable_event:<system>:<event>\n"
5782	"\t disable_event:<system>:<event>\n"
5783	#ifdef CONFIG_HIST_TRIGGERS
5784	"\t enable_hist:<system>:<event>\n"
5785	"\t disable_hist:<system>:<event>\n"
5786	#endif
5787	#ifdef CONFIG_STACKTRACE
5788	"\t\t stacktrace\n"
5789	#endif
5790	#ifdef CONFIG_TRACER_SNAPSHOT
5791	"\t\t snapshot\n"
5792	#endif
5793	#ifdef CONFIG_HIST_TRIGGERS
5794	"\t\t hist (see below)\n"
5795	#endif
5796	"\t example: echo traceoff > events/block/block_unplug/trigger\n"
5797	"\t echo traceoff:3 > events/block/block_unplug/trigger\n"
5798	"\t echo 'enable_event:kmem:kmalloc:3 if nr_rq > 1' > \\\n"
5799	"\t events/block/block_unplug/trigger\n"
5800	"\t The first disables tracing every time block_unplug is hit.\n"
5801	"\t The second disables tracing the first 3 times block_unplug is hit.\n"
5802	"\t The third enables the kmalloc event the first 3 times block_unplug\n"
5803	"\t is hit and has value of greater than 1 for the 'nr_rq' event field.\n"
5804	"\t Like function triggers, the counter is only decremented if it\n"
5805	"\t enabled or disabled tracing.\n"
5806	"\t To remove a trigger without a count:\n"
5807	"\t echo '!<trigger> > <system>/<event>/trigger\n"
5808	"\t To remove a trigger with a count:\n"
5809	"\t echo '!<trigger>:0 > <system>/<event>/trigger\n"
5810	"\t Filters can be ignored when removing a trigger.\n"
5811	#ifdef CONFIG_HIST_TRIGGERS
5812	" hist trigger\t- If set, event hits are aggregated into a hash table\n"
5813	"\t Format: hist:keys=<field1[,field2,...]>\n"
5814	"\t [:<var1>=<field\|var_ref\|numeric_literal>[,<var2>=...]]\n"
5815	"\t [:values=<field1[,field2,...]>]\n"
5816	"\t [:sort=<field1[,field2,...]>]\n"
5817	"\t [:size=#entries]\n"
5818	"\t [:pause][:continue][:clear]\n"
5819	"\t [:name=histname1]\n"
5820	"\t [:nohitcount]\n"
5821	"\t [:<handler>.<action>]\n"
5822	"\t [if <filter>]\n\n"
5823	"\t Note, special fields can be used as well:\n"
5824	"\t common_timestamp - to record current timestamp\n"
5825	"\t common_cpu - to record the CPU the event happened on\n"
5826	"\n"
5827	"\t A hist trigger variable can be:\n"
5828	"\t - a reference to a field e.g. x=current_timestamp,\n"
5829	"\t - a reference to another variable e.g. y=$x,\n"
5830	"\t - a numeric literal: e.g. ms_per_sec=1000,\n"
5831	"\t - an arithmetic expression: e.g. time_secs=current_timestamp/1000\n"
5832	"\n"
5833	"\t hist trigger arithmetic expressions support addition(+), subtraction(-),\n"
5834	"\t multiplication(*) and division(/) operators. An operand can be either a\n"
5835	"\t variable reference, field or numeric literal.\n"
5836	"\n"
5837	"\t When a matching event is hit, an entry is added to a hash\n"
5838	"\t table using the key(s) and value(s) named, and the value of a\n"
5839	"\t sum called 'hitcount' is incremented. Keys and values\n"
5840	"\t correspond to fields in the event's format description. Keys\n"
5841	"\t can be any field, or the special string 'common_stacktrace'.\n"
5842	"\t Compound keys consisting of up to two fields can be specified\n"
5843	"\t by the 'keys' keyword. Values must correspond to numeric\n"
5844	"\t fields. Sort keys consisting of up to two fields can be\n"
5845	"\t specified using the 'sort' keyword. The sort direction can\n"
5846	"\t be modified by appending '.descending' or '.ascending' to a\n"
5847	"\t sort field. The 'size' parameter can be used to specify more\n"
5848	"\t or fewer than the default 2048 entries for the hashtable size.\n"
5849	"\t If a hist trigger is given a name using the 'name' parameter,\n"
5850	"\t its histogram data will be shared with other triggers of the\n"
5851	"\t same name, and trigger hits will update this common data.\n\n"
5852	"\t Reading the 'hist' file for the event will dump the hash\n"
5853	"\t table in its entirety to stdout. If there are multiple hist\n"
5854	"\t triggers attached to an event, there will be a table for each\n"
5855	"\t trigger in the output. The table displayed for a named\n"
5856	"\t trigger will be the same as any other instance having the\n"
5857	"\t same name. The default format used to display a given field\n"
5858	"\t can be modified by appending any of the following modifiers\n"
5859	"\t to the field name, as applicable:\n\n"
5860	"\t .hex display a number as a hex value\n"
5861	"\t .sym display an address as a symbol\n"
5862	"\t .sym-offset display an address as a symbol and offset\n"
5863	"\t .execname display a common_pid as a program name\n"
5864	"\t .syscall display a syscall id as a syscall name\n"
5865	"\t .log2 display log2 value rather than raw number\n"
5866	"\t .buckets=size display values in groups of size rather than raw number\n"
5867	"\t .usecs display a common_timestamp in microseconds\n"
5868	"\t .percent display a number of percentage value\n"
5869	"\t .graph display a bar-graph of a value\n\n"
5870	"\t The 'pause' parameter can be used to pause an existing hist\n"
5871	"\t trigger or to start a hist trigger but not log any events\n"
5872	"\t until told to do so. 'continue' can be used to start or\n"
5873	"\t restart a paused hist trigger.\n\n"
5874	"\t The 'clear' parameter will clear the contents of a running\n"
5875	"\t hist trigger and leave its current paused/active state\n"
5876	"\t unchanged.\n\n"
5877	"\t The 'nohitcount' (or NOHC) parameter will suppress display of\n"
5878	"\t raw hitcount in the histogram.\n\n"
5879	"\t The enable_hist and disable_hist triggers can be used to\n"
5880	"\t have one event conditionally start and stop another event's\n"
5881	"\t already-attached hist trigger. The syntax is analogous to\n"
5882	"\t the enable_event and disable_event triggers.\n\n"
5883	"\t Hist trigger handlers and actions are executed whenever a\n"
5884	"\t a histogram entry is added or updated. They take the form:\n\n"
5885	"\t <handler>.<action>\n\n"
5886	"\t The available handlers are:\n\n"
5887	"\t onmatch(matching.event) - invoke on addition or update\n"
5888	"\t onmax(var) - invoke if var exceeds current max\n"
5889	"\t onchange(var) - invoke action if var changes\n\n"
5890	"\t The available actions are:\n\n"
5891	"\t trace(<synthetic_event>,param list) - generate synthetic event\n"
5892	"\t save(field,...) - save current event fields\n"
5893	#ifdef CONFIG_TRACER_SNAPSHOT
5894	"\t snapshot() - snapshot the trace buffer\n\n"
5895	#endif
5896	#ifdef CONFIG_SYNTH_EVENTS
5897	" events/synthetic_events\t- Create/append/remove/show synthetic events\n"
5898	"\t Write into this file to define/undefine new synthetic events.\n"
5899	"\t example: echo 'myevent u64 lat; char name[]; long[] stack' >> synthetic_events\n"
5900	#endif
5901	#endif
5902	;
5903
5904	static ssize_t
5905	tracing_readme_read(struct file filp, char* __user *ubuf,
5906	size_t cnt, loff_t *ppos)
5907	{
5908	return simple_read_from_buffer(to: ubuf, count: cnt, ppos,
5909	from: readme_msg, strlen(readme_msg));
5910	}
5911
5912	static const struct file_operations tracing_readme_fops = {
5913	.open = tracing_open_generic,
5914	.read = tracing_readme_read,
5915	.llseek = generic_file_llseek,
5916	};
5917
5918	static void saved_tgids_next(struct* seq_file m, void* v, loff_t pos)
5919	{
5920	int pid = ++(*pos);
5921
5922	return trace_find_tgid_ptr(pid);
5923	}
5924
5925	static void saved_tgids_start(struct* seq_file m, loff_t pos)
5926	{
5927	int pid = *pos;
5928
5929	return trace_find_tgid_ptr(pid);
5930	}
5931
5932	static void saved_tgids_stop(struct seq_file m, void* *v)
5933	{
5934	}
5935
5936	static int saved_tgids_show(struct seq_file m, void* *v)
5937	{
5938	int entry = (int* *)v;
5939	int pid = entry - tgid_map;
5940	int tgid = *entry;
5941
5942	if (tgid == `0`)
5943	return SEQ_SKIP;
5944
5945	seq_printf(m, fmt: "%d %d\n", pid, tgid);
5946	return `0`;
5947	}
5948
5949	static const struct seq_operations tracing_saved_tgids_seq_ops = {
5950	.start = saved_tgids_start,
5951	.stop = saved_tgids_stop,
5952	.next = saved_tgids_next,
5953	.show = saved_tgids_show,
5954	};
5955
5956	static int tracing_saved_tgids_open(struct inode inode, struct* file *filp)
5957	{
5958	int ret;
5959
5960	ret = tracing_check_open_get_tr(NULL);
5961	if (ret)
5962	return ret;
5963
5964	return seq_open(filp, &tracing_saved_tgids_seq_ops);
5965	}
5966
5967
5968	static const struct file_operations tracing_saved_tgids_fops = {
5969	.open = tracing_saved_tgids_open,
5970	.read = seq_read,
5971	.llseek = seq_lseek,
5972	.release = seq_release,
5973	};
5974
5975	static void saved_cmdlines_next(struct* seq_file m, void* v, loff_t pos)
5976	{
5977	unsigned int *ptr = v;
5978
5979	if (*pos \|\| m->count)
5980	ptr++;
5981
5982	(*pos)++;
5983
5984	for (; ptr < &savedcmd->map_cmdline_to_pid[savedcmd->cmdline_num];
5985	ptr++) {
5986	if (ptr == -`1` \|\| ptr == NO_CMDLINE_MAP)
5987	continue;
5988
5989	return ptr;
5990	}
5991
5992	return NULL;
5993	}
5994
5995	static void saved_cmdlines_start(struct* seq_file m, loff_t pos)
5996	{
5997	void *v;
5998	loff_t l = `0`;
5999
6000	preempt_disable();
6001	arch_spin_lock(&trace_cmdline_lock);
6002
6003	v = &savedcmd->map_cmdline_to_pid[`0`];
6004	while (l <= *pos) {
6005	v = saved_cmdlines_next(m, v, pos: &l);
6006	if (!v)
6007	return NULL;
6008	}
6009
6010	return v;
6011	}
6012
6013	static void saved_cmdlines_stop(struct seq_file m, void* *v)
6014	{
6015	arch_spin_unlock(&trace_cmdline_lock);
6016	preempt_enable();
6017	}
6018
6019	static int saved_cmdlines_show(struct seq_file m, void* *v)
6020	{
6021	char buf[TASK_COMM_LEN];
6022	unsigned int *pid = v;
6023
6024	__trace_find_cmdline(pid: *pid, comm: buf);
6025	seq_printf(m, fmt: "%d %s\n", *pid, buf);
6026	return `0`;
6027	}
6028
6029	static const struct seq_operations tracing_saved_cmdlines_seq_ops = {
6030	.start = saved_cmdlines_start,
6031	.next = saved_cmdlines_next,
6032	.stop = saved_cmdlines_stop,
6033	.show = saved_cmdlines_show,
6034	};
6035
6036	static int tracing_saved_cmdlines_open(struct inode inode, struct* file *filp)
6037	{
6038	int ret;
6039
6040	ret = tracing_check_open_get_tr(NULL);
6041	if (ret)
6042	return ret;
6043
6044	return seq_open(filp, &tracing_saved_cmdlines_seq_ops);
6045	}
6046
6047	static const struct file_operations tracing_saved_cmdlines_fops = {
6048	.open = tracing_saved_cmdlines_open,
6049	.read = seq_read,
6050	.llseek = seq_lseek,
6051	.release = seq_release,
6052	};
6053
6054	static ssize_t
6055	tracing_saved_cmdlines_size_read(struct file filp, char* __user *ubuf,
6056	size_t cnt, loff_t *ppos)
6057	{
6058	char buf[`64`];
6059	int r;
6060
6061	preempt_disable();
6062	arch_spin_lock(&trace_cmdline_lock);
6063	r = scnprintf(buf, size: sizeof(buf), fmt: "%u\n", savedcmd->cmdline_num);
6064	arch_spin_unlock(&trace_cmdline_lock);
6065	preempt_enable();
6066
6067	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
6068	}
6069
6070	static void free_saved_cmdlines_buffer(struct saved_cmdlines_buffer *s)
6071	{
6072	kfree(objp: s->saved_cmdlines);
6073	kfree(objp: s->map_cmdline_to_pid);
6074	kfree(objp: s);
6075	}
6076
6077	static int tracing_resize_saved_cmdlines(unsigned int val)
6078	{
6079	struct saved_cmdlines_buffer s, savedcmd_temp;
6080
6081	s = kmalloc(size: sizeof(*s), GFP_KERNEL);
6082	if (!s)
6083	return -ENOMEM;
6084
6085	if (allocate_cmdlines_buffer(val, s) < `0`) {
6086	kfree(objp: s);
6087	return -ENOMEM;
6088	}
6089
6090	preempt_disable();
6091	arch_spin_lock(&trace_cmdline_lock);
6092	savedcmd_temp = savedcmd;
6093	savedcmd = s;
6094	arch_spin_unlock(&trace_cmdline_lock);
6095	preempt_enable();
6096	free_saved_cmdlines_buffer(s: savedcmd_temp);
6097
6098	return `0`;
6099	}
6100
6101	static ssize_t
6102	tracing_saved_cmdlines_size_write(struct file filp, const* char __user *ubuf,
6103	size_t cnt, loff_t *ppos)
6104	{
6105	unsigned long val;
6106	int ret;
6107
6108	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
6109	if (ret)
6110	return ret;
6111
6112	/ must have at least 1 entry or less than PID_MAX_DEFAULT /
6113	if (!val \|\| val > PID_MAX_DEFAULT)
6114	return -EINVAL;
6115
6116	ret = tracing_resize_saved_cmdlines(val: (unsigned int)val);
6117	if (ret < `0`)
6118	return ret;
6119
6120	*ppos += cnt;
6121
6122	return cnt;
6123	}
6124
6125	static const struct file_operations tracing_saved_cmdlines_size_fops = {
6126	.open = tracing_open_generic,
6127	.read = tracing_saved_cmdlines_size_read,
6128	.write = tracing_saved_cmdlines_size_write,
6129	};
6130
6131	#ifdef CONFIG_TRACE_EVAL_MAP_FILE
6132	static union trace_eval_map_item *
6133	update_eval_map(union trace_eval_map_item *ptr)
6134	{
6135	if (!ptr->map.eval_string) {
6136	if (ptr->tail.next) {
6137	ptr = ptr->tail.next;
6138	/ Set ptr to the next real item (skip head) /
6139	ptr++;
6140	} else
6141	return NULL;
6142	}
6143	return ptr;
6144	}
6145
6146	static void eval_map_next(struct* seq_file m, void* v, loff_t pos)
6147	{
6148	union trace_eval_map_item *ptr = v;
6149
6150	/*
6151	* Paranoid! If ptr points to end, we don't want to increment past it.
6152	* This really should never happen.
6153	*/
6154	(*pos)++;
6155	ptr = update_eval_map(ptr);
6156	if (WARN_ON_ONCE(!ptr))
6157	return NULL;
6158
6159	ptr++;
6160	ptr = update_eval_map(ptr);
6161
6162	return ptr;
6163	}
6164
6165	static void eval_map_start(struct* seq_file m, loff_t pos)
6166	{
6167	union trace_eval_map_item *v;
6168	loff_t l = `0`;
6169
6170	mutex_lock(&trace_eval_mutex);
6171
6172	v = trace_eval_maps;
6173	if (v)
6174	v++;
6175
6176	while (v && l < *pos) {
6177	v = eval_map_next(m, v, pos: &l);
6178	}
6179
6180	return v;
6181	}
6182
6183	static void eval_map_stop(struct seq_file m, void* *v)
6184	{
6185	mutex_unlock(lock: &trace_eval_mutex);
6186	}
6187
6188	static int eval_map_show(struct seq_file m, void* *v)
6189	{
6190	union trace_eval_map_item *ptr = v;
6191
6192	seq_printf(m, fmt: "%s %ld (%s)\n",
6193	ptr->map.eval_string, ptr->map.eval_value,
6194	ptr->map.system);
6195
6196	return `0`;
6197	}
6198
6199	static const struct seq_operations tracing_eval_map_seq_ops = {
6200	.start = eval_map_start,
6201	.next = eval_map_next,
6202	.stop = eval_map_stop,
6203	.show = eval_map_show,
6204	};
6205
6206	static int tracing_eval_map_open(struct inode inode, struct* file *filp)
6207	{
6208	int ret;
6209
6210	ret = tracing_check_open_get_tr(NULL);
6211	if (ret)
6212	return ret;
6213
6214	return seq_open(filp, &tracing_eval_map_seq_ops);
6215	}
6216
6217	static const struct file_operations tracing_eval_map_fops = {
6218	.open = tracing_eval_map_open,
6219	.read = seq_read,
6220	.llseek = seq_lseek,
6221	.release = seq_release,
6222	};
6223
6224	static inline union trace_eval_map_item *
6225	trace_eval_jmp_to_tail(union trace_eval_map_item *ptr)
6226	{
6227	/ Return tail of array given the head /
6228	return ptr + ptr->head.length + `1`;
6229	}
6230
6231	static void
6232	trace_insert_eval_map_file(struct module mod, struct* trace_eval_map **start,
6233	int len)
6234	{
6235	struct trace_eval_map **stop;
6236	struct trace_eval_map **map;
6237	union trace_eval_map_item *map_array;
6238	union trace_eval_map_item *ptr;
6239
6240	stop = start + len;
6241
6242	/*
6243	* The trace_eval_maps contains the map plus a head and tail item,
6244	* where the head holds the module and length of array, and the
6245	* tail holds a pointer to the next list.
6246	*/
6247	map_array = kmalloc_array(n: len + `2`, size: sizeof(*map_array), GFP_KERNEL);
6248	if (!map_array) {
6249	pr_warn("Unable to allocate trace eval mapping\n");
6250	return;
6251	}
6252
6253	mutex_lock(&trace_eval_mutex);
6254
6255	if (!trace_eval_maps)
6256	trace_eval_maps = map_array;
6257	else {
6258	ptr = trace_eval_maps;
6259	for (;;) {
6260	ptr = trace_eval_jmp_to_tail(ptr);
6261	if (!ptr->tail.next)
6262	break;
6263	ptr = ptr->tail.next;
6264
6265	}
6266	ptr->tail.next = map_array;
6267	}
6268	map_array->head.mod = mod;
6269	map_array->head.length = len;
6270	map_array++;
6271
6272	for (map = start; (unsigned long)map < (unsigned long)stop; map++) {
6273	map_array->map = **map;
6274	map_array++;
6275	}
6276	memset(map_array, `0`, sizeof(*map_array));
6277
6278	mutex_unlock(lock: &trace_eval_mutex);
6279	}
6280
6281	static void trace_create_eval_file(struct dentry *d_tracer)
6282	{
6283	trace_create_file(name: "eval_map", TRACE_MODE_READ, parent: d_tracer,
6284	NULL, fops: &tracing_eval_map_fops);
6285	}
6286
6287	#else /* CONFIG_TRACE_EVAL_MAP_FILE */
6288	static inline void trace_create_eval_file(struct dentry *d_tracer) { }
6289	static inline void trace_insert_eval_map_file(struct module *mod,
6290	struct trace_eval_map *start, int* len) { }
6291	#endif /* !CONFIG_TRACE_EVAL_MAP_FILE */
6292
6293	static void trace_insert_eval_map(struct module *mod,
6294	struct trace_eval_map *start, int* len)
6295	{
6296	struct trace_eval_map **map;
6297
6298	if (len <= `0`)
6299	return;
6300
6301	map = start;
6302
6303	trace_event_eval_update(map, len);
6304
6305	trace_insert_eval_map_file(mod, start, len);
6306	}
6307
6308	static ssize_t
6309	tracing_set_trace_read(struct file filp, char* __user *ubuf,
6310	size_t cnt, loff_t *ppos)
6311	{
6312	struct trace_array *tr = filp->private_data;
6313	char buf[MAX_TRACER_SIZE+`2`];
6314	int r;
6315
6316	mutex_lock(&trace_types_lock);
6317	r = sprintf(buf, fmt: "%s\n", tr->current_trace->name);
6318	mutex_unlock(lock: &trace_types_lock);
6319
6320	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
6321	}
6322
6323	int tracer_init(struct tracer t, struct* trace_array *tr)
6324	{
6325	tracing_reset_online_cpus(buf: &tr->array_buffer);
6326	return t->init(tr);
6327	}
6328
6329	static void set_buffer_entries(struct array_buffer buf, unsigned* long val)
6330	{
6331	int cpu;
6332
6333	for_each_tracing_cpu(cpu)
6334	per_cpu_ptr(buf->data, cpu)->entries = val;
6335	}
6336
6337	static void update_buffer_entries(struct array_buffer buf, int* cpu)
6338	{
6339	if (cpu == RING_BUFFER_ALL_CPUS) {
6340	set_buffer_entries(buf, val: ring_buffer_size(buffer: buf->buffer, cpu: `0`));
6341	} else {
6342	per_cpu_ptr(buf->data, cpu)->entries = ring_buffer_size(buffer: buf->buffer, cpu);
6343	}
6344	}
6345
6346	#ifdef CONFIG_TRACER_MAX_TRACE
6347	/ resize @tr's buffer to the size of @size_tr's entries /
6348	static int resize_buffer_duplicate_size(struct array_buffer *trace_buf,
6349	struct array_buffer size_buf, int* cpu_id)
6350	{
6351	int cpu, ret = `0`;
6352
6353	if (cpu_id == RING_BUFFER_ALL_CPUS) {
6354	for_each_tracing_cpu(cpu) {
6355	ret = ring_buffer_resize(buffer: trace_buf->buffer,
6356	per_cpu_ptr(size_buf->data, cpu)->entries, cpu);
6357	if (ret < `0`)
6358	break;
6359	per_cpu_ptr(trace_buf->data, cpu)->entries =
6360	per_cpu_ptr(size_buf->data, cpu)->entries;
6361	}
6362	} else {
6363	ret = ring_buffer_resize(buffer: trace_buf->buffer,
6364	per_cpu_ptr(size_buf->data, cpu_id)->entries, cpu: cpu_id);
6365	if (ret == `0`)
6366	per_cpu_ptr(trace_buf->data, cpu_id)->entries =
6367	per_cpu_ptr(size_buf->data, cpu_id)->entries;
6368	}
6369
6370	return ret;
6371	}
6372	#endif /* CONFIG_TRACER_MAX_TRACE */
6373
6374	static int __tracing_resize_ring_buffer(struct trace_array *tr,
6375	unsigned long size, int cpu)
6376	{
6377	int ret;
6378
6379	/*
6380	* If kernel or user changes the size of the ring buffer
6381	* we use the size that was given, and we can forget about
6382	* expanding it later.
6383	*/
6384	trace_set_ring_buffer_expanded(tr);
6385
6386	/ May be called before buffers are initialized /
6387	if (!tr->array_buffer.buffer)
6388	return `0`;
6389
6390	ret = ring_buffer_resize(buffer: tr->array_buffer.buffer, size, cpu);
6391	if (ret < `0`)
6392	return ret;
6393
6394	#ifdef CONFIG_TRACER_MAX_TRACE
6395	if (!(tr->flags & TRACE_ARRAY_FL_GLOBAL) \|\|
6396	!tr->current_trace->use_max_tr)
6397	goto out;
6398
6399	ret = ring_buffer_resize(buffer: tr->max_buffer.buffer, size, cpu);
6400	if (ret < `0`) {
6401	int r = resize_buffer_duplicate_size(trace_buf: &tr->array_buffer,
6402	size_buf: &tr->array_buffer, cpu_id: cpu);
6403	if (r < `0`) {
6404	/*
6405	* AARGH! We are left with different
6406	* size max buffer!!!!
6407	* The max buffer is our "snapshot" buffer.
6408	* When a tracer needs a snapshot (one of the
6409	* latency tracers), it swaps the max buffer
6410	* with the saved snap shot. We succeeded to
6411	* update the size of the main buffer, but failed to
6412	* update the size of the max buffer. But when we tried
6413	* to reset the main buffer to the original size, we
6414	* failed there too. This is very unlikely to
6415	* happen, but if it does, warn and kill all
6416	* tracing.
6417	*/
6418	WARN_ON(`1`);
6419	tracing_disabled = `1`;
6420	}
6421	return ret;
6422	}
6423
6424	update_buffer_entries(buf: &tr->max_buffer, cpu);
6425
6426	out:
6427	#endif /* CONFIG_TRACER_MAX_TRACE */
6428
6429	update_buffer_entries(buf: &tr->array_buffer, cpu);
6430
6431	return ret;
6432	}
6433
6434	ssize_t tracing_resize_ring_buffer(struct trace_array *tr,
6435	unsigned long size, int cpu_id)
6436	{
6437	int ret;
6438
6439	mutex_lock(&trace_types_lock);
6440
6441	if (cpu_id != RING_BUFFER_ALL_CPUS) {
6442	/ make sure, this cpu is enabled in the mask /
6443	if (!cpumask_test_cpu(cpu: cpu_id, cpumask: tracing_buffer_mask)) {
6444	ret = -EINVAL;
6445	goto out;
6446	}
6447	}
6448
6449	ret = __tracing_resize_ring_buffer(tr, size, cpu: cpu_id);
6450	if (ret < `0`)
6451	ret = -ENOMEM;
6452
6453	out:
6454	mutex_unlock(lock: &trace_types_lock);
6455
6456	return ret;
6457	}
6458
6459
6460	/**
6461	* tracing_update_buffers - used by tracing facility to expand ring buffers
6462	* @tr: The tracing instance
6463	*
6464	* To save on memory when the tracing is never used on a system with it
6465	* configured in. The ring buffers are set to a minimum size. But once
6466	* a user starts to use the tracing facility, then they need to grow
6467	* to their default size.
6468	*
6469	* This function is to be called when a tracer is about to be used.
6470	*/
6471	int tracing_update_buffers(struct trace_array *tr)
6472	{
6473	int ret = `0`;
6474
6475	mutex_lock(&trace_types_lock);
6476	if (!tr->ring_buffer_expanded)
6477	ret = __tracing_resize_ring_buffer(tr, size: trace_buf_size,
6478	RING_BUFFER_ALL_CPUS);
6479	mutex_unlock(lock: &trace_types_lock);
6480
6481	return ret;
6482	}
6483
6484	struct trace_option_dentry;
6485
6486	static void
6487	create_trace_option_files(struct trace_array tr, struct* tracer *tracer);
6488
6489	/*
6490	* Used to clear out the tracer before deletion of an instance.
6491	* Must have trace_types_lock held.
6492	*/
6493	static void tracing_set_nop(struct trace_array *tr)
6494	{
6495	if (tr->current_trace == &nop_trace)
6496	return;
6497
6498	tr->current_trace->enabled--;
6499
6500	if (tr->current_trace->reset)
6501	tr->current_trace->reset(tr);
6502
6503	tr->current_trace = &nop_trace;
6504	}
6505
6506	static bool tracer_options_updated;
6507
6508	static void add_tracer_options(struct trace_array tr, struct* tracer *t)
6509	{
6510	/ Only enable if the directory has been created already. /
6511	if (!tr->dir)
6512	return;
6513
6514	/ Only create trace option files after update_tracer_options finish /
6515	if (!tracer_options_updated)
6516	return;
6517
6518	create_trace_option_files(tr, tracer: t);
6519	}
6520
6521	int tracing_set_tracer(struct trace_array tr, const* char *buf)
6522	{
6523	struct tracer *t;
6524	#ifdef CONFIG_TRACER_MAX_TRACE
6525	bool had_max_tr;
6526	#endif
6527	int ret = `0`;
6528
6529	mutex_lock(&trace_types_lock);
6530
6531	if (!tr->ring_buffer_expanded) {
6532	ret = __tracing_resize_ring_buffer(tr, size: trace_buf_size,
6533	RING_BUFFER_ALL_CPUS);
6534	if (ret < `0`)
6535	goto out;
6536	ret = `0`;
6537	}
6538
6539	for (t = trace_types; t; t = t->next) {
6540	if (strcmp(t->name, buf) == `0`)
6541	break;
6542	}
6543	if (!t) {
6544	ret = -EINVAL;
6545	goto out;
6546	}
6547	if (t == tr->current_trace)
6548	goto out;
6549
6550	#ifdef CONFIG_TRACER_SNAPSHOT
6551	if (t->use_max_tr) {
6552	local_irq_disable();
6553	arch_spin_lock(&tr->max_lock);
6554	if (tr->cond_snapshot)
6555	ret = -EBUSY;
6556	arch_spin_unlock(&tr->max_lock);
6557	local_irq_enable();
6558	if (ret)
6559	goto out;
6560	}
6561	#endif
6562	/ Some tracers won't work on kernel command line /
6563	if (system_state < SYSTEM_RUNNING && t->noboot) {
6564	pr_warn("Tracer '%s' is not allowed on command line, ignored\n",
6565	t->name);
6566	goto out;
6567	}
6568
6569	/ Some tracers are only allowed for the top level buffer /
6570	if (!trace_ok_for_array(t, tr)) {
6571	ret = -EINVAL;
6572	goto out;
6573	}
6574
6575	/ If trace pipe files are being read, we can't change the tracer /
6576	if (tr->trace_ref) {
6577	ret = -EBUSY;
6578	goto out;
6579	}
6580
6581	trace_branch_disable();
6582
6583	tr->current_trace->enabled--;
6584
6585	if (tr->current_trace->reset)
6586	tr->current_trace->reset(tr);
6587
6588	#ifdef CONFIG_TRACER_MAX_TRACE
6589	had_max_tr = tr->current_trace->use_max_tr;
6590
6591	/ Current trace needs to be nop_trace before synchronize_rcu /
6592	tr->current_trace = &nop_trace;
6593
6594	if (had_max_tr && !t->use_max_tr) {
6595	/*
6596	* We need to make sure that the update_max_tr sees that
6597	* current_trace changed to nop_trace to keep it from
6598	* swapping the buffers after we resize it.
6599	* The update_max_tr is called from interrupts disabled
6600	* so a synchronized_sched() is sufficient.
6601	*/
6602	synchronize_rcu();
6603	free_snapshot(tr);
6604	}
6605
6606	if (t->use_max_tr && !tr->allocated_snapshot) {
6607	ret = tracing_alloc_snapshot_instance(tr);
6608	if (ret < `0`)
6609	goto out;
6610	}
6611	#else
6612	tr->current_trace = &nop_trace;
6613	#endif
6614
6615	if (t->init) {
6616	ret = tracer_init(t, tr);
6617	if (ret)
6618	goto out;
6619	}
6620
6621	tr->current_trace = t;
6622	tr->current_trace->enabled++;
6623	trace_branch_enable(tr);
6624	out:
6625	mutex_unlock(lock: &trace_types_lock);
6626
6627	return ret;
6628	}
6629
6630	static ssize_t
6631	tracing_set_trace_write(struct file filp, const* char __user *ubuf,
6632	size_t cnt, loff_t *ppos)
6633	{
6634	struct trace_array *tr = filp->private_data;
6635	char buf[MAX_TRACER_SIZE+`1`];
6636	char *name;
6637	size_t ret;
6638	int err;
6639
6640	ret = cnt;
6641
6642	if (cnt > MAX_TRACER_SIZE)
6643	cnt = MAX_TRACER_SIZE;
6644
6645	if (copy_from_user(to: buf, from: ubuf, n: cnt))
6646	return -EFAULT;
6647
6648	buf[cnt] = `0`;
6649
6650	name = strim(buf);
6651
6652	err = tracing_set_tracer(tr, buf: name);
6653	if (err)
6654	return err;
6655
6656	*ppos += ret;
6657
6658	return ret;
6659	}
6660
6661	static ssize_t
6662	tracing_nsecs_read(unsigned long ptr, char* __user *ubuf,
6663	size_t cnt, loff_t *ppos)
6664	{
6665	char buf[`64`];
6666	int r;
6667
6668	r = snprintf(buf, size: sizeof(buf), fmt: "%ld\n",
6669	ptr == (unsigned* long)-`1` ? -`1` : nsecs_to_usecs(nsecs: *ptr));
6670	if (r > sizeof(buf))
6671	r = sizeof(buf);
6672	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
6673	}
6674
6675	static ssize_t
6676	tracing_nsecs_write(unsigned long ptr, const* char __user *ubuf,
6677	size_t cnt, loff_t *ppos)
6678	{
6679	unsigned long val;
6680	int ret;
6681
6682	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
6683	if (ret)
6684	return ret;
6685
6686	ptr = val `1000`;
6687
6688	return cnt;
6689	}
6690
6691	static ssize_t
6692	tracing_thresh_read(struct file filp, char* __user *ubuf,
6693	size_t cnt, loff_t *ppos)
6694	{
6695	return tracing_nsecs_read(ptr: &tracing_thresh, ubuf, cnt, ppos);
6696	}
6697
6698	static ssize_t
6699	tracing_thresh_write(struct file filp, const* char __user *ubuf,
6700	size_t cnt, loff_t *ppos)
6701	{
6702	struct trace_array *tr = filp->private_data;
6703	int ret;
6704
6705	mutex_lock(&trace_types_lock);
6706	ret = tracing_nsecs_write(ptr: &tracing_thresh, ubuf, cnt, ppos);
6707	if (ret < `0`)
6708	goto out;
6709
6710	if (tr->current_trace->update_thresh) {
6711	ret = tr->current_trace->update_thresh(tr);
6712	if (ret < `0`)
6713	goto out;
6714	}
6715
6716	ret = cnt;
6717	out:
6718	mutex_unlock(lock: &trace_types_lock);
6719
6720	return ret;
6721	}
6722
6723	#ifdef CONFIG_TRACER_MAX_TRACE
6724
6725	static ssize_t
6726	tracing_max_lat_read(struct file filp, char* __user *ubuf,
6727	size_t cnt, loff_t *ppos)
6728	{
6729	struct trace_array *tr = filp->private_data;
6730
6731	return tracing_nsecs_read(ptr: &tr->max_latency, ubuf, cnt, ppos);
6732	}
6733
6734	static ssize_t
6735	tracing_max_lat_write(struct file filp, const* char __user *ubuf,
6736	size_t cnt, loff_t *ppos)
6737	{
6738	struct trace_array *tr = filp->private_data;
6739
6740	return tracing_nsecs_write(ptr: &tr->max_latency, ubuf, cnt, ppos);
6741	}
6742
6743	#endif
6744
6745	static int open_pipe_on_cpu(struct trace_array tr, int* cpu)
6746	{
6747	if (cpu == RING_BUFFER_ALL_CPUS) {
6748	if (cpumask_empty(srcp: tr->pipe_cpumask)) {
6749	cpumask_setall(dstp: tr->pipe_cpumask);
6750	return `0`;
6751	}
6752	} else if (!cpumask_test_cpu(cpu, cpumask: tr->pipe_cpumask)) {
6753	cpumask_set_cpu(cpu, dstp: tr->pipe_cpumask);
6754	return `0`;
6755	}
6756	return -EBUSY;
6757	}
6758
6759	static void close_pipe_on_cpu(struct trace_array tr, int* cpu)
6760	{
6761	if (cpu == RING_BUFFER_ALL_CPUS) {
6762	WARN_ON(!cpumask_full(tr->pipe_cpumask));
6763	cpumask_clear(dstp: tr->pipe_cpumask);
6764	} else {
6765	WARN_ON(!cpumask_test_cpu(cpu, tr->pipe_cpumask));
6766	cpumask_clear_cpu(cpu, dstp: tr->pipe_cpumask);
6767	}
6768	}
6769
6770	static int tracing_open_pipe(struct inode inode, struct* file *filp)
6771	{
6772	struct trace_array *tr = inode->i_private;
6773	struct trace_iterator *iter;
6774	int cpu;
6775	int ret;
6776
6777	ret = tracing_check_open_get_tr(tr);
6778	if (ret)
6779	return ret;
6780
6781	mutex_lock(&trace_types_lock);
6782	cpu = tracing_get_cpu(inode);
6783	ret = open_pipe_on_cpu(tr, cpu);
6784	if (ret)
6785	goto fail_pipe_on_cpu;
6786
6787	/ create a buffer to store the information to pass to userspace /
6788	iter = kzalloc(size: sizeof(*iter), GFP_KERNEL);
6789	if (!iter) {
6790	ret = -ENOMEM;
6791	goto fail_alloc_iter;
6792	}
6793
6794	trace_seq_init(s: &iter->seq);
6795	iter->trace = tr->current_trace;
6796
6797	if (!alloc_cpumask_var(mask: &iter->started, GFP_KERNEL)) {
6798	ret = -ENOMEM;
6799	goto fail;
6800	}
6801
6802	/ trace pipe does not show start of buffer /
6803	cpumask_setall(dstp: iter->started);
6804
6805	if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
6806	iter->iter_flags \|= TRACE_FILE_LAT_FMT;
6807
6808	/ Output in nanoseconds only if we are using a clock in nanoseconds. /
6809	if (trace_clocks[tr->clock_id].in_ns)
6810	iter->iter_flags \|= TRACE_FILE_TIME_IN_NS;
6811
6812	iter->tr = tr;
6813	iter->array_buffer = &tr->array_buffer;
6814	iter->cpu_file = cpu;
6815	mutex_init(&iter->mutex);
6816	filp->private_data = iter;
6817
6818	if (iter->trace->pipe_open)
6819	iter->trace->pipe_open(iter);
6820
6821	nonseekable_open(inode, filp);
6822
6823	tr->trace_ref++;
6824
6825	mutex_unlock(lock: &trace_types_lock);
6826	return ret;
6827
6828	fail:
6829	kfree(objp: iter);
6830	fail_alloc_iter:
6831	close_pipe_on_cpu(tr, cpu);
6832	fail_pipe_on_cpu:
6833	__trace_array_put(this_tr: tr);
6834	mutex_unlock(lock: &trace_types_lock);
6835	return ret;
6836	}
6837
6838	static int tracing_release_pipe(struct inode inode, struct* file *file)
6839	{
6840	struct trace_iterator *iter = file->private_data;
6841	struct trace_array *tr = inode->i_private;
6842
6843	mutex_lock(&trace_types_lock);
6844
6845	tr->trace_ref--;
6846
6847	if (iter->trace->pipe_close)
6848	iter->trace->pipe_close(iter);
6849	close_pipe_on_cpu(tr, cpu: iter->cpu_file);
6850	mutex_unlock(lock: &trace_types_lock);
6851
6852	free_trace_iter_content(iter);
6853	kfree(objp: iter);
6854
6855	trace_array_put(tr);
6856
6857	return `0`;
6858	}
6859
6860	static __poll_t
6861	trace_poll(struct trace_iterator iter, struct* file filp, poll_table poll_table)
6862	{
6863	struct trace_array *tr = iter->tr;
6864
6865	/ Iterators are static, they should be filled or empty /
6866	if (trace_buffer_iter(iter, cpu: iter->cpu_file))
6867	return EPOLLIN \| EPOLLRDNORM;
6868
6869	if (tr->trace_flags & TRACE_ITER_BLOCK)
6870	/*
6871	* Always select as readable when in blocking mode
6872	*/
6873	return EPOLLIN \| EPOLLRDNORM;
6874	else
6875	return ring_buffer_poll_wait(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file,
6876	filp, poll_table, full: iter->tr->buffer_percent);
6877	}
6878
6879	static __poll_t
6880	tracing_poll_pipe(struct file filp, poll_table poll_table)
6881	{
6882	struct trace_iterator *iter = filp->private_data;
6883
6884	return trace_poll(iter, filp, poll_table);
6885	}
6886
6887	/ Must be called with iter->mutex held. /
6888	static int tracing_wait_pipe(struct file *filp)
6889	{
6890	struct trace_iterator *iter = filp->private_data;
6891	int ret;
6892
6893	while (trace_empty(iter)) {
6894
6895	if ((filp->f_flags & O_NONBLOCK)) {
6896	return -EAGAIN;
6897	}
6898
6899	/*
6900	* We block until we read something and tracing is disabled.
6901	* We still block if tracing is disabled, but we have never
6902	* read anything. This allows a user to cat this file, and
6903	* then enable tracing. But after we have read something,
6904	* we give an EOF when tracing is again disabled.
6905	*
6906	* iter->pos will be 0 if we haven't read anything.
6907	*/
6908	if (!tracer_tracing_is_on(tr: iter->tr) && iter->pos)
6909	break;
6910
6911	mutex_unlock(lock: &iter->mutex);
6912
6913	ret = wait_on_pipe(iter, full: `0`);
6914
6915	mutex_lock(&iter->mutex);
6916
6917	if (ret)
6918	return ret;
6919	}
6920
6921	return `1`;
6922	}
6923
6924	/*
6925	* Consumer reader.
6926	*/
6927	static ssize_t
6928	tracing_read_pipe(struct file filp, char* __user *ubuf,
6929	size_t cnt, loff_t *ppos)
6930	{
6931	struct trace_iterator *iter = filp->private_data;
6932	ssize_t sret;
6933
6934	/*
6935	* Avoid more than one consumer on a single file descriptor
6936	* This is just a matter of traces coherency, the ring buffer itself
6937	* is protected.
6938	*/
6939	mutex_lock(&iter->mutex);
6940
6941	/ return any leftover data /
6942	sret = trace_seq_to_user(s: &iter->seq, ubuf, cnt);
6943	if (sret != -EBUSY)
6944	goto out;
6945
6946	trace_seq_init(s: &iter->seq);
6947
6948	if (iter->trace->read) {
6949	sret = iter->trace->read(iter, filp, ubuf, cnt, ppos);
6950	if (sret)
6951	goto out;
6952	}
6953
6954	waitagain:
6955	sret = tracing_wait_pipe(filp);
6956	if (sret <= `0`)
6957	goto out;
6958
6959	/ stop when tracing is finished /
6960	if (trace_empty(iter)) {
6961	sret = `0`;
6962	goto out;
6963	}
6964
6965	if (cnt >= PAGE_SIZE)
6966	cnt = PAGE_SIZE - `1`;
6967
6968	/ reset all but tr, trace, and overruns /
6969	trace_iterator_reset(iter);
6970	cpumask_clear(dstp: iter->started);
6971	trace_seq_init(s: &iter->seq);
6972
6973	trace_event_read_lock();
6974	trace_access_lock(cpu: iter->cpu_file);
6975	while (trace_find_next_entry_inc(iter) != NULL) {
6976	enum print_line_t ret;
6977	int save_len = iter->seq.seq.len;
6978
6979	ret = print_trace_line(iter);
6980	if (ret == TRACE_TYPE_PARTIAL_LINE) {
6981	/*
6982	* If one print_trace_line() fills entire trace_seq in one shot,
6983	* trace_seq_to_user() will returns -EBUSY because save_len == 0,
6984	* In this case, we need to consume it, otherwise, loop will peek
6985	* this event next time, resulting in an infinite loop.
6986	*/
6987	if (save_len == `0`) {
6988	iter->seq.full = `0`;
6989	trace_seq_puts(s: &iter->seq, str: "[LINE TOO BIG]\n");
6990	trace_consume(iter);
6991	break;
6992	}
6993
6994	/ In other cases, don't print partial lines /
6995	iter->seq.seq.len = save_len;
6996	break;
6997	}
6998	if (ret != TRACE_TYPE_NO_CONSUME)
6999	trace_consume(iter);
7000
7001	if (trace_seq_used(s: &iter->seq) >= cnt)
7002	break;
7003
7004	/*
7005	* Setting the full flag means we reached the trace_seq buffer
7006	* size and we should leave by partial output condition above.
7007	* One of the trace_seq_* functions is not used properly.
7008	*/
7009	WARN_ONCE(iter->seq.full, "full flag set for trace type %d",
7010	iter->ent->type);
7011	}
7012	trace_access_unlock(cpu: iter->cpu_file);
7013	trace_event_read_unlock();
7014
7015	/ Now copy what we have to the user /
7016	sret = trace_seq_to_user(s: &iter->seq, ubuf, cnt);
7017	if (iter->seq.readpos >= trace_seq_used(s: &iter->seq))
7018	trace_seq_init(s: &iter->seq);
7019
7020	/*
7021	* If there was nothing to send to user, in spite of consuming trace
7022	* entries, go back to wait for more entries.
7023	*/
7024	if (sret == -EBUSY)
7025	goto waitagain;
7026
7027	out:
7028	mutex_unlock(lock: &iter->mutex);
7029
7030	return sret;
7031	}
7032
7033	static void tracing_spd_release_pipe(struct splice_pipe_desc *spd,
7034	unsigned int idx)
7035	{
7036	__free_page(spd->pages[idx]);
7037	}
7038
7039	static size_t
7040	tracing_fill_pipe_page(size_t rem, struct trace_iterator *iter)
7041	{
7042	size_t count;
7043	int save_len;
7044	int ret;
7045
7046	/ Seq buffer is page-sized, exactly what we need. /
7047	for (;;) {
7048	save_len = iter->seq.seq.len;
7049	ret = print_trace_line(iter);
7050
7051	if (trace_seq_has_overflowed(s: &iter->seq)) {
7052	iter->seq.seq.len = save_len;
7053	break;
7054	}
7055
7056	/*
7057	* This should not be hit, because it should only
7058	* be set if the iter->seq overflowed. But check it
7059	* anyway to be safe.
7060	*/
7061	if (ret == TRACE_TYPE_PARTIAL_LINE) {
7062	iter->seq.seq.len = save_len;
7063	break;
7064	}
7065
7066	count = trace_seq_used(s: &iter->seq) - save_len;
7067	if (rem < count) {
7068	rem = `0`;
7069	iter->seq.seq.len = save_len;
7070	break;
7071	}
7072
7073	if (ret != TRACE_TYPE_NO_CONSUME)
7074	trace_consume(iter);
7075	rem -= count;
7076	if (!trace_find_next_entry_inc(iter)) {
7077	rem = `0`;
7078	iter->ent = NULL;
7079	break;
7080	}
7081	}
7082
7083	return rem;
7084	}
7085
7086	static ssize_t tracing_splice_read_pipe(struct file *filp,
7087	loff_t *ppos,
7088	struct pipe_inode_info *pipe,
7089	size_t len,
7090	unsigned int flags)
7091	{
7092	struct page *pages_def[PIPE_DEF_BUFFERS];
7093	struct partial_page partial_def[PIPE_DEF_BUFFERS];
7094	struct trace_iterator *iter = filp->private_data;
7095	struct splice_pipe_desc spd = {
7096	.pages = pages_def,
7097	.partial = partial_def,
7098	.nr_pages = `0`, / This gets updated below. /
7099	.nr_pages_max = PIPE_DEF_BUFFERS,
7100	.ops = &default_pipe_buf_ops,
7101	.spd_release = tracing_spd_release_pipe,
7102	};
7103	ssize_t ret;
7104	size_t rem;
7105	unsigned int i;
7106
7107	if (splice_grow_spd(pipe, &spd))
7108	return -ENOMEM;
7109
7110	mutex_lock(&iter->mutex);
7111
7112	if (iter->trace->splice_read) {
7113	ret = iter->trace->splice_read(iter, filp,
7114	ppos, pipe, len, flags);
7115	if (ret)
7116	goto out_err;
7117	}
7118
7119	ret = tracing_wait_pipe(filp);
7120	if (ret <= `0`)
7121	goto out_err;
7122
7123	if (!iter->ent && !trace_find_next_entry_inc(iter)) {
7124	ret = -EFAULT;
7125	goto out_err;
7126	}
7127
7128	trace_event_read_lock();
7129	trace_access_lock(cpu: iter->cpu_file);
7130
7131	/ Fill as many pages as possible. /
7132	for (i = `0`, rem = len; i < spd.nr_pages_max && rem; i++) {
7133	spd.pages[i] = alloc_page(GFP_KERNEL);
7134	if (!spd.pages[i])
7135	break;
7136
7137	rem = tracing_fill_pipe_page(rem, iter);
7138
7139	/ Copy the data into the page, so we can start over. /
7140	ret = trace_seq_to_buffer(s: &iter->seq,
7141	page_address(spd.pages[i]),
7142	cnt: trace_seq_used(s: &iter->seq));
7143	if (ret < `0`) {
7144	__free_page(spd.pages[i]);
7145	break;
7146	}
7147	spd.partial[i].offset = `0`;
7148	spd.partial[i].len = trace_seq_used(s: &iter->seq);
7149
7150	trace_seq_init(s: &iter->seq);
7151	}
7152
7153	trace_access_unlock(cpu: iter->cpu_file);
7154	trace_event_read_unlock();
7155	mutex_unlock(lock: &iter->mutex);
7156
7157	spd.nr_pages = i;
7158
7159	if (i)
7160	ret = splice_to_pipe(pipe, &spd);
7161	else
7162	ret = `0`;
7163	out:
7164	splice_shrink_spd(&spd);
7165	return ret;
7166
7167	out_err:
7168	mutex_unlock(lock: &iter->mutex);
7169	goto out;
7170	}
7171
7172	static ssize_t
7173	tracing_entries_read(struct file filp, char* __user *ubuf,
7174	size_t cnt, loff_t *ppos)
7175	{
7176	struct inode *inode = file_inode(f: filp);
7177	struct trace_array *tr = inode->i_private;
7178	int cpu = tracing_get_cpu(inode);
7179	char buf[`64`];
7180	int r = `0`;
7181	ssize_t ret;
7182
7183	mutex_lock(&trace_types_lock);
7184
7185	if (cpu == RING_BUFFER_ALL_CPUS) {
7186	int cpu, buf_size_same;
7187	unsigned long size;
7188
7189	size = `0`;
7190	buf_size_same = `1`;
7191	/ check if all cpu sizes are same /
7192	for_each_tracing_cpu(cpu) {
7193	/ fill in the size from first enabled cpu /
7194	if (size == `0`)
7195	size = per_cpu_ptr(tr->array_buffer.data, cpu)->entries;
7196	if (size != per_cpu_ptr(tr->array_buffer.data, cpu)->entries) {
7197	buf_size_same = `0`;
7198	break;
7199	}
7200	}
7201
7202	if (buf_size_same) {
7203	if (!tr->ring_buffer_expanded)
7204	r = sprintf(buf, fmt: "%lu (expanded: %lu)\n",
7205	size >> `10`,
7206	trace_buf_size >> `10`);
7207	else
7208	r = sprintf(buf, fmt: "%lu\n", size >> `10`);
7209	} else
7210	r = sprintf(buf, fmt: "X\n");
7211	} else
7212	r = sprintf(buf, fmt: "%lu\n", per_cpu_ptr(tr->array_buffer.data, cpu)->entries >> `10`);
7213
7214	mutex_unlock(lock: &trace_types_lock);
7215
7216	ret = simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
7217	return ret;
7218	}
7219
7220	static ssize_t
7221	tracing_entries_write(struct file filp, const* char __user *ubuf,
7222	size_t cnt, loff_t *ppos)
7223	{
7224	struct inode *inode = file_inode(f: filp);
7225	struct trace_array *tr = inode->i_private;
7226	unsigned long val;
7227	int ret;
7228
7229	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
7230	if (ret)
7231	return ret;
7232
7233	/ must have at least 1 entry /
7234	if (!val)
7235	return -EINVAL;
7236
7237	/ value is in KB /
7238	val <<= `10`;
7239	ret = tracing_resize_ring_buffer(tr, size: val, cpu_id: tracing_get_cpu(inode));
7240	if (ret < `0`)
7241	return ret;
7242
7243	*ppos += cnt;
7244
7245	return cnt;
7246	}
7247
7248	static ssize_t
7249	tracing_total_entries_read(struct file filp, char* __user *ubuf,
7250	size_t cnt, loff_t *ppos)
7251	{
7252	struct trace_array *tr = filp->private_data;
7253	char buf[`64`];
7254	int r, cpu;
7255	unsigned long size = `0`, expanded_size = `0`;
7256
7257	mutex_lock(&trace_types_lock);
7258	for_each_tracing_cpu(cpu) {
7259	size += per_cpu_ptr(tr->array_buffer.data, cpu)->entries >> `10`;
7260	if (!tr->ring_buffer_expanded)
7261	expanded_size += trace_buf_size >> `10`;
7262	}
7263	if (tr->ring_buffer_expanded)
7264	r = sprintf(buf, fmt: "%lu\n", size);
7265	else
7266	r = sprintf(buf, fmt: "%lu (expanded: %lu)\n", size, expanded_size);
7267	mutex_unlock(lock: &trace_types_lock);
7268
7269	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
7270	}
7271
7272	static ssize_t
7273	tracing_free_buffer_write(struct file filp, const* char __user *ubuf,
7274	size_t cnt, loff_t *ppos)
7275	{
7276	/*
7277	* There is no need to read what the user has written, this function
7278	* is just to make sure that there is no error when "echo" is used
7279	*/
7280
7281	*ppos += cnt;
7282
7283	return cnt;
7284	}
7285
7286	static int
7287	tracing_free_buffer_release(struct inode inode, struct* file *filp)
7288	{
7289	struct trace_array *tr = inode->i_private;
7290
7291	/ disable tracing ? /
7292	if (tr->trace_flags & TRACE_ITER_STOP_ON_FREE)
7293	tracer_tracing_off(tr);
7294	/ resize the ring buffer to 0 /
7295	tracing_resize_ring_buffer(tr, size: `0`, RING_BUFFER_ALL_CPUS);
7296
7297	trace_array_put(tr);
7298
7299	return `0`;
7300	}
7301
7302	static ssize_t
7303	tracing_mark_write(struct file filp, const* char __user *ubuf,
7304	size_t cnt, loff_t *fpos)
7305	{
7306	struct trace_array *tr = filp->private_data;
7307	struct ring_buffer_event *event;
7308	enum event_trigger_type tt = ETT_NONE;
7309	struct trace_buffer *buffer;
7310	struct print_entry *entry;
7311	ssize_t written;
7312	int size;
7313	int len;
7314
7315	/ Used in tracing_mark_raw_write() as well /
7316	#define FAULTED_STR "<faulted>"
7317	#define FAULTED_SIZE (sizeof(FAULTED_STR) - 1) /* '\0' is already accounted for */
7318
7319	if (tracing_disabled)
7320	return -EINVAL;
7321
7322	if (!(tr->trace_flags & TRACE_ITER_MARKERS))
7323	return -EINVAL;
7324
7325	if (cnt > TRACE_BUF_SIZE)
7326	cnt = TRACE_BUF_SIZE;
7327
7328	BUILD_BUG_ON(TRACE_BUF_SIZE >= PAGE_SIZE);
7329
7330	size = sizeof(entry) + cnt + `2`; /* add '\0' and possible '\n' /
7331
7332	/ If less than "<faulted>", then make sure we can still add that /
7333	if (cnt < FAULTED_SIZE)
7334	size += FAULTED_SIZE - cnt;
7335
7336	buffer = tr->array_buffer.buffer;
7337	event = __trace_buffer_lock_reserve(buffer, type: TRACE_PRINT, len: size,
7338	trace_ctx: tracing_gen_ctx());
7339	if (unlikely(!event))
7340	/ Ring buffer disabled, return as if not open for write /
7341	return -EBADF;
7342
7343	entry = ring_buffer_event_data(event);
7344	entry->ip = _THIS_IP_;
7345
7346	len = __copy_from_user_inatomic(to: &entry->buf, from: ubuf, n: cnt);
7347	if (len) {
7348	memcpy(&entry->buf, FAULTED_STR, FAULTED_SIZE);
7349	cnt = FAULTED_SIZE;
7350	written = -EFAULT;
7351	} else
7352	written = cnt;
7353
7354	if (tr->trace_marker_file && !list_empty(head: &tr->trace_marker_file->triggers)) {
7355	/ do not add \n before testing triggers, but add \0 /
7356	entry->buf[cnt] = `'\0'`;
7357	tt = event_triggers_call(file: tr->trace_marker_file, buffer, rec: entry, event);
7358	}
7359
7360	if (entry->buf[cnt - `1`] != `'\n'`) {
7361	entry->buf[cnt] = `'\n'`;
7362	entry->buf[cnt + `1`] = `'\0'`;
7363	} else
7364	entry->buf[cnt] = `'\0'`;
7365
7366	if (static_branch_unlikely(&trace_marker_exports_enabled))
7367	ftrace_exports(event, TRACE_EXPORT_MARKER);
7368	__buffer_unlock_commit(buffer, event);
7369
7370	if (tt)
7371	event_triggers_post_call(file: tr->trace_marker_file, tt);
7372
7373	return written;
7374	}
7375
7376	/ Limit it for now to 3K (including tag) /
7377	#define RAW_DATA_MAX_SIZE (1024*3)
7378
7379	static ssize_t
7380	tracing_mark_raw_write(struct file filp, const* char __user *ubuf,
7381	size_t cnt, loff_t *fpos)
7382	{
7383	struct trace_array *tr = filp->private_data;
7384	struct ring_buffer_event *event;
7385	struct trace_buffer *buffer;
7386	struct raw_data_entry *entry;
7387	ssize_t written;
7388	int size;
7389	int len;
7390
7391	#define FAULT_SIZE_ID (FAULTED_SIZE + sizeof(int))
7392
7393	if (tracing_disabled)
7394	return -EINVAL;
7395
7396	if (!(tr->trace_flags & TRACE_ITER_MARKERS))
7397	return -EINVAL;
7398
7399	/ The marker must at least have a tag id /
7400	if (cnt < sizeof(unsigned int) \|\| cnt > RAW_DATA_MAX_SIZE)
7401	return -EINVAL;
7402
7403	if (cnt > TRACE_BUF_SIZE)
7404	cnt = TRACE_BUF_SIZE;
7405
7406	BUILD_BUG_ON(TRACE_BUF_SIZE >= PAGE_SIZE);
7407
7408	size = sizeof(*entry) + cnt;
7409	if (cnt < FAULT_SIZE_ID)
7410	size += FAULT_SIZE_ID - cnt;
7411
7412	buffer = tr->array_buffer.buffer;
7413	event = __trace_buffer_lock_reserve(buffer, type: TRACE_RAW_DATA, len: size,
7414	trace_ctx: tracing_gen_ctx());
7415	if (!event)
7416	/ Ring buffer disabled, return as if not open for write /
7417	return -EBADF;
7418
7419	entry = ring_buffer_event_data(event);
7420
7421	len = __copy_from_user_inatomic(to: &entry->id, from: ubuf, n: cnt);
7422	if (len) {
7423	entry->id = -`1`;
7424	memcpy(&entry->buf, FAULTED_STR, FAULTED_SIZE);
7425	written = -EFAULT;
7426	} else
7427	written = cnt;
7428
7429	__buffer_unlock_commit(buffer, event);
7430
7431	return written;
7432	}
7433
7434	static int tracing_clock_show(struct seq_file m, void* *v)
7435	{
7436	struct trace_array *tr = m->private;
7437	int i;
7438
7439	for (i = `0`; i < ARRAY_SIZE(trace_clocks); i++)
7440	seq_printf(m,
7441	fmt: "%s%s%s%s", i ? " " : "",
7442	i == tr->clock_id ? "[" : "", trace_clocks[i].name,
7443	i == tr->clock_id ? "]" : "");
7444	seq_putc(m, c: `'\n'`);
7445
7446	return `0`;
7447	}
7448
7449	int tracing_set_clock(struct trace_array tr, const* char *clockstr)
7450	{
7451	int i;
7452
7453	for (i = `0`; i < ARRAY_SIZE(trace_clocks); i++) {
7454	if (strcmp(trace_clocks[i].name, clockstr) == `0`)
7455	break;
7456	}
7457	if (i == ARRAY_SIZE(trace_clocks))
7458	return -EINVAL;
7459
7460	mutex_lock(&trace_types_lock);
7461
7462	tr->clock_id = i;
7463
7464	ring_buffer_set_clock(buffer: tr->array_buffer.buffer, clock: trace_clocks[i].func);
7465
7466	/*
7467	* New clock may not be consistent with the previous clock.
7468	* Reset the buffer so that it doesn't have incomparable timestamps.
7469	*/
7470	tracing_reset_online_cpus(buf: &tr->array_buffer);
7471
7472	#ifdef CONFIG_TRACER_MAX_TRACE
7473	if (tr->max_buffer.buffer)
7474	ring_buffer_set_clock(buffer: tr->max_buffer.buffer, clock: trace_clocks[i].func);
7475	tracing_reset_online_cpus(buf: &tr->max_buffer);
7476	#endif
7477
7478	mutex_unlock(lock: &trace_types_lock);
7479
7480	return `0`;
7481	}
7482
7483	static ssize_t tracing_clock_write(struct file filp, const* char __user *ubuf,
7484	size_t cnt, loff_t *fpos)
7485	{
7486	struct seq_file *m = filp->private_data;
7487	struct trace_array *tr = m->private;
7488	char buf[`64`];
7489	const char *clockstr;
7490	int ret;
7491
7492	if (cnt >= sizeof(buf))
7493	return -EINVAL;
7494
7495	if (copy_from_user(to: buf, from: ubuf, n: cnt))
7496	return -EFAULT;
7497
7498	buf[cnt] = `0`;
7499
7500	clockstr = strstrip(str: buf);
7501
7502	ret = tracing_set_clock(tr, clockstr);
7503	if (ret)
7504	return ret;
7505
7506	*fpos += cnt;
7507
7508	return cnt;
7509	}
7510
7511	static int tracing_clock_open(struct inode inode, struct* file *file)
7512	{
7513	struct trace_array *tr = inode->i_private;
7514	int ret;
7515
7516	ret = tracing_check_open_get_tr(tr);
7517	if (ret)
7518	return ret;
7519
7520	ret = single_open(file, tracing_clock_show, inode->i_private);
7521	if (ret < `0`)
7522	trace_array_put(tr);
7523
7524	return ret;
7525	}
7526
7527	static int tracing_time_stamp_mode_show(struct seq_file m, void* *v)
7528	{
7529	struct trace_array *tr = m->private;
7530
7531	mutex_lock(&trace_types_lock);
7532
7533	if (ring_buffer_time_stamp_abs(buffer: tr->array_buffer.buffer))
7534	seq_puts(m, s: "delta [absolute]\n");
7535	else
7536	seq_puts(m, s: "[delta] absolute\n");
7537
7538	mutex_unlock(lock: &trace_types_lock);
7539
7540	return `0`;
7541	}
7542
7543	static int tracing_time_stamp_mode_open(struct inode inode, struct* file *file)
7544	{
7545	struct trace_array *tr = inode->i_private;
7546	int ret;
7547
7548	ret = tracing_check_open_get_tr(tr);
7549	if (ret)
7550	return ret;
7551
7552	ret = single_open(file, tracing_time_stamp_mode_show, inode->i_private);
7553	if (ret < `0`)
7554	trace_array_put(tr);
7555
7556	return ret;
7557	}
7558
7559	u64 tracing_event_time_stamp(struct trace_buffer buffer, struct* ring_buffer_event *rbe)
7560	{
7561	if (rbe == this_cpu_read(trace_buffered_event))
7562	return ring_buffer_time_stamp(buffer);
7563
7564	return ring_buffer_event_time_stamp(buffer, event: rbe);
7565	}
7566
7567	/*
7568	* Set or disable using the per CPU trace_buffer_event when possible.
7569	*/
7570	int tracing_set_filter_buffering(struct trace_array *tr, bool set)
7571	{
7572	int ret = `0`;
7573
7574	mutex_lock(&trace_types_lock);
7575
7576	if (set && tr->no_filter_buffering_ref++)
7577	goto out;
7578
7579	if (!set) {
7580	if (WARN_ON_ONCE(!tr->no_filter_buffering_ref)) {
7581	ret = -EINVAL;
7582	goto out;
7583	}
7584
7585	--tr->no_filter_buffering_ref;
7586	}
7587	out:
7588	mutex_unlock(lock: &trace_types_lock);
7589
7590	return ret;
7591	}
7592
7593	struct ftrace_buffer_info {
7594	struct trace_iterator iter;
7595	void *spare;
7596	unsigned int spare_cpu;
7597	unsigned int read;
7598	};
7599
7600	#ifdef CONFIG_TRACER_SNAPSHOT
7601	static int tracing_snapshot_open(struct inode inode, struct* file *file)
7602	{
7603	struct trace_array *tr = inode->i_private;
7604	struct trace_iterator *iter;
7605	struct seq_file *m;
7606	int ret;
7607
7608	ret = tracing_check_open_get_tr(tr);
7609	if (ret)
7610	return ret;
7611
7612	if (file->f_mode & FMODE_READ) {
7613	iter = __tracing_open(inode, file, snapshot: true);
7614	if (IS_ERR(ptr: iter))
7615	ret = PTR_ERR(ptr: iter);
7616	} else {
7617	/ Writes still need the seq_file to hold the private data /
7618	ret = -ENOMEM;
7619	m = kzalloc(size: sizeof(*m), GFP_KERNEL);
7620	if (!m)
7621	goto out;
7622	iter = kzalloc(size: sizeof(*iter), GFP_KERNEL);
7623	if (!iter) {
7624	kfree(objp: m);
7625	goto out;
7626	}
7627	ret = `0`;
7628
7629	iter->tr = tr;
7630	iter->array_buffer = &tr->max_buffer;
7631	iter->cpu_file = tracing_get_cpu(inode);
7632	m->private = iter;
7633	file->private_data = m;
7634	}
7635	out:
7636	if (ret < `0`)
7637	trace_array_put(tr);
7638
7639	return ret;
7640	}
7641
7642	static void tracing_swap_cpu_buffer(void *tr)
7643	{
7644	update_max_tr_single(tr: (struct trace_array *)tr, current, smp_processor_id());
7645	}
7646
7647	static ssize_t
7648	tracing_snapshot_write(struct file filp, const* char __user *ubuf, size_t cnt,
7649	loff_t *ppos)
7650	{
7651	struct seq_file *m = filp->private_data;
7652	struct trace_iterator *iter = m->private;
7653	struct trace_array *tr = iter->tr;
7654	unsigned long val;
7655	int ret;
7656
7657	ret = tracing_update_buffers(tr);
7658	if (ret < `0`)
7659	return ret;
7660
7661	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
7662	if (ret)
7663	return ret;
7664
7665	mutex_lock(&trace_types_lock);
7666
7667	if (tr->current_trace->use_max_tr) {
7668	ret = -EBUSY;
7669	goto out;
7670	}
7671
7672	local_irq_disable();
7673	arch_spin_lock(&tr->max_lock);
7674	if (tr->cond_snapshot)
7675	ret = -EBUSY;
7676	arch_spin_unlock(&tr->max_lock);
7677	local_irq_enable();
7678	if (ret)
7679	goto out;
7680
7681	switch (val) {
7682	case `0`:
7683	if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
7684	ret = -EINVAL;
7685	break;
7686	}
7687	if (tr->allocated_snapshot)
7688	free_snapshot(tr);
7689	break;
7690	case `1`:
7691	/ Only allow per-cpu swap if the ring buffer supports it /
7692	#ifndef CONFIG_RING_BUFFER_ALLOW_SWAP
7693	if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
7694	ret = -EINVAL;
7695	break;
7696	}
7697	#endif
7698	if (tr->allocated_snapshot)
7699	ret = resize_buffer_duplicate_size(trace_buf: &tr->max_buffer,
7700	size_buf: &tr->array_buffer, cpu_id: iter->cpu_file);
7701	else
7702	ret = tracing_alloc_snapshot_instance(tr);
7703	if (ret < `0`)
7704	break;
7705	/ Now, we're going to swap /
7706	if (iter->cpu_file == RING_BUFFER_ALL_CPUS) {
7707	local_irq_disable();
7708	update_max_tr(tr, current, smp_processor_id(), NULL);
7709	local_irq_enable();
7710	} else {
7711	smp_call_function_single(cpuid: iter->cpu_file, func: tracing_swap_cpu_buffer,
7712	info: (void *)tr, wait: `1`);
7713	}
7714	break;
7715	default:
7716	if (tr->allocated_snapshot) {
7717	if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
7718	tracing_reset_online_cpus(buf: &tr->max_buffer);
7719	else
7720	tracing_reset_cpu(buf: &tr->max_buffer, cpu: iter->cpu_file);
7721	}
7722	break;
7723	}
7724
7725	if (ret >= `0`) {
7726	*ppos += cnt;
7727	ret = cnt;
7728	}
7729	out:
7730	mutex_unlock(lock: &trace_types_lock);
7731	return ret;
7732	}
7733
7734	static int tracing_snapshot_release(struct inode inode, struct* file *file)
7735	{
7736	struct seq_file *m = file->private_data;
7737	int ret;
7738
7739	ret = tracing_release(inode, file);
7740
7741	if (file->f_mode & FMODE_READ)
7742	return ret;
7743
7744	/ If write only, the seq_file is just a stub /
7745	if (m)
7746	kfree(objp: m->private);
7747	kfree(objp: m);
7748
7749	return `0`;
7750	}
7751
7752	static int tracing_buffers_open(struct inode inode, struct* file *filp);
7753	static ssize_t tracing_buffers_read(struct file filp, char* __user *ubuf,
7754	size_t count, loff_t *ppos);
7755	static int tracing_buffers_release(struct inode inode, struct* file *file);
7756	static ssize_t tracing_buffers_splice_read(struct file file, loff_t ppos,
7757	struct pipe_inode_info pipe, size_t len, unsigned* int flags);
7758
7759	static int snapshot_raw_open(struct inode inode, struct* file *filp)
7760	{
7761	struct ftrace_buffer_info *info;
7762	int ret;
7763
7764	/ The following checks for tracefs lockdown /
7765	ret = tracing_buffers_open(inode, filp);
7766	if (ret < `0`)
7767	return ret;
7768
7769	info = filp->private_data;
7770
7771	if (info->iter.trace->use_max_tr) {
7772	tracing_buffers_release(inode, file: filp);
7773	return -EBUSY;
7774	}
7775
7776	info->iter.snapshot = true;
7777	info->iter.array_buffer = &info->iter.tr->max_buffer;
7778
7779	return ret;
7780	}
7781
7782	#endif /* CONFIG_TRACER_SNAPSHOT */
7783
7784
7785	static const struct file_operations tracing_thresh_fops = {
7786	.open = tracing_open_generic,
7787	.read = tracing_thresh_read,
7788	.write = tracing_thresh_write,
7789	.llseek = generic_file_llseek,
7790	};
7791
7792	#ifdef CONFIG_TRACER_MAX_TRACE
7793	static const struct file_operations tracing_max_lat_fops = {
7794	.open = tracing_open_generic_tr,
7795	.read = tracing_max_lat_read,
7796	.write = tracing_max_lat_write,
7797	.llseek = generic_file_llseek,
7798	.release = tracing_release_generic_tr,
7799	};
7800	#endif
7801
7802	static const struct file_operations set_tracer_fops = {
7803	.open = tracing_open_generic_tr,
7804	.read = tracing_set_trace_read,
7805	.write = tracing_set_trace_write,
7806	.llseek = generic_file_llseek,
7807	.release = tracing_release_generic_tr,
7808	};
7809
7810	static const struct file_operations tracing_pipe_fops = {
7811	.open = tracing_open_pipe,
7812	.poll = tracing_poll_pipe,
7813	.read = tracing_read_pipe,
7814	.splice_read = tracing_splice_read_pipe,
7815	.release = tracing_release_pipe,
7816	.llseek = no_llseek,
7817	};
7818
7819	static const struct file_operations tracing_entries_fops = {
7820	.open = tracing_open_generic_tr,
7821	.read = tracing_entries_read,
7822	.write = tracing_entries_write,
7823	.llseek = generic_file_llseek,
7824	.release = tracing_release_generic_tr,
7825	};
7826
7827	static const struct file_operations tracing_total_entries_fops = {
7828	.open = tracing_open_generic_tr,
7829	.read = tracing_total_entries_read,
7830	.llseek = generic_file_llseek,
7831	.release = tracing_release_generic_tr,
7832	};
7833
7834	static const struct file_operations tracing_free_buffer_fops = {
7835	.open = tracing_open_generic_tr,
7836	.write = tracing_free_buffer_write,
7837	.release = tracing_free_buffer_release,
7838	};
7839
7840	static const struct file_operations tracing_mark_fops = {
7841	.open = tracing_mark_open,
7842	.write = tracing_mark_write,
7843	.release = tracing_release_generic_tr,
7844	};
7845
7846	static const struct file_operations tracing_mark_raw_fops = {
7847	.open = tracing_mark_open,
7848	.write = tracing_mark_raw_write,
7849	.release = tracing_release_generic_tr,
7850	};
7851
7852	static const struct file_operations trace_clock_fops = {
7853	.open = tracing_clock_open,
7854	.read = seq_read,
7855	.llseek = seq_lseek,
7856	.release = tracing_single_release_tr,
7857	.write = tracing_clock_write,
7858	};
7859
7860	static const struct file_operations trace_time_stamp_mode_fops = {
7861	.open = tracing_time_stamp_mode_open,
7862	.read = seq_read,
7863	.llseek = seq_lseek,
7864	.release = tracing_single_release_tr,
7865	};
7866
7867	#ifdef CONFIG_TRACER_SNAPSHOT
7868	static const struct file_operations snapshot_fops = {
7869	.open = tracing_snapshot_open,
7870	.read = seq_read,
7871	.write = tracing_snapshot_write,
7872	.llseek = tracing_lseek,
7873	.release = tracing_snapshot_release,
7874	};
7875
7876	static const struct file_operations snapshot_raw_fops = {
7877	.open = snapshot_raw_open,
7878	.read = tracing_buffers_read,
7879	.release = tracing_buffers_release,
7880	.splice_read = tracing_buffers_splice_read,
7881	.llseek = no_llseek,
7882	};
7883
7884	#endif /* CONFIG_TRACER_SNAPSHOT */
7885
7886	/*
7887	* trace_min_max_write - Write a u64 value to a trace_min_max_param struct
7888	* @filp: The active open file structure
7889	* @ubuf: The userspace provided buffer to read value into
7890	* @cnt: The maximum number of bytes to read
7891	* @ppos: The current "file" position
7892	*
7893	* This function implements the write interface for a struct trace_min_max_param.
7894	* The filp->private_data must point to a trace_min_max_param structure that
7895	* defines where to write the value, the min and the max acceptable values,
7896	* and a lock to protect the write.
7897	*/
7898	static ssize_t
7899	trace_min_max_write(struct file filp, const* char __user ubuf, size_t cnt, loff_t ppos)
7900	{
7901	struct trace_min_max_param *param = filp->private_data;
7902	u64 val;
7903	int err;
7904
7905	if (!param)
7906	return -EFAULT;
7907
7908	err = kstrtoull_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
7909	if (err)
7910	return err;
7911
7912	if (param->lock)
7913	mutex_lock(param->lock);
7914
7915	if (param->min && val < *param->min)
7916	err = -EINVAL;
7917
7918	if (param->max && val > *param->max)
7919	err = -EINVAL;
7920
7921	if (!err)
7922	*param->val = val;
7923
7924	if (param->lock)
7925	mutex_unlock(lock: param->lock);
7926
7927	if (err)
7928	return err;
7929
7930	return cnt;
7931	}
7932
7933	/*
7934	* trace_min_max_read - Read a u64 value from a trace_min_max_param struct
7935	* @filp: The active open file structure
7936	* @ubuf: The userspace provided buffer to read value into
7937	* @cnt: The maximum number of bytes to read
7938	* @ppos: The current "file" position
7939	*
7940	* This function implements the read interface for a struct trace_min_max_param.
7941	* The filp->private_data must point to a trace_min_max_param struct with valid
7942	* data.
7943	*/
7944	static ssize_t
7945	trace_min_max_read(struct file filp, char* __user ubuf, size_t cnt, loff_t ppos)
7946	{
7947	struct trace_min_max_param *param = filp->private_data;
7948	char buf[U64_STR_SIZE];
7949	int len;
7950	u64 val;
7951
7952	if (!param)
7953	return -EFAULT;
7954
7955	val = *param->val;
7956
7957	if (cnt > sizeof(buf))
7958	cnt = sizeof(buf);
7959
7960	len = snprintf(buf, size: sizeof(buf), fmt: "%llu\n", val);
7961
7962	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: len);
7963	}
7964
7965	const struct file_operations trace_min_max_fops = {
7966	.open = tracing_open_generic,
7967	.read = trace_min_max_read,
7968	.write = trace_min_max_write,
7969	};
7970
7971	#define TRACING_LOG_ERRS_MAX 8
7972	#define TRACING_LOG_LOC_MAX 128
7973
7974	#define CMD_PREFIX " Command: "
7975
7976	struct err_info {
7977	const char *errs; /* ptr to loc-specific array of err strings /
7978	u8 type; / index into errs -> specific err string /
7979	u16 pos; / caret position /
7980	u64 ts;
7981	};
7982
7983	struct tracing_log_err {
7984	struct list_head list;
7985	struct err_info info;
7986	char loc[TRACING_LOG_LOC_MAX]; / err location /
7987	char cmd; /* what caused err /
7988	};
7989
7990	static DEFINE_MUTEX(tracing_err_log_lock);
7991
7992	static struct tracing_log_err alloc_tracing_log_err(int* len)
7993	{
7994	struct tracing_log_err *err;
7995
7996	err = kzalloc(size: sizeof(*err), GFP_KERNEL);
7997	if (!err)
7998	return ERR_PTR(error: -ENOMEM);
7999
8000	err->cmd = kzalloc(size: len, GFP_KERNEL);
8001	if (!err->cmd) {
8002	kfree(objp: err);
8003	return ERR_PTR(error: -ENOMEM);
8004	}
8005
8006	return err;
8007	}
8008
8009	static void free_tracing_log_err(struct tracing_log_err *err)
8010	{
8011	kfree(objp: err->cmd);
8012	kfree(objp: err);
8013	}
8014
8015	static struct tracing_log_err get_tracing_log_err(struct* trace_array *tr,
8016	int len)
8017	{
8018	struct tracing_log_err *err;
8019	char *cmd;
8020
8021	if (tr->n_err_log_entries < TRACING_LOG_ERRS_MAX) {
8022	err = alloc_tracing_log_err(len);
8023	if (PTR_ERR(ptr: err) != -ENOMEM)
8024	tr->n_err_log_entries++;
8025
8026	return err;
8027	}
8028	cmd = kzalloc(size: len, GFP_KERNEL);
8029	if (!cmd)
8030	return ERR_PTR(error: -ENOMEM);
8031	err = list_first_entry(&tr->err_log, struct tracing_log_err, list);
8032	kfree(objp: err->cmd);
8033	err->cmd = cmd;
8034	list_del(entry: &err->list);
8035
8036	return err;
8037	}
8038
8039	/**
8040	* err_pos - find the position of a string within a command for error careting
8041	* @cmd: The tracing command that caused the error
8042	* @str: The string to position the caret at within @cmd
8043	*
8044	* Finds the position of the first occurrence of @str within @cmd. The
8045	* return value can be passed to tracing_log_err() for caret placement
8046	* within @cmd.
8047	*
8048	* Returns the index within @cmd of the first occurrence of @str or 0
8049	* if @str was not found.
8050	*/
8051	unsigned int err_pos(char cmd, const* char *str)
8052	{
8053	char *found;
8054
8055	if (WARN_ON(!strlen(cmd)))
8056	return `0`;
8057
8058	found = strstr(cmd, str);
8059	if (found)
8060	return found - cmd;
8061
8062	return `0`;
8063	}
8064
8065	/**
8066	* tracing_log_err - write an error to the tracing error log
8067	* @tr: The associated trace array for the error (NULL for top level array)
8068	* @loc: A string describing where the error occurred
8069	* @cmd: The tracing command that caused the error
8070	* @errs: The array of loc-specific static error strings
8071	* @type: The index into errs[], which produces the specific static err string
8072	* @pos: The position the caret should be placed in the cmd
8073	*
8074	* Writes an error into tracing/error_log of the form:
8075	*
8076	* <loc>: error: <text>
8077	* Command: <cmd>
8078	* ^
8079	*
8080	* tracing/error_log is a small log file containing the last
8081	* TRACING_LOG_ERRS_MAX errors (8). Memory for errors isn't allocated
8082	* unless there has been a tracing error, and the error log can be
8083	* cleared and have its memory freed by writing the empty string in
8084	* truncation mode to it i.e. echo > tracing/error_log.
8085	*
8086	* NOTE: the @errs array along with the @type param are used to
8087	* produce a static error string - this string is not copied and saved
8088	* when the error is logged - only a pointer to it is saved. See
8089	* existing callers for examples of how static strings are typically
8090	* defined for use with tracing_log_err().
8091	*/
8092	void tracing_log_err(struct trace_array *tr,
8093	const char loc, const* char *cmd,
8094	const char **errs, u8 type, u16 pos)
8095	{
8096	struct tracing_log_err *err;
8097	int len = `0`;
8098
8099	if (!tr)
8100	tr = &global_trace;
8101
8102	len += sizeof(CMD_PREFIX) + `2` * sizeof("\n") + strlen(cmd) + `1`;
8103
8104	mutex_lock(&tracing_err_log_lock);
8105	err = get_tracing_log_err(tr, len);
8106	if (PTR_ERR(ptr: err) == -ENOMEM) {
8107	mutex_unlock(lock: &tracing_err_log_lock);
8108	return;
8109	}
8110
8111	snprintf(buf: err->loc, TRACING_LOG_LOC_MAX, fmt: "%s: error: ", loc);
8112	snprintf(buf: err->cmd, size: len, fmt: "\n" CMD_PREFIX "%s\n", cmd);
8113
8114	err->info.errs = errs;
8115	err->info.type = type;
8116	err->info.pos = pos;
8117	err->info.ts = local_clock();
8118
8119	list_add_tail(new: &err->list, head: &tr->err_log);
8120	mutex_unlock(lock: &tracing_err_log_lock);
8121	}
8122
8123	static void clear_tracing_err_log(struct trace_array *tr)
8124	{
8125	struct tracing_log_err err, next;
8126
8127	mutex_lock(&tracing_err_log_lock);
8128	list_for_each_entry_safe(err, next, &tr->err_log, list) {
8129	list_del(entry: &err->list);
8130	free_tracing_log_err(err);
8131	}
8132
8133	tr->n_err_log_entries = `0`;
8134	mutex_unlock(lock: &tracing_err_log_lock);
8135	}
8136
8137	static void tracing_err_log_seq_start(struct* seq_file m, loff_t pos)
8138	{
8139	struct trace_array *tr = m->private;
8140
8141	mutex_lock(&tracing_err_log_lock);
8142
8143	return seq_list_start(head: &tr->err_log, pos: *pos);
8144	}
8145
8146	static void tracing_err_log_seq_next(struct* seq_file m, void* v, loff_t pos)
8147	{
8148	struct trace_array *tr = m->private;
8149
8150	return seq_list_next(v, head: &tr->err_log, ppos: pos);
8151	}
8152
8153	static void tracing_err_log_seq_stop(struct seq_file m, void* *v)
8154	{
8155	mutex_unlock(lock: &tracing_err_log_lock);
8156	}
8157
8158	static void tracing_err_log_show_pos(struct seq_file *m, u16 pos)
8159	{
8160	u16 i;
8161
8162	for (i = `0`; i < sizeof(CMD_PREFIX) - `1`; i++)
8163	seq_putc(m, c: `' '`);
8164	for (i = `0`; i < pos; i++)
8165	seq_putc(m, c: `' '`);
8166	seq_puts(m, s: "^\n");
8167	}
8168
8169	static int tracing_err_log_seq_show(struct seq_file m, void* *v)
8170	{
8171	struct tracing_log_err *err = v;
8172
8173	if (err) {
8174	const char *err_text = err->info.errs[err->info.type];
8175	u64 sec = err->info.ts;
8176	u32 nsec;
8177
8178	nsec = do_div(sec, NSEC_PER_SEC);
8179	seq_printf(m, fmt: "[%5llu.%06u] %s%s", sec, nsec / `1000`,
8180	err->loc, err_text);
8181	seq_printf(m, fmt: "%s", err->cmd);
8182	tracing_err_log_show_pos(m, pos: err->info.pos);
8183	}
8184
8185	return `0`;
8186	}
8187
8188	static const struct seq_operations tracing_err_log_seq_ops = {
8189	.start = tracing_err_log_seq_start,
8190	.next = tracing_err_log_seq_next,
8191	.stop = tracing_err_log_seq_stop,
8192	.show = tracing_err_log_seq_show
8193	};
8194
8195	static int tracing_err_log_open(struct inode inode, struct* file *file)
8196	{
8197	struct trace_array *tr = inode->i_private;
8198	int ret = `0`;
8199
8200	ret = tracing_check_open_get_tr(tr);
8201	if (ret)
8202	return ret;
8203
8204	/ If this file was opened for write, then erase contents /
8205	if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC))
8206	clear_tracing_err_log(tr);
8207
8208	if (file->f_mode & FMODE_READ) {
8209	ret = seq_open(file, &tracing_err_log_seq_ops);
8210	if (!ret) {
8211	struct seq_file *m = file->private_data;
8212	m->private = tr;
8213	} else {
8214	trace_array_put(tr);
8215	}
8216	}
8217	return ret;
8218	}
8219
8220	static ssize_t tracing_err_log_write(struct file *file,
8221	const char __user *buffer,
8222	size_t count, loff_t *ppos)
8223	{
8224	return count;
8225	}
8226
8227	static int tracing_err_log_release(struct inode inode, struct* file *file)
8228	{
8229	struct trace_array *tr = inode->i_private;
8230
8231	trace_array_put(tr);
8232
8233	if (file->f_mode & FMODE_READ)
8234	seq_release(inode, file);
8235
8236	return `0`;
8237	}
8238
8239	static const struct file_operations tracing_err_log_fops = {
8240	.open = tracing_err_log_open,
8241	.write = tracing_err_log_write,
8242	.read = seq_read,
8243	.llseek = tracing_lseek,
8244	.release = tracing_err_log_release,
8245	};
8246
8247	static int tracing_buffers_open(struct inode inode, struct* file *filp)
8248	{
8249	struct trace_array *tr = inode->i_private;
8250	struct ftrace_buffer_info *info;
8251	int ret;
8252
8253	ret = tracing_check_open_get_tr(tr);
8254	if (ret)
8255	return ret;
8256
8257	info = kvzalloc(size: sizeof(*info), GFP_KERNEL);
8258	if (!info) {
8259	trace_array_put(tr);
8260	return -ENOMEM;
8261	}
8262
8263	mutex_lock(&trace_types_lock);
8264
8265	info->iter.tr = tr;
8266	info->iter.cpu_file = tracing_get_cpu(inode);
8267	info->iter.trace = tr->current_trace;
8268	info->iter.array_buffer = &tr->array_buffer;
8269	info->spare = NULL;
8270	/ Force reading ring buffer for first read /
8271	info->read = (unsigned int)-`1`;
8272
8273	filp->private_data = info;
8274
8275	tr->trace_ref++;
8276
8277	mutex_unlock(lock: &trace_types_lock);
8278
8279	ret = nonseekable_open(inode, filp);
8280	if (ret < `0`)
8281	trace_array_put(tr);
8282
8283	return ret;
8284	}
8285
8286	static __poll_t
8287	tracing_buffers_poll(struct file filp, poll_table poll_table)
8288	{
8289	struct ftrace_buffer_info *info = filp->private_data;
8290	struct trace_iterator *iter = &info->iter;
8291
8292	return trace_poll(iter, filp, poll_table);
8293	}
8294
8295	static ssize_t
8296	tracing_buffers_read(struct file filp, char* __user *ubuf,
8297	size_t count, loff_t *ppos)
8298	{
8299	struct ftrace_buffer_info *info = filp->private_data;
8300	struct trace_iterator *iter = &info->iter;
8301	ssize_t ret = `0`;
8302	ssize_t size;
8303
8304	if (!count)
8305	return `0`;
8306
8307	#ifdef CONFIG_TRACER_MAX_TRACE
8308	if (iter->snapshot && iter->tr->current_trace->use_max_tr)
8309	return -EBUSY;
8310	#endif
8311
8312	if (!info->spare) {
8313	info->spare = ring_buffer_alloc_read_page(buffer: iter->array_buffer->buffer,
8314	cpu: iter->cpu_file);
8315	if (IS_ERR(ptr: info->spare)) {
8316	ret = PTR_ERR(ptr: info->spare);
8317	info->spare = NULL;
8318	} else {
8319	info->spare_cpu = iter->cpu_file;
8320	}
8321	}
8322	if (!info->spare)
8323	return ret;
8324
8325	/ Do we have previous read data to read? /
8326	if (info->read < PAGE_SIZE)
8327	goto read;
8328
8329	again:
8330	trace_access_lock(cpu: iter->cpu_file);
8331	ret = ring_buffer_read_page(buffer: iter->array_buffer->buffer,
8332	data_page: &info->spare,
8333	len: count,
8334	cpu: iter->cpu_file, full: `0`);
8335	trace_access_unlock(cpu: iter->cpu_file);
8336
8337	if (ret < `0`) {
8338	if (trace_empty(iter)) {
8339	if ((filp->f_flags & O_NONBLOCK))
8340	return -EAGAIN;
8341
8342	ret = wait_on_pipe(iter, full: `0`);
8343	if (ret)
8344	return ret;
8345
8346	goto again;
8347	}
8348	return `0`;
8349	}
8350
8351	info->read = `0`;
8352	read:
8353	size = PAGE_SIZE - info->read;
8354	if (size > count)
8355	size = count;
8356
8357	ret = copy_to_user(to: ubuf, from: info->spare + info->read, n: size);
8358	if (ret == size)
8359	return -EFAULT;
8360
8361	size -= ret;
8362
8363	*ppos += size;
8364	info->read += size;
8365
8366	return size;
8367	}
8368
8369	static int tracing_buffers_release(struct inode inode, struct* file *file)
8370	{
8371	struct ftrace_buffer_info *info = file->private_data;
8372	struct trace_iterator *iter = &info->iter;
8373
8374	mutex_lock(&trace_types_lock);
8375
8376	iter->tr->trace_ref--;
8377
8378	__trace_array_put(this_tr: iter->tr);
8379
8380	iter->wait_index++;
8381	/ Make sure the waiters see the new wait_index /
8382	smp_wmb();
8383
8384	ring_buffer_wake_waiters(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file);
8385
8386	if (info->spare)
8387	ring_buffer_free_read_page(buffer: iter->array_buffer->buffer,
8388	cpu: info->spare_cpu, data: info->spare);
8389	kvfree(addr: info);
8390
8391	mutex_unlock(lock: &trace_types_lock);
8392
8393	return `0`;
8394	}
8395
8396	struct buffer_ref {
8397	struct trace_buffer *buffer;
8398	void *page;
8399	int cpu;
8400	refcount_t refcount;
8401	};
8402
8403	static void buffer_ref_release(struct buffer_ref *ref)
8404	{
8405	if (!refcount_dec_and_test(r: &ref->refcount))
8406	return;
8407	ring_buffer_free_read_page(buffer: ref->buffer, cpu: ref->cpu, data: ref->page);
8408	kfree(objp: ref);
8409	}
8410
8411	static void buffer_pipe_buf_release(struct pipe_inode_info *pipe,
8412	struct pipe_buffer *buf)
8413	{
8414	struct buffer_ref ref = (struct* buffer_ref *)buf->private;
8415
8416	buffer_ref_release(ref);
8417	buf->private = `0`;
8418	}
8419
8420	static bool buffer_pipe_buf_get(struct pipe_inode_info *pipe,
8421	struct pipe_buffer *buf)
8422	{
8423	struct buffer_ref ref = (struct* buffer_ref *)buf->private;
8424
8425	if (refcount_read(r: &ref->refcount) > INT_MAX/`2`)
8426	return false;
8427
8428	refcount_inc(r: &ref->refcount);
8429	return true;
8430	}
8431
8432	/ Pipe buffer operations for a buffer. /
8433	static const struct pipe_buf_operations buffer_pipe_buf_ops = {
8434	.release = buffer_pipe_buf_release,
8435	.get = buffer_pipe_buf_get,
8436	};
8437
8438	/*
8439	* Callback from splice_to_pipe(), if we need to release some pages
8440	* at the end of the spd in case we error'ed out in filling the pipe.
8441	*/
8442	static void buffer_spd_release(struct splice_pipe_desc spd, unsigned* int i)
8443	{
8444	struct buffer_ref *ref =
8445	(struct buffer_ref *)spd->partial[i].private;
8446
8447	buffer_ref_release(ref);
8448	spd->partial[i].private = `0`;
8449	}
8450
8451	static ssize_t
8452	tracing_buffers_splice_read(struct file file, loff_t ppos,
8453	struct pipe_inode_info *pipe, size_t len,
8454	unsigned int flags)
8455	{
8456	struct ftrace_buffer_info *info = file->private_data;
8457	struct trace_iterator *iter = &info->iter;
8458	struct partial_page partial_def[PIPE_DEF_BUFFERS];
8459	struct page *pages_def[PIPE_DEF_BUFFERS];
8460	struct splice_pipe_desc spd = {
8461	.pages = pages_def,
8462	.partial = partial_def,
8463	.nr_pages_max = PIPE_DEF_BUFFERS,
8464	.ops = &buffer_pipe_buf_ops,
8465	.spd_release = buffer_spd_release,
8466	};
8467	struct buffer_ref *ref;
8468	int entries, i;
8469	ssize_t ret = `0`;
8470
8471	#ifdef CONFIG_TRACER_MAX_TRACE
8472	if (iter->snapshot && iter->tr->current_trace->use_max_tr)
8473	return -EBUSY;
8474	#endif
8475
8476	if (*ppos & (PAGE_SIZE - `1`))
8477	return -EINVAL;
8478
8479	if (len & (PAGE_SIZE - `1`)) {
8480	if (len < PAGE_SIZE)
8481	return -EINVAL;
8482	len &= PAGE_MASK;
8483	}
8484
8485	if (splice_grow_spd(pipe, &spd))
8486	return -ENOMEM;
8487
8488	again:
8489	trace_access_lock(cpu: iter->cpu_file);
8490	entries = ring_buffer_entries_cpu(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file);
8491
8492	for (i = `0`; i < spd.nr_pages_max && len && entries; i++, len -= PAGE_SIZE) {
8493	struct page *page;
8494	int r;
8495
8496	ref = kzalloc(size: sizeof(*ref), GFP_KERNEL);
8497	if (!ref) {
8498	ret = -ENOMEM;
8499	break;
8500	}
8501
8502	refcount_set(r: &ref->refcount, n: `1`);
8503	ref->buffer = iter->array_buffer->buffer;
8504	ref->page = ring_buffer_alloc_read_page(buffer: ref->buffer, cpu: iter->cpu_file);
8505	if (IS_ERR(ptr: ref->page)) {
8506	ret = PTR_ERR(ptr: ref->page);
8507	ref->page = NULL;
8508	kfree(objp: ref);
8509	break;
8510	}
8511	ref->cpu = iter->cpu_file;
8512
8513	r = ring_buffer_read_page(buffer: ref->buffer, data_page: &ref->page,
8514	len, cpu: iter->cpu_file, full: `1`);
8515	if (r < `0`) {
8516	ring_buffer_free_read_page(buffer: ref->buffer, cpu: ref->cpu,
8517	data: ref->page);
8518	kfree(objp: ref);
8519	break;
8520	}
8521
8522	page = virt_to_page(ref->page);
8523
8524	spd.pages[i] = page;
8525	spd.partial[i].len = PAGE_SIZE;
8526	spd.partial[i].offset = `0`;
8527	spd.partial[i].private = (unsigned long)ref;
8528	spd.nr_pages++;
8529	*ppos += PAGE_SIZE;
8530
8531	entries = ring_buffer_entries_cpu(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file);
8532	}
8533
8534	trace_access_unlock(cpu: iter->cpu_file);
8535	spd.nr_pages = i;
8536
8537	/ did we read anything? /
8538	if (!spd.nr_pages) {
8539	long wait_index;
8540
8541	if (ret)
8542	goto out;
8543
8544	ret = -EAGAIN;
8545	if ((file->f_flags & O_NONBLOCK) \|\| (flags & SPLICE_F_NONBLOCK))
8546	goto out;
8547
8548	wait_index = READ_ONCE(iter->wait_index);
8549
8550	ret = wait_on_pipe(iter, full: iter->tr->buffer_percent);
8551	if (ret)
8552	goto out;
8553
8554	/ No need to wait after waking up when tracing is off /
8555	if (!tracer_tracing_is_on(tr: iter->tr))
8556	goto out;
8557
8558	/ Make sure we see the new wait_index /
8559	smp_rmb();
8560	if (wait_index != iter->wait_index)
8561	goto out;
8562
8563	goto again;
8564	}
8565
8566	ret = splice_to_pipe(pipe, &spd);
8567	out:
8568	splice_shrink_spd(&spd);
8569
8570	return ret;
8571	}
8572
8573	/ An ioctl call with cmd 0 to the ring buffer file will wake up all waiters /
8574	static long tracing_buffers_ioctl(struct file file, unsigned* int cmd, unsigned long arg)
8575	{
8576	struct ftrace_buffer_info *info = file->private_data;
8577	struct trace_iterator *iter = &info->iter;
8578
8579	if (cmd)
8580	return -ENOIOCTLCMD;
8581
8582	mutex_lock(&trace_types_lock);
8583
8584	iter->wait_index++;
8585	/ Make sure the waiters see the new wait_index /
8586	smp_wmb();
8587
8588	ring_buffer_wake_waiters(buffer: iter->array_buffer->buffer, cpu: iter->cpu_file);
8589
8590	mutex_unlock(lock: &trace_types_lock);
8591	return `0`;
8592	}
8593
8594	static const struct file_operations tracing_buffers_fops = {
8595	.open = tracing_buffers_open,
8596	.read = tracing_buffers_read,
8597	.poll = tracing_buffers_poll,
8598	.release = tracing_buffers_release,
8599	.splice_read = tracing_buffers_splice_read,
8600	.unlocked_ioctl = tracing_buffers_ioctl,
8601	.llseek = no_llseek,
8602	};
8603
8604	static ssize_t
8605	tracing_stats_read(struct file filp, char* __user *ubuf,
8606	size_t count, loff_t *ppos)
8607	{
8608	struct inode *inode = file_inode(f: filp);
8609	struct trace_array *tr = inode->i_private;
8610	struct array_buffer *trace_buf = &tr->array_buffer;
8611	int cpu = tracing_get_cpu(inode);
8612	struct trace_seq *s;
8613	unsigned long cnt;
8614	unsigned long long t;
8615	unsigned long usec_rem;
8616
8617	s = kmalloc(size: sizeof(*s), GFP_KERNEL);
8618	if (!s)
8619	return -ENOMEM;
8620
8621	trace_seq_init(s);
8622
8623	cnt = ring_buffer_entries_cpu(buffer: trace_buf->buffer, cpu);
8624	trace_seq_printf(s, fmt: "entries: %ld\n", cnt);
8625
8626	cnt = ring_buffer_overrun_cpu(buffer: trace_buf->buffer, cpu);
8627	trace_seq_printf(s, fmt: "overrun: %ld\n", cnt);
8628
8629	cnt = ring_buffer_commit_overrun_cpu(buffer: trace_buf->buffer, cpu);
8630	trace_seq_printf(s, fmt: "commit overrun: %ld\n", cnt);
8631
8632	cnt = ring_buffer_bytes_cpu(buffer: trace_buf->buffer, cpu);
8633	trace_seq_printf(s, fmt: "bytes: %ld\n", cnt);
8634
8635	if (trace_clocks[tr->clock_id].in_ns) {
8636	/ local or global for trace_clock /
8637	t = ns2usecs(nsec: ring_buffer_oldest_event_ts(buffer: trace_buf->buffer, cpu));
8638	usec_rem = do_div(t, USEC_PER_SEC);
8639	trace_seq_printf(s, fmt: "oldest event ts: %5llu.%06lu\n",
8640	t, usec_rem);
8641
8642	t = ns2usecs(nsec: ring_buffer_time_stamp(buffer: trace_buf->buffer));
8643	usec_rem = do_div(t, USEC_PER_SEC);
8644	trace_seq_printf(s, fmt: "now ts: %5llu.%06lu\n", t, usec_rem);
8645	} else {
8646	/ counter or tsc mode for trace_clock /
8647	trace_seq_printf(s, fmt: "oldest event ts: %llu\n",
8648	ring_buffer_oldest_event_ts(buffer: trace_buf->buffer, cpu));
8649
8650	trace_seq_printf(s, fmt: "now ts: %llu\n",
8651	ring_buffer_time_stamp(buffer: trace_buf->buffer));
8652	}
8653
8654	cnt = ring_buffer_dropped_events_cpu(buffer: trace_buf->buffer, cpu);
8655	trace_seq_printf(s, fmt: "dropped events: %ld\n", cnt);
8656
8657	cnt = ring_buffer_read_events_cpu(buffer: trace_buf->buffer, cpu);
8658	trace_seq_printf(s, fmt: "read events: %ld\n", cnt);
8659
8660	count = simple_read_from_buffer(to: ubuf, count, ppos,
8661	from: s->buffer, available: trace_seq_used(s));
8662
8663	kfree(objp: s);
8664
8665	return count;
8666	}
8667
8668	static const struct file_operations tracing_stats_fops = {
8669	.open = tracing_open_generic_tr,
8670	.read = tracing_stats_read,
8671	.llseek = generic_file_llseek,
8672	.release = tracing_release_generic_tr,
8673	};
8674
8675	#ifdef CONFIG_DYNAMIC_FTRACE
8676
8677	static ssize_t
8678	tracing_read_dyn_info(struct file filp, char* __user *ubuf,
8679	size_t cnt, loff_t *ppos)
8680	{
8681	ssize_t ret;
8682	char *buf;
8683	int r;
8684
8685	/ 256 should be plenty to hold the amount needed /
8686	buf = kmalloc(size: `256`, GFP_KERNEL);
8687	if (!buf)
8688	return -ENOMEM;
8689
8690	r = scnprintf(buf, size: `256`, fmt: "%ld pages:%ld groups: %ld\n",
8691	ftrace_update_tot_cnt,
8692	ftrace_number_of_pages,
8693	ftrace_number_of_groups);
8694
8695	ret = simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
8696	kfree(objp: buf);
8697	return ret;
8698	}
8699
8700	static const struct file_operations tracing_dyn_info_fops = {
8701	.open = tracing_open_generic,
8702	.read = tracing_read_dyn_info,
8703	.llseek = generic_file_llseek,
8704	};
8705	#endif /* CONFIG_DYNAMIC_FTRACE */
8706
8707	#if defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE)
8708	static void
8709	ftrace_snapshot(unsigned long ip, unsigned long parent_ip,
8710	struct trace_array tr, struct* ftrace_probe_ops *ops,
8711	void *data)
8712	{
8713	tracing_snapshot_instance(tr);
8714	}
8715
8716	static void
8717	ftrace_count_snapshot(unsigned long ip, unsigned long parent_ip,
8718	struct trace_array tr, struct* ftrace_probe_ops *ops,
8719	void *data)
8720	{
8721	struct ftrace_func_mapper *mapper = data;
8722	long *count = NULL;
8723
8724	if (mapper)
8725	count = (long *)ftrace_func_mapper_find_ip(mapper, ip);
8726
8727	if (count) {
8728
8729	if (*count <= `0`)
8730	return;
8731
8732	(*count)--;
8733	}
8734
8735	tracing_snapshot_instance(tr);
8736	}
8737
8738	static int
8739	ftrace_snapshot_print(struct seq_file m, unsigned* long ip,
8740	struct ftrace_probe_ops ops, void* *data)
8741	{
8742	struct ftrace_func_mapper *mapper = data;
8743	long *count = NULL;
8744
8745	seq_printf(m, fmt: "%ps:", (void *)ip);
8746
8747	seq_puts(m, s: "snapshot");
8748
8749	if (mapper)
8750	count = (long *)ftrace_func_mapper_find_ip(mapper, ip);
8751
8752	if (count)
8753	seq_printf(m, fmt: ":count=%ld\n", *count);
8754	else
8755	seq_puts(m, s: ":unlimited\n");
8756
8757	return `0`;
8758	}
8759
8760	static int
8761	ftrace_snapshot_init(struct ftrace_probe_ops ops, struct* trace_array *tr,
8762	unsigned long ip, void init_data, void* **data)
8763	{
8764	struct ftrace_func_mapper mapper = data;
8765
8766	if (!mapper) {
8767	mapper = allocate_ftrace_func_mapper();
8768	if (!mapper)
8769	return -ENOMEM;
8770	*data = mapper;
8771	}
8772
8773	return ftrace_func_mapper_add_ip(mapper, ip, data: init_data);
8774	}
8775
8776	static void
8777	ftrace_snapshot_free(struct ftrace_probe_ops ops, struct* trace_array *tr,
8778	unsigned long ip, void *data)
8779	{
8780	struct ftrace_func_mapper *mapper = data;
8781
8782	if (!ip) {
8783	if (!mapper)
8784	return;
8785	free_ftrace_func_mapper(mapper, NULL);
8786	return;
8787	}
8788
8789	ftrace_func_mapper_remove_ip(mapper, ip);
8790	}
8791
8792	static struct ftrace_probe_ops snapshot_probe_ops = {
8793	.func = ftrace_snapshot,
8794	.print = ftrace_snapshot_print,
8795	};
8796
8797	static struct ftrace_probe_ops snapshot_count_probe_ops = {
8798	.func = ftrace_count_snapshot,
8799	.print = ftrace_snapshot_print,
8800	.init = ftrace_snapshot_init,
8801	.free = ftrace_snapshot_free,
8802	};
8803
8804	static int
8805	ftrace_trace_snapshot_callback(struct trace_array tr, struct* ftrace_hash *hash,
8806	char glob, char* cmd, char* param, int* enable)
8807	{
8808	struct ftrace_probe_ops *ops;
8809	void count = (void* *)-`1`;
8810	char *number;
8811	int ret;
8812
8813	if (!tr)
8814	return -ENODEV;
8815
8816	/ hash funcs only work with set_ftrace_filter /
8817	if (!enable)
8818	return -EINVAL;
8819
8820	ops = param ? &snapshot_count_probe_ops : &snapshot_probe_ops;
8821
8822	if (glob[`0`] == `'!'`)
8823	return unregister_ftrace_function_probe_func(glob: glob+`1`, tr, ops);
8824
8825	if (!param)
8826	goto out_reg;
8827
8828	number = strsep(&param, ":");
8829
8830	if (!strlen(number))
8831	goto out_reg;
8832
8833	/*
8834	* We use the callback data field (which is a pointer)
8835	* as our counter.
8836	*/
8837	ret = kstrtoul(s: number, base: `0`, res: (unsigned long *)&count);
8838	if (ret)
8839	return ret;
8840
8841	out_reg:
8842	ret = tracing_alloc_snapshot_instance(tr);
8843	if (ret < `0`)
8844	goto out;
8845
8846	ret = register_ftrace_function_probe(glob, tr, ops, data: count);
8847
8848	out:
8849	return ret < `0` ? ret : `0`;
8850	}
8851
8852	static struct ftrace_func_command ftrace_snapshot_cmd = {
8853	.name = "snapshot",
8854	.func = ftrace_trace_snapshot_callback,
8855	};
8856
8857	static __init int register_snapshot_cmd(void)
8858	{
8859	return register_ftrace_command(cmd: &ftrace_snapshot_cmd);
8860	}
8861	#else
8862	static inline __init int register_snapshot_cmd(void) { return `0`; }
8863	#endif /* defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE) */
8864
8865	static struct dentry tracing_get_dentry(struct* trace_array *tr)
8866	{
8867	if (WARN_ON(!tr->dir))
8868	return ERR_PTR(error: -ENODEV);
8869
8870	/ Top directory uses NULL as the parent /
8871	if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
8872	return NULL;
8873
8874	/ All sub buffers have a descriptor /
8875	return tr->dir;
8876	}
8877
8878	static struct dentry tracing_dentry_percpu(struct* trace_array tr, int* cpu)
8879	{
8880	struct dentry *d_tracer;
8881
8882	if (tr->percpu_dir)
8883	return tr->percpu_dir;
8884
8885	d_tracer = tracing_get_dentry(tr);
8886	if (IS_ERR(ptr: d_tracer))
8887	return NULL;
8888
8889	tr->percpu_dir = tracefs_create_dir(name: "per_cpu", parent: d_tracer);
8890
8891	MEM_FAIL(!tr->percpu_dir,
8892	"Could not create tracefs directory 'per_cpu/%d'\n", cpu);
8893
8894	return tr->percpu_dir;
8895	}
8896
8897	static struct dentry *
8898	trace_create_cpu_file(const char name, umode_t mode, struct* dentry *parent,
8899	void data, long* cpu, const struct file_operations *fops)
8900	{
8901	struct dentry *ret = trace_create_file(name, mode, parent, data, fops);
8902
8903	if (ret) / See tracing_get_cpu() /
8904	d_inode(dentry: ret)->i_cdev = (void *)(cpu + `1`);
8905	return ret;
8906	}
8907
8908	static void
8909	tracing_init_tracefs_percpu(struct trace_array tr, long* cpu)
8910	{
8911	struct dentry *d_percpu = tracing_dentry_percpu(tr, cpu);
8912	struct dentry *d_cpu;
8913	char cpu_dir[`30`]; / 30 characters should be more than enough /
8914
8915	if (!d_percpu)
8916	return;
8917
8918	snprintf(buf: cpu_dir, size: `30`, fmt: "cpu%ld", cpu);
8919	d_cpu = tracefs_create_dir(name: cpu_dir, parent: d_percpu);
8920	if (!d_cpu) {
8921	pr_warn("Could not create tracefs '%s' entry\n", cpu_dir);
8922	return;
8923	}
8924
8925	/ per cpu trace_pipe /
8926	trace_create_cpu_file(name: "trace_pipe", TRACE_MODE_READ, parent: d_cpu,
8927	data: tr, cpu, fops: &tracing_pipe_fops);
8928
8929	/ per cpu trace /
8930	trace_create_cpu_file(name: "trace", TRACE_MODE_WRITE, parent: d_cpu,
8931	data: tr, cpu, fops: &tracing_fops);
8932
8933	trace_create_cpu_file(name: "trace_pipe_raw", TRACE_MODE_READ, parent: d_cpu,
8934	data: tr, cpu, fops: &tracing_buffers_fops);
8935
8936	trace_create_cpu_file(name: "stats", TRACE_MODE_READ, parent: d_cpu,
8937	data: tr, cpu, fops: &tracing_stats_fops);
8938
8939	trace_create_cpu_file(name: "buffer_size_kb", TRACE_MODE_READ, parent: d_cpu,
8940	data: tr, cpu, fops: &tracing_entries_fops);
8941
8942	#ifdef CONFIG_TRACER_SNAPSHOT
8943	trace_create_cpu_file(name: "snapshot", TRACE_MODE_WRITE, parent: d_cpu,
8944	data: tr, cpu, fops: &snapshot_fops);
8945
8946	trace_create_cpu_file(name: "snapshot_raw", TRACE_MODE_READ, parent: d_cpu,
8947	data: tr, cpu, fops: &snapshot_raw_fops);
8948	#endif
8949	}
8950
8951	#ifdef CONFIG_FTRACE_SELFTEST
8952	/ Let selftest have access to static functions in this file /
8953	#include "trace_selftest.c"
8954	#endif
8955
8956	static ssize_t
8957	trace_options_read(struct file filp, char* __user *ubuf, size_t cnt,
8958	loff_t *ppos)
8959	{
8960	struct trace_option_dentry *topt = filp->private_data;
8961	char *buf;
8962
8963	if (topt->flags->val & topt->opt->bit)
8964	buf = "1\n";
8965	else
8966	buf = "0\n";
8967
8968	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: `2`);
8969	}
8970
8971	static ssize_t
8972	trace_options_write(struct file filp, const* char __user *ubuf, size_t cnt,
8973	loff_t *ppos)
8974	{
8975	struct trace_option_dentry *topt = filp->private_data;
8976	unsigned long val;
8977	int ret;
8978
8979	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
8980	if (ret)
8981	return ret;
8982
8983	if (val != `0` && val != `1`)
8984	return -EINVAL;
8985
8986	if (!!(topt->flags->val & topt->opt->bit) != val) {
8987	mutex_lock(&trace_types_lock);
8988	ret = __set_tracer_option(tr: topt->tr, tracer_flags: topt->flags,
8989	opts: topt->opt, neg: !val);
8990	mutex_unlock(lock: &trace_types_lock);
8991	if (ret)
8992	return ret;
8993	}
8994
8995	*ppos += cnt;
8996
8997	return cnt;
8998	}
8999
9000	static int tracing_open_options(struct inode inode, struct* file *filp)
9001	{
9002	struct trace_option_dentry *topt = inode->i_private;
9003	int ret;
9004
9005	ret = tracing_check_open_get_tr(tr: topt->tr);
9006	if (ret)
9007	return ret;
9008
9009	filp->private_data = inode->i_private;
9010	return `0`;
9011	}
9012
9013	static int tracing_release_options(struct inode inode, struct* file *file)
9014	{
9015	struct trace_option_dentry *topt = file->private_data;
9016
9017	trace_array_put(topt->tr);
9018	return `0`;
9019	}
9020
9021	static const struct file_operations trace_options_fops = {
9022	.open = tracing_open_options,
9023	.read = trace_options_read,
9024	.write = trace_options_write,
9025	.llseek = generic_file_llseek,
9026	.release = tracing_release_options,
9027	};
9028
9029	/*
9030	* In order to pass in both the trace_array descriptor as well as the index
9031	* to the flag that the trace option file represents, the trace_array
9032	* has a character array of trace_flags_index[], which holds the index
9033	* of the bit for the flag it represents. index[0] == 0, index[1] == 1, etc.
9034	* The address of this character array is passed to the flag option file
9035	* read/write callbacks.
9036	*
9037	* In order to extract both the index and the trace_array descriptor,
9038	* get_tr_index() uses the following algorithm.
9039	*
9040	* idx = *ptr;
9041	*
9042	* As the pointer itself contains the address of the index (remember
9043	* index[1] == 1).
9044	*
9045	* Then to get the trace_array descriptor, by subtracting that index
9046	* from the ptr, we get to the start of the index itself.
9047	*
9048	* ptr - idx == &index[0]
9049	*
9050	* Then a simple container_of() from that pointer gets us to the
9051	* trace_array descriptor.
9052	*/
9053	static void get_tr_index(void data, struct* trace_array **ptr,
9054	unsigned int *pindex)
9055	{
9056	pindex = (unsigned char *)data;
9057
9058	ptr = container_of(data - pindex, struct trace_array,
9059	trace_flags_index);
9060	}
9061
9062	static ssize_t
9063	trace_options_core_read(struct file filp, char* __user *ubuf, size_t cnt,
9064	loff_t *ppos)
9065	{
9066	void *tr_index = filp->private_data;
9067	struct trace_array *tr;
9068	unsigned int index;
9069	char *buf;
9070
9071	get_tr_index(data: tr_index, ptr: &tr, pindex: &index);
9072
9073	if (tr->trace_flags & (`1` << index))
9074	buf = "1\n";
9075	else
9076	buf = "0\n";
9077
9078	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: `2`);
9079	}
9080
9081	static ssize_t
9082	trace_options_core_write(struct file filp, const* char __user *ubuf, size_t cnt,
9083	loff_t *ppos)
9084	{
9085	void *tr_index = filp->private_data;
9086	struct trace_array *tr;
9087	unsigned int index;
9088	unsigned long val;
9089	int ret;
9090
9091	get_tr_index(data: tr_index, ptr: &tr, pindex: &index);
9092
9093	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
9094	if (ret)
9095	return ret;
9096
9097	if (val != `0` && val != `1`)
9098	return -EINVAL;
9099
9100	mutex_lock(&event_mutex);
9101	mutex_lock(&trace_types_lock);
9102	ret = set_tracer_flag(tr, mask: `1` << index, enabled: val);
9103	mutex_unlock(lock: &trace_types_lock);
9104	mutex_unlock(lock: &event_mutex);
9105
9106	if (ret < `0`)
9107	return ret;
9108
9109	*ppos += cnt;
9110
9111	return cnt;
9112	}
9113
9114	static const struct file_operations trace_options_core_fops = {
9115	.open = tracing_open_generic,
9116	.read = trace_options_core_read,
9117	.write = trace_options_core_write,
9118	.llseek = generic_file_llseek,
9119	};
9120
9121	struct dentry trace_create_file(const* char *name,
9122	umode_t mode,
9123	struct dentry *parent,
9124	void *data,
9125	const struct file_operations *fops)
9126	{
9127	struct dentry *ret;
9128
9129	ret = tracefs_create_file(name, mode, parent, data, fops);
9130	if (!ret)
9131	pr_warn("Could not create tracefs '%s' entry\n", name);
9132
9133	return ret;
9134	}
9135
9136
9137	static struct dentry trace_options_init_dentry(struct* trace_array *tr)
9138	{
9139	struct dentry *d_tracer;
9140
9141	if (tr->options)
9142	return tr->options;
9143
9144	d_tracer = tracing_get_dentry(tr);
9145	if (IS_ERR(ptr: d_tracer))
9146	return NULL;
9147
9148	tr->options = tracefs_create_dir(name: "options", parent: d_tracer);
9149	if (!tr->options) {
9150	pr_warn("Could not create tracefs directory 'options'\n");
9151	return NULL;
9152	}
9153
9154	return tr->options;
9155	}
9156
9157	static void
9158	create_trace_option_file(struct trace_array *tr,
9159	struct trace_option_dentry *topt,
9160	struct tracer_flags *flags,
9161	struct tracer_opt *opt)
9162	{
9163	struct dentry *t_options;
9164
9165	t_options = trace_options_init_dentry(tr);
9166	if (!t_options)
9167	return;
9168
9169	topt->flags = flags;
9170	topt->opt = opt;
9171	topt->tr = tr;
9172
9173	topt->entry = trace_create_file(name: opt->name, TRACE_MODE_WRITE,
9174	parent: t_options, data: topt, fops: &trace_options_fops);
9175
9176	}
9177
9178	static void
9179	create_trace_option_files(struct trace_array tr, struct* tracer *tracer)
9180	{
9181	struct trace_option_dentry *topts;
9182	struct trace_options *tr_topts;
9183	struct tracer_flags *flags;
9184	struct tracer_opt *opts;
9185	int cnt;
9186	int i;
9187
9188	if (!tracer)
9189	return;
9190
9191	flags = tracer->flags;
9192
9193	if (!flags \|\| !flags->opts)
9194	return;
9195
9196	/*
9197	* If this is an instance, only create flags for tracers
9198	* the instance may have.
9199	*/
9200	if (!trace_ok_for_array(t: tracer, tr))
9201	return;
9202
9203	for (i = `0`; i < tr->nr_topts; i++) {
9204	/ Make sure there's no duplicate flags. /
9205	if (WARN_ON_ONCE(tr->topts[i].tracer->flags == tracer->flags))
9206	return;
9207	}
9208
9209	opts = flags->opts;
9210
9211	for (cnt = `0`; opts[cnt].name; cnt++)
9212	;
9213
9214	topts = kcalloc(n: cnt + `1`, size: sizeof(*topts), GFP_KERNEL);
9215	if (!topts)
9216	return;
9217
9218	tr_topts = krealloc(objp: tr->topts, new_size: sizeof(tr->topts) (tr->nr_topts + `1`),
9219	GFP_KERNEL);
9220	if (!tr_topts) {
9221	kfree(objp: topts);
9222	return;
9223	}
9224
9225	tr->topts = tr_topts;
9226	tr->topts[tr->nr_topts].tracer = tracer;
9227	tr->topts[tr->nr_topts].topts = topts;
9228	tr->nr_topts++;
9229
9230	for (cnt = `0`; opts[cnt].name; cnt++) {
9231	create_trace_option_file(tr, topt: &topts[cnt], flags,
9232	opt: &opts[cnt]);
9233	MEM_FAIL(topts[cnt].entry == NULL,
9234	"Failed to create trace option: %s",
9235	opts[cnt].name);
9236	}
9237	}
9238
9239	static struct dentry *
9240	create_trace_option_core_file(struct trace_array *tr,
9241	const char option, long* index)
9242	{
9243	struct dentry *t_options;
9244
9245	t_options = trace_options_init_dentry(tr);
9246	if (!t_options)
9247	return NULL;
9248
9249	return trace_create_file(name: option, TRACE_MODE_WRITE, parent: t_options,
9250	data: (void *)&tr->trace_flags_index[index],
9251	fops: &trace_options_core_fops);
9252	}
9253
9254	static void create_trace_options_dir(struct trace_array *tr)
9255	{
9256	struct dentry *t_options;
9257	bool top_level = tr == &global_trace;
9258	int i;
9259
9260	t_options = trace_options_init_dentry(tr);
9261	if (!t_options)
9262	return;
9263
9264	for (i = `0`; trace_options[i]; i++) {
9265	if (top_level \|\|
9266	!((`1` << i) & TOP_LEVEL_TRACE_FLAGS))
9267	create_trace_option_core_file(tr, option: trace_options[i], index: i);
9268	}
9269	}
9270
9271	static ssize_t
9272	rb_simple_read(struct file filp, char* __user *ubuf,
9273	size_t cnt, loff_t *ppos)
9274	{
9275	struct trace_array *tr = filp->private_data;
9276	char buf[`64`];
9277	int r;
9278
9279	r = tracer_tracing_is_on(tr);
9280	r = sprintf(buf, fmt: "%d\n", r);
9281
9282	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
9283	}
9284
9285	static ssize_t
9286	rb_simple_write(struct file filp, const* char __user *ubuf,
9287	size_t cnt, loff_t *ppos)
9288	{
9289	struct trace_array *tr = filp->private_data;
9290	struct trace_buffer *buffer = tr->array_buffer.buffer;
9291	unsigned long val;
9292	int ret;
9293
9294	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
9295	if (ret)
9296	return ret;
9297
9298	if (buffer) {
9299	mutex_lock(&trace_types_lock);
9300	if (!!val == tracer_tracing_is_on(tr)) {
9301	val = `0`; / do nothing /
9302	} else if (val) {
9303	tracer_tracing_on(tr);
9304	if (tr->current_trace->start)
9305	tr->current_trace->start(tr);
9306	} else {
9307	tracer_tracing_off(tr);
9308	if (tr->current_trace->stop)
9309	tr->current_trace->stop(tr);
9310	/ Wake up any waiters /
9311	ring_buffer_wake_waiters(buffer, RING_BUFFER_ALL_CPUS);
9312	}
9313	mutex_unlock(lock: &trace_types_lock);
9314	}
9315
9316	(*ppos)++;
9317
9318	return cnt;
9319	}
9320
9321	static const struct file_operations rb_simple_fops = {
9322	.open = tracing_open_generic_tr,
9323	.read = rb_simple_read,
9324	.write = rb_simple_write,
9325	.release = tracing_release_generic_tr,
9326	.llseek = default_llseek,
9327	};
9328
9329	static ssize_t
9330	buffer_percent_read(struct file filp, char* __user *ubuf,
9331	size_t cnt, loff_t *ppos)
9332	{
9333	struct trace_array *tr = filp->private_data;
9334	char buf[`64`];
9335	int r;
9336
9337	r = tr->buffer_percent;
9338	r = sprintf(buf, fmt: "%d\n", r);
9339
9340	return simple_read_from_buffer(to: ubuf, count: cnt, ppos, from: buf, available: r);
9341	}
9342
9343	static ssize_t
9344	buffer_percent_write(struct file filp, const* char __user *ubuf,
9345	size_t cnt, loff_t *ppos)
9346	{
9347	struct trace_array *tr = filp->private_data;
9348	unsigned long val;
9349	int ret;
9350
9351	ret = kstrtoul_from_user(s: ubuf, count: cnt, base: `10`, res: &val);
9352	if (ret)
9353	return ret;
9354
9355	if (val > `100`)
9356	return -EINVAL;
9357
9358	tr->buffer_percent = val;
9359
9360	(*ppos)++;
9361
9362	return cnt;
9363	}
9364
9365	static const struct file_operations buffer_percent_fops = {
9366	.open = tracing_open_generic_tr,
9367	.read = buffer_percent_read,
9368	.write = buffer_percent_write,
9369	.release = tracing_release_generic_tr,
9370	.llseek = default_llseek,
9371	};
9372
9373	static struct dentry *trace_instance_dir;
9374
9375	static void
9376	init_tracer_tracefs(struct trace_array tr, struct* dentry *d_tracer);
9377
9378	static int
9379	allocate_trace_buffer(struct trace_array tr, struct* array_buffer buf, int* size)
9380	{
9381	enum ring_buffer_flags rb_flags;
9382
9383	rb_flags = tr->trace_flags & TRACE_ITER_OVERWRITE ? RB_FL_OVERWRITE : `0`;
9384
9385	buf->tr = tr;
9386
9387	buf->buffer = ring_buffer_alloc(size, rb_flags);
9388	if (!buf->buffer)
9389	return -ENOMEM;
9390
9391	buf->data = alloc_percpu(struct trace_array_cpu);
9392	if (!buf->data) {
9393	ring_buffer_free(buffer: buf->buffer);
9394	buf->buffer = NULL;
9395	return -ENOMEM;
9396	}
9397
9398	/ Allocate the first page for all buffers /
9399	set_buffer_entries(buf: &tr->array_buffer,
9400	val: ring_buffer_size(buffer: tr->array_buffer.buffer, cpu: `0`));
9401
9402	return `0`;
9403	}
9404
9405	static void free_trace_buffer(struct array_buffer *buf)
9406	{
9407	if (buf->buffer) {
9408	ring_buffer_free(buffer: buf->buffer);
9409	buf->buffer = NULL;
9410	free_percpu(pdata: buf->data);
9411	buf->data = NULL;
9412	}
9413	}
9414
9415	static int allocate_trace_buffers(struct trace_array tr, int* size)
9416	{
9417	int ret;
9418
9419	ret = allocate_trace_buffer(tr, buf: &tr->array_buffer, size);
9420	if (ret)
9421	return ret;
9422
9423	#ifdef CONFIG_TRACER_MAX_TRACE
9424	ret = allocate_trace_buffer(tr, buf: &tr->max_buffer,
9425	size: allocate_snapshot ? size : `1`);
9426	if (MEM_FAIL(ret, "Failed to allocate trace buffer\n")) {
9427	free_trace_buffer(buf: &tr->array_buffer);
9428	return -ENOMEM;
9429	}
9430	tr->allocated_snapshot = allocate_snapshot;
9431
9432	allocate_snapshot = false;
9433	#endif
9434
9435	return `0`;
9436	}
9437
9438	static void free_trace_buffers(struct trace_array *tr)
9439	{
9440	if (!tr)
9441	return;
9442
9443	free_trace_buffer(buf: &tr->array_buffer);
9444
9445	#ifdef CONFIG_TRACER_MAX_TRACE
9446	free_trace_buffer(buf: &tr->max_buffer);
9447	#endif
9448	}
9449
9450	static void init_trace_flags_index(struct trace_array *tr)
9451	{
9452	int i;
9453
9454	/ Used by the trace options files /
9455	for (i = `0`; i < TRACE_FLAGS_MAX_SIZE; i++)
9456	tr->trace_flags_index[i] = i;
9457	}
9458
9459	static void __update_tracer_options(struct trace_array *tr)
9460	{
9461	struct tracer *t;
9462
9463	for (t = trace_types; t; t = t->next)
9464	add_tracer_options(tr, t);
9465	}
9466
9467	static void update_tracer_options(struct trace_array *tr)
9468	{
9469	mutex_lock(&trace_types_lock);
9470	tracer_options_updated = true;
9471	__update_tracer_options(tr);
9472	mutex_unlock(lock: &trace_types_lock);
9473	}
9474
9475	/ Must have trace_types_lock held /
9476	struct trace_array trace_array_find(const* char *instance)
9477	{
9478	struct trace_array tr, found = NULL;
9479
9480	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
9481	if (tr->name && strcmp(tr->name, instance) == `0`) {
9482	found = tr;
9483	break;
9484	}
9485	}
9486
9487	return found;
9488	}
9489
9490	struct trace_array trace_array_find_get(const* char *instance)
9491	{
9492	struct trace_array *tr;
9493
9494	mutex_lock(&trace_types_lock);
9495	tr = trace_array_find(instance);
9496	if (tr)
9497	tr->ref++;
9498	mutex_unlock(lock: &trace_types_lock);
9499
9500	return tr;
9501	}
9502
9503	static int trace_array_create_dir(struct trace_array *tr)
9504	{
9505	int ret;
9506
9507	tr->dir = tracefs_create_dir(name: tr->name, parent: trace_instance_dir);
9508	if (!tr->dir)
9509	return -EINVAL;
9510
9511	ret = event_trace_add_tracer(parent: tr->dir, tr);
9512	if (ret) {
9513	tracefs_remove(dentry: tr->dir);
9514	return ret;
9515	}
9516
9517	init_tracer_tracefs(tr, d_tracer: tr->dir);
9518	__update_tracer_options(tr);
9519
9520	return ret;
9521	}
9522
9523	static struct trace_array trace_array_create(const* char *name)
9524	{
9525	struct trace_array *tr;
9526	int ret;
9527
9528	ret = -ENOMEM;
9529	tr = kzalloc(size: sizeof(*tr), GFP_KERNEL);
9530	if (!tr)
9531	return ERR_PTR(error: ret);
9532
9533	tr->name = kstrdup(s: name, GFP_KERNEL);
9534	if (!tr->name)
9535	goto out_free_tr;
9536
9537	if (!alloc_cpumask_var(mask: &tr->tracing_cpumask, GFP_KERNEL))
9538	goto out_free_tr;
9539
9540	if (!zalloc_cpumask_var(mask: &tr->pipe_cpumask, GFP_KERNEL))
9541	goto out_free_tr;
9542
9543	tr->trace_flags = global_trace.trace_flags & ~ZEROED_TRACE_FLAGS;
9544
9545	cpumask_copy(dstp: tr->tracing_cpumask, cpu_all_mask);
9546
9547	raw_spin_lock_init(&tr->start_lock);
9548
9549	tr->max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
9550
9551	tr->current_trace = &nop_trace;
9552
9553	INIT_LIST_HEAD(list: &tr->systems);
9554	INIT_LIST_HEAD(list: &tr->events);
9555	INIT_LIST_HEAD(list: &tr->hist_vars);
9556	INIT_LIST_HEAD(list: &tr->err_log);
9557
9558	if (allocate_trace_buffers(tr, size: trace_buf_size) < `0`)
9559	goto out_free_tr;
9560
9561	/ The ring buffer is defaultly expanded /
9562	trace_set_ring_buffer_expanded(tr);
9563
9564	if (ftrace_allocate_ftrace_ops(tr) < `0`)
9565	goto out_free_tr;
9566
9567	ftrace_init_trace_array(tr);
9568
9569	init_trace_flags_index(tr);
9570
9571	if (trace_instance_dir) {
9572	ret = trace_array_create_dir(tr);
9573	if (ret)
9574	goto out_free_tr;
9575	} else
9576	__trace_early_add_events(tr);
9577
9578	list_add(new: &tr->list, head: &ftrace_trace_arrays);
9579
9580	tr->ref++;
9581
9582	return tr;
9583
9584	out_free_tr:
9585	ftrace_free_ftrace_ops(tr);
9586	free_trace_buffers(tr);
9587	free_cpumask_var(mask: tr->pipe_cpumask);
9588	free_cpumask_var(mask: tr->tracing_cpumask);
9589	kfree(objp: tr->name);
9590	kfree(objp: tr);
9591
9592	return ERR_PTR(error: ret);
9593	}
9594
9595	static int instance_mkdir(const char *name)
9596	{
9597	struct trace_array *tr;
9598	int ret;
9599
9600	mutex_lock(&event_mutex);
9601	mutex_lock(&trace_types_lock);
9602
9603	ret = -EEXIST;
9604	if (trace_array_find(instance: name))
9605	goto out_unlock;
9606
9607	tr = trace_array_create(name);
9608
9609	ret = PTR_ERR_OR_ZERO(ptr: tr);
9610
9611	out_unlock:
9612	mutex_unlock(lock: &trace_types_lock);
9613	mutex_unlock(lock: &event_mutex);
9614	return ret;
9615	}
9616
9617	/**
9618	* trace_array_get_by_name - Create/Lookup a trace array, given its name.
9619	* @name: The name of the trace array to be looked up/created.
9620	*
9621	* Returns pointer to trace array with given name.
9622	* NULL, if it cannot be created.
9623	*
9624	* NOTE: This function increments the reference counter associated with the
9625	* trace array returned. This makes sure it cannot be freed while in use.
9626	* Use trace_array_put() once the trace array is no longer needed.
9627	* If the trace_array is to be freed, trace_array_destroy() needs to
9628	* be called after the trace_array_put(), or simply let user space delete
9629	* it from the tracefs instances directory. But until the
9630	* trace_array_put() is called, user space can not delete it.
9631	*
9632	*/
9633	struct trace_array trace_array_get_by_name(const* char *name)
9634	{
9635	struct trace_array *tr;
9636
9637	mutex_lock(&event_mutex);
9638	mutex_lock(&trace_types_lock);
9639
9640	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
9641	if (tr->name && strcmp(tr->name, name) == `0`)
9642	goto out_unlock;
9643	}
9644
9645	tr = trace_array_create(name);
9646
9647	if (IS_ERR(ptr: tr))
9648	tr = NULL;
9649	out_unlock:
9650	if (tr)
9651	tr->ref++;
9652
9653	mutex_unlock(lock: &trace_types_lock);
9654	mutex_unlock(lock: &event_mutex);
9655	return tr;
9656	}
9657	EXPORT_SYMBOL_GPL(trace_array_get_by_name);
9658
9659	static int __remove_instance(struct trace_array *tr)
9660	{
9661	int i;
9662
9663	/ Reference counter for a newly created trace array = 1. /
9664	if (tr->ref > `1` \|\| (tr->current_trace && tr->trace_ref))
9665	return -EBUSY;
9666
9667	list_del(entry: &tr->list);
9668
9669	/ Disable all the flags that were enabled coming in /
9670	for (i = `0`; i < TRACE_FLAGS_MAX_SIZE; i++) {
9671	if ((`1` << i) & ZEROED_TRACE_FLAGS)
9672	set_tracer_flag(tr, mask: `1` << i, enabled: `0`);
9673	}
9674
9675	tracing_set_nop(tr);
9676	clear_ftrace_function_probes(tr);
9677	event_trace_del_tracer(tr);
9678	ftrace_clear_pids(tr);
9679	ftrace_destroy_function_files(tr);
9680	tracefs_remove(dentry: tr->dir);
9681	free_percpu(pdata: tr->last_func_repeats);
9682	free_trace_buffers(tr);
9683	clear_tracing_err_log(tr);
9684
9685	for (i = `0`; i < tr->nr_topts; i++) {
9686	kfree(objp: tr->topts[i].topts);
9687	}
9688	kfree(objp: tr->topts);
9689
9690	free_cpumask_var(mask: tr->pipe_cpumask);
9691	free_cpumask_var(mask: tr->tracing_cpumask);
9692	kfree(objp: tr->name);
9693	kfree(objp: tr);
9694
9695	return `0`;
9696	}
9697
9698	int trace_array_destroy(struct trace_array *this_tr)
9699	{
9700	struct trace_array *tr;
9701	int ret;
9702
9703	if (!this_tr)
9704	return -EINVAL;
9705
9706	mutex_lock(&event_mutex);
9707	mutex_lock(&trace_types_lock);
9708
9709	ret = -ENODEV;
9710
9711	/ Making sure trace array exists before destroying it. /
9712	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
9713	if (tr == this_tr) {
9714	ret = __remove_instance(tr);
9715	break;
9716	}
9717	}
9718
9719	mutex_unlock(lock: &trace_types_lock);
9720	mutex_unlock(lock: &event_mutex);
9721
9722	return ret;
9723	}
9724	EXPORT_SYMBOL_GPL(trace_array_destroy);
9725
9726	static int instance_rmdir(const char *name)
9727	{
9728	struct trace_array *tr;
9729	int ret;
9730
9731	mutex_lock(&event_mutex);
9732	mutex_lock(&trace_types_lock);
9733
9734	ret = -ENODEV;
9735	tr = trace_array_find(instance: name);
9736	if (tr)
9737	ret = __remove_instance(tr);
9738
9739	mutex_unlock(lock: &trace_types_lock);
9740	mutex_unlock(lock: &event_mutex);
9741
9742	return ret;
9743	}
9744
9745	static __init void create_trace_instances(struct dentry *d_tracer)
9746	{
9747	struct trace_array *tr;
9748
9749	trace_instance_dir = tracefs_create_instance_dir(name: "instances", parent: d_tracer,
9750	mkdir: instance_mkdir,
9751	rmdir: instance_rmdir);
9752	if (MEM_FAIL(!trace_instance_dir, "Failed to create instances directory\n"))
9753	return;
9754
9755	mutex_lock(&event_mutex);
9756	mutex_lock(&trace_types_lock);
9757
9758	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
9759	if (!tr->name)
9760	continue;
9761	if (MEM_FAIL(trace_array_create_dir(tr) < `0`,
9762	"Failed to create instance directory\n"))
9763	break;
9764	}
9765
9766	mutex_unlock(lock: &trace_types_lock);
9767	mutex_unlock(lock: &event_mutex);
9768	}
9769
9770	static void
9771	init_tracer_tracefs(struct trace_array tr, struct* dentry *d_tracer)
9772	{
9773	int cpu;
9774
9775	trace_create_file(name: "available_tracers", TRACE_MODE_READ, parent: d_tracer,
9776	data: tr, fops: &show_traces_fops);
9777
9778	trace_create_file(name: "current_tracer", TRACE_MODE_WRITE, parent: d_tracer,
9779	data: tr, fops: &set_tracer_fops);
9780
9781	trace_create_file(name: "tracing_cpumask", TRACE_MODE_WRITE, parent: d_tracer,
9782	data: tr, fops: &tracing_cpumask_fops);
9783
9784	trace_create_file(name: "trace_options", TRACE_MODE_WRITE, parent: d_tracer,
9785	data: tr, fops: &tracing_iter_fops);
9786
9787	trace_create_file(name: "trace", TRACE_MODE_WRITE, parent: d_tracer,
9788	data: tr, fops: &tracing_fops);
9789
9790	trace_create_file(name: "trace_pipe", TRACE_MODE_READ, parent: d_tracer,
9791	data: tr, fops: &tracing_pipe_fops);
9792
9793	trace_create_file(name: "buffer_size_kb", TRACE_MODE_WRITE, parent: d_tracer,
9794	data: tr, fops: &tracing_entries_fops);
9795
9796	trace_create_file(name: "buffer_total_size_kb", TRACE_MODE_READ, parent: d_tracer,
9797	data: tr, fops: &tracing_total_entries_fops);
9798
9799	trace_create_file(name: "free_buffer", mode: `0200`, parent: d_tracer,
9800	data: tr, fops: &tracing_free_buffer_fops);
9801
9802	trace_create_file(name: "trace_marker", mode: `0220`, parent: d_tracer,
9803	data: tr, fops: &tracing_mark_fops);
9804
9805	tr->trace_marker_file = __find_event_file(tr, system: "ftrace", event: "print");
9806
9807	trace_create_file(name: "trace_marker_raw", mode: `0220`, parent: d_tracer,
9808	data: tr, fops: &tracing_mark_raw_fops);
9809
9810	trace_create_file(name: "trace_clock", TRACE_MODE_WRITE, parent: d_tracer, data: tr,
9811	fops: &trace_clock_fops);
9812
9813	trace_create_file(name: "tracing_on", TRACE_MODE_WRITE, parent: d_tracer,
9814	data: tr, fops: &rb_simple_fops);
9815
9816	trace_create_file(name: "timestamp_mode", TRACE_MODE_READ, parent: d_tracer, data: tr,
9817	fops: &trace_time_stamp_mode_fops);
9818
9819	tr->buffer_percent = `50`;
9820
9821	trace_create_file(name: "buffer_percent", TRACE_MODE_WRITE, parent: d_tracer,
9822	data: tr, fops: &buffer_percent_fops);
9823
9824	create_trace_options_dir(tr);
9825
9826	#ifdef CONFIG_TRACER_MAX_TRACE
9827	trace_create_maxlat_file(tr, d_tracer);
9828	#endif
9829
9830	if (ftrace_create_function_files(tr, parent: d_tracer))
9831	MEM_FAIL(`1`, "Could not allocate function filter files");
9832
9833	#ifdef CONFIG_TRACER_SNAPSHOT
9834	trace_create_file(name: "snapshot", TRACE_MODE_WRITE, parent: d_tracer,
9835	data: tr, fops: &snapshot_fops);
9836	#endif
9837
9838	trace_create_file(name: "error_log", TRACE_MODE_WRITE, parent: d_tracer,
9839	data: tr, fops: &tracing_err_log_fops);
9840
9841	for_each_tracing_cpu(cpu)
9842	tracing_init_tracefs_percpu(tr, cpu);
9843
9844	ftrace_init_tracefs(tr, d_tracer);
9845	}
9846
9847	static struct vfsmount trace_automount(struct* dentry mntpt, void* *ingore)
9848	{
9849	struct vfsmount *mnt;
9850	struct file_system_type *type;
9851
9852	/*
9853	* To maintain backward compatibility for tools that mount
9854	* debugfs to get to the tracing facility, tracefs is automatically
9855	* mounted to the debugfs/tracing directory.
9856	*/
9857	type = get_fs_type(name: "tracefs");
9858	if (!type)
9859	return NULL;
9860	mnt = vfs_submount(mountpoint: mntpt, type, name: "tracefs", NULL);
9861	put_filesystem(fs: type);
9862	if (IS_ERR(ptr: mnt))
9863	return NULL;
9864	mntget(mnt);
9865
9866	return mnt;
9867	}
9868
9869	/**
9870	* tracing_init_dentry - initialize top level trace array
9871	*
9872	* This is called when creating files or directories in the tracing
9873	* directory. It is called via fs_initcall() by any of the boot up code
9874	* and expects to return the dentry of the top level tracing directory.
9875	*/
9876	int tracing_init_dentry(void)
9877	{
9878	struct trace_array *tr = &global_trace;
9879
9880	if (security_locked_down(what: LOCKDOWN_TRACEFS)) {
9881	pr_warn("Tracing disabled due to lockdown\n");
9882	return -EPERM;
9883	}
9884
9885	/ The top level trace array uses NULL as parent /
9886	if (tr->dir)
9887	return `0`;
9888
9889	if (WARN_ON(!tracefs_initialized()))
9890	return -ENODEV;
9891
9892	/*
9893	* As there may still be users that expect the tracing
9894	* files to exist in debugfs/tracing, we must automount
9895	* the tracefs file system there, so older tools still
9896	* work with the newer kernel.
9897	*/
9898	tr->dir = debugfs_create_automount(name: "tracing", NULL,
9899	f: trace_automount, NULL);
9900
9901	return `0`;
9902	}
9903
9904	extern struct trace_eval_map *__start_ftrace_eval_maps[];
9905	extern struct trace_eval_map *__stop_ftrace_eval_maps[];
9906
9907	static struct workqueue_struct *eval_map_wq __initdata;
9908	static struct work_struct eval_map_work __initdata;
9909	static struct work_struct tracerfs_init_work __initdata;
9910
9911	static void __init eval_map_work_func(struct work_struct *work)
9912	{
9913	int len;
9914
9915	len = __stop_ftrace_eval_maps - __start_ftrace_eval_maps;
9916	trace_insert_eval_map(NULL, start: __start_ftrace_eval_maps, len);
9917	}
9918
9919	static int __init trace_eval_init(void)
9920	{
9921	INIT_WORK(&eval_map_work, eval_map_work_func);
9922
9923	eval_map_wq = alloc_workqueue(fmt: "eval_map_wq", flags: WQ_UNBOUND, max_active: `0`);
9924	if (!eval_map_wq) {
9925	pr_err("Unable to allocate eval_map_wq\n");
9926	/ Do work here /
9927	eval_map_work_func(work: &eval_map_work);
9928	return -ENOMEM;
9929	}
9930
9931	queue_work(wq: eval_map_wq, work: &eval_map_work);
9932	return `0`;
9933	}
9934
9935	subsys_initcall(trace_eval_init);
9936
9937	static int __init trace_eval_sync(void)
9938	{
9939	/ Make sure the eval map updates are finished /
9940	if (eval_map_wq)
9941	destroy_workqueue(wq: eval_map_wq);
9942	return `0`;
9943	}
9944
9945	late_initcall_sync(trace_eval_sync);
9946
9947
9948	#ifdef CONFIG_MODULES
9949	static void trace_module_add_evals(struct module *mod)
9950	{
9951	if (!mod->num_trace_evals)
9952	return;
9953
9954	/*
9955	* Modules with bad taint do not have events created, do
9956	* not bother with enums either.
9957	*/
9958	if (trace_module_has_bad_taint(mod))
9959	return;
9960
9961	trace_insert_eval_map(mod, start: mod->trace_evals, len: mod->num_trace_evals);
9962	}
9963
9964	#ifdef CONFIG_TRACE_EVAL_MAP_FILE
9965	static void trace_module_remove_evals(struct module *mod)
9966	{
9967	union trace_eval_map_item *map;
9968	union trace_eval_map_item **last = &trace_eval_maps;
9969
9970	if (!mod->num_trace_evals)
9971	return;
9972
9973	mutex_lock(&trace_eval_mutex);
9974
9975	map = trace_eval_maps;
9976
9977	while (map) {
9978	if (map->head.mod == mod)
9979	break;
9980	map = trace_eval_jmp_to_tail(ptr: map);
9981	last = &map->tail.next;
9982	map = map->tail.next;
9983	}
9984	if (!map)
9985	goto out;
9986
9987	*last = trace_eval_jmp_to_tail(ptr: map)->tail.next;
9988	kfree(objp: map);
9989	out:
9990	mutex_unlock(lock: &trace_eval_mutex);
9991	}
9992	#else
9993	static inline void trace_module_remove_evals(struct module *mod) { }
9994	#endif /* CONFIG_TRACE_EVAL_MAP_FILE */
9995
9996	static int trace_module_notify(struct notifier_block *self,
9997	unsigned long val, void *data)
9998	{
9999	struct module *mod = data;
10000
10001	switch (val) {
10002	case MODULE_STATE_COMING:
10003	trace_module_add_evals(mod);
10004	break;
10005	case MODULE_STATE_GOING:
10006	trace_module_remove_evals(mod);
10007	break;
10008	}
10009
10010	return NOTIFY_OK;
10011	}
10012
10013	static struct notifier_block trace_module_nb = {
10014	.notifier_call = trace_module_notify,
10015	.priority = `0`,
10016	};
10017	#endif /* CONFIG_MODULES */
10018
10019	static __init void tracer_init_tracefs_work_func(struct work_struct *work)
10020	{
10021
10022	event_trace_init();
10023
10024	init_tracer_tracefs(tr: &global_trace, NULL);
10025	ftrace_init_tracefs_toplevel(tr: &global_trace, NULL);
10026
10027	trace_create_file(name: "tracing_thresh", TRACE_MODE_WRITE, NULL,
10028	data: &global_trace, fops: &tracing_thresh_fops);
10029
10030	trace_create_file(name: "README", TRACE_MODE_READ, NULL,
10031	NULL, fops: &tracing_readme_fops);
10032
10033	trace_create_file(name: "saved_cmdlines", TRACE_MODE_READ, NULL,
10034	NULL, fops: &tracing_saved_cmdlines_fops);
10035
10036	trace_create_file(name: "saved_cmdlines_size", TRACE_MODE_WRITE, NULL,
10037	NULL, fops: &tracing_saved_cmdlines_size_fops);
10038
10039	trace_create_file(name: "saved_tgids", TRACE_MODE_READ, NULL,
10040	NULL, fops: &tracing_saved_tgids_fops);
10041
10042	trace_create_eval_file(NULL);
10043
10044	#ifdef CONFIG_MODULES
10045	register_module_notifier(nb: &trace_module_nb);
10046	#endif
10047
10048	#ifdef CONFIG_DYNAMIC_FTRACE
10049	trace_create_file(name: "dyn_ftrace_total_info", TRACE_MODE_READ, NULL,
10050	NULL, fops: &tracing_dyn_info_fops);
10051	#endif
10052
10053	create_trace_instances(NULL);
10054
10055	update_tracer_options(tr: &global_trace);
10056	}
10057
10058	static __init int tracer_init_tracefs(void)
10059	{
10060	int ret;
10061
10062	trace_access_lock_init();
10063
10064	ret = tracing_init_dentry();
10065	if (ret)
10066	return `0`;
10067
10068	if (eval_map_wq) {
10069	INIT_WORK(&tracerfs_init_work, tracer_init_tracefs_work_func);
10070	queue_work(wq: eval_map_wq, work: &tracerfs_init_work);
10071	} else {
10072	tracer_init_tracefs_work_func(NULL);
10073	}
10074
10075	rv_init_interface();
10076
10077	return `0`;
10078	}
10079
10080	fs_initcall(tracer_init_tracefs);
10081
10082	static int trace_die_panic_handler(struct notifier_block *self,
10083	unsigned long ev, void *unused);
10084
10085	static struct notifier_block trace_panic_notifier = {
10086	.notifier_call = trace_die_panic_handler,
10087	.priority = INT_MAX - `1`,
10088	};
10089
10090	static struct notifier_block trace_die_notifier = {
10091	.notifier_call = trace_die_panic_handler,
10092	.priority = INT_MAX - `1`,
10093	};
10094
10095	/*
10096	* The idea is to execute the following die/panic callback early, in order
10097	* to avoid showing irrelevant information in the trace (like other panic
10098	* notifier functions); we are the 2nd to run, after hung_task/rcu_stall
10099	* warnings get disabled (to prevent potential log flooding).
10100	*/
10101	static int trace_die_panic_handler(struct notifier_block *self,
10102	unsigned long ev, void *unused)
10103	{
10104	if (!ftrace_dump_on_oops)
10105	return NOTIFY_DONE;
10106
10107	/ The die notifier requires DIE_OOPS to trigger /
10108	if (self == &trace_die_notifier && ev != DIE_OOPS)
10109	return NOTIFY_DONE;
10110
10111	ftrace_dump(oops_dump_mode: ftrace_dump_on_oops);
10112
10113	return NOTIFY_DONE;
10114	}
10115
10116	/*
10117	* printk is set to max of 1024, we really don't need it that big.
10118	* Nothing should be printing 1000 characters anyway.
10119	*/
10120	#define TRACE_MAX_PRINT 1000
10121
10122	/*
10123	* Define here KERN_TRACE so that we have one place to modify
10124	* it if we decide to change what log level the ftrace dump
10125	* should be at.
10126	*/
10127	#define KERN_TRACE KERN_EMERG
10128
10129	void
10130	trace_printk_seq(struct trace_seq *s)
10131	{
10132	/ Probably should print a warning here. /
10133	if (s->seq.len >= TRACE_MAX_PRINT)
10134	s->seq.len = TRACE_MAX_PRINT;
10135
10136	/*
10137	* More paranoid code. Although the buffer size is set to
10138	* PAGE_SIZE, and TRACE_MAX_PRINT is 1000, this is just
10139	* an extra layer of protection.
10140	*/
10141	if (WARN_ON_ONCE(s->seq.len >= s->seq.size))
10142	s->seq.len = s->seq.size - `1`;
10143
10144	/ should be zero ended, but we are paranoid. /
10145	s->buffer[s->seq.len] = `0`;
10146
10147	printk(KERN_TRACE "%s", s->buffer);
10148
10149	trace_seq_init(s);
10150	}
10151
10152	void trace_init_global_iter(struct trace_iterator *iter)
10153	{
10154	iter->tr = &global_trace;
10155	iter->trace = iter->tr->current_trace;
10156	iter->cpu_file = RING_BUFFER_ALL_CPUS;
10157	iter->array_buffer = &global_trace.array_buffer;
10158
10159	if (iter->trace && iter->trace->open)
10160	iter->trace->open(iter);
10161
10162	/ Annotate start of buffers if we had overruns /
10163	if (ring_buffer_overruns(buffer: iter->array_buffer->buffer))
10164	iter->iter_flags \|= TRACE_FILE_ANNOTATE;
10165
10166	/ Output in nanoseconds only if we are using a clock in nanoseconds. /
10167	if (trace_clocks[iter->tr->clock_id].in_ns)
10168	iter->iter_flags \|= TRACE_FILE_TIME_IN_NS;
10169
10170	/ Can not use kmalloc for iter.temp and iter.fmt /
10171	iter->temp = static_temp_buf;
10172	iter->temp_size = STATIC_TEMP_BUF_SIZE;
10173	iter->fmt = static_fmt_buf;
10174	iter->fmt_size = STATIC_FMT_BUF_SIZE;
10175	}
10176
10177	void ftrace_dump(enum ftrace_dump_mode oops_dump_mode)
10178	{
10179	/ use static because iter can be a bit big for the stack /
10180	static struct trace_iterator iter;
10181	static atomic_t dump_running;
10182	struct trace_array *tr = &global_trace;
10183	unsigned int old_userobj;
10184	unsigned long flags;
10185	int cnt = `0`, cpu;
10186
10187	/ Only allow one dump user at a time. /
10188	if (atomic_inc_return(v: &dump_running) != `1`) {
10189	atomic_dec(v: &dump_running);
10190	return;
10191	}
10192
10193	/*
10194	* Always turn off tracing when we dump.
10195	* We don't need to show trace output of what happens
10196	* between multiple crashes.
10197	*
10198	* If the user does a sysrq-z, then they can re-enable
10199	* tracing with echo 1 > tracing_on.
10200	*/
10201	tracing_off();
10202
10203	local_irq_save(flags);
10204
10205	/ Simulate the iterator /
10206	trace_init_global_iter(iter: &iter);
10207
10208	for_each_tracing_cpu(cpu) {
10209	atomic_inc(v: &per_cpu_ptr(iter.array_buffer->data, cpu)->disabled);
10210	}
10211
10212	old_userobj = tr->trace_flags & TRACE_ITER_SYM_USEROBJ;
10213
10214	/ don't look at user memory in panic mode /
10215	tr->trace_flags &= ~TRACE_ITER_SYM_USEROBJ;
10216
10217	switch (oops_dump_mode) {
10218	case DUMP_ALL:
10219	iter.cpu_file = RING_BUFFER_ALL_CPUS;
10220	break;
10221	case DUMP_ORIG:
10222	iter.cpu_file = raw_smp_processor_id();
10223	break;
10224	case DUMP_NONE:
10225	goto out_enable;
10226	default:
10227	printk(KERN_TRACE "Bad dumping mode, switching to all CPUs dump\n");
10228	iter.cpu_file = RING_BUFFER_ALL_CPUS;
10229	}
10230
10231	printk(KERN_TRACE "Dumping ftrace buffer:\n");
10232
10233	/ Did function tracer already get disabled? /
10234	if (ftrace_is_dead()) {
10235	printk("# WARNING: FUNCTION TRACING IS CORRUPTED\n");
10236	printk("# MAY BE MISSING FUNCTION EVENTS\n");
10237	}
10238
10239	/*
10240	* We need to stop all tracing on all CPUS to read
10241	* the next buffer. This is a bit expensive, but is
10242	* not done often. We fill all what we can read,
10243	* and then release the locks again.
10244	*/
10245
10246	while (!trace_empty(iter: &iter)) {
10247
10248	if (!cnt)
10249	printk(KERN_TRACE "---------------------------------\n");
10250
10251	cnt++;
10252
10253	trace_iterator_reset(iter: &iter);
10254	iter.iter_flags \|= TRACE_FILE_LAT_FMT;
10255
10256	if (trace_find_next_entry_inc(iter: &iter) != NULL) {
10257	int ret;
10258
10259	ret = print_trace_line(iter: &iter);
10260	if (ret != TRACE_TYPE_NO_CONSUME)
10261	trace_consume(iter: &iter);
10262	}
10263	touch_nmi_watchdog();
10264
10265	trace_printk_seq(s: &iter.seq);
10266	}
10267
10268	if (!cnt)
10269	printk(KERN_TRACE " (ftrace buffer empty)\n");
10270	else
10271	printk(KERN_TRACE "---------------------------------\n");
10272
10273	out_enable:
10274	tr->trace_flags \|= old_userobj;
10275
10276	for_each_tracing_cpu(cpu) {
10277	atomic_dec(v: &per_cpu_ptr(iter.array_buffer->data, cpu)->disabled);
10278	}
10279	atomic_dec(v: &dump_running);
10280	local_irq_restore(flags);
10281	}
10282	EXPORT_SYMBOL_GPL(ftrace_dump);
10283
10284	#define WRITE_BUFSIZE 4096
10285
10286	ssize_t trace_parse_run_command(struct file file, const* char __user *buffer,
10287	size_t count, loff_t *ppos,
10288	int (createfn)(const* char *))
10289	{
10290	char kbuf, buf, *tmp;
10291	int ret = `0`;
10292	size_t done = `0`;
10293	size_t size;
10294
10295	kbuf = kmalloc(WRITE_BUFSIZE, GFP_KERNEL);
10296	if (!kbuf)
10297	return -ENOMEM;
10298
10299	while (done < count) {
10300	size = count - done;
10301
10302	if (size >= WRITE_BUFSIZE)
10303	size = WRITE_BUFSIZE - `1`;
10304
10305	if (copy_from_user(to: kbuf, from: buffer + done, n: size)) {
10306	ret = -EFAULT;
10307	goto out;
10308	}
10309	kbuf[size] = `'\0'`;
10310	buf = kbuf;
10311	do {
10312	tmp = strchr(buf, `'\n'`);
10313	if (tmp) {
10314	*tmp = `'\0'`;
10315	size = tmp - buf + `1`;
10316	} else {
10317	size = strlen(buf);
10318	if (done + size < count) {
10319	if (buf != kbuf)
10320	break;
10321	/ This can accept WRITE_BUFSIZE - 2 ('\n' + '\0') /
10322	pr_warn("Line length is too long: Should be less than %d\n",
10323	WRITE_BUFSIZE - `2`);
10324	ret = -EINVAL;
10325	goto out;
10326	}
10327	}
10328	done += size;
10329
10330	/ Remove comments /
10331	tmp = strchr(buf, `'#'`);
10332
10333	if (tmp)
10334	*tmp = `'\0'`;
10335
10336	ret = createfn(buf);
10337	if (ret)
10338	goto out;
10339	buf += size;
10340
10341	} while (done < count);
10342	}
10343	ret = done;
10344
10345	out:
10346	kfree(objp: kbuf);
10347
10348	return ret;
10349	}
10350
10351	#ifdef CONFIG_TRACER_MAX_TRACE
10352	__init static bool tr_needs_alloc_snapshot(const char *name)
10353	{
10354	char *test;
10355	int len = strlen(name);
10356	bool ret;
10357
10358	if (!boot_snapshot_index)
10359	return false;
10360
10361	if (strncmp(name, boot_snapshot_info, len) == `0` &&
10362	boot_snapshot_info[len] == `'\t'`)
10363	return true;
10364
10365	test = kmalloc(strlen(name) + `3`, GFP_KERNEL);
10366	if (!test)
10367	return false;
10368
10369	sprintf(buf: test, fmt: "\t%s\t", name);
10370	ret = strstr(boot_snapshot_info, test) == NULL;
10371	kfree(objp: test);
10372	return ret;
10373	}
10374
10375	__init static void do_allocate_snapshot(const char *name)
10376	{
10377	if (!tr_needs_alloc_snapshot(name))
10378	return;
10379
10380	/*
10381	* When allocate_snapshot is set, the next call to
10382	* allocate_trace_buffers() (called by trace_array_get_by_name())
10383	* will allocate the snapshot buffer. That will alse clear
10384	* this flag.
10385	*/
10386	allocate_snapshot = true;
10387	}
10388	#else
10389	static inline void do_allocate_snapshot(const char *name) { }
10390	#endif
10391
10392	__init static void enable_instances(void)
10393	{
10394	struct trace_array *tr;
10395	char *curr_str;
10396	char *str;
10397	char *tok;
10398
10399	/ A tab is always appended /
10400	boot_instance_info[boot_instance_index - `1`] = `'\0'`;
10401	str = boot_instance_info;
10402
10403	while ((curr_str = strsep(&str, "\t"))) {
10404
10405	tok = strsep(&curr_str, ",");
10406
10407	if (IS_ENABLED(CONFIG_TRACER_MAX_TRACE))
10408	do_allocate_snapshot(name: tok);
10409
10410	tr = trace_array_get_by_name(tok);
10411	if (!tr) {
10412	pr_warn("Failed to create instance buffer %s\n", curr_str);
10413	continue;
10414	}
10415	/ Allow user space to delete it /
10416	trace_array_put(tr);
10417
10418	while ((tok = strsep(&curr_str, ","))) {
10419	early_enable_events(tr, buf: tok, disable_first: true);
10420	}
10421	}
10422	}
10423
10424	__init static int tracer_alloc_buffers(void)
10425	{
10426	int ring_buf_size;
10427	int ret = -ENOMEM;
10428
10429
10430	if (security_locked_down(what: LOCKDOWN_TRACEFS)) {
10431	pr_warn("Tracing disabled due to lockdown\n");
10432	return -EPERM;
10433	}
10434
10435	/*
10436	* Make sure we don't accidentally add more trace options
10437	* than we have bits for.
10438	*/
10439	BUILD_BUG_ON(TRACE_ITER_LAST_BIT > TRACE_FLAGS_MAX_SIZE);
10440
10441	if (!alloc_cpumask_var(mask: &tracing_buffer_mask, GFP_KERNEL))
10442	goto out;
10443
10444	if (!alloc_cpumask_var(mask: &global_trace.tracing_cpumask, GFP_KERNEL))
10445	goto out_free_buffer_mask;
10446
10447	/ Only allocate trace_printk buffers if a trace_printk exists /
10448	if (&__stop___trace_bprintk_fmt != &__start___trace_bprintk_fmt)
10449	/ Must be called before global_trace.buffer is allocated /
10450	trace_printk_init_buffers();
10451
10452	/ To save memory, keep the ring buffer size to its minimum /
10453	if (global_trace.ring_buffer_expanded)
10454	ring_buf_size = trace_buf_size;
10455	else
10456	ring_buf_size = `1`;
10457
10458	cpumask_copy(dstp: tracing_buffer_mask, cpu_possible_mask);
10459	cpumask_copy(dstp: global_trace.tracing_cpumask, cpu_all_mask);
10460
10461	raw_spin_lock_init(&global_trace.start_lock);
10462
10463	/*
10464	* The prepare callbacks allocates some memory for the ring buffer. We
10465	* don't free the buffer if the CPU goes down. If we were to free
10466	* the buffer, then the user would lose any trace that was in the
10467	* buffer. The memory will be removed once the "instance" is removed.
10468	*/
10469	ret = cpuhp_setup_state_multi(state: CPUHP_TRACE_RB_PREPARE,
10470	name: "trace/RB:prepare", startup: trace_rb_cpu_prepare,
10471	NULL);
10472	if (ret < `0`)
10473	goto out_free_cpumask;
10474	/ Used for event triggers /
10475	ret = -ENOMEM;
10476	temp_buffer = ring_buffer_alloc(PAGE_SIZE, RB_FL_OVERWRITE);
10477	if (!temp_buffer)
10478	goto out_rm_hp_state;
10479
10480	if (trace_create_savedcmd() < `0`)
10481	goto out_free_temp_buffer;
10482
10483	if (!zalloc_cpumask_var(mask: &global_trace.pipe_cpumask, GFP_KERNEL))
10484	goto out_free_savedcmd;
10485
10486	/ TODO: make the number of buffers hot pluggable with CPUS /
10487	if (allocate_trace_buffers(tr: &global_trace, size: ring_buf_size) < `0`) {
10488	MEM_FAIL(`1`, "tracer: failed to allocate ring buffer!\n");
10489	goto out_free_pipe_cpumask;
10490	}
10491	if (global_trace.buffer_disabled)
10492	tracing_off();
10493
10494	if (trace_boot_clock) {
10495	ret = tracing_set_clock(tr: &global_trace, clockstr: trace_boot_clock);
10496	if (ret < `0`)
10497	pr_warn("Trace clock %s not defined, going back to default\n",
10498	trace_boot_clock);
10499	}
10500
10501	/*
10502	* register_tracer() might reference current_trace, so it
10503	* needs to be set before we register anything. This is
10504	* just a bootstrap of current_trace anyway.
10505	*/
10506	global_trace.current_trace = &nop_trace;
10507
10508	global_trace.max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
10509
10510	ftrace_init_global_array_ops(tr: &global_trace);
10511
10512	init_trace_flags_index(tr: &global_trace);
10513
10514	register_tracer(type: &nop_trace);
10515
10516	/ Function tracing may start here (via kernel command line) /
10517	init_function_trace();
10518
10519	/ All seems OK, enable tracing /
10520	tracing_disabled = `0`;
10521
10522	atomic_notifier_chain_register(nh: &panic_notifier_list,
10523	nb: &trace_panic_notifier);
10524
10525	register_die_notifier(nb: &trace_die_notifier);
10526
10527	global_trace.flags = TRACE_ARRAY_FL_GLOBAL;
10528
10529	INIT_LIST_HEAD(list: &global_trace.systems);
10530	INIT_LIST_HEAD(list: &global_trace.events);
10531	INIT_LIST_HEAD(list: &global_trace.hist_vars);
10532	INIT_LIST_HEAD(list: &global_trace.err_log);
10533	list_add(new: &global_trace.list, head: &ftrace_trace_arrays);
10534
10535	apply_trace_boot_options();
10536
10537	register_snapshot_cmd();
10538
10539	test_can_verify();
10540
10541	return `0`;
10542
10543	out_free_pipe_cpumask:
10544	free_cpumask_var(mask: global_trace.pipe_cpumask);
10545	out_free_savedcmd:
10546	free_saved_cmdlines_buffer(s: savedcmd);
10547	out_free_temp_buffer:
10548	ring_buffer_free(buffer: temp_buffer);
10549	out_rm_hp_state:
10550	cpuhp_remove_multi_state(state: CPUHP_TRACE_RB_PREPARE);
10551	out_free_cpumask:
10552	free_cpumask_var(mask: global_trace.tracing_cpumask);
10553	out_free_buffer_mask:
10554	free_cpumask_var(mask: tracing_buffer_mask);
10555	out:
10556	return ret;
10557	}
10558
10559	void __init ftrace_boot_snapshot(void)
10560	{
10561	#ifdef CONFIG_TRACER_MAX_TRACE
10562	struct trace_array *tr;
10563
10564	if (!snapshot_at_boot)
10565	return;
10566
10567	list_for_each_entry(tr, &ftrace_trace_arrays, list) {
10568	if (!tr->allocated_snapshot)
10569	continue;
10570
10571	tracing_snapshot_instance(tr);
10572	trace_array_puts(tr, " Boot snapshot taken \n");
10573	}
10574	#endif
10575	}
10576
10577	void __init early_trace_init(void)
10578	{
10579	if (tracepoint_printk) {
10580	tracepoint_print_iter =
10581	kzalloc(size: sizeof(*tracepoint_print_iter), GFP_KERNEL);
10582	if (MEM_FAIL(!tracepoint_print_iter,
10583	"Failed to allocate trace iterator\n"))
10584	tracepoint_printk = `0`;
10585	else
10586	static_key_enable(key: &tracepoint_printk_key.key);
10587	}
10588	tracer_alloc_buffers();
10589
10590	init_events();
10591	}
10592
10593	void __init trace_init(void)
10594	{
10595	trace_event_init();
10596
10597	if (boot_instance_index)
10598	enable_instances();
10599	}
10600
10601	__init static void clear_boot_tracer(void)
10602	{
10603	/*
10604	* The default tracer at boot buffer is an init section.
10605	* This function is called in lateinit. If we did not
10606	* find the boot tracer, then clear it out, to prevent
10607	* later registration from accessing the buffer that is
10608	* about to be freed.
10609	*/
10610	if (!default_bootup_tracer)
10611	return;
10612
10613	printk(KERN_INFO "ftrace bootup tracer '%s' not registered.\n",
10614	default_bootup_tracer);
10615	default_bootup_tracer = NULL;
10616	}
10617
10618	#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
10619	__init static void tracing_set_default_clock(void)
10620	{
10621	/ sched_clock_stable() is determined in late_initcall /
10622	if (!trace_boot_clock && !sched_clock_stable()) {
10623	if (security_locked_down(what: LOCKDOWN_TRACEFS)) {
10624	pr_warn("Can not set tracing clock due to lockdown\n");
10625	return;
10626	}
10627
10628	printk(KERN_WARNING
10629	"Unstable clock detected, switching default tracing clock to \"global\"\n"
10630	"If you want to keep using the local clock, then add:\n"
10631	" \"trace_clock=local\"\n"
10632	"on the kernel command line\n");
10633	tracing_set_clock(tr: &global_trace, clockstr: "global");
10634	}
10635	}
10636	#else
10637	static inline void tracing_set_default_clock(void) { }
10638	#endif
10639
10640	__init static int late_trace_init(void)
10641	{
10642	if (tracepoint_printk && tracepoint_printk_stop_on_boot) {
10643	static_key_disable(key: &tracepoint_printk_key.key);
10644	tracepoint_printk = `0`;
10645	}
10646
10647	tracing_set_default_clock();
10648	clear_boot_tracer();
10649	return `0`;
10650	}
10651
10652	late_initcall_sync(late_trace_init);
10653

source code of linux/kernel/trace/trace.c