ipa-inline.cc source code [gcc/ipa-inline.cc]

1	/ Inlining decision heuristics.*
2	Copyright (C) 2003-2024 Free Software Foundation, Inc.
3	Contributed by Jan Hubicka
4
5	This file is part of GCC.
6
7	GCC is free software; you can redistribute it and/or modify it under
8	the terms of the GNU General Public License as published by the Free
9	Software Foundation; either version 3, or (at your option) any later
10	version.
11
12	GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13	WARRANTY; without even the implied warranty of MERCHANTABILITY or
14	FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15	for more details.
16
17	You should have received a copy of the GNU General Public License
18	along with GCC; see the file COPYING3. If not see
19	<http://www.gnu.org/licenses/>. /*
20
21	/ Inlining decision heuristics*
22
23	The implementation of inliner is organized as follows:
24
25	inlining heuristics limits
26
27	can_inline_edge_p allow to check that particular inlining is allowed
28	by the limits specified by user (allowed function growth, growth and so
29	on).
30
31	Functions are inlined when it is obvious the result is profitable (such
32	as functions called once or when inlining reduce code size).
33	In addition to that we perform inlining of small functions and recursive
34	inlining.
35
36	inlining heuristics
37
38	The inliner itself is split into two passes:
39
40	pass_early_inlining
41
42	Simple local inlining pass inlining callees into current function.
43	This pass makes no use of whole unit analysis and thus it can do only
44	very simple decisions based on local properties.
45
46	The strength of the pass is that it is run in topological order
47	(reverse postorder) on the callgraph. Functions are converted into SSA
48	form just before this pass and optimized subsequently. As a result, the
49	callees of the function seen by the early inliner was already optimized
50	and results of early inlining adds a lot of optimization opportunities
51	for the local optimization.
52
53	The pass handle the obvious inlining decisions within the compilation
54	unit - inlining auto inline functions, inlining for size and
55	flattening.
56
57	main strength of the pass is the ability to eliminate abstraction
58	penalty in C++ code (via combination of inlining and early
59	optimization) and thus improve quality of analysis done by real IPA
60	optimizers.
61
62	Because of lack of whole unit knowledge, the pass cannot really make
63	good code size/performance tradeoffs. It however does very simple
64	speculative inlining allowing code size to grow by
65	EARLY_INLINING_INSNS when callee is leaf function. In this case the
66	optimizations performed later are very likely to eliminate the cost.
67
68	pass_ipa_inline
69
70	This is the real inliner able to handle inlining with whole program
71	knowledge. It performs following steps:
72
73	1) inlining of small functions. This is implemented by greedy
74	algorithm ordering all inlinable cgraph edges by their badness and
75	inlining them in this order as long as inline limits allows doing so.
76
77	This heuristics is not very good on inlining recursive calls. Recursive
78	calls can be inlined with results similar to loop unrolling. To do so,
79	special purpose recursive inliner is executed on function when
80	recursive edge is met as viable candidate.
81
82	2) Unreachable functions are removed from callgraph. Inlining leads
83	to devirtualization and other modification of callgraph so functions
84	may become unreachable during the process. Also functions declared as
85	extern inline or virtual functions are removed, since after inlining
86	we no longer need the offline bodies.
87
88	3) Functions called once and not exported from the unit are inlined.
89	This should almost always lead to reduction of code size by eliminating
90	the need for offline copy of the function. /*
91
92	#include "config.h"
93	#include "system.h"
94	#include "coretypes.h"
95	#include "backend.h"
96	#include "target.h"
97	#include "rtl.h"
98	#include "tree.h"
99	#include "gimple.h"
100	#include "alloc-pool.h"
101	#include "tree-pass.h"
102	#include "gimple-ssa.h"
103	#include "cgraph.h"
104	#include "lto-streamer.h"
105	#include "trans-mem.h"
106	#include "calls.h"
107	#include "tree-inline.h"
108	#include "profile.h"
109	#include "symbol-summary.h"
110	#include "tree-vrp.h"
111	#include "sreal.h"
112	#include "ipa-cp.h"
113	#include "ipa-prop.h"
114	#include "ipa-fnsummary.h"
115	#include "ipa-inline.h"
116	#include "ipa-utils.h"
117	#include "auto-profile.h"
118	#include "builtins.h"
119	#include "fibonacci_heap.h"
120	#include "stringpool.h"
121	#include "attribs.h"
122	#include "asan.h"
123	#include "ipa-strub.h"
124
125	/ Inliner uses greedy algorithm to inline calls in a priority order.*
126	Badness is used as the key in a Fibonacci heap which roughly corresponds
127	to negation of benefit to cost ratios.
128	In case multiple calls has same priority we want to stabilize the outcomes
129	for which we use ids. /*
130	class inline_badness
131	{
132	public:
133	sreal badness;
134	int uid;
135	inline_badness ()
136	: badness (sreal::min ()), uid (`0`)
137	{
138	}
139	inline_badness (cgraph_edge *e, sreal b)
140	: badness (b), uid (e->get_uid ())
141	{
142	}
143	bool operator<= (const inline_badness &other)
144	{
145	if (badness != other.badness)
146	return badness <= other.badness;
147	return uid <= other.uid;
148	}
149	bool operator== (const inline_badness &other)
150	{
151	return badness == other.badness && uid == other.uid;
152	}
153	bool operator!= (const inline_badness &other)
154	{
155	return badness != other.badness \|\| uid != other.uid;
156	}
157	bool operator< (const inline_badness &other)
158	{
159	if (badness != other.badness)
160	return badness < other.badness;
161	return uid < other.uid;
162	}
163	bool operator> (const inline_badness &other)
164	{
165	if (badness != other.badness)
166	return badness > other.badness;
167	return uid > other.uid;
168	}
169	};
170
171	typedef fibonacci_heap <inline_badness, cgraph_edge> edge_heap_t;
172	typedef fibonacci_node <inline_badness, cgraph_edge> edge_heap_node_t;
173
174	/ Statistics we collect about inlining algorithm. /
175	static int overall_size;
176	static profile_count max_count;
177	static profile_count spec_rem;
178
179	/ Return false when inlining edge E would lead to violating*
180	limits on function unit growth or stack usage growth.
181
182	The relative function body growth limit is present generally
183	to avoid problems with non-linear behavior of the compiler.
184	To allow inlining huge functions into tiny wrapper, the limit
185	is always based on the bigger of the two functions considered.
186
187	For stack growth limits we always base the growth in stack usage
188	of the callers. We want to prevent applications from segfaulting
189	on stack overflow when functions with huge stack frames gets
190	inlined. /*
191
192	static bool
193	caller_growth_limits (struct cgraph_edge *e)
194	{
195	struct cgraph_node *to = e->caller;
196	struct cgraph_node *what = e->callee->ultimate_alias_target ();
197	int newsize;
198	int limit = `0`;
199	HOST_WIDE_INT stack_size_limit = `0`, inlined_stack;
200	ipa_size_summary *outer_info = ipa_size_summaries->get (node: to);
201
202	/ Look for function e->caller is inlined to. While doing*
203	so work out the largest function body on the way. As
204	described above, we want to base our function growth
205	limits based on that. Not on the self size of the
206	outer function, not on the self size of inline code
207	we immediately inline to. This is the most relaxed
208	interpretation of the rule "do not grow large functions
209	too much in order to prevent compiler from exploding". /*
210	while (true)
211	{
212	ipa_size_summary *size_info = ipa_size_summaries->get (node: to);
213	if (limit < size_info->self_size)
214	limit = size_info->self_size;
215	if (stack_size_limit < size_info->estimated_self_stack_size)
216	stack_size_limit = size_info->estimated_self_stack_size;
217	if (to->inlined_to)
218	to = to->callers->caller;
219	else
220	break;
221	}
222
223	ipa_fn_summary *what_info = ipa_fn_summaries->get (node: what);
224	ipa_size_summary *what_size_info = ipa_size_summaries->get (node: what);
225
226	if (limit < what_size_info->self_size)
227	limit = what_size_info->self_size;
228
229	limit += limit * opt_for_fn (to->decl, param_large_function_growth) / `100`;
230
231	/ Check the size after inlining against the function limits. But allow*
232	the function to shrink if it went over the limits by forced inlining. /*
233	newsize = estimate_size_after_inlining (to, e);
234	if (newsize >= ipa_size_summaries->get (node: what)->size
235	&& newsize > opt_for_fn (to->decl, param_large_function_insns)
236	&& newsize > limit)
237	{
238	e->inline_failed = CIF_LARGE_FUNCTION_GROWTH_LIMIT;
239	return false;
240	}
241
242	if (!what_info->estimated_stack_size)
243	return true;
244
245	/ FIXME: Stack size limit often prevents inlining in Fortran programs*
246	due to large i/o datastructures used by the Fortran front-end.
247	We ought to ignore this limit when we know that the edge is executed
248	on every invocation of the caller (i.e. its call statement dominates
249	exit block). We do not track this information, yet. /*
250	stack_size_limit += ((gcov_type)stack_size_limit
251	* opt_for_fn (to->decl, param_stack_frame_growth)
252	/ `100`);
253
254	inlined_stack = (ipa_get_stack_frame_offset (node: to)
255	+ outer_info->estimated_self_stack_size
256	+ what_info->estimated_stack_size);
257	/ Check new stack consumption with stack consumption at the place*
258	stack is used. /*
259	if (inlined_stack > stack_size_limit
260	/ If function already has large stack usage from sibling*
261	inline call, we can inline, too.
262	This bit overoptimistically assume that we are good at stack
263	packing. /*
264	&& inlined_stack > ipa_fn_summaries->get (node: to)->estimated_stack_size
265	&& inlined_stack > opt_for_fn (to->decl, param_large_stack_frame))
266	{
267	e->inline_failed = CIF_LARGE_STACK_FRAME_GROWTH_LIMIT;
268	return false;
269	}
270	return true;
271	}
272
273	/ Dump info about why inlining has failed. /
274
275	static void
276	report_inline_failed_reason (struct cgraph_edge *e)
277	{
278	if (dump_enabled_p ())
279	{
280	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
281	" not inlinable: %C -> %C, %s\n",
282	e->caller, e->callee,
283	cgraph_inline_failed_string (e->inline_failed));
284	if ((e->inline_failed == CIF_TARGET_OPTION_MISMATCH
285	\|\| e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
286	&& e->caller->lto_file_data
287	&& e->callee->ultimate_alias_target ()->lto_file_data)
288	{
289	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
290	" LTO objects: %s, %s\n",
291	e->caller->lto_file_data->file_name,
292	e->callee->ultimate_alias_target ()->lto_file_data->file_name);
293	}
294	if (e->inline_failed == CIF_TARGET_OPTION_MISMATCH)
295	if (dump_file)
296	cl_target_option_print_diff
297	(dump_file, `2`, ptr1: target_opts_for_fn (fndecl: e->caller->decl),
298	ptr2: target_opts_for_fn (fndecl: e->callee->ultimate_alias_target ()->decl));
299	if (e->inline_failed == CIF_OPTIMIZATION_MISMATCH)
300	if (dump_file)
301	cl_optimization_print_diff
302	(dump_file, `2`, ptr1: opts_for_fn (fndecl: e->caller->decl),
303	ptr2: opts_for_fn (fndecl: e->callee->ultimate_alias_target ()->decl));
304	}
305	}
306
307	/ Decide whether sanitizer-related attributes allow inlining. /
308
309	static bool
310	sanitize_attrs_match_for_inline_p (const_tree caller, const_tree callee)
311	{
312	if (!caller \|\| !callee)
313	return true;
314
315	/ Follow clang and allow inlining for always_inline functions. /
316	if (lookup_attribute (attr_name: "always_inline", DECL_ATTRIBUTES (callee)))
317	return true;
318
319	const sanitize_code codes[] =
320	{
321	SANITIZE_ADDRESS,
322	SANITIZE_THREAD,
323	SANITIZE_UNDEFINED,
324	SANITIZE_UNDEFINED_NONDEFAULT,
325	SANITIZE_POINTER_COMPARE,
326	SANITIZE_POINTER_SUBTRACT
327	};
328
329	for (unsigned i = `0`; i < ARRAY_SIZE (codes); i++)
330	if (sanitize_flags_p (flag: codes[i], fn: caller)
331	!= sanitize_flags_p (flag: codes[i], fn: callee))
332	return false;
333
334	if (sanitize_coverage_p (fn: caller) != sanitize_coverage_p (fn: callee))
335	return false;
336
337	return true;
338	}
339
340	/ Used for flags where it is safe to inline when caller's value is*
341	grater than callee's. /*
342	#define check_maybe_up(flag) \
343	(opts_for_fn (caller->decl)->x_##flag \
344	!= opts_for_fn (callee->decl)->x_##flag \
345	&& (!always_inline \
346	\|\| opts_for_fn (caller->decl)->x_##flag \
347	< opts_for_fn (callee->decl)->x_##flag))
348	/ Used for flags where it is safe to inline when caller's value is*
349	smaller than callee's. /*
350	#define check_maybe_down(flag) \
351	(opts_for_fn (caller->decl)->x_##flag \
352	!= opts_for_fn (callee->decl)->x_##flag \
353	&& (!always_inline \
354	\|\| opts_for_fn (caller->decl)->x_##flag \
355	> opts_for_fn (callee->decl)->x_##flag))
356	/ Used for flags where exact match is needed for correctness. /
357	#define check_match(flag) \
358	(opts_for_fn (caller->decl)->x_##flag \
359	!= opts_for_fn (callee->decl)->x_##flag)
360
361	/ Decide if we can inline the edge and possibly update*
362	inline_failed reason.
363	We check whether inlining is possible at all and whether
364	caller growth limits allow doing so.
365
366	if REPORT is true, output reason to the dump file. /*
367
368	static bool
369	can_inline_edge_p (struct cgraph_edge e, bool* report,
370	bool early = false)
371	{
372	gcc_checking_assert (e->inline_failed);
373
374	if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
375	{
376	if (report)
377	report_inline_failed_reason (e);
378	return false;
379	}
380
381	bool inlinable = true;
382	enum availability avail;
383	cgraph_node *caller = (e->caller->inlined_to
384	? e->caller->inlined_to : e->caller);
385	cgraph_node *callee = e->callee->ultimate_alias_target (availability: &avail, ref: caller);
386
387	if (!callee->definition)
388	{
389	e->inline_failed = CIF_BODY_NOT_AVAILABLE;
390	inlinable = false;
391	}
392	if (!early && (!opt_for_fn (callee->decl, optimize)
393	\|\| !opt_for_fn (caller->decl, optimize)))
394	{
395	e->inline_failed = CIF_FUNCTION_NOT_OPTIMIZED;
396	inlinable = false;
397	}
398	else if (callee->calls_comdat_local)
399	{
400	e->inline_failed = CIF_USES_COMDAT_LOCAL;
401	inlinable = false;
402	}
403	else if (avail <= AVAIL_INTERPOSABLE)
404	{
405	e->inline_failed = CIF_OVERWRITABLE;
406	inlinable = false;
407	}
408	/ All edges with call_stmt_cannot_inline_p should have inline_failed*
409	initialized to one of FINAL_ERROR reasons. /*
410	else if (e->call_stmt_cannot_inline_p)
411	gcc_unreachable ();
412	/ Don't inline if the functions have different EH personalities. /
413	else if (DECL_FUNCTION_PERSONALITY (caller->decl)
414	&& DECL_FUNCTION_PERSONALITY (callee->decl)
415	&& (DECL_FUNCTION_PERSONALITY (caller->decl)
416	!= DECL_FUNCTION_PERSONALITY (callee->decl)))
417	{
418	e->inline_failed = CIF_EH_PERSONALITY;
419	inlinable = false;
420	}
421	/ TM pure functions should not be inlined into non-TM_pure*
422	functions. /*
423	else if (is_tm_pure (callee->decl) && !is_tm_pure (caller->decl))
424	{
425	e->inline_failed = CIF_UNSPECIFIED;
426	inlinable = false;
427	}
428	/ Check compatibility of target optimization options. /
429	else if (!targetm.target_option.can_inline_p (caller->decl,
430	callee->decl))
431	{
432	e->inline_failed = CIF_TARGET_OPTION_MISMATCH;
433	inlinable = false;
434	}
435	else if (ipa_fn_summaries->get (node: callee) == NULL
436	\|\| !ipa_fn_summaries->get (node: callee)->inlinable)
437	{
438	e->inline_failed = CIF_FUNCTION_NOT_INLINABLE;
439	inlinable = false;
440	}
441	/ Don't inline a function with mismatched sanitization attributes. /
442	else if (!sanitize_attrs_match_for_inline_p (caller: caller->decl, callee: callee->decl))
443	{
444	e->inline_failed = CIF_SANITIZE_ATTRIBUTE_MISMATCH;
445	inlinable = false;
446	}
447
448	if (inlinable && !strub_inlinable_to_p (callee, caller))
449	{
450	e->inline_failed = CIF_UNSPECIFIED;
451	inlinable = false;
452	}
453	if (!inlinable && report)
454	report_inline_failed_reason (e);
455	return inlinable;
456	}
457
458	/ Return inlining_insns_single limit for function N. If HINT or HINT2 is true*
459	scale up the bound. /*
460
461	static int
462	inline_insns_single (cgraph_node n, bool* hint, bool hint2)
463	{
464	if (hint && hint2)
465	{
466	int64_t spd = opt_for_fn (n->decl, param_inline_heuristics_hint_percent);
467	spd = spd * spd;
468	if (spd > `1000000`)
469	spd = `1000000`;
470	return opt_for_fn (n->decl, param_max_inline_insns_single) * spd / `100`;
471	}
472	if (hint \|\| hint2)
473	return opt_for_fn (n->decl, param_max_inline_insns_single)
474	* opt_for_fn (n->decl, param_inline_heuristics_hint_percent) / `100`;
475	return opt_for_fn (n->decl, param_max_inline_insns_single);
476	}
477
478	/ Return inlining_insns_auto limit for function N. If HINT or HINT2 is true*
479	scale up the bound. /*
480
481	static int
482	inline_insns_auto (cgraph_node n, bool* hint, bool hint2)
483	{
484	int max_inline_insns_auto = opt_for_fn (n->decl, param_max_inline_insns_auto);
485	if (hint && hint2)
486	{
487	int64_t spd = opt_for_fn (n->decl, param_inline_heuristics_hint_percent);
488	spd = spd * spd;
489	if (spd > `1000000`)
490	spd = `1000000`;
491	return max_inline_insns_auto * spd / `100`;
492	}
493	if (hint \|\| hint2)
494	return max_inline_insns_auto
495	* opt_for_fn (n->decl, param_inline_heuristics_hint_percent) / `100`;
496	return max_inline_insns_auto;
497	}
498
499	/ Decide if we can inline the edge and possibly update*
500	inline_failed reason.
501	We check whether inlining is possible at all and whether
502	caller growth limits allow doing so.
503
504	if REPORT is true, output reason to the dump file.
505
506	if DISREGARD_LIMITS is true, ignore size limits. /*
507
508	static bool
509	can_inline_edge_by_limits_p (struct cgraph_edge e, bool* report,
510	bool disregard_limits = false, bool early = false)
511	{
512	gcc_checking_assert (e->inline_failed);
513
514	if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
515	{
516	if (report)
517	report_inline_failed_reason (e);
518	return false;
519	}
520
521	bool inlinable = true;
522	enum availability avail;
523	cgraph_node *caller = (e->caller->inlined_to
524	? e->caller->inlined_to : e->caller);
525	cgraph_node *callee = e->callee->ultimate_alias_target (availability: &avail, ref: caller);
526	tree caller_tree = DECL_FUNCTION_SPECIFIC_OPTIMIZATION (caller->decl);
527	tree callee_tree
528	= callee ? DECL_FUNCTION_SPECIFIC_OPTIMIZATION (callee->decl) : NULL;
529	/ Check if caller growth allows the inlining. /
530	if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl)
531	&& !disregard_limits
532	&& !lookup_attribute (attr_name: "flatten",
533	DECL_ATTRIBUTES (caller->decl))
534	&& !caller_growth_limits (e))
535	inlinable = false;
536	else if (callee->externally_visible
537	&& !DECL_DISREGARD_INLINE_LIMITS (callee->decl)
538	&& flag_live_patching == LIVE_PATCHING_INLINE_ONLY_STATIC)
539	{
540	e->inline_failed = CIF_EXTERN_LIVE_ONLY_STATIC;
541	inlinable = false;
542	}
543	/ Don't inline a function with a higher optimization level than the*
544	caller. FIXME: this is really just tip of iceberg of handling
545	optimization attribute. /*
546	else if (caller_tree != callee_tree)
547	{
548	bool always_inline =
549	(DECL_DISREGARD_INLINE_LIMITS (callee->decl)
550	&& lookup_attribute (attr_name: "always_inline",
551	DECL_ATTRIBUTES (callee->decl)));
552	ipa_fn_summary *caller_info = ipa_fn_summaries->get (node: caller);
553	ipa_fn_summary *callee_info = ipa_fn_summaries->get (node: callee);
554
555	/ Until GCC 4.9 we did not check the semantics-altering flags*
556	below and inlined across optimization boundaries.
557	Enabling checks below breaks several packages by refusing
558	to inline library always_inline functions. See PR65873.
559	Disable the check for early inlining for now until better solution
560	is found. /*
561	if (always_inline && early)
562	;
563	/ There are some options that change IL semantics which means*
564	we cannot inline in these cases for correctness reason.
565	Not even for always_inline declared functions. /*
566	else if (check_match (flag_wrapv)
567	\|\| check_match (flag_trapv)
568	\|\| check_match (flag_pcc_struct_return)
569	\|\| check_maybe_down (optimize_debug)
570	/ When caller or callee does FP math, be sure FP codegen flags*
571	compatible. /*
572	\|\| ((caller_info->fp_expressions && callee_info->fp_expressions)
573	&& (check_maybe_up (flag_rounding_math)
574	\|\| check_maybe_up (flag_trapping_math)
575	\|\| check_maybe_down (flag_unsafe_math_optimizations)
576	\|\| check_maybe_down (flag_finite_math_only)
577	\|\| check_maybe_up (flag_signaling_nans)
578	\|\| check_maybe_down (flag_cx_limited_range)
579	\|\| check_maybe_up (flag_signed_zeros)
580	\|\| check_maybe_down (flag_associative_math)
581	\|\| check_maybe_down (flag_reciprocal_math)
582	\|\| check_maybe_down (flag_fp_int_builtin_inexact)
583	/ Strictly speaking only when the callee contains function*
584	calls that may end up setting errno. /*
585	\|\| check_maybe_up (flag_errno_math)))
586	/ We do not want to make code compiled with exceptions to be*
587	brought into a non-EH function unless we know that the callee
588	does not throw.
589	This is tracked by DECL_FUNCTION_PERSONALITY. /*
590	\|\| (check_maybe_up (flag_non_call_exceptions)
591	&& DECL_FUNCTION_PERSONALITY (callee->decl))
592	\|\| (check_maybe_up (flag_exceptions)
593	&& DECL_FUNCTION_PERSONALITY (callee->decl))
594	/ When devirtualization is disabled for callee, it is not safe*
595	to inline it as we possibly mangled the type info.
596	Allow early inlining of always inlines. /*
597	\|\| (!early && check_maybe_down (flag_devirtualize)))
598	{
599	e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
600	inlinable = false;
601	}
602	/ gcc.dg/pr43564.c. Apply user-forced inline even at -O0. /
603	else if (always_inline)
604	;
605	/ When user added an attribute to the callee honor it. /
606	else if (lookup_attribute (attr_name: "optimize", DECL_ATTRIBUTES (callee->decl))
607	&& opts_for_fn (fndecl: caller->decl) != opts_for_fn (fndecl: callee->decl))
608	{
609	e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
610	inlinable = false;
611	}
612	/ If explicit optimize attribute are not used, the mismatch is caused*
613	by different command line options used to build different units.
614	Do not care about COMDAT functions - those are intended to be
615	optimized with the optimization flags of module they are used in.
616	Also do not care about mixing up size/speed optimization when
617	DECL_DISREGARD_INLINE_LIMITS is set. /*
618	else if ((callee->merged_comdat
619	&& !lookup_attribute (attr_name: "optimize",
620	DECL_ATTRIBUTES (caller->decl)))
621	\|\| DECL_DISREGARD_INLINE_LIMITS (callee->decl))
622	;
623	/ If mismatch is caused by merging two LTO units with different*
624	optimization flags we want to be bit nicer. However never inline
625	if one of functions is not optimized at all. /*
626	else if (!opt_for_fn (callee->decl, optimize)
627	\|\| !opt_for_fn (caller->decl, optimize))
628	{
629	e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
630	inlinable = false;
631	}
632	/ If callee is optimized for size and caller is not, allow inlining if*
633	code shrinks or we are in param_max_inline_insns_single limit and
634	callee is inline (and thus likely an unified comdat).
635	This will allow caller to run faster. /*
636	else if (opt_for_fn (callee->decl, optimize_size)
637	> opt_for_fn (caller->decl, optimize_size))
638	{
639	int growth = estimate_edge_growth (edge: e);
640	if (growth > opt_for_fn (caller->decl, param_max_inline_insns_size)
641	&& (!DECL_DECLARED_INLINE_P (callee->decl)
642	&& growth >= MAX (inline_insns_single (caller, false, false),
643	inline_insns_auto (caller, false, false))))
644	{
645	e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
646	inlinable = false;
647	}
648	}
649	/ If callee is more aggressively optimized for performance than caller,*
650	we generally want to inline only cheap (runtime wise) functions. /*
651	else if (opt_for_fn (callee->decl, optimize_size)
652	< opt_for_fn (caller->decl, optimize_size)
653	\|\| (opt_for_fn (callee->decl, optimize)
654	> opt_for_fn (caller->decl, optimize)))
655	{
656	if (estimate_edge_time (edge: e)
657	>= `20` + ipa_call_summaries->get (edge: e)->call_stmt_time)
658	{
659	e->inline_failed = CIF_OPTIMIZATION_MISMATCH;
660	inlinable = false;
661	}
662	}
663
664	}
665
666	if (!inlinable && report)
667	report_inline_failed_reason (e);
668	return inlinable;
669	}
670
671
672	/ Return true if the edge E is inlinable during early inlining. /
673
674	static bool
675	can_early_inline_edge_p (struct cgraph_edge *e)
676	{
677	cgraph_node *caller = (e->caller->inlined_to
678	? e->caller->inlined_to : e->caller);
679	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
680	/ Early inliner might get called at WPA stage when IPA pass adds new*
681	function. In this case we cannot really do any of early inlining
682	because function bodies are missing. /*
683	if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
684	return false;
685	if (!gimple_has_body_p (callee->decl))
686	{
687	e->inline_failed = CIF_BODY_NOT_AVAILABLE;
688	return false;
689	}
690	gcc_assert (gimple_in_ssa_p (DECL_STRUCT_FUNCTION (e->caller->decl))
691	&& gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)));
692	if ((profile_arc_flag \|\| condition_coverage_flag)
693	&& ((lookup_attribute (attr_name: "no_profile_instrument_function",
694	DECL_ATTRIBUTES (caller->decl)) == NULL_TREE)
695	!= (lookup_attribute (attr_name: "no_profile_instrument_function",
696	DECL_ATTRIBUTES (callee->decl)) == NULL_TREE)))
697	return false;
698
699	if (!can_inline_edge_p (e, report: true, early: true)
700	\|\| !can_inline_edge_by_limits_p (e, report: true, disregard_limits: false, early: true))
701	return false;
702	/ When inlining regular functions into always-inline functions*
703	during early inlining watch for possible inline cycles. /*
704	if (DECL_DISREGARD_INLINE_LIMITS (caller->decl)
705	&& lookup_attribute (attr_name: "always_inline", DECL_ATTRIBUTES (caller->decl))
706	&& (!DECL_DISREGARD_INLINE_LIMITS (callee->decl)
707	\|\| !lookup_attribute (attr_name: "always_inline", DECL_ATTRIBUTES (callee->decl))))
708	{
709	/ If there are indirect calls, inlining may produce direct call.*
710	TODO: We may lift this restriction if we avoid errors on formely
711	indirect calls to always_inline functions. Taking address
712	of always_inline function is generally bad idea and should
713	have been declared as undefined, but sadly we allow this. /*
714	if (caller->indirect_calls \|\| e->callee->indirect_calls)
715	return false;
716	ipa_fn_summary *callee_info = ipa_fn_summaries->get (node: callee);
717	if (callee_info->safe_to_inline_to_always_inline)
718	return callee_info->safe_to_inline_to_always_inline - `1`;
719	for (cgraph_edge *e2 = callee->callees; e2; e2 = e2->next_callee)
720	{
721	struct cgraph_node *callee2 = e2->callee->ultimate_alias_target ();
722	/ As early inliner runs in RPO order, we will see uninlined*
723	always_inline calls only in the case of cyclic graphs. /*
724	if (DECL_DISREGARD_INLINE_LIMITS (callee2->decl)
725	\|\| lookup_attribute (attr_name: "always_inline", DECL_ATTRIBUTES (callee2->decl)))
726	{
727	callee_info->safe_to_inline_to_always_inline = `1`;
728	return false;
729	}
730	/ With LTO watch for case where function is later replaced*
731	by always_inline definition.
732	TODO: We may either stop treating noninlined cross-module always
733	inlines as errors, or we can extend decl merging to produce
734	syntacic alias and honor always inline only in units it has
735	been declared as such. /*
736	if (flag_lto && callee2->externally_visible)
737	{
738	callee_info->safe_to_inline_to_always_inline = `1`;
739	return false;
740	}
741	}
742	callee_info->safe_to_inline_to_always_inline = `2`;
743	}
744	return true;
745	}
746
747
748	/ Return number of calls in N. Ignore cheap builtins. /
749
750	static int
751	num_calls (struct cgraph_node *n)
752	{
753	struct cgraph_edge *e;
754	int num = `0`;
755
756	for (e = n->callees; e; e = e->next_callee)
757	if (!is_inexpensive_builtin (e->callee->decl))
758	num++;
759	return num;
760	}
761
762
763	/ Return true if we are interested in inlining small function. /
764
765	static bool
766	want_early_inline_function_p (struct cgraph_edge *e)
767	{
768	bool want_inline = true;
769	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
770
771	if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
772	;
773	/ For AutoFDO, we need to make sure that before profile summary, all*
774	hot paths' IR look exactly the same as profiled binary. As a result,
775	in einliner, we will disregard size limit and inline those callsites
776	that are:
777	* inlined in the profiled binary, and
778	* the cloned callee has enough samples to be considered "hot". */
779	else if (flag_auto_profile && afdo_callsite_hot_enough_for_early_inline (e))
780	;
781	else if (!DECL_DECLARED_INLINE_P (callee->decl)
782	&& !opt_for_fn (e->caller->decl, flag_inline_small_functions))
783	{
784	e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
785	report_inline_failed_reason (e);
786	want_inline = false;
787	}
788	else
789	{
790	/ First take care of very large functions. /
791	int min_growth = estimate_min_edge_growth (edge: e), growth = `0`;
792	int n;
793	int early_inlining_insns = param_early_inlining_insns;
794
795	if (min_growth > early_inlining_insns)
796	{
797	if (dump_enabled_p ())
798	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
799	" will not early inline: %C->%C, "
800	"call is cold and code would grow "
801	"at least by %i\n",
802	e->caller, callee,
803	min_growth);
804	want_inline = false;
805	}
806	else
807	growth = estimate_edge_growth (edge: e);
808
809
810	if (!want_inline \|\| growth <= param_max_inline_insns_size)
811	;
812	else if (!e->maybe_hot_p ())
813	{
814	if (dump_enabled_p ())
815	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
816	" will not early inline: %C->%C, "
817	"call is cold and code would grow by %i\n",
818	e->caller, callee,
819	growth);
820	want_inline = false;
821	}
822	else if (growth > early_inlining_insns)
823	{
824	if (dump_enabled_p ())
825	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
826	" will not early inline: %C->%C, "
827	"growth %i exceeds --param early-inlining-insns\n",
828	e->caller, callee, growth);
829	want_inline = false;
830	}
831	else if ((n = num_calls (n: callee)) != `0`
832	&& growth * (n + `1`) > early_inlining_insns)
833	{
834	if (dump_enabled_p ())
835	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
836	" will not early inline: %C->%C, "
837	"growth %i exceeds --param early-inlining-insns "
838	"divided by number of calls\n",
839	e->caller, callee, growth);
840	want_inline = false;
841	}
842	}
843	return want_inline;
844	}
845
846	/ Compute time of the edge->caller + edge->callee execution when inlining*
847	does not happen. /*
848
849	inline sreal
850	compute_uninlined_call_time (struct cgraph_edge *edge,
851	sreal uninlined_call_time,
852	sreal freq)
853	{
854	cgraph_node *caller = (edge->caller->inlined_to
855	? edge->caller->inlined_to
856	: edge->caller);
857
858	if (freq > `0`)
859	uninlined_call_time *= freq;
860	else
861	uninlined_call_time = uninlined_call_time >> `11`;
862
863	sreal caller_time = ipa_fn_summaries->get (node: caller)->time;
864	return uninlined_call_time + caller_time;
865	}
866
867	/ Same as compute_uinlined_call_time but compute time when inlining*
868	does happen. /*
869
870	inline sreal
871	compute_inlined_call_time (struct cgraph_edge *edge,
872	sreal time,
873	sreal freq)
874	{
875	cgraph_node *caller = (edge->caller->inlined_to
876	? edge->caller->inlined_to
877	: edge->caller);
878	sreal caller_time = ipa_fn_summaries->get (node: caller)->time;
879
880	if (freq > `0`)
881	time *= freq;
882	else
883	time = time >> `11`;
884
885	/ This calculation should match one in ipa-inline-analysis.cc*
886	(estimate_edge_size_and_time). /*
887	time -= (sreal)ipa_call_summaries->get (edge)->call_stmt_time * freq;
888	time += caller_time;
889	if (time <= `0`)
890	time = ((sreal) `1`) >> `8`;
891	gcc_checking_assert (time >= `0`);
892	return time;
893	}
894
895	/ Determine time saved by inlining EDGE of frequency FREQ*
896	where callee's runtime w/o inlining is UNINLINED_TYPE
897	and with inlined is INLINED_TYPE. /*
898
899	inline sreal
900	inlining_speedup (struct cgraph_edge *edge,
901	sreal freq,
902	sreal uninlined_time,
903	sreal inlined_time)
904	{
905	sreal speedup = uninlined_time - inlined_time;
906	/ Handling of call_time should match one in ipa-inline-fnsummary.c*
907	(estimate_edge_size_and_time). /*
908	sreal call_time = ipa_call_summaries->get (edge)->call_stmt_time;
909
910	if (freq > `0`)
911	{
912	speedup = (speedup + call_time);
913	if (freq != `1`)
914	speedup = speedup * freq;
915	}
916	else if (freq == `0`)
917	speedup = speedup >> `11`;
918	gcc_checking_assert (speedup >= `0`);
919	return speedup;
920	}
921
922	/ Return true if the speedup for inlining E is bigger than*
923	param_inline_min_speedup. /*
924
925	static bool
926	big_speedup_p (struct cgraph_edge *e)
927	{
928	sreal unspec_time;
929	sreal spec_time = estimate_edge_time (edge: e, nonspec_time: &unspec_time);
930	sreal freq = e->sreal_frequency ();
931	sreal time = compute_uninlined_call_time (edge: e, uninlined_call_time: unspec_time, freq);
932	sreal inlined_time = compute_inlined_call_time (edge: e, time: spec_time, freq);
933	cgraph_node *caller = (e->caller->inlined_to
934	? e->caller->inlined_to
935	: e->caller);
936	int limit = opt_for_fn (caller->decl, param_inline_min_speedup);
937
938	if ((time - inlined_time) * `100` > time * limit)
939	return true;
940	return false;
941	}
942
943	/ Return true if we are interested in inlining small function.*
944	When REPORT is true, report reason to dump file. /*
945
946	static bool
947	want_inline_small_function_p (struct cgraph_edge e, bool* report)
948	{
949	bool want_inline = true;
950	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
951	cgraph_node *to = (e->caller->inlined_to
952	? e->caller->inlined_to : e->caller);
953
954	/ Allow this function to be called before can_inline_edge_p,*
955	since it's usually cheaper. /*
956	if (cgraph_inline_failed_type (e->inline_failed) == CIF_FINAL_ERROR)
957	want_inline = false;
958	else if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
959	;
960	else if (!DECL_DECLARED_INLINE_P (callee->decl)
961	&& !opt_for_fn (e->caller->decl, flag_inline_small_functions))
962	{
963	e->inline_failed = CIF_FUNCTION_NOT_INLINE_CANDIDATE;
964	want_inline = false;
965	}
966	/ Do fast and conservative check if the function can be good*
967	inline candidate. /*
968	else if ((!DECL_DECLARED_INLINE_P (callee->decl)
969	&& (!e->count.ipa ().initialized_p () \|\| !e->maybe_hot_p ()))
970	&& ipa_fn_summaries->get (node: callee)->min_size
971	- ipa_call_summaries->get (edge: e)->call_stmt_size
972	> inline_insns_auto (n: e->caller, hint: true, hint2: true))
973	{
974	e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
975	want_inline = false;
976	}
977	else if ((DECL_DECLARED_INLINE_P (callee->decl)
978	\|\| e->count.ipa ().nonzero_p ())
979	&& ipa_fn_summaries->get (node: callee)->min_size
980	- ipa_call_summaries->get (edge: e)->call_stmt_size
981	> inline_insns_single (n: e->caller, hint: true, hint2: true))
982	{
983	e->inline_failed = (DECL_DECLARED_INLINE_P (callee->decl)
984	? CIF_MAX_INLINE_INSNS_SINGLE_LIMIT
985	: CIF_MAX_INLINE_INSNS_AUTO_LIMIT);
986	want_inline = false;
987	}
988	else
989	{
990	int growth = estimate_edge_growth (edge: e);
991	ipa_hints hints = estimate_edge_hints (edge: e);
992	/ We have two independent groups of hints. If one matches in each*
993	of groups the limits are inreased. If both groups matches, limit
994	is increased even more. /*
995	bool apply_hints = (hints & (INLINE_HINT_indirect_call
996	\| INLINE_HINT_known_hot
997	\| INLINE_HINT_loop_iterations
998	\| INLINE_HINT_loop_stride));
999	bool apply_hints2 = (hints & INLINE_HINT_builtin_constant_p);
1000
1001	if (growth <= opt_for_fn (to->decl,
1002	param_max_inline_insns_size))
1003	;
1004	/ Apply param_max_inline_insns_single limit. Do not do so when*
1005	hints suggests that inlining given function is very profitable.
1006	Avoid computation of big_speedup_p when not necessary to change
1007	outcome of decision. /*
1008	else if (DECL_DECLARED_INLINE_P (callee->decl)
1009	&& growth >= inline_insns_single (n: e->caller, hint: apply_hints,
1010	hint2: apply_hints2)
1011	&& (apply_hints \|\| apply_hints2
1012	\|\| growth >= inline_insns_single (n: e->caller, hint: true,
1013	hint2: apply_hints2)
1014	\|\| !big_speedup_p (e)))
1015	{
1016	e->inline_failed = CIF_MAX_INLINE_INSNS_SINGLE_LIMIT;
1017	want_inline = false;
1018	}
1019	else if (!DECL_DECLARED_INLINE_P (callee->decl)
1020	&& !opt_for_fn (e->caller->decl, flag_inline_functions)
1021	&& growth >= opt_for_fn (to->decl,
1022	param_max_inline_insns_small))
1023	{
1024	/ growth_positive_p is expensive, always test it last. /
1025	if (growth >= inline_insns_single (n: e->caller, hint: false, hint2: false)
1026	\|\| growth_positive_p (callee, e, growth))
1027	{
1028	e->inline_failed = CIF_NOT_DECLARED_INLINED;
1029	want_inline = false;
1030	}
1031	}
1032	/ Apply param_max_inline_insns_auto limit for functions not declared*
1033	inline. Bypass the limit when speedup seems big. /*
1034	else if (!DECL_DECLARED_INLINE_P (callee->decl)
1035	&& growth >= inline_insns_auto (n: e->caller, hint: apply_hints,
1036	hint2: apply_hints2)
1037	&& (apply_hints \|\| apply_hints2
1038	\|\| growth >= inline_insns_auto (n: e->caller, hint: true,
1039	hint2: apply_hints2)
1040	\|\| !big_speedup_p (e)))
1041	{
1042	/ growth_positive_p is expensive, always test it last. /
1043	if (growth >= inline_insns_single (n: e->caller, hint: false, hint2: false)
1044	\|\| growth_positive_p (callee, e, growth))
1045	{
1046	e->inline_failed = CIF_MAX_INLINE_INSNS_AUTO_LIMIT;
1047	want_inline = false;
1048	}
1049	}
1050	/ If call is cold, do not inline when function body would grow. /
1051	else if (!e->maybe_hot_p ()
1052	&& (growth >= inline_insns_single (n: e->caller, hint: false, hint2: false)
1053	\|\| growth_positive_p (callee, e, growth)))
1054	{
1055	e->inline_failed = CIF_UNLIKELY_CALL;
1056	want_inline = false;
1057	}
1058	}
1059	if (!want_inline && report)
1060	report_inline_failed_reason (e);
1061	return want_inline;
1062	}
1063
1064	/ EDGE is self recursive edge.*
1065	We handle two cases - when function A is inlining into itself
1066	or when function A is being inlined into another inliner copy of function
1067	A within function B.
1068
1069	In first case OUTER_NODE points to the toplevel copy of A, while
1070	in the second case OUTER_NODE points to the outermost copy of A in B.
1071
1072	In both cases we want to be extra selective since
1073	inlining the call will just introduce new recursive calls to appear. /*
1074
1075	static bool
1076	want_inline_self_recursive_call_p (struct cgraph_edge *edge,
1077	struct cgraph_node *outer_node,
1078	bool peeling,
1079	int depth)
1080	{
1081	char const *reason = NULL;
1082	bool want_inline = true;
1083	sreal caller_freq = `1`;
1084	int max_depth = opt_for_fn (outer_node->decl,
1085	param_max_inline_recursive_depth_auto);
1086
1087	if (DECL_DECLARED_INLINE_P (edge->caller->decl))
1088	max_depth = opt_for_fn (outer_node->decl,
1089	param_max_inline_recursive_depth);
1090
1091	if (!edge->maybe_hot_p ())
1092	{
1093	reason = "recursive call is cold";
1094	want_inline = false;
1095	}
1096	else if (depth > max_depth)
1097	{
1098	reason = "--param max-inline-recursive-depth exceeded.";
1099	want_inline = false;
1100	}
1101	else if (outer_node->inlined_to
1102	&& (caller_freq = outer_node->callers->sreal_frequency ()) == `0`)
1103	{
1104	reason = "caller frequency is 0";
1105	want_inline = false;
1106	}
1107
1108	if (!want_inline)
1109	;
1110	/ Inlining of self recursive function into copy of itself within other*
1111	function is transformation similar to loop peeling.
1112
1113	Peeling is profitable if we can inline enough copies to make probability
1114	of actual call to the self recursive function very small. Be sure that
1115	the probability of recursion is small.
1116
1117	We ensure that the frequency of recursing is at most 1 - (1/max_depth).
1118	This way the expected number of recursion is at most max_depth. /*
1119	else if (peeling)
1120	{
1121	sreal max_prob = (sreal)`1` - ((sreal)`1` / (sreal)max_depth);
1122	int i;
1123	for (i = `1`; i < depth; i++)
1124	max_prob = max_prob * max_prob;
1125	if (edge->sreal_frequency () >= max_prob * caller_freq)
1126	{
1127	reason = "frequency of recursive call is too large";
1128	want_inline = false;
1129	}
1130	}
1131	/ Recursive inlining, i.e. equivalent of unrolling, is profitable if*
1132	recursion depth is large. We reduce function call overhead and increase
1133	chances that things fit in hardware return predictor.
1134
1135	Recursive inlining might however increase cost of stack frame setup
1136	actually slowing down functions whose recursion tree is wide rather than
1137	deep.
1138
1139	Deciding reliably on when to do recursive inlining without profile feedback
1140	is tricky. For now we disable recursive inlining when probability of self
1141	recursion is low.
1142
1143	Recursive inlining of self recursive call within loop also results in
1144	large loop depths that generally optimize badly. We may want to throttle
1145	down inlining in those cases. In particular this seems to happen in one
1146	of libstdc++ rb tree methods. /*
1147	else
1148	{
1149	if (edge->sreal_frequency () * `100`
1150	<= caller_freq
1151	* opt_for_fn (outer_node->decl,
1152	param_min_inline_recursive_probability))
1153	{
1154	reason = "frequency of recursive call is too small";
1155	want_inline = false;
1156	}
1157	}
1158	if (!want_inline && dump_enabled_p ())
1159	dump_printf_loc (MSG_MISSED_OPTIMIZATION, edge->call_stmt,
1160	" not inlining recursively: %s\n", reason);
1161	return want_inline;
1162	}
1163
1164	/ Return true when NODE has uninlinable caller;*
1165	set HAS_HOT_CALL if it has hot call.
1166	Worker for cgraph_for_node_and_aliases. /*
1167
1168	static bool
1169	check_callers (struct cgraph_node node, void* *has_hot_call)
1170	{
1171	struct cgraph_edge *e;
1172	for (e = node->callers; e; e = e->next_caller)
1173	{
1174	if (!opt_for_fn (e->caller->decl, flag_inline_functions_called_once)
1175	\|\| !opt_for_fn (e->caller->decl, optimize))
1176	return true;
1177	if (!can_inline_edge_p (e, report: true))
1178	return true;
1179	if (e->recursive_p ())
1180	return true;
1181	if (!can_inline_edge_by_limits_p (e, report: true))
1182	return true;
1183	/ Inlining large functions to large loop depth is often harmful because*
1184	of register pressure it implies. /*
1185	if ((int)ipa_call_summaries->get (edge: e)->loop_depth
1186	> param_inline_functions_called_once_loop_depth)
1187	return true;
1188	/ Do not produce gigantic functions. /
1189	if (estimate_size_after_inlining (e->caller->inlined_to ?
1190	e->caller->inlined_to : e->caller, e)
1191	> param_inline_functions_called_once_insns)
1192	return true;
1193	if (!((bool* *)has_hot_call) && e->maybe_hot_p ())
1194	(bool* )has_hot_call = true*;
1195	}
1196	return false;
1197	}
1198
1199	/ If NODE has a caller, return true. /
1200
1201	static bool
1202	has_caller_p (struct cgraph_node node, void* *data ATTRIBUTE_UNUSED)
1203	{
1204	if (node->callers)
1205	return true;
1206	return false;
1207	}
1208
1209	/ Decide if inlining NODE would reduce unit size by eliminating*
1210	the offline copy of function.
1211	When COLD is true the cold calls are considered, too. /*
1212
1213	static bool
1214	want_inline_function_to_all_callers_p (struct cgraph_node node, bool* cold)
1215	{
1216	bool has_hot_call = false;
1217
1218	/ Aliases gets inlined along with the function they alias. /
1219	if (node->alias)
1220	return false;
1221	/ Already inlined? /
1222	if (node->inlined_to)
1223	return false;
1224	/ Does it have callers? /
1225	if (!node->call_for_symbol_and_aliases (callback: has_caller_p, NULL, include_overwritable: true))
1226	return false;
1227	/ Inlining into all callers would increase size? /
1228	if (growth_positive_p (node, NULL, INT_MIN) > `0`)
1229	return false;
1230	/ All inlines must be possible. /
1231	if (node->call_for_symbol_and_aliases (callback: check_callers, data: &has_hot_call,
1232	include_overwritable: true))
1233	return false;
1234	if (!cold && !has_hot_call)
1235	return false;
1236	return true;
1237	}
1238
1239	/ Return true if WHERE of SIZE is a possible candidate for wrapper heuristics*
1240	in estimate_edge_badness. /*
1241
1242	static bool
1243	wrapper_heuristics_may_apply (struct cgraph_node where, int* size)
1244	{
1245	return size < (DECL_DECLARED_INLINE_P (where->decl)
1246	? inline_insns_single (n: where, hint: false, hint2: false)
1247	: inline_insns_auto (n: where, hint: false, hint2: false));
1248	}
1249
1250	/ A cost model driving the inlining heuristics in a way so the edges with*
1251	smallest badness are inlined first. After each inlining is performed
1252	the costs of all caller edges of nodes affected are recomputed so the
1253	metrics may accurately depend on values such as number of inlinable callers
1254	of the function or function body size. /*
1255
1256	static sreal
1257	edge_badness (struct cgraph_edge edge, bool* dump)
1258	{
1259	sreal badness;
1260	int growth;
1261	sreal edge_time, unspec_edge_time;
1262	struct cgraph_node *callee = edge->callee->ultimate_alias_target ();
1263	class ipa_fn_summary *callee_info = ipa_fn_summaries->get (node: callee);
1264	ipa_hints hints;
1265	cgraph_node *caller = (edge->caller->inlined_to
1266	? edge->caller->inlined_to
1267	: edge->caller);
1268
1269	growth = estimate_edge_growth (edge);
1270	edge_time = estimate_edge_time (edge, nonspec_time: &unspec_edge_time);
1271	hints = estimate_edge_hints (edge);
1272	gcc_checking_assert (edge_time >= `0`);
1273	/ Check that inlined time is better, but tolerate some roundoff issues.*
1274	FIXME: When callee profile drops to 0 we account calls more. This
1275	should be fixed by never doing that. /*
1276	gcc_checking_assert ((edge_time * `100`
1277	- callee_info->time * `101`).to_int () <= `0`
1278	\|\| callee->count.ipa ().initialized_p ());
1279	gcc_checking_assert (growth <= ipa_size_summaries->get (callee)->size);
1280
1281	if (dump)
1282	{
1283	fprintf (stream: dump_file, format: " Badness calculation for %s -> %s\n",
1284	edge->caller->dump_name (),
1285	edge->callee->dump_name ());
1286	fprintf (stream: dump_file, format: " size growth %i, time %f unspec %f ",
1287	growth,
1288	edge_time.to_double (),
1289	unspec_edge_time.to_double ());
1290	ipa_dump_hints (f: dump_file, hints);
1291	if (big_speedup_p (e: edge))
1292	fprintf (stream: dump_file, format: " big_speedup");
1293	fprintf (stream: dump_file, format: "\n");
1294	}
1295
1296	/ Always prefer inlining saving code size. /
1297	if (growth <= `0`)
1298	{
1299	badness = (sreal) (-SREAL_MIN_SIG + growth) << (SREAL_MAX_EXP / `256`);
1300	if (dump)
1301	fprintf (stream: dump_file, format: " %f: Growth %d <= 0\n", badness.to_double (),
1302	growth);
1303	}
1304	/ Inlining into EXTERNAL functions is not going to change anything unless*
1305	they are themselves inlined. /*
1306	else if (DECL_EXTERNAL (caller->decl))
1307	{
1308	if (dump)
1309	fprintf (stream: dump_file, format: " max: function is external\n");
1310	return sreal::max ();
1311	}
1312	/ When profile is available. Compute badness as:*
1313
1314	time_saved caller_count*
1315	goodness = -------------------------------------------------
1316	growth_of_caller overall_growth * combined_size*
1317
1318	badness = - goodness
1319
1320	Again use negative value to make calls with profile appear hotter
1321	then calls without.
1322	*/
1323	else if (opt_for_fn (caller->decl, flag_guess_branch_prob)
1324	\|\| caller->count.ipa ().nonzero_p ())
1325	{
1326	sreal numerator, denominator;
1327	int overall_growth;
1328	sreal freq = edge->sreal_frequency ();
1329
1330	numerator = inlining_speedup (edge, freq, uninlined_time: unspec_edge_time, inlined_time: edge_time);
1331	if (numerator <= `0`)
1332	numerator = ((sreal) `1` >> `8`);
1333	if (caller->count.ipa ().nonzero_p ())
1334	numerator *= caller->count.ipa ().to_gcov_type ();
1335	else if (caller->count.ipa ().initialized_p ())
1336	numerator = numerator >> `11`;
1337	denominator = growth;
1338
1339	overall_growth = callee_info->growth;
1340
1341	/ Look for inliner wrappers of the form:*
1342
1343	inline_caller ()
1344	{
1345	do_fast_job...
1346	if (need_more_work)
1347	noninline_callee ();
1348	}
1349	Without penalizing this case, we usually inline noninline_callee
1350	into the inline_caller because overall_growth is small preventing
1351	further inlining of inline_caller.
1352
1353	Penalize only callgraph edges to functions with small overall
1354	growth ...
1355	*/
1356	if (growth > overall_growth
1357	/ ... and having only one caller which is not inlined ... /
1358	&& callee_info->single_caller
1359	&& !edge->caller->inlined_to
1360	/ ... and edges executed only conditionally ... /
1361	&& freq < `1`
1362	/ ... consider case where callee is not inline but caller is ... /
1363	&& ((!DECL_DECLARED_INLINE_P (edge->callee->decl)
1364	&& DECL_DECLARED_INLINE_P (caller->decl))
1365	/ ... or when early optimizers decided to split and edge*
1366	frequency still indicates splitting is a win ... /*
1367	\|\| (callee->split_part && !caller->split_part
1368	&& freq * `100`
1369	< opt_for_fn (caller->decl,
1370	param_partial_inlining_entry_probability)
1371	/ ... and do not overwrite user specified hints. /
1372	&& (!DECL_DECLARED_INLINE_P (edge->callee->decl)
1373	\|\| DECL_DECLARED_INLINE_P (caller->decl)))))
1374	{
1375	ipa_fn_summary *caller_info = ipa_fn_summaries->get (node: caller);
1376	int caller_growth = caller_info->growth;
1377
1378	/ Only apply the penalty when caller looks like inline candidate,*
1379	and it is not called once. /*
1380	if (!caller_info->single_caller && overall_growth < caller_growth
1381	&& caller_info->inlinable
1382	&& wrapper_heuristics_may_apply
1383	(where: caller, size: ipa_size_summaries->get (node: caller)->size))
1384	{
1385	if (dump)
1386	fprintf (stream: dump_file,
1387	format: " Wrapper penalty. Increasing growth %i to %i\n",
1388	overall_growth, caller_growth);
1389	overall_growth = caller_growth;
1390	}
1391	}
1392	if (overall_growth > `0`)
1393	{
1394	/ Strongly prefer functions with few callers that can be inlined*
1395	fully. The square root here leads to smaller binaries at average.
1396	Watch however for extreme cases and return to linear function
1397	when growth is large. /*
1398	if (overall_growth < `256`)
1399	overall_growth *= overall_growth;
1400	else
1401	overall_growth += `256` * `256` - `256`;
1402	denominator *= overall_growth;
1403	}
1404	denominator *= ipa_size_summaries->get (node: caller)->size + growth;
1405
1406	badness = - numerator / denominator;
1407
1408	if (dump)
1409	{
1410	fprintf (stream: dump_file,
1411	format: " %f: guessed profile. frequency %f, count %" PRId64
1412	" caller count %" PRId64
1413	" time saved %f"
1414	" overall growth %i (current) %i (original)"
1415	" %i (compensated)\n",
1416	badness.to_double (),
1417	freq.to_double (),
1418	edge->count.ipa ().initialized_p ()
1419	? edge->count.ipa ().to_gcov_type () : -`1`,
1420	caller->count.ipa ().initialized_p ()
1421	? caller->count.ipa ().to_gcov_type () : -`1`,
1422	inlining_speedup (edge, freq, uninlined_time: unspec_edge_time,
1423	inlined_time: edge_time).to_double (),
1424	estimate_growth (callee),
1425	callee_info->growth, overall_growth);
1426	}
1427	}
1428	/ When function local profile is not available or it does not give*
1429	useful information (i.e. frequency is zero), base the cost on
1430	loop nest and overall size growth, so we optimize for overall number
1431	of functions fully inlined in program. /*
1432	else
1433	{
1434	int nest = MIN (ipa_call_summaries->get (edge)->loop_depth, `8`);
1435	badness = growth;
1436
1437	/ Decrease badness if call is nested. /
1438	if (badness > `0`)
1439	badness = badness >> nest;
1440	else
1441	badness = badness << nest;
1442	if (dump)
1443	fprintf (stream: dump_file, format: " %f: no profile. nest %i\n",
1444	badness.to_double (), nest);
1445	}
1446	gcc_checking_assert (badness != `0`);
1447
1448	if (edge->recursive_p ())
1449	badness = badness.shift (s: badness > `0` ? `4` : -`4`);
1450	if ((hints & (INLINE_HINT_indirect_call
1451	\| INLINE_HINT_loop_iterations
1452	\| INLINE_HINT_loop_stride))
1453	\|\| callee_info->growth <= `0`)
1454	badness = badness.shift (s: badness > `0` ? -`2` : `2`);
1455	if (hints & INLINE_HINT_builtin_constant_p)
1456	badness = badness.shift (s: badness > `0` ? -`4` : `4`);
1457	if (hints & (INLINE_HINT_same_scc))
1458	badness = badness.shift (s: badness > `0` ? `3` : -`3`);
1459	else if (hints & (INLINE_HINT_in_scc))
1460	badness = badness.shift (s: badness > `0` ? `2` : -`2`);
1461	else if (hints & (INLINE_HINT_cross_module))
1462	badness = badness.shift (s: badness > `0` ? `1` : -`1`);
1463	if (DECL_DISREGARD_INLINE_LIMITS (callee->decl))
1464	badness = badness.shift (s: badness > `0` ? -`4` : `4`);
1465	else if ((hints & INLINE_HINT_declared_inline))
1466	badness = badness.shift (s: badness > `0` ? -`3` : `3`);
1467	if (dump)
1468	fprintf (stream: dump_file, format: " Adjusted by hints %f\n", badness.to_double ());
1469	return badness;
1470	}
1471
1472	/ Recompute badness of EDGE and update its key in HEAP if needed. /
1473	static inline void
1474	update_edge_key (edge_heap_t heap, struct* cgraph_edge *edge)
1475	{
1476	sreal badness = edge_badness (edge, dump: false);
1477	if (edge->aux)
1478	{
1479	edge_heap_node_t n = (edge_heap_node_t ) edge->aux;
1480	gcc_checking_assert (n->get_data () == edge);
1481
1482	/ fibonacci_heap::replace_key does busy updating of the*
1483	heap that is unnecessarily expensive.
1484	We do lazy increases: after extracting minimum if the key
1485	turns out to be out of date, it is re-inserted into heap
1486	with correct value. /*
1487	if (badness < n->get_key ().badness)
1488	{
1489	if (dump_file && (dump_flags & TDF_DETAILS))
1490	{
1491	fprintf (stream: dump_file,
1492	format: " decreasing badness %s -> %s, %f to %f\n",
1493	edge->caller->dump_name (),
1494	edge->callee->dump_name (),
1495	n->get_key ().badness.to_double (),
1496	badness.to_double ());
1497	}
1498	inline_badness b (edge, badness);
1499	heap->decrease_key (node: n, key: b);
1500	}
1501	}
1502	else
1503	{
1504	if (dump_file && (dump_flags & TDF_DETAILS))
1505	{
1506	fprintf (stream: dump_file,
1507	format: " enqueuing call %s -> %s, badness %f\n",
1508	edge->caller->dump_name (),
1509	edge->callee->dump_name (),
1510	badness.to_double ());
1511	}
1512	inline_badness b (edge, badness);
1513	edge->aux = heap->insert (key: b, data: edge);
1514	}
1515	}
1516
1517
1518	/ NODE was inlined.*
1519	All caller edges needs to be reset because
1520	size estimates change. Similarly callees needs reset
1521	because better context may be known. /*
1522
1523	static void
1524	reset_edge_caches (struct cgraph_node *node)
1525	{
1526	struct cgraph_edge *edge;
1527	struct cgraph_edge *e = node->callees;
1528	struct cgraph_node *where = node;
1529	struct ipa_ref *ref;
1530
1531	if (where->inlined_to)
1532	where = where->inlined_to;
1533
1534	reset_node_cache (node: where);
1535
1536	if (edge_growth_cache != NULL)
1537	for (edge = where->callers; edge; edge = edge->next_caller)
1538	if (edge->inline_failed)
1539	edge_growth_cache->remove (edge);
1540
1541	FOR_EACH_ALIAS (where, ref)
1542	reset_edge_caches (node: dyn_cast <cgraph_node *> (p: ref->referring));
1543
1544	if (!e)
1545	return;
1546
1547	while (true)
1548	if (!e->inline_failed && e->callee->callees)
1549	e = e->callee->callees;
1550	else
1551	{
1552	if (edge_growth_cache != NULL && e->inline_failed)
1553	edge_growth_cache->remove (edge: e);
1554	if (e->next_callee)
1555	e = e->next_callee;
1556	else
1557	{
1558	do
1559	{
1560	if (e->caller == node)
1561	return;
1562	e = e->caller->callers;
1563	}
1564	while (!e->next_callee);
1565	e = e->next_callee;
1566	}
1567	}
1568	}
1569
1570	/ Recompute HEAP nodes for each of caller of NODE.*
1571	UPDATED_NODES track nodes we already visited, to avoid redundant work.
1572	When CHECK_INLINABLITY_FOR is set, re-check for specified edge that
1573	it is inlinable. Otherwise check all edges. /*
1574
1575	static void
1576	update_caller_keys (edge_heap_t heap, struct* cgraph_node *node,
1577	bitmap updated_nodes,
1578	struct cgraph_edge *check_inlinablity_for)
1579	{
1580	struct cgraph_edge *edge;
1581	struct ipa_ref *ref;
1582
1583	if ((!node->alias && !ipa_fn_summaries->get (node)->inlinable)
1584	\|\| node->inlined_to)
1585	return;
1586	if (!bitmap_set_bit (updated_nodes, node->get_uid ()))
1587	return;
1588
1589	FOR_EACH_ALIAS (node, ref)
1590	{
1591	struct cgraph_node alias = dyn_cast <cgraph_node > (p: ref->referring);
1592	update_caller_keys (heap, node: alias, updated_nodes, check_inlinablity_for);
1593	}
1594
1595	for (edge = node->callers; edge; edge = edge->next_caller)
1596	if (edge->inline_failed)
1597	{
1598	if (!check_inlinablity_for
1599	\|\| check_inlinablity_for == edge)
1600	{
1601	if (can_inline_edge_p (e: edge, report: false)
1602	&& want_inline_small_function_p (e: edge, report: false)
1603	&& can_inline_edge_by_limits_p (e: edge, report: false))
1604	update_edge_key (heap, edge);
1605	else if (edge->aux)
1606	{
1607	report_inline_failed_reason (e: edge);
1608	heap->delete_node (node: (edge_heap_node_t *) edge->aux);
1609	edge->aux = NULL;
1610	}
1611	}
1612	else if (edge->aux)
1613	update_edge_key (heap, edge);
1614	}
1615	}
1616
1617	/ Recompute HEAP nodes for each uninlined call in NODE*
1618	If UPDATE_SINCE is non-NULL check if edges called within that function
1619	are inlinable (typically UPDATE_SINCE is the inline clone we introduced
1620	where all edges have new context).
1621
1622	This is used when we know that edge badnesses are going only to increase
1623	(we introduced new call site) and thus all we need is to insert newly
1624	created edges into heap. /*
1625
1626	static void
1627	update_callee_keys (edge_heap_t heap, struct* cgraph_node *node,
1628	struct cgraph_node *update_since,
1629	bitmap updated_nodes)
1630	{
1631	struct cgraph_edge *e = node->callees;
1632	bool check_inlinability = update_since == node;
1633
1634	if (!e)
1635	return;
1636	while (true)
1637	if (!e->inline_failed && e->callee->callees)
1638	{
1639	if (e->callee == update_since)
1640	check_inlinability = true;
1641	e = e->callee->callees;
1642	}
1643	else
1644	{
1645	enum availability avail;
1646	struct cgraph_node *callee;
1647	if (!check_inlinability)
1648	{
1649	if (e->aux
1650	&& !bitmap_bit_p (updated_nodes,
1651	e->callee->ultimate_alias_target
1652	(availability: &avail, ref: e->caller)->get_uid ()))
1653	update_edge_key (heap, edge: e);
1654	}
1655	/ We do not reset callee growth cache here. Since we added a new call,*
1656	growth should have just increased and consequently badness metric
1657	don't need updating. /*
1658	else if (e->inline_failed
1659	&& (callee = e->callee->ultimate_alias_target (availability: &avail,
1660	ref: e->caller))
1661	&& avail >= AVAIL_AVAILABLE
1662	&& ipa_fn_summaries->get (node: callee) != NULL
1663	&& ipa_fn_summaries->get (node: callee)->inlinable
1664	&& !bitmap_bit_p (updated_nodes, callee->get_uid ()))
1665	{
1666	if (can_inline_edge_p (e, report: false)
1667	&& want_inline_small_function_p (e, report: false)
1668	&& can_inline_edge_by_limits_p (e, report: false))
1669	{
1670	gcc_checking_assert (check_inlinability \|\| can_inline_edge_p (e, false));
1671	gcc_checking_assert (check_inlinability \|\| e->aux);
1672	update_edge_key (heap, edge: e);
1673	}
1674	else if (e->aux)
1675	{
1676	report_inline_failed_reason (e);
1677	heap->delete_node (node: (edge_heap_node_t *) e->aux);
1678	e->aux = NULL;
1679	}
1680	}
1681	/ In case we redirected to unreachable node we only need to remove the*
1682	fibheap entry. /*
1683	else if (e->aux)
1684	{
1685	heap->delete_node (node: (edge_heap_node_t *) e->aux);
1686	e->aux = NULL;
1687	}
1688	if (e->next_callee)
1689	e = e->next_callee;
1690	else
1691	{
1692	do
1693	{
1694	if (e->caller == node)
1695	return;
1696	if (e->caller == update_since)
1697	check_inlinability = false;
1698	e = e->caller->callers;
1699	}
1700	while (!e->next_callee);
1701	e = e->next_callee;
1702	}
1703	}
1704	}
1705
1706	/ Enqueue all recursive calls from NODE into priority queue depending on*
1707	how likely we want to recursively inline the call. /*
1708
1709	static void
1710	lookup_recursive_calls (struct cgraph_node node, struct* cgraph_node *where,
1711	edge_heap_t *heap)
1712	{
1713	struct cgraph_edge *e;
1714	enum availability avail;
1715
1716	for (e = where->callees; e; e = e->next_callee)
1717	if (e->callee == node
1718	\|\| (e->callee->ultimate_alias_target (availability: &avail, ref: e->caller) == node
1719	&& avail > AVAIL_INTERPOSABLE))
1720	{
1721	inline_badness b (e, -e->sreal_frequency ());
1722	heap->insert (key: b, data: e);
1723	}
1724	for (e = where->callees; e; e = e->next_callee)
1725	if (!e->inline_failed)
1726	lookup_recursive_calls (node, where: e->callee, heap);
1727	}
1728
1729	/ Decide on recursive inlining: in the case function has recursive calls,*
1730	inline until body size reaches given argument. If any new indirect edges
1731	are discovered in the process, add them to NEW_EDGES, unless NEW_EDGES*
1732	is NULL. /*
1733
1734	static bool
1735	recursive_inlining (struct cgraph_edge *edge,
1736	vec<cgraph_edge > new_edges)
1737	{
1738	cgraph_node *to = (edge->caller->inlined_to
1739	? edge->caller->inlined_to : edge->caller);
1740	int limit = opt_for_fn (to->decl,
1741	param_max_inline_insns_recursive_auto);
1742	inline_badness b (edge, sreal::min ());
1743	edge_heap_t heap (b);
1744	struct cgraph_node *node;
1745	struct cgraph_edge *e;
1746	struct cgraph_node master_clone = NULL, next;
1747	int depth = `0`;
1748	int n = `0`;
1749
1750	node = edge->caller;
1751	if (node->inlined_to)
1752	node = node->inlined_to;
1753
1754	if (DECL_DECLARED_INLINE_P (node->decl))
1755	limit = opt_for_fn (to->decl, param_max_inline_insns_recursive);
1756
1757	/ Make sure that function is small enough to be considered for inlining. /
1758	if (estimate_size_after_inlining (node, edge) >= limit)
1759	return false;
1760	lookup_recursive_calls (node, where: node, heap: &heap);
1761	if (heap.empty ())
1762	return false;
1763
1764	if (dump_file)
1765	fprintf (stream: dump_file,
1766	format: " Performing recursive inlining on %s\n", node->dump_name ());
1767
1768	/ Do the inlining and update list of recursive call during process. /
1769	while (!heap.empty ())
1770	{
1771	struct cgraph_edge *curr = heap.extract_min ();
1772	struct cgraph_node cnode, dest = curr->callee;
1773
1774	if (!can_inline_edge_p (e: curr, report: true)
1775	\|\| !can_inline_edge_by_limits_p (e: curr, report: true))
1776	continue;
1777
1778	/ MASTER_CLONE is produced in the case we already started modified*
1779	the function. Be sure to redirect edge to the original body before
1780	estimating growths otherwise we will be seeing growths after inlining
1781	the already modified body. /*
1782	if (master_clone)
1783	{
1784	curr->redirect_callee (n: master_clone);
1785	if (edge_growth_cache != NULL)
1786	edge_growth_cache->remove (edge: curr);
1787	}
1788
1789	if (estimate_size_after_inlining (node, curr) > limit)
1790	{
1791	curr->redirect_callee (n: dest);
1792	if (edge_growth_cache != NULL)
1793	edge_growth_cache->remove (edge: curr);
1794	break;
1795	}
1796
1797	depth = `1`;
1798	for (cnode = curr->caller;
1799	cnode->inlined_to; cnode = cnode->callers->caller)
1800	if (node->decl
1801	== curr->callee->ultimate_alias_target ()->decl)
1802	depth++;
1803
1804	if (!want_inline_self_recursive_call_p (edge: curr, outer_node: node, peeling: false, depth))
1805	{
1806	curr->redirect_callee (n: dest);
1807	if (edge_growth_cache != NULL)
1808	edge_growth_cache->remove (edge: curr);
1809	continue;
1810	}
1811
1812	if (dump_file)
1813	{
1814	fprintf (stream: dump_file,
1815	format: " Inlining call of depth %i", depth);
1816	if (node->count.nonzero_p () && curr->count.initialized_p ())
1817	{
1818	fprintf (stream: dump_file, format: " called approx. %.2f times per call",
1819	(double)curr->count.to_gcov_type ()
1820	/ node->count.to_gcov_type ());
1821	}
1822	fprintf (stream: dump_file, format: "\n");
1823	}
1824	if (!master_clone)
1825	{
1826	/ We need original clone to copy around. /
1827	master_clone = node->create_clone (decl: node->decl, count: node->count,
1828	update_original: false, redirect_callers: vNULL, call_duplication_hook: true, NULL, NULL);
1829	for (e = master_clone->callees; e; e = e->next_callee)
1830	if (!e->inline_failed)
1831	clone_inlined_nodes (e, true, false, NULL);
1832	curr->redirect_callee (n: master_clone);
1833	if (edge_growth_cache != NULL)
1834	edge_growth_cache->remove (edge: curr);
1835	}
1836
1837	inline_call (curr, false, new_edges, &overall_size, true);
1838	reset_node_cache (node);
1839	lookup_recursive_calls (node, where: curr->callee, heap: &heap);
1840	n++;
1841	}
1842
1843	if (!heap.empty () && dump_file)
1844	fprintf (stream: dump_file, format: " Recursive inlining growth limit met.\n");
1845
1846	if (!master_clone)
1847	return false;
1848
1849	if (dump_enabled_p ())
1850	dump_printf_loc (MSG_NOTE, edge->call_stmt,
1851	"\n Inlined %i times, "
1852	"body grown from size %i to %i, time %f to %f\n", n,
1853	ipa_size_summaries->get (node: master_clone)->size,
1854	ipa_size_summaries->get (node)->size,
1855	ipa_fn_summaries->get (node: master_clone)->time.to_double (),
1856	ipa_fn_summaries->get (node)->time.to_double ());
1857
1858	/ Remove master clone we used for inlining. We rely that clones inlined*
1859	into master clone gets queued just before master clone so we don't
1860	need recursion. /*
1861	for (node = symtab->first_function (); node != master_clone;
1862	node = next)
1863	{
1864	next = symtab->next_function (node);
1865	if (node->inlined_to == master_clone)
1866	node->remove ();
1867	}
1868	master_clone->remove ();
1869	return true;
1870	}
1871
1872
1873	/ Given whole compilation unit estimate of INSNS, compute how large we can*
1874	allow the unit to grow. /*
1875
1876	static int64_t
1877	compute_max_insns (cgraph_node node, int* insns)
1878	{
1879	int max_insns = insns;
1880	if (max_insns < opt_for_fn (node->decl, param_large_unit_insns))
1881	max_insns = opt_for_fn (node->decl, param_large_unit_insns);
1882
1883	return ((int64_t) max_insns
1884	* (`100` + opt_for_fn (node->decl, param_inline_unit_growth)) / `100`);
1885	}
1886
1887
1888	/ Compute badness of all edges in NEW_EDGES and add them to the HEAP. /
1889
1890	static void
1891	add_new_edges_to_heap (edge_heap_t heap, vec<cgraph_edge > &new_edges)
1892	{
1893	while (new_edges.length () > `0`)
1894	{
1895	struct cgraph_edge *edge = new_edges.pop ();
1896
1897	gcc_assert (!edge->aux);
1898	gcc_assert (edge->callee);
1899	if (edge->inline_failed
1900	&& can_inline_edge_p (e: edge, report: true)
1901	&& want_inline_small_function_p (e: edge, report: true)
1902	&& can_inline_edge_by_limits_p (e: edge, report: true))
1903	{
1904	inline_badness b (edge, edge_badness (edge, dump: false));
1905	edge->aux = heap->insert (key: b, data: edge);
1906	}
1907	}
1908	}
1909
1910	/ Remove EDGE from the fibheap. /
1911
1912	static void
1913	heap_edge_removal_hook (struct cgraph_edge e, void* *data)
1914	{
1915	if (e->aux)
1916	{
1917	((edge_heap_t )data)->delete_node (node: (edge_heap_node_t )e->aux);
1918	e->aux = NULL;
1919	}
1920	}
1921
1922	/ Return true if speculation of edge E seems useful.*
1923	If ANTICIPATE_INLINING is true, be conservative and hope that E
1924	may get inlined. /*
1925
1926	bool
1927	speculation_useful_p (struct cgraph_edge e, bool* anticipate_inlining)
1928	{
1929	/ If we have already decided to inline the edge, it seems useful. /
1930	if (!e->inline_failed)
1931	return true;
1932
1933	enum availability avail;
1934	struct cgraph_node *target = e->callee->ultimate_alias_target (availability: &avail,
1935	ref: e->caller);
1936
1937	gcc_assert (e->speculative && !e->indirect_unknown_callee);
1938
1939	if (!e->maybe_hot_p ())
1940	return false;
1941
1942	/ See if IP optimizations found something potentially useful about the*
1943	function. For now we look only for CONST/PURE flags. Almost everything
1944	else we propagate is useless. /*
1945	if (avail >= AVAIL_AVAILABLE)
1946	{
1947	int ecf_flags = flags_from_decl_or_type (target->decl);
1948	if (ecf_flags & ECF_CONST)
1949	{
1950	if (!(e->speculative_call_indirect_edge ()->indirect_info
1951	->ecf_flags & ECF_CONST))
1952	return true;
1953	}
1954	else if (ecf_flags & ECF_PURE)
1955	{
1956	if (!(e->speculative_call_indirect_edge ()->indirect_info
1957	->ecf_flags & ECF_PURE))
1958	return true;
1959	}
1960	}
1961	/ If we did not managed to inline the function nor redirect*
1962	to an ipa-cp clone (that are seen by having local flag set),
1963	it is probably pointless to inline it unless hardware is missing
1964	indirect call predictor. /*
1965	if (!anticipate_inlining && !target->local)
1966	return false;
1967	/ For overwritable targets there is not much to do. /
1968	if (!can_inline_edge_p (e, report: false)
1969	\|\| !can_inline_edge_by_limits_p (e, report: false, disregard_limits: true))
1970	return false;
1971	/ OK, speculation seems interesting. /
1972	return true;
1973	}
1974
1975	/ We know that EDGE is not going to be inlined.*
1976	See if we can remove speculation. /*
1977
1978	static void
1979	resolve_noninline_speculation (edge_heap_t edge_heap, struct* cgraph_edge *edge)
1980	{
1981	if (edge->speculative && !speculation_useful_p (e: edge, anticipate_inlining: false))
1982	{
1983	struct cgraph_node *node = edge->caller;
1984	struct cgraph_node *where = node->inlined_to
1985	? node->inlined_to : node;
1986	auto_bitmap updated_nodes;
1987
1988	if (edge->count.ipa ().initialized_p ())
1989	spec_rem += edge->count.ipa ();
1990	cgraph_edge::resolve_speculation (edge);
1991	reset_edge_caches (node: where);
1992	ipa_update_overall_fn_summary (node: where);
1993	update_caller_keys (heap: edge_heap, node: where,
1994	updated_nodes, NULL);
1995	update_callee_keys (heap: edge_heap, node: where, NULL,
1996	updated_nodes);
1997	}
1998	}
1999
2000	/ Return true if NODE should be accounted for overall size estimate.*
2001	Skip all nodes optimized for size so we can measure the growth of hot
2002	part of program no matter of the padding. /*
2003
2004	bool
2005	inline_account_function_p (struct cgraph_node *node)
2006	{
2007	return (!DECL_EXTERNAL (node->decl)
2008	&& !opt_for_fn (node->decl, optimize_size)
2009	&& node->frequency != NODE_FREQUENCY_UNLIKELY_EXECUTED);
2010	}
2011
2012	/ Count number of callers of NODE and store it into DATA (that*
2013	points to int. Worker for cgraph_for_node_and_aliases. /*
2014
2015	static bool
2016	sum_callers (struct cgraph_node node, void* *data)
2017	{
2018	struct cgraph_edge *e;
2019	int num_calls = (int* *)data;
2020
2021	for (e = node->callers; e; e = e->next_caller)
2022	(*num_calls)++;
2023	return false;
2024	}
2025
2026	/ We only propagate across edges with non-interposable callee. /
2027
2028	inline bool
2029	ignore_edge_p (struct cgraph_edge *e)
2030	{
2031	enum availability avail;
2032	e->callee->function_or_virtual_thunk_symbol (avail: &avail, ref: e->caller);
2033	return (avail <= AVAIL_INTERPOSABLE);
2034	}
2035
2036	/ We use greedy algorithm for inlining of small functions:*
2037	All inline candidates are put into prioritized heap ordered in
2038	increasing badness.
2039
2040	The inlining of small functions is bounded by unit growth parameters. /*
2041
2042	static void
2043	inline_small_functions (void)
2044	{
2045	struct cgraph_node *node;
2046	struct cgraph_edge *edge;
2047	inline_badness b;
2048	edge_heap_t edge_heap (b);
2049	auto_bitmap updated_nodes;
2050	int min_size;
2051	auto_vec<cgraph_edge *> new_indirect_edges;
2052	int initial_size = `0`;
2053	struct cgraph_node *order = XCNEWVEC (cgraph_node , symtab->cgraph_count);
2054	struct cgraph_edge_hook_list *edge_removal_hook_holder;
2055	new_indirect_edges.create (nelems: `8`);
2056
2057	edge_removal_hook_holder
2058	= symtab->add_edge_removal_hook (hook: &heap_edge_removal_hook, data: &edge_heap);
2059
2060	/ Compute overall unit size and other global parameters used by badness*
2061	metrics. /*
2062
2063	max_count = profile_count::uninitialized ();
2064	ipa_reduced_postorder (order, true, ignore_edge: ignore_edge_p);
2065	free (ptr: order);
2066
2067	FOR_EACH_DEFINED_FUNCTION (node)
2068	if (!node->inlined_to)
2069	{
2070	if (!node->alias && node->analyzed
2071	&& (node->has_gimple_body_p () \|\| node->thunk)
2072	&& opt_for_fn (node->decl, optimize))
2073	{
2074	class ipa_fn_summary *info = ipa_fn_summaries->get (node);
2075	struct ipa_dfs_info dfs = (struct* ipa_dfs_info *) node->aux;
2076
2077	/ Do not account external functions, they will be optimized out*
2078	if not inlined. Also only count the non-cold portion of program. /*
2079	if (inline_account_function_p (node))
2080	initial_size += ipa_size_summaries->get (node)->size;
2081	info->growth = estimate_growth (node);
2082
2083	int num_calls = `0`;
2084	node->call_for_symbol_and_aliases (callback: sum_callers, data: &num_calls,
2085	include_overwritable: true);
2086	if (num_calls == `1`)
2087	info->single_caller = true;
2088	if (dfs && dfs->next_cycle)
2089	{
2090	struct cgraph_node *n2;
2091	int id = dfs->scc_no + `1`;
2092	for (n2 = node; n2;
2093	n2 = ((struct ipa_dfs_info *) n2->aux)->next_cycle)
2094	if (opt_for_fn (n2->decl, optimize))
2095	{
2096	ipa_fn_summary *info2 = ipa_fn_summaries->get
2097	(node: n2->inlined_to ? n2->inlined_to : n2);
2098	if (info2->scc_no)
2099	break;
2100	info2->scc_no = id;
2101	}
2102	}
2103	}
2104
2105	for (edge = node->callers; edge; edge = edge->next_caller)
2106	max_count = max_count.max (other: edge->count.ipa ());
2107	}
2108	ipa_free_postorder_info ();
2109	initialize_growth_caches ();
2110
2111	if (dump_file)
2112	fprintf (stream: dump_file,
2113	format: "\nDeciding on inlining of small functions. Starting with size %i.\n",
2114	initial_size);
2115
2116	overall_size = initial_size;
2117	min_size = overall_size;
2118
2119	/ Populate the heap with all edges we might inline. /
2120
2121	FOR_EACH_DEFINED_FUNCTION (node)
2122	{
2123	bool update = false;
2124	struct cgraph_edge *next = NULL;
2125	bool has_speculative = false;
2126
2127	if (!opt_for_fn (node->decl, optimize)
2128	/ With -Og we do not want to perform IPA inlining of small*
2129	functions since there are no scalar cleanups after it
2130	that would realize the anticipated win. All abstraction
2131	is removed during early inlining. /*
2132	\|\| opt_for_fn (node->decl, optimize_debug))
2133	continue;
2134
2135	if (dump_file)
2136	fprintf (stream: dump_file, format: "Enqueueing calls in %s.\n", node->dump_name ());
2137
2138	for (edge = node->callees; edge; edge = edge->next_callee)
2139	{
2140	if (edge->inline_failed
2141	&& !edge->aux
2142	&& can_inline_edge_p (e: edge, report: true)
2143	&& want_inline_small_function_p (e: edge, report: true)
2144	&& can_inline_edge_by_limits_p (e: edge, report: true)
2145	&& edge->inline_failed)
2146	{
2147	gcc_assert (!edge->aux);
2148	update_edge_key (heap: &edge_heap, edge);
2149	}
2150	if (edge->speculative)
2151	has_speculative = true;
2152	}
2153	if (has_speculative)
2154	for (edge = node->callees; edge; edge = next)
2155	{
2156	next = edge->next_callee;
2157	if (edge->speculative
2158	&& !speculation_useful_p (e: edge, anticipate_inlining: edge->aux != NULL))
2159	{
2160	cgraph_edge::resolve_speculation (edge);
2161	update = true;
2162	}
2163	}
2164	if (update)
2165	{
2166	struct cgraph_node *where = node->inlined_to
2167	? node->inlined_to : node;
2168	ipa_update_overall_fn_summary (node: where);
2169	reset_edge_caches (node: where);
2170	update_caller_keys (heap: &edge_heap, node: where,
2171	updated_nodes, NULL);
2172	update_callee_keys (heap: &edge_heap, node: where, NULL,
2173	updated_nodes);
2174	bitmap_clear (updated_nodes);
2175	}
2176	}
2177
2178	gcc_assert (in_lto_p
2179	\|\| !(max_count > `0`)
2180	\|\| (profile_info && flag_branch_probabilities));
2181
2182	while (!edge_heap.empty ())
2183	{
2184	int old_size = overall_size;
2185	struct cgraph_node where, callee;
2186	sreal badness = edge_heap.min_key ().badness;
2187	sreal current_badness;
2188	int growth;
2189
2190	edge = edge_heap.extract_min ();
2191	gcc_assert (edge->aux);
2192	edge->aux = NULL;
2193	if (!edge->inline_failed \|\| !edge->callee->analyzed)
2194	continue;
2195
2196	/ Be sure that caches are maintained consistent.*
2197	This check is affected by scaling roundoff errors when compiling for
2198	IPA this we skip it in that case. /*
2199	if (flag_checking && !edge->callee->count.ipa_p ()
2200	&& (!max_count.initialized_p () \|\| !max_count.nonzero_p ()))
2201	{
2202	sreal cached_badness = edge_badness (edge, dump: false);
2203
2204	int old_size_est = estimate_edge_size (edge);
2205	sreal old_time_est = estimate_edge_time (edge);
2206	int old_hints_est = estimate_edge_hints (edge);
2207
2208	if (edge_growth_cache != NULL)
2209	edge_growth_cache->remove (edge);
2210	reset_node_cache (node: edge->caller->inlined_to
2211	? edge->caller->inlined_to
2212	: edge->caller);
2213	gcc_assert (old_size_est == estimate_edge_size (edge));
2214	gcc_assert (old_time_est == estimate_edge_time (edge));
2215	/ FIXME:*
2216
2217	gcc_assert (old_hints_est == estimate_edge_hints (edge));
2218
2219	fails with profile feedback because some hints depends on
2220	maybe_hot_edge_p predicate and because callee gets inlined to other
2221	calls, the edge may become cold.
2222	This ought to be fixed by computing relative probabilities
2223	for given invocation but that will be better done once whole
2224	code is converted to sreals. Disable for now and revert to "wrong"
2225	value so enable/disable checking paths agree. /*
2226	edge_growth_cache->get (edge)->hints = old_hints_est + `1`;
2227
2228	/ When updating the edge costs, we only decrease badness in the keys.*
2229	Increases of badness are handled lazily; when we see key with out
2230	of date value on it, we re-insert it now. /*
2231	current_badness = edge_badness (edge, dump: false);
2232	gcc_assert (cached_badness == current_badness);
2233	gcc_assert (current_badness >= badness);
2234	}
2235	else
2236	current_badness = edge_badness (edge, dump: false);
2237	if (current_badness != badness)
2238	{
2239	if (edge_heap.min () && current_badness > edge_heap.min_key ().badness)
2240	{
2241	inline_badness b (edge, current_badness);
2242	edge->aux = edge_heap.insert (key: b, data: edge);
2243	continue;
2244	}
2245	else
2246	badness = current_badness;
2247	}
2248
2249	if (!can_inline_edge_p (e: edge, report: true)
2250	\|\| !can_inline_edge_by_limits_p (e: edge, report: true))
2251	{
2252	resolve_noninline_speculation (edge_heap: &edge_heap, edge);
2253	continue;
2254	}
2255
2256	callee = edge->callee->ultimate_alias_target ();
2257	growth = estimate_edge_growth (edge);
2258	if (dump_file)
2259	{
2260	fprintf (stream: dump_file,
2261	format: "\nConsidering %s with %i size\n",
2262	callee->dump_name (),
2263	ipa_size_summaries->get (node: callee)->size);
2264	fprintf (stream: dump_file,
2265	format: " to be inlined into %s in %s:%i\n"
2266	" Estimated badness is %f, frequency %.2f.\n",
2267	edge->caller->dump_name (),
2268	edge->call_stmt
2269	&& (LOCATION_LOCUS (gimple_location ((const gimple *)
2270	edge->call_stmt))
2271	> BUILTINS_LOCATION)
2272	? gimple_filename (stmt: (const gimple *) edge->call_stmt)
2273	: "unknown",
2274	edge->call_stmt
2275	? gimple_lineno (stmt: (const gimple *) edge->call_stmt)
2276	: -`1`,
2277	badness.to_double (),
2278	edge->sreal_frequency ().to_double ());
2279	if (edge->count.ipa ().initialized_p ())
2280	{
2281	fprintf (stream: dump_file, format: " Called ");
2282	edge->count.ipa ().dump (f: dump_file);
2283	fprintf (stream: dump_file, format: " times\n");
2284	}
2285	if (dump_flags & TDF_DETAILS)
2286	edge_badness (edge, dump: true);
2287	}
2288
2289	where = edge->caller;
2290
2291	if (overall_size + growth > compute_max_insns (node: where, insns: min_size)
2292	&& !DECL_DISREGARD_INLINE_LIMITS (callee->decl))
2293	{
2294	edge->inline_failed = CIF_INLINE_UNIT_GROWTH_LIMIT;
2295	report_inline_failed_reason (e: edge);
2296	resolve_noninline_speculation (edge_heap: &edge_heap, edge);
2297	continue;
2298	}
2299
2300	if (!want_inline_small_function_p (e: edge, report: true))
2301	{
2302	resolve_noninline_speculation (edge_heap: &edge_heap, edge);
2303	continue;
2304	}
2305
2306	profile_count old_count = callee->count;
2307
2308	/ Heuristics for inlining small functions work poorly for*
2309	recursive calls where we do effects similar to loop unrolling.
2310	When inlining such edge seems profitable, leave decision on
2311	specific inliner. /*
2312	if (edge->recursive_p ())
2313	{
2314	if (where->inlined_to)
2315	where = where->inlined_to;
2316	if (!recursive_inlining (edge,
2317	opt_for_fn (edge->caller->decl,
2318	flag_indirect_inlining)
2319	? &new_indirect_edges : NULL))
2320	{
2321	edge->inline_failed = CIF_RECURSIVE_INLINING;
2322	resolve_noninline_speculation (edge_heap: &edge_heap, edge);
2323	continue;
2324	}
2325	reset_edge_caches (node: where);
2326	/ Recursive inliner inlines all recursive calls of the function*
2327	at once. Consequently we need to update all callee keys. /*
2328	if (opt_for_fn (edge->caller->decl, flag_indirect_inlining))
2329	add_new_edges_to_heap (heap: &edge_heap, new_edges&: new_indirect_edges);
2330	update_callee_keys (heap: &edge_heap, node: where, update_since: where, updated_nodes);
2331	bitmap_clear (updated_nodes);
2332	}
2333	else
2334	{
2335	struct cgraph_node *outer_node = NULL;
2336	int depth = `0`;
2337
2338	/ Consider the case where self recursive function A is inlined*
2339	into B. This is desired optimization in some cases, since it
2340	leads to effect similar of loop peeling and we might completely
2341	optimize out the recursive call. However we must be extra
2342	selective. /*
2343
2344	where = edge->caller;
2345	while (where->inlined_to)
2346	{
2347	if (where->decl == callee->decl)
2348	outer_node = where, depth++;
2349	where = where->callers->caller;
2350	}
2351	if (outer_node
2352	&& !want_inline_self_recursive_call_p (edge, outer_node,
2353	peeling: true, depth))
2354	{
2355	edge->inline_failed
2356	= (DECL_DISREGARD_INLINE_LIMITS (edge->callee->decl)
2357	? CIF_RECURSIVE_INLINING : CIF_UNSPECIFIED);
2358	resolve_noninline_speculation (edge_heap: &edge_heap, edge);
2359	continue;
2360	}
2361	else if (depth && dump_file)
2362	fprintf (stream: dump_file, format: " Peeling recursion with depth %i\n", depth);
2363
2364	gcc_checking_assert (!callee->inlined_to);
2365
2366	int old_size = ipa_size_summaries->get (node: where)->size;
2367	sreal old_time = ipa_fn_summaries->get (node: where)->time;
2368
2369	inline_call (edge, true, &new_indirect_edges, &overall_size, true);
2370	reset_edge_caches (node: edge->callee);
2371	add_new_edges_to_heap (heap: &edge_heap, new_edges&: new_indirect_edges);
2372
2373	/ If caller's size and time increased we do not need to update*
2374	all edges because badness is not going to decrease. /*
2375	if (old_size <= ipa_size_summaries->get (node: where)->size
2376	&& old_time <= ipa_fn_summaries->get (node: where)->time
2377	/ Wrapper penalty may be non-monotonous in this respect.*
2378	Fortunately it only affects small functions. /*
2379	&& !wrapper_heuristics_may_apply (where, size: old_size))
2380	update_callee_keys (heap: &edge_heap, node: edge->callee, update_since: edge->callee,
2381	updated_nodes);
2382	else
2383	update_callee_keys (heap: &edge_heap, node: where,
2384	update_since: edge->callee,
2385	updated_nodes);
2386	}
2387	where = edge->caller;
2388	if (where->inlined_to)
2389	where = where->inlined_to;
2390
2391	/ Our profitability metric can depend on local properties*
2392	such as number of inlinable calls and size of the function body.
2393	After inlining these properties might change for the function we
2394	inlined into (since it's body size changed) and for the functions
2395	called by function we inlined (since number of it inlinable callers
2396	might change). /*
2397	update_caller_keys (heap: &edge_heap, node: where, updated_nodes, NULL);
2398	/ Offline copy count has possibly changed, recompute if profile is*
2399	available. /*
2400	struct cgraph_node *n
2401	= cgraph_node::get (decl: edge->callee->decl)->ultimate_alias_target ();
2402	if (n != edge->callee && n->analyzed && !(n->count == old_count)
2403	&& n->count.ipa_p ())
2404	update_callee_keys (heap: &edge_heap, node: n, NULL, updated_nodes);
2405	bitmap_clear (updated_nodes);
2406
2407	if (dump_enabled_p ())
2408	{
2409	ipa_fn_summary *s = ipa_fn_summaries->get (node: where);
2410
2411	/ dump_printf can't handle %+i. /
2412	char buf_net_change[`100`];
2413	snprintf (s: buf_net_change, maxlen: sizeof buf_net_change, format: "%+i",
2414	overall_size - old_size);
2415
2416	dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, edge->call_stmt,
2417	" Inlined %C into %C which now has time %f and "
2418	"size %i, net change of %s%s.\n",
2419	edge->callee, edge->caller,
2420	s->time.to_double (),
2421	ipa_size_summaries->get (node: edge->caller)->size,
2422	buf_net_change,
2423	cross_module_call_p (edge) ? " (cross module)":"");
2424	}
2425	if (min_size > overall_size)
2426	{
2427	min_size = overall_size;
2428
2429	if (dump_file)
2430	fprintf (stream: dump_file, format: "New minimal size reached: %i\n", min_size);
2431	}
2432	}
2433
2434	free_growth_caches ();
2435	if (dump_enabled_p ())
2436	dump_printf (MSG_NOTE,
2437	"Unit growth for small function inlining: %i->%i (%i%%)\n",
2438	initial_size, overall_size,
2439	initial_size ? overall_size * `100` / (initial_size) - `100`: `0`);
2440	symtab->remove_edge_removal_hook (entry: edge_removal_hook_holder);
2441	}
2442
2443	/ Flatten NODE. Performed both during early inlining and*
2444	at IPA inlining time. /*
2445
2446	static void
2447	flatten_function (struct cgraph_node node, bool* early, bool update)
2448	{
2449	struct cgraph_edge *e;
2450
2451	/ We shouldn't be called recursively when we are being processed. /
2452	gcc_assert (node->aux == NULL);
2453
2454	node->aux = (void *) node;
2455
2456	for (e = node->callees; e; e = e->next_callee)
2457	{
2458	struct cgraph_node *orig_callee;
2459	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2460
2461	/ We've hit cycle? It is time to give up. /
2462	if (callee->aux)
2463	{
2464	if (dump_enabled_p ())
2465	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2466	"Not inlining %C into %C to avoid cycle.\n",
2467	callee, e->caller);
2468	if (cgraph_inline_failed_type (e->inline_failed) != CIF_FINAL_ERROR)
2469	e->inline_failed = CIF_RECURSIVE_INLINING;
2470	continue;
2471	}
2472
2473	/ When the edge is already inlined, we just need to recurse into*
2474	it in order to fully flatten the leaves. /*
2475	if (!e->inline_failed)
2476	{
2477	flatten_function (node: callee, early, update: false);
2478	continue;
2479	}
2480
2481	/ Flatten attribute needs to be processed during late inlining. For*
2482	extra code quality we however do flattening during early optimization,
2483	too. /*
2484	if (!early
2485	? !can_inline_edge_p (e, report: true)
2486	&& !can_inline_edge_by_limits_p (e, report: true)
2487	: !can_early_inline_edge_p (e))
2488	continue;
2489
2490	if (e->recursive_p ())
2491	{
2492	if (dump_enabled_p ())
2493	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2494	"Not inlining: recursive call.\n");
2495	continue;
2496	}
2497
2498	if (gimple_in_ssa_p (DECL_STRUCT_FUNCTION (node->decl))
2499	!= gimple_in_ssa_p (DECL_STRUCT_FUNCTION (callee->decl)))
2500	{
2501	if (dump_enabled_p ())
2502	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2503	"Not inlining: SSA form does not match.\n");
2504	continue;
2505	}
2506
2507	/ Inline the edge and flatten the inline clone. Avoid*
2508	recursing through the original node if the node was cloned. /*
2509	if (dump_enabled_p ())
2510	dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
2511	" Inlining %C into %C.\n",
2512	callee, e->caller);
2513	orig_callee = callee;
2514	inline_call (e, true, NULL, NULL, false);
2515	if (e->callee != orig_callee)
2516	orig_callee->aux = (void *) node;
2517	flatten_function (node: e->callee, early, update: false);
2518	if (e->callee != orig_callee)
2519	orig_callee->aux = NULL;
2520	}
2521
2522	node->aux = NULL;
2523	cgraph_node *where = node->inlined_to ? node->inlined_to : node;
2524	if (update && opt_for_fn (where->decl, optimize))
2525	ipa_update_overall_fn_summary (node: where);
2526	}
2527
2528	/ Inline NODE to all callers. Worker for cgraph_for_node_and_aliases.*
2529	DATA points to number of calls originally found so we avoid infinite
2530	recursion. /*
2531
2532	static bool
2533	inline_to_all_callers_1 (struct cgraph_node node, void* *data,
2534	hash_set<cgraph_node > callers)
2535	{
2536	int num_calls = (int* *)data;
2537	bool callee_removed = false;
2538
2539	while (node->callers && !node->inlined_to)
2540	{
2541	struct cgraph_node *caller = node->callers->caller;
2542
2543	if (!can_inline_edge_p (e: node->callers, report: true)
2544	\|\| !can_inline_edge_by_limits_p (e: node->callers, report: true)
2545	\|\| node->callers->recursive_p ())
2546	{
2547	if (dump_file)
2548	fprintf (stream: dump_file, format: "Uninlinable call found; giving up.\n");
2549	*num_calls = `0`;
2550	return false;
2551	}
2552
2553	if (dump_file)
2554	{
2555	cgraph_node *ultimate = node->ultimate_alias_target ();
2556	fprintf (stream: dump_file,
2557	format: "\nInlining %s size %i.\n",
2558	ultimate->dump_name (),
2559	ipa_size_summaries->get (node: ultimate)->size);
2560	fprintf (stream: dump_file,
2561	format: " Called once from %s %i insns.\n",
2562	node->callers->caller->dump_name (),
2563	ipa_size_summaries->get (node: node->callers->caller)->size);
2564	}
2565
2566	/ Remember which callers we inlined to, delaying updating the*
2567	overall summary. /*
2568	callers->add (k: node->callers->caller);
2569	inline_call (node->callers, true, NULL, NULL, false, callee_removed: &callee_removed);
2570	if (dump_file)
2571	fprintf (stream: dump_file,
2572	format: " Inlined into %s which now has %i size\n",
2573	caller->dump_name (),
2574	ipa_size_summaries->get (node: caller)->size);
2575	if (!(*num_calls)--)
2576	{
2577	if (dump_file)
2578	fprintf (stream: dump_file, format: "New calls found; giving up.\n");
2579	return callee_removed;
2580	}
2581	if (callee_removed)
2582	return true;
2583	}
2584	return false;
2585	}
2586
2587	/ Wrapper around inline_to_all_callers_1 doing delayed overall summary*
2588	update. /*
2589
2590	static bool
2591	inline_to_all_callers (struct cgraph_node node, void* *data)
2592	{
2593	hash_set<cgraph_node *> callers;
2594	bool res = inline_to_all_callers_1 (node, data, callers: &callers);
2595	/ Perform the delayed update of the overall summary of all callers*
2596	processed. This avoids quadratic behavior in the cases where
2597	we have a lot of calls to the same function. /*
2598	for (hash_set<cgraph_node *>::iterator i = callers.begin ();
2599	i != callers.end (); ++i)
2600	ipa_update_overall_fn_summary (node: (i)->inlined_to ? (i)->inlined_to : *i);
2601	return res;
2602	}
2603
2604	/ Output overall time estimate. /
2605	static void
2606	dump_overall_stats (void)
2607	{
2608	sreal sum_weighted = `0`, sum = `0`;
2609	struct cgraph_node *node;
2610
2611	FOR_EACH_DEFINED_FUNCTION (node)
2612	if (!node->inlined_to
2613	&& !node->alias)
2614	{
2615	ipa_fn_summary *s = ipa_fn_summaries->get (node);
2616	if (s != NULL)
2617	{
2618	sum += s->time;
2619	if (node->count.ipa ().initialized_p ())
2620	sum_weighted += s->time * node->count.ipa ().to_gcov_type ();
2621	}
2622	}
2623	fprintf (stream: dump_file, format: "Overall time estimate: "
2624	"%f weighted by profile: "
2625	"%f\n", sum.to_double (), sum_weighted.to_double ());
2626	}
2627
2628	/ Output some useful stats about inlining. /
2629
2630	static void
2631	dump_inline_stats (void)
2632	{
2633	int64_t inlined_cnt = `0`, inlined_indir_cnt = `0`;
2634	int64_t inlined_virt_cnt = `0`, inlined_virt_indir_cnt = `0`;
2635	int64_t noninlined_cnt = `0`, noninlined_indir_cnt = `0`;
2636	int64_t noninlined_virt_cnt = `0`, noninlined_virt_indir_cnt = `0`;
2637	int64_t inlined_speculative = `0`, inlined_speculative_ply = `0`;
2638	int64_t indirect_poly_cnt = `0`, indirect_cnt = `0`;
2639	int64_t reason[CIF_N_REASONS][`2`];
2640	sreal reason_freq[CIF_N_REASONS];
2641	int i;
2642	struct cgraph_node *node;
2643
2644	memset (s: reason, c: `0`, n: sizeof (reason));
2645	for (i=`0`; i < CIF_N_REASONS; i++)
2646	reason_freq[i] = `0`;
2647	FOR_EACH_DEFINED_FUNCTION (node)
2648	{
2649	struct cgraph_edge *e;
2650	for (e = node->callees; e; e = e->next_callee)
2651	{
2652	if (e->inline_failed)
2653	{
2654	if (e->count.ipa ().initialized_p ())
2655	reason[(int) e->inline_failed][`0`] += e->count.ipa ().to_gcov_type ();
2656	reason_freq[(int) e->inline_failed] += e->sreal_frequency ();
2657	reason[(int) e->inline_failed][`1`] ++;
2658	if (DECL_VIRTUAL_P (e->callee->decl)
2659	&& e->count.ipa ().initialized_p ())
2660	{
2661	if (e->indirect_inlining_edge)
2662	noninlined_virt_indir_cnt += e->count.ipa ().to_gcov_type ();
2663	else
2664	noninlined_virt_cnt += e->count.ipa ().to_gcov_type ();
2665	}
2666	else if (e->count.ipa ().initialized_p ())
2667	{
2668	if (e->indirect_inlining_edge)
2669	noninlined_indir_cnt += e->count.ipa ().to_gcov_type ();
2670	else
2671	noninlined_cnt += e->count.ipa ().to_gcov_type ();
2672	}
2673	}
2674	else if (e->count.ipa ().initialized_p ())
2675	{
2676	if (e->speculative)
2677	{
2678	if (DECL_VIRTUAL_P (e->callee->decl))
2679	inlined_speculative_ply += e->count.ipa ().to_gcov_type ();
2680	else
2681	inlined_speculative += e->count.ipa ().to_gcov_type ();
2682	}
2683	else if (DECL_VIRTUAL_P (e->callee->decl))
2684	{
2685	if (e->indirect_inlining_edge)
2686	inlined_virt_indir_cnt += e->count.ipa ().to_gcov_type ();
2687	else
2688	inlined_virt_cnt += e->count.ipa ().to_gcov_type ();
2689	}
2690	else
2691	{
2692	if (e->indirect_inlining_edge)
2693	inlined_indir_cnt += e->count.ipa ().to_gcov_type ();
2694	else
2695	inlined_cnt += e->count.ipa ().to_gcov_type ();
2696	}
2697	}
2698	}
2699	for (e = node->indirect_calls; e; e = e->next_callee)
2700	if (e->indirect_info->polymorphic
2701	& e->count.ipa ().initialized_p ())
2702	indirect_poly_cnt += e->count.ipa ().to_gcov_type ();
2703	else if (e->count.ipa ().initialized_p ())
2704	indirect_cnt += e->count.ipa ().to_gcov_type ();
2705	}
2706	if (max_count.initialized_p ())
2707	{
2708	fprintf (stream: dump_file,
2709	format: "Inlined %" PRId64 " + speculative "
2710	"%" PRId64 " + speculative polymorphic "
2711	"%" PRId64 " + previously indirect "
2712	"%" PRId64 " + virtual "
2713	"%" PRId64 " + virtual and previously indirect "
2714	"%" PRId64 "\n" "Not inlined "
2715	"%" PRId64 " + previously indirect "
2716	"%" PRId64 " + virtual "
2717	"%" PRId64 " + virtual and previously indirect "
2718	"%" PRId64 " + still indirect "
2719	"%" PRId64 " + still indirect polymorphic "
2720	"%" PRId64 "\n", inlined_cnt,
2721	inlined_speculative, inlined_speculative_ply,
2722	inlined_indir_cnt, inlined_virt_cnt, inlined_virt_indir_cnt,
2723	noninlined_cnt, noninlined_indir_cnt, noninlined_virt_cnt,
2724	noninlined_virt_indir_cnt, indirect_cnt, indirect_poly_cnt);
2725	fprintf (stream: dump_file, format: "Removed speculations ");
2726	spec_rem.dump (f: dump_file);
2727	fprintf (stream: dump_file, format: "\n");
2728	}
2729	dump_overall_stats ();
2730	fprintf (stream: dump_file, format: "\nWhy inlining failed?\n");
2731	for (i = `0`; i < CIF_N_REASONS; i++)
2732	if (reason[i][`1`])
2733	fprintf (stream: dump_file, format: "%-50s: %8i calls, %8f freq, %" PRId64" count\n",
2734	cgraph_inline_failed_string ((cgraph_inline_failed_t) i),
2735	(int) reason[i][`1`], reason_freq[i].to_double (), reason[i][`0`]);
2736	}
2737
2738	/ Called when node is removed. /
2739
2740	static void
2741	flatten_remove_node_hook (struct cgraph_node node, void* *data)
2742	{
2743	if (lookup_attribute (attr_name: "flatten", DECL_ATTRIBUTES (node->decl)) == NULL)
2744	return;
2745
2746	hash_set<struct cgraph_node > removed
2747	= (hash_set<struct cgraph_node > ) data;
2748	removed->add (k: node);
2749	}
2750
2751	/ Decide on the inlining. We do so in the topological order to avoid*
2752	expenses on updating data structures. /*
2753
2754	static unsigned int
2755	ipa_inline (void)
2756	{
2757	struct cgraph_node *node;
2758	int nnodes;
2759	struct cgraph_node **order;
2760	int i, j;
2761	int cold;
2762	bool remove_functions = false;
2763
2764	order = XCNEWVEC (struct cgraph_node *, symtab->cgraph_count);
2765
2766	if (dump_file)
2767	ipa_dump_fn_summaries (f: dump_file);
2768
2769	nnodes = ipa_reverse_postorder (order);
2770	spec_rem = profile_count::zero ();
2771
2772	FOR_EACH_FUNCTION (node)
2773	{
2774	node->aux = `0`;
2775
2776	/ Recompute the default reasons for inlining because they may have*
2777	changed during merging. /*
2778	if (in_lto_p)
2779	{
2780	for (cgraph_edge *e = node->callees; e; e = e->next_callee)
2781	{
2782	gcc_assert (e->inline_failed);
2783	initialize_inline_failed (e);
2784	}
2785	for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
2786	initialize_inline_failed (e);
2787	}
2788	}
2789
2790	if (dump_file)
2791	fprintf (stream: dump_file, format: "\nFlattening functions:\n");
2792
2793	/ First shrink order array, so that it only contains nodes with*
2794	flatten attribute. /*
2795	for (i = nnodes - `1`, j = i; i >= `0`; i--)
2796	{
2797	node = order[i];
2798	if (node->definition
2799	/ Do not try to flatten aliases. These may happen for example when*
2800	creating local aliases. /*
2801	&& !node->alias
2802	&& lookup_attribute (attr_name: "flatten",
2803	DECL_ATTRIBUTES (node->decl)) != NULL)
2804	order[j--] = order[i];
2805	}
2806
2807	/ After the above loop, order[j + 1] ... order[nnodes - 1] contain*
2808	nodes with flatten attribute. If there is more than one such
2809	node, we need to register a node removal hook, as flatten_function
2810	could remove other nodes with flatten attribute. See PR82801. /*
2811	struct cgraph_node_hook_list *node_removal_hook_holder = NULL;
2812	hash_set<struct cgraph_node > flatten_removed_nodes = NULL;
2813	if (j < nnodes - `2`)
2814	{
2815	flatten_removed_nodes = new hash_set<struct cgraph_node *>;
2816	node_removal_hook_holder
2817	= symtab->add_cgraph_removal_hook (hook: &flatten_remove_node_hook,
2818	data: flatten_removed_nodes);
2819	}
2820
2821	/ In the first pass handle functions to be flattened. Do this with*
2822	a priority so none of our later choices will make this impossible. /*
2823	for (i = nnodes - `1`; i > j; i--)
2824	{
2825	node = order[i];
2826	if (flatten_removed_nodes
2827	&& flatten_removed_nodes->contains (k: node))
2828	continue;
2829
2830	/ Handle nodes to be flattened.*
2831	Ideally when processing callees we stop inlining at the
2832	entry of cycles, possibly cloning that entry point and
2833	try to flatten itself turning it into a self-recursive
2834	function. /*
2835	if (dump_file)
2836	fprintf (stream: dump_file, format: "Flattening %s\n", node->dump_name ());
2837	flatten_function (node, early: false, update: true);
2838	}
2839
2840	if (j < nnodes - `2`)
2841	{
2842	symtab->remove_cgraph_removal_hook (entry: node_removal_hook_holder);
2843	delete flatten_removed_nodes;
2844	}
2845	free (ptr: order);
2846
2847	if (dump_file)
2848	dump_overall_stats ();
2849
2850	inline_small_functions ();
2851
2852	gcc_assert (symtab->state == IPA_SSA);
2853	symtab->state = IPA_SSA_AFTER_INLINING;
2854	/ Do first after-inlining removal. We want to remove all "stale" extern*
2855	inline functions and virtual functions so we really know what is called
2856	once. /*
2857	symtab->remove_unreachable_nodes (file: dump_file);
2858
2859	/ Inline functions with a property that after inlining into all callers the*
2860	code size will shrink because the out-of-line copy is eliminated.
2861	We do this regardless on the callee size as long as function growth limits
2862	are met. /*
2863	if (dump_file)
2864	fprintf (stream: dump_file,
2865	format: "\nDeciding on functions to be inlined into all callers and "
2866	"removing useless speculations:\n");
2867
2868	/ Inlining one function called once has good chance of preventing*
2869	inlining other function into the same callee. Ideally we should
2870	work in priority order, but probably inlining hot functions first
2871	is good cut without the extra pain of maintaining the queue.
2872
2873	??? this is not really fitting the bill perfectly: inlining function
2874	into callee often leads to better optimization of callee due to
2875	increased context for optimization.
2876	For example if main() function calls a function that outputs help
2877	and then function that does the main optimization, we should inline
2878	the second with priority even if both calls are cold by themselves.
2879
2880	We probably want to implement new predicate replacing our use of
2881	maybe_hot_edge interpreted as maybe_hot_edge \|\| callee is known
2882	to be hot. /*
2883	for (cold = `0`; cold <= `1`; cold ++)
2884	{
2885	FOR_EACH_DEFINED_FUNCTION (node)
2886	{
2887	struct cgraph_edge edge, next;
2888	bool update=false;
2889
2890	if (!opt_for_fn (node->decl, optimize)
2891	\|\| !opt_for_fn (node->decl, flag_inline_functions_called_once))
2892	continue;
2893
2894	for (edge = node->callees; edge; edge = next)
2895	{
2896	next = edge->next_callee;
2897	if (edge->speculative && !speculation_useful_p (e: edge, anticipate_inlining: false))
2898	{
2899	if (edge->count.ipa ().initialized_p ())
2900	spec_rem += edge->count.ipa ();
2901	cgraph_edge::resolve_speculation (edge);
2902	update = true;
2903	remove_functions = true;
2904	}
2905	}
2906	if (update)
2907	{
2908	struct cgraph_node *where = node->inlined_to
2909	? node->inlined_to : node;
2910	reset_edge_caches (node: where);
2911	ipa_update_overall_fn_summary (node: where);
2912	}
2913	if (want_inline_function_to_all_callers_p (node, cold))
2914	{
2915	int num_calls = `0`;
2916	node->call_for_symbol_and_aliases (callback: sum_callers, data: &num_calls,
2917	include_overwritable: true);
2918	while (node->call_for_symbol_and_aliases
2919	(callback: inline_to_all_callers, data: &num_calls, include_overwritable: true))
2920	;
2921	remove_functions = true;
2922	}
2923	}
2924	}
2925
2926	if (dump_enabled_p ())
2927	dump_printf (MSG_NOTE,
2928	"\nInlined %i calls, eliminated %i functions\n\n",
2929	ncalls_inlined, nfunctions_inlined);
2930	if (dump_file)
2931	dump_inline_stats ();
2932
2933	if (dump_file)
2934	ipa_dump_fn_summaries (f: dump_file);
2935	return remove_functions ? TODO_remove_functions : `0`;
2936	}
2937
2938	/ Inline always-inline function calls in NODE*
2939	(which itself is possibly inline). /*
2940
2941	static bool
2942	inline_always_inline_functions (struct cgraph_node *node)
2943	{
2944	struct cgraph_edge *e;
2945	bool inlined = false;
2946
2947	for (e = node->callees; e; e = e->next_callee)
2948	{
2949	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
2950	gcc_checking_assert (!callee->aux \|\| callee->aux == (void *)(size_t)`1`);
2951	if (!DECL_DISREGARD_INLINE_LIMITS (callee->decl)
2952	/ Watch for self-recursive cycles. /
2953	\|\| callee->aux)
2954	continue;
2955
2956	if (e->recursive_p ())
2957	{
2958	if (dump_enabled_p ())
2959	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
2960	" Not inlining recursive call to %C.\n",
2961	e->callee);
2962	e->inline_failed = CIF_RECURSIVE_INLINING;
2963	continue;
2964	}
2965	if (callee->definition
2966	&& !ipa_fn_summaries->get (node: callee))
2967	compute_fn_summary (callee, true);
2968
2969	if (!can_early_inline_edge_p (e))
2970	{
2971	/ Set inlined to true if the callee is marked "always_inline" but*
2972	is not inlinable. This will allow flagging an error later in
2973	expand_call_inline in tree-inline.cc. /*
2974	if (lookup_attribute (attr_name: "always_inline",
2975	DECL_ATTRIBUTES (callee->decl)) != NULL)
2976	inlined = true;
2977	continue;
2978	}
2979
2980	if (dump_enabled_p ())
2981	dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
2982	" Inlining %C into %C (always_inline).\n",
2983	e->callee, e->caller);
2984	inline_call (e, true, NULL, NULL, false);
2985	callee->aux = (void *)(size_t)`1`;
2986	/ Inline recursively to handle the case where always_inline function was*
2987	not optimized yet since it is a part of a cycle in callgraph. /*
2988	inline_always_inline_functions (node: e->callee);
2989	callee->aux = NULL;
2990	inlined = true;
2991	}
2992	return inlined;
2993	}
2994
2995	/ Decide on the inlining. We do so in the topological order to avoid*
2996	expenses on updating data structures. /*
2997
2998	static bool
2999	early_inline_small_functions (struct cgraph_node *node)
3000	{
3001	struct cgraph_edge *e;
3002	bool inlined = false;
3003
3004	for (e = node->callees; e; e = e->next_callee)
3005	{
3006	struct cgraph_node *callee = e->callee->ultimate_alias_target ();
3007
3008	/ We can encounter not-yet-analyzed function during*
3009	early inlining on callgraphs with strongly
3010	connected components. /*
3011	ipa_fn_summary *s = ipa_fn_summaries->get (node: callee);
3012	if (s == NULL \|\| !s->inlinable \|\| !e->inline_failed)
3013	continue;
3014
3015	/ Do not consider functions not declared inline. /
3016	if (!DECL_DECLARED_INLINE_P (callee->decl)
3017	&& !opt_for_fn (node->decl, flag_inline_small_functions)
3018	&& !opt_for_fn (node->decl, flag_inline_functions))
3019	continue;
3020
3021	if (dump_enabled_p ())
3022	dump_printf_loc (MSG_NOTE, e->call_stmt,
3023	"Considering inline candidate %C.\n",
3024	callee);
3025
3026	if (!can_early_inline_edge_p (e))
3027	continue;
3028
3029	if (e->recursive_p ())
3030	{
3031	if (dump_enabled_p ())
3032	dump_printf_loc (MSG_MISSED_OPTIMIZATION, e->call_stmt,
3033	" Not inlining: recursive call.\n");
3034	continue;
3035	}
3036
3037	if (!want_early_inline_function_p (e))
3038	continue;
3039
3040	if (dump_enabled_p ())
3041	dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, e->call_stmt,
3042	" Inlining %C into %C.\n",
3043	callee, e->caller);
3044	inline_call (e, true, NULL, NULL, false);
3045	inlined = true;
3046	}
3047
3048	if (inlined)
3049	ipa_update_overall_fn_summary (node);
3050
3051	return inlined;
3052	}
3053
3054	unsigned int
3055	early_inliner (function *fun)
3056	{
3057	struct cgraph_node *node = cgraph_node::get (decl: current_function_decl);
3058	struct cgraph_edge *edge;
3059	unsigned int todo = `0`;
3060	int iterations = `0`;
3061	bool inlined = false;
3062
3063	if (seen_error ())
3064	return `0`;
3065
3066	/ Do nothing if datastructures for ipa-inliner are already computed. This*
3067	happens when some pass decides to construct new function and
3068	cgraph_add_new_function calls lowering passes and early optimization on
3069	it. This may confuse ourself when early inliner decide to inline call to
3070	function clone, because function clones don't have parameter list in
3071	ipa-prop matching their signature. /*
3072	if (ipa_node_params_sum)
3073	return `0`;
3074
3075	if (flag_checking)
3076	node->verify ();
3077	node->remove_all_references ();
3078
3079	/ Even when not optimizing or not inlining inline always-inline*
3080	functions. /*
3081	inlined = inline_always_inline_functions (node);
3082
3083	if (!optimize
3084	\|\| flag_no_inline
3085	\|\| !flag_early_inlining)
3086	;
3087	else if (lookup_attribute (attr_name: "flatten",
3088	DECL_ATTRIBUTES (node->decl)) != NULL)
3089	{
3090	/ When the function is marked to be flattened, recursively inline*
3091	all calls in it. /*
3092	if (dump_enabled_p ())
3093	dump_printf (MSG_OPTIMIZED_LOCATIONS,
3094	"Flattening %C\n", node);
3095	flatten_function (node, early: true, update: true);
3096	inlined = true;
3097	}
3098	else
3099	{
3100	/ If some always_inline functions was inlined, apply the changes.*
3101	This way we will not account always inline into growth limits and
3102	moreover we will inline calls from always inlines that we skipped
3103	previously because of conditional in can_early_inline_edge_p
3104	which prevents some inlining to always_inline. /*
3105	if (inlined)
3106	{
3107	timevar_push (tv: TV_INTEGRATION);
3108	todo \|= optimize_inline_calls (current_function_decl);
3109	/ optimize_inline_calls call above might have introduced new*
3110	statements that don't have inline parameters computed. /*
3111	for (edge = node->callees; edge; edge = edge->next_callee)
3112	{
3113	/ We can enounter not-yet-analyzed function during*
3114	early inlining on callgraphs with strongly
3115	connected components. /*
3116	ipa_call_summary *es = ipa_call_summaries->get_create (edge);
3117	es->call_stmt_size
3118	= estimate_num_insns (edge->call_stmt, &eni_size_weights);
3119	es->call_stmt_time
3120	= estimate_num_insns (edge->call_stmt, &eni_time_weights);
3121	}
3122	ipa_update_overall_fn_summary (node);
3123	inlined = false;
3124	timevar_pop (tv: TV_INTEGRATION);
3125	}
3126	/ We iterate incremental inlining to get trivial cases of indirect*
3127	inlining. /*
3128	while (iterations < opt_for_fn (node->decl,
3129	param_early_inliner_max_iterations)
3130	&& early_inline_small_functions (node))
3131	{
3132	timevar_push (tv: TV_INTEGRATION);
3133	todo \|= optimize_inline_calls (current_function_decl);
3134
3135	/ Technically we ought to recompute inline parameters so the new*
3136	iteration of early inliner works as expected. We however have
3137	values approximately right and thus we only need to update edge
3138	info that might be cleared out for newly discovered edges. /*
3139	for (edge = node->callees; edge; edge = edge->next_callee)
3140	{
3141	/ We have no summary for new bound store calls yet. /
3142	ipa_call_summary *es = ipa_call_summaries->get_create (edge);
3143	es->call_stmt_size
3144	= estimate_num_insns (edge->call_stmt, &eni_size_weights);
3145	es->call_stmt_time
3146	= estimate_num_insns (edge->call_stmt, &eni_time_weights);
3147	}
3148	if (iterations < opt_for_fn (node->decl,
3149	param_early_inliner_max_iterations) - `1`)
3150	ipa_update_overall_fn_summary (node);
3151	timevar_pop (tv: TV_INTEGRATION);
3152	iterations++;
3153	inlined = false;
3154	}
3155	if (dump_file)
3156	fprintf (stream: dump_file, format: "Iterations: %i\n", iterations);
3157	}
3158
3159	if (inlined)
3160	{
3161	timevar_push (tv: TV_INTEGRATION);
3162	todo \|= optimize_inline_calls (current_function_decl);
3163	timevar_pop (tv: TV_INTEGRATION);
3164	}
3165
3166	fun->always_inline_functions_inlined = true;
3167
3168	return todo;
3169	}
3170
3171	/ Do inlining of small functions. Doing so early helps profiling and other*
3172	passes to be somewhat more effective and avoids some code duplication in
3173	later real inlining pass for testcases with very many function calls. /*
3174
3175	namespace {
3176
3177	const pass_data pass_data_early_inline =
3178	{
3179	.type: GIMPLE_PASS, / type /
3180	.name: "einline", / name /
3181	.optinfo_flags: OPTGROUP_INLINE, / optinfo_flags /
3182	.tv_id: TV_EARLY_INLINING, / tv_id /
3183	PROP_ssa, / properties_required /
3184	.properties_provided: `0`, / properties_provided /
3185	.properties_destroyed: `0`, / properties_destroyed /
3186	.todo_flags_start: `0`, / todo_flags_start /
3187	.todo_flags_finish: `0`, / todo_flags_finish /
3188	};
3189
3190	class pass_early_inline : public gimple_opt_pass
3191	{
3192	public:
3193	pass_early_inline (gcc::context *ctxt)
3194	: gimple_opt_pass (pass_data_early_inline, ctxt)
3195	{}
3196
3197	/ opt_pass methods: /
3198	unsigned int execute (function *) final override;
3199
3200	}; // class pass_early_inline
3201
3202	unsigned int
3203	pass_early_inline::execute (function *fun)
3204	{
3205	return early_inliner (fun);
3206	}
3207
3208	} // anon namespace
3209
3210	gimple_opt_pass *
3211	make_pass_early_inline (gcc::context *ctxt)
3212	{
3213	return new pass_early_inline (ctxt);
3214	}
3215
3216	namespace {
3217
3218	const pass_data pass_data_ipa_inline =
3219	{
3220	.type: IPA_PASS, / type /
3221	.name: "inline", / name /
3222	.optinfo_flags: OPTGROUP_INLINE, / optinfo_flags /
3223	.tv_id: TV_IPA_INLINING, / tv_id /
3224	.properties_required: `0`, / properties_required /
3225	.properties_provided: `0`, / properties_provided /
3226	.properties_destroyed: `0`, / properties_destroyed /
3227	.todo_flags_start: `0`, / todo_flags_start /
3228	.todo_flags_finish: ( TODO_dump_symtab ), / todo_flags_finish /
3229	};
3230
3231	class pass_ipa_inline : public ipa_opt_pass_d
3232	{
3233	public:
3234	pass_ipa_inline (gcc::context *ctxt)
3235	: ipa_opt_pass_d (pass_data_ipa_inline, ctxt,
3236	NULL, / generate_summary /
3237	NULL, / write_summary /
3238	NULL, / read_summary /
3239	NULL, / write_optimization_summary /
3240	NULL, / read_optimization_summary /
3241	NULL, / stmt_fixup /
3242	`0`, / function_transform_todo_flags_start /
3243	inline_transform, / function_transform /
3244	NULL) / variable_transform /
3245	{}
3246
3247	/ opt_pass methods: /
3248	unsigned int execute (function ) final override { return* ipa_inline (); }
3249
3250	}; // class pass_ipa_inline
3251
3252	} // anon namespace
3253
3254	ipa_opt_pass_d *
3255	make_pass_ipa_inline (gcc::context *ctxt)
3256	{
3257	return new pass_ipa_inline (ctxt);
3258	}
3259

source code of gcc/ipa-inline.cc