libFirm
|
Topics | |
Flags | |
Flags to customize the behavior of libfirm. | |
Graph Transformations | |
Local Optimizations | |
Macros | |
#define | osr_flag_default osr_flag_lftr_with_ov_check |
default setting | |
#define | DEFAULT_CLONE_THRESHOLD 20 |
A default threshold. | |
Typedefs | |
typedef int(* | check_alloc_entity_func) (ir_entity *ent) |
A callback that checks whether a entity is an allocation routine. | |
typedef int(* | arch_allow_ifconv_func) (ir_node const *sel, ir_node const *mux_false, ir_node const *mux_true) |
This function is called to evaluate, if a mux(sel , mux_false , mux_true ) should be built for the current architecture. | |
typedef void(* | opt_ptr) (ir_graph *irg) |
pointer to an optimization function | |
Enumerations | |
enum | osr_flags { osr_flag_none = 0 , osr_flag_lftr_with_ov_check = 1 , osr_flag_ignore_x86_shift = 2 , osr_flag_keep_reg_pressure = 4 } |
Possible flags for the Operator Scalar Replacement. More... | |
Functions | |
void | optimize_cf (ir_graph *irg) |
Control flow optimization. | |
void | opt_jumpthreading (ir_graph *irg) |
Perform path-sensitive jump threading on the given graph. | |
void | opt_bool (ir_graph *irg) |
Simplifies boolean expression in the given ir graph. | |
void | conv_opt (ir_graph *irg) |
Reduces the number of Conv nodes in the given ir graph. | |
void | optimize_funccalls (void) |
Optimize function calls by handling const functions. | |
void | do_gvn_pre (ir_graph *irg) |
Does Partial Redundancy Elimination combined with Global Value Numbering. | |
void | opt_if_conv (ir_graph *irg) |
Perform If conversion on a graph. | |
void | opt_if_conv_cb (ir_graph *irg, arch_allow_ifconv_func callback) |
Perform If conversion on a graph - callback version. | |
void | opt_parallelize_mem (ir_graph *irg) |
Tries to reduce dependencies for memory nodes where possible by parallelizing them and synchronizing with Sync nodes. | |
ir_node * | can_replace_load_by_const (const ir_node *load, ir_node *c) |
Check if we can replace the load by a given const from the const code irg. | |
void | optimize_load_store (ir_graph *irg) |
Load/Store optimization. | |
void | combine_memops (ir_graph *irg) |
Combine adjacent "small" load/store operations into bigger ones. | |
void | opt_ldst (ir_graph *irg) |
New experimental alternative to optimize_load_store. | |
void | opt_frame_irg (ir_graph *irg) |
Optimize the frame type of an irg by removing never touched entities. | |
void | opt_osr (ir_graph *irg, unsigned flags) |
Performs the Operator Scalar Replacement optimization and linear function test replacement for loop control. | |
void | remove_phi_cycles (ir_graph *irg) |
Removes useless Phi cycles, i.e cycles of Phi nodes with only one non-Phi node. | |
void | proc_cloning (float threshold) |
Performs procedure cloning. | |
void | optimize_reassociation (ir_graph *irg) |
Reassociation. | |
void | normalize_one_return (ir_graph *irg) |
Normalize the Returns of a graph by creating a new End block with One Return(Phi). | |
void | normalize_n_returns (ir_graph *irg) |
Normalize the Returns of a graph by moving the Returns upwards as much as possible. | |
void | scalar_replacement_opt (ir_graph *irg) |
Performs the scalar replacement optimization. | |
void | opt_tail_rec_irg (ir_graph *irg) |
Optimizes tail-recursion calls by converting them into loops. | |
void | combo (ir_graph *irg) |
CLiff Click's combo algorithm from "Combining Analyses, combining Optimizations". | |
void | inline_functions (unsigned maxsize, int inline_threshold, opt_ptr after_inline_opt) |
Heuristic inliner. | |
void | shape_blocks (ir_graph *irg) |
Combines congruent blocks into one. | |
void | do_loop_inversion (ir_graph *irg) |
Perform loop inversion on a given graph. | |
void | do_loop_unrolling (ir_graph *irg) |
Perform loop unrolling on a given graph. | |
void | unroll_loops (ir_graph *irg, unsigned factor, unsigned maxsize) |
Perform loop unrolling on a given graph. | |
void | do_loop_peeling (ir_graph *irg) |
Perform loop peeling on a given graph. | |
void | garbage_collect_entities (void) |
Removes all entities which are unused. | |
void | dead_node_elimination (ir_graph *irg) |
Performs dead node elimination by copying the ir graph to a new obstack. | |
void | place_code (ir_graph *irg) |
Code Placement. | |
void | occult_consts (ir_graph *) |
This optimization finds values where the bits are either constant or irrelevant and exchanges them for a corresponding constant. | |
int | value_not_null (const ir_node *n, const ir_node **confirm) |
Returns true if the value n is known not be zero/null. | |
ir_tarval * | computed_value_Cmp_Confirm (ir_node *left, ir_node *right, ir_relation relation) |
Returns the value of a Cmp if one or both predecessors are Confirm nodes. | |
ir_entity * | create_compilerlib_entity (char const *name, ir_type *mt) |
Constructs the entity for a given function using the current compilerlib entity creation callback. | |
#define DEFAULT_CLONE_THRESHOLD 20 |
A default threshold.
Definition at line 289 of file iroptimize.h.
#define osr_flag_default osr_flag_lftr_with_ov_check |
default setting
Definition at line 216 of file iroptimize.h.
typedef int(* arch_allow_ifconv_func) (ir_node const *sel, ir_node const *mux_false, ir_node const *mux_true) |
This function is called to evaluate, if a mux(sel
, mux_false
, mux_true
) should be built for the current architecture.
If it returns non-zero, a mux is created, else the code is not modified.
sel | A selector of a Cond. |
phi_list | phi node to be converted |
i | First data predecessor involved in if conversion |
j | Second data predecessor involved in if conversion |
Definition at line 109 of file iroptimize.h.
typedef int(* check_alloc_entity_func) (ir_entity *ent) |
A callback that checks whether a entity is an allocation routine.
Definition at line 61 of file iroptimize.h.
typedef void(* opt_ptr) (ir_graph *irg) |
pointer to an optimization function
Definition at line 401 of file iroptimize.h.
enum osr_flags |
Possible flags for the Operator Scalar Replacement.
Definition at line 206 of file iroptimize.h.
Check if we can replace the load by a given const from the const code irg.
load | the load to replace |
c | the constant |
void combine_memops | ( | ir_graph * | irg | ) |
Combine adjacent "small" load/store operations into bigger ones.
void combo | ( | ir_graph * | irg | ) |
CLiff Click's combo algorithm from "Combining Analyses, combining Optimizations".
Does conditional constant propagation, unreachable code elimination and optimistic global value numbering at once.
irg | the graph to run on |
ir_tarval * computed_value_Cmp_Confirm | ( | ir_node * | left, |
ir_node * | right, | ||
ir_relation | relation ) |
Returns the value of a Cmp if one or both predecessors are Confirm nodes.
left | the left operand of the Cmp |
right | the right operand of the Cmp |
relation | the compare relation |
void conv_opt | ( | ir_graph * | irg | ) |
Reduces the number of Conv nodes in the given ir graph.
irg | the graph |
Constructs the entity for a given function using the current compilerlib entity creation callback.
void dead_node_elimination | ( | ir_graph * | irg | ) |
Performs dead node elimination by copying the ir graph to a new obstack.
The major intention of this pass is to free memory occupied by dead nodes and outdated analyzes information. Further this function removes Bad predecessors from Blocks and the corresponding inputs to Phi nodes. This opens optimization potential for other optimizations. Further this phase reduces dead Block<->Jmp self-cycles to Bad nodes.
Dead_node_elimination is only performed if options ‘optimize’ and ‘opt_dead_node_elimination’ are set. The graph may not be in state phase_building. The outs data structure is freed, the outs state set to outs_none. Backedge information is conserved. Removes old attributes of nodes. Sets link field to NULL. Callee information must be freed (irg_callee_info_none).
irg | The graph to be optimized. |
void do_gvn_pre | ( | ir_graph * | irg | ) |
Does Partial Redundancy Elimination combined with Global Value Numbering.
Can be used to replace place_code() completely.
Based on VanDrunen and Hosking 2004.
irg | the graph |
void do_loop_inversion | ( | ir_graph * | irg | ) |
Perform loop inversion on a given graph.
Loop inversion transforms a head controlled loop (like while(...) {} and for(...) {}) into a foot controlled loop (do {} while(...)).
void do_loop_peeling | ( | ir_graph * | irg | ) |
Perform loop peeling on a given graph.
void do_loop_unrolling | ( | ir_graph * | irg | ) |
Perform loop unrolling on a given graph.
Loop unrolling multiplies the number loop completely by a number found through a heuristic.
void garbage_collect_entities | ( | void | ) |
Removes all entities which are unused.
Unused entities have ir_visibility_local and are not used directly or indirectly through entities/code visible outside the compilation unit. This is usually conservative than gc_irgs, but does not respect properties of object-oriented programs.
void inline_functions | ( | unsigned | maxsize, |
int | inline_threshold, | ||
opt_ptr | after_inline_opt ) |
Heuristic inliner.
Calculates a benefice value for every call and inlines those calls with a value higher than the threshold.
maxsize | Do not inline any calls if a method has more than maxsize firm nodes. It may reach this limit by inlining. |
inline_threshold | inlining threshold |
after_inline_opt | optimizations performed immediately after inlining some calls |
void normalize_n_returns | ( | ir_graph * | irg | ) |
Normalize the Returns of a graph by moving the Returns upwards as much as possible.
This might be preferred for code generation.
In pseudocode, it means:
if (a) res = b; else res = c; return res;
is transformed into
if (a) return b; else return c;
void normalize_one_return | ( | ir_graph * | irg | ) |
Normalize the Returns of a graph by creating a new End block with One Return(Phi).
This is the preferred input for the if-conversion.
In pseudocode, it means:
if (a) return b; else return c;
is transformed into
if (a) res = b; else res = c; return res;
void occult_consts | ( | ir_graph * | ) |
This optimization finds values where the bits are either constant or irrelevant and exchanges them for a corresponding constant.
void opt_bool | ( | ir_graph * | irg | ) |
Simplifies boolean expression in the given ir graph.
eg. x < 5 && x < 6 becomes x < 5
irg | the graph |
void opt_frame_irg | ( | ir_graph * | irg | ) |
Optimize the frame type of an irg by removing never touched entities.
irg | The graph whose frame type will be optimized |
This function did not change the graph, only its frame type. The layout state of the frame type will be set to layout_undefined if entities were removed.
void opt_if_conv | ( | ir_graph * | irg | ) |
Perform If conversion on a graph.
irg | The graph. |
Cannot handle blocks with Bad control predecessors, so call it after control flow optimization.
void opt_if_conv_cb | ( | ir_graph * | irg, |
arch_allow_ifconv_func | callback ) |
Perform If conversion on a graph - callback version.
irg | The graph. |
callback | The predicate. |
Like above, but let the caller decide about valid transformations by supplying a predicate function.
void opt_jumpthreading | ( | ir_graph * | irg | ) |
Perform path-sensitive jump threading on the given graph.
irg | the graph |
void opt_ldst | ( | ir_graph * | irg | ) |
New experimental alternative to optimize_load_store.
Based on a dataflow analysis, so load/stores are moved out of loops where possible
void opt_osr | ( | ir_graph * | irg, |
unsigned | flags ) |
Performs the Operator Scalar Replacement optimization and linear function test replacement for loop control.
irg | the graph which should be optimized |
flags | set of osr_flags |
The linear function replacement test is controlled by the flags. If the osr_flag_lftr_with_ov_check is set, the replacement is only done if do overflow can occur. Otherwise it is ALWAYS done which might be insecure.
For instance:
for (i = 0; i < 100; ++i)
might be replaced by
for (i = 0; i < 400; i += 4)
But
for (i = 0; i < 0x7FFFFFFF; ++i)
will not be replaced by
for (i = 0; i < 0xFFFFFFFC; i += 4)
because of overflow.
More bad cases:
for (i = 0; i <= 0xF; ++i)
will NOT be transformed into
for (i = 0xFFFFFFF0; i <= 0xFFFFFFFF; ++i)
although here is no direct overflow. The OV occurs when the ++i is executed (and would created an endless loop here!).
For the same reason, a loop
for (i = 0; i <= 9; i += x)
will NOT be transformed because we cannot estimate whether an overflow might happen adding x.
Note that i < a + 400 is also not possible with the current implementation although this might be allowed by other compilers...
Note further that tests for equality can be handled some simpler (but are not implemented yet).
This algorithm destroys the link field of nodes.
void opt_parallelize_mem | ( | ir_graph * | irg | ) |
Tries to reduce dependencies for memory nodes where possible by parallelizing them and synchronizing with Sync nodes.
irg | the graph where memory operations should be parallelized |
void opt_tail_rec_irg | ( | ir_graph * | irg | ) |
Optimizes tail-recursion calls by converting them into loops.
Depends on the flag opt_tail_recursion. Currently supports the following forms:
Does not work for Calls that use the exception stuff.
irg | the graph to be optimized |
void optimize_cf | ( | ir_graph * | irg | ) |
Control flow optimization.
Removes empty blocks doing if simplifications and loop simplifications. A block is empty if it contains only a Jmp node and Phi nodes. Merges single entry single exit blocks with their predecessor and propagates dead control flow by calling equivalent_node(). Independent of compiler flag it removes Tuples from cf edges, Bad predecessors from Blocks and Phis, and unnecessary predecessors of End. Destroys backedge information.
void optimize_funccalls | ( | void | ) |
Optimize function calls by handling const functions.
This optimization first detects all "const functions", i.e., IR graphs that neither read nor write memory (and hence did not create exceptions, as these use memory in Firm).
The result of calls to such functions depends only on its arguments, hence those calls are no more pinned.
This is a rather strong criteria, so do not expect that a lot of functions will be found. Moreover, all of them might already be inlined if inlining is activated. Anyway, it might be good for handling builtin's even if the later read/write memory (but we know how).
This optimization reads the irg_const_function property of entities, and sets the irg_const_function property of graphs.
If callee information is valid, we also optimize polymorphic Calls.
void optimize_load_store | ( | ir_graph * | irg | ) |
Load/Store optimization.
Removes redundant non-volatile Loads and Stores. May introduce Bad nodes if exceptional control flow is removed. The following cases are optimized:
Load without result: A Load which has only a memory use is removed.
Load after Store: A Load after a Store is removed, if the Load doesn't have an exception handler OR is in the same block as the Store.
Load after Load: A Load after a Load is removed, if the Load doesn't have an exception handler OR is in the same block as the previous Load.
Store before Store: A Store immediately before another Store in the same block is removed, if the Store doesn't have an exception handler.
Store after Load: A Store after a Load is removed, if the Store doesn't have an exception handler.
void optimize_reassociation | ( | ir_graph * | irg | ) |
Reassociation.
Applies Reassociation rules to integer expressions. Beware: Works only if integer overflow might be ignored, as for C, Java and for address expression. Works only if Constant folding is activated.
Uses loop information to detect loop-invariant (i.e. constant inside the loop) values.
See Muchnik 12.3.1 Algebraic Simplification and Reassociation of Addressing Expressions.
void place_code | ( | ir_graph * | irg | ) |
Code Placement.
Pins all floating nodes to a block where they will be executed only if needed. Depends on the flag opt_global_cse. Graph may not be in phase_building. Does not schedule control dead code. Uses dominator information which it computes if the irg is not in state dom_consistent. Destroys the out information as it moves nodes to other blocks. Optimizes Tuples in Control edges.
Call remove_critical_cf_edges() before place_code(). This normalizes the control flow graph so that for all operations a basic block exists where they can be optimally placed.
void proc_cloning | ( | float | threshold | ) |
Performs procedure cloning.
Evaluate a heuristic weight for every Call(..., Const, ...). If the weight is bigger than threshold, clone the entity and fix the calls.
threshold | the threshold for cloning |
The threshold is an estimation of how many instructions are saved when executing a cloned method. If threshold is 0.0, every possible call is cloned.
void remove_phi_cycles | ( | ir_graph * | irg | ) |
Removes useless Phi cycles, i.e cycles of Phi nodes with only one non-Phi node.
This is automatically done in opt_osr(), so there is no need to call it additionally.
irg | the graph which should be optimized |
This algorithm destroys the link field of nodes.
void scalar_replacement_opt | ( | ir_graph * | irg | ) |
Performs the scalar replacement optimization.
Replaces local compound entities (like structures and arrays) with atomic values if possible. Does not handle classes yet.
irg | the graph which should be optimized |
void shape_blocks | ( | ir_graph * | irg | ) |
Combines congruent blocks into one.
irg | The IR-graph to optimize. |
void unroll_loops | ( | ir_graph * | irg, |
unsigned | factor, | ||
unsigned | maxsize ) |
Perform loop unrolling on a given graph.
irg | the IR-graph to optimize |
factor | the unroll factor |
maxsize | the maximum number of nodes in a loop |