ira-int.h revision 1.13 1 /* Integrated Register Allocator (IRA) intercommunication header file.
2 Copyright (C) 2006-2022 Free Software Foundation, Inc.
3 Contributed by Vladimir Makarov <vmakarov (at) redhat.com>.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 #ifndef GCC_IRA_INT_H
22 #define GCC_IRA_INT_H
23
24 #include "recog.h"
25 #include "function-abi.h"
26
27 /* To provide consistency in naming, all IRA external variables,
28 functions, common typedefs start with prefix ira_. */
29
30 #if CHECKING_P
31 #define ENABLE_IRA_CHECKING
32 #endif
33
34 #ifdef ENABLE_IRA_CHECKING
35 #define ira_assert(c) gcc_assert (c)
36 #else
37 /* Always define and include C, so that warnings for empty body in an
38 'if' statement and unused variable do not occur. */
39 #define ira_assert(c) ((void)(0 && (c)))
40 #endif
41
42 /* Compute register frequency from edge frequency FREQ. It is
43 analogous to REG_FREQ_FROM_BB. When optimizing for size, or
44 profile driven feedback is available and the function is never
45 executed, frequency is always equivalent. Otherwise rescale the
46 edge frequency. */
47 #define REG_FREQ_FROM_EDGE_FREQ(freq) \
48 (optimize_function_for_size_p (cfun) \
49 ? REG_FREQ_MAX : (freq * REG_FREQ_MAX / BB_FREQ_MAX) \
50 ? (freq * REG_FREQ_MAX / BB_FREQ_MAX) : 1)
51
52 /* A modified value of flag `-fira-verbose' used internally. */
53 extern int internal_flag_ira_verbose;
54
55 /* Dump file of the allocator if it is not NULL. */
56 extern FILE *ira_dump_file;
57
58 /* Typedefs for pointers to allocno live range, allocno, and copy of
59 allocnos. */
60 typedef struct live_range *live_range_t;
61 typedef struct ira_allocno *ira_allocno_t;
62 typedef struct ira_allocno_pref *ira_pref_t;
63 typedef struct ira_allocno_copy *ira_copy_t;
64 typedef struct ira_object *ira_object_t;
65
66 /* Definition of vector of allocnos and copies. */
67
68 /* Typedef for pointer to the subsequent structure. */
69 typedef struct ira_loop_tree_node *ira_loop_tree_node_t;
70
71 typedef unsigned short move_table[N_REG_CLASSES];
72
73 /* In general case, IRA is a regional allocator. The regions are
74 nested and form a tree. Currently regions are natural loops. The
75 following structure describes loop tree node (representing basic
76 block or loop). We need such tree because the loop tree from
77 cfgloop.h is not convenient for the optimization: basic blocks are
78 not a part of the tree from cfgloop.h. We also use the nodes for
79 storing additional information about basic blocks/loops for the
80 register allocation purposes. */
81 struct ira_loop_tree_node
82 {
83 /* The node represents basic block if children == NULL. */
84 basic_block bb; /* NULL for loop. */
85 /* NULL for BB or for loop tree root if we did not build CFG loop tree. */
86 class loop *loop;
87 /* NEXT/SUBLOOP_NEXT is the next node/loop-node of the same parent.
88 SUBLOOP_NEXT is always NULL for BBs. */
89 ira_loop_tree_node_t subloop_next, next;
90 /* CHILDREN/SUBLOOPS is the first node/loop-node immediately inside
91 the node. They are NULL for BBs. */
92 ira_loop_tree_node_t subloops, children;
93 /* The node immediately containing given node. */
94 ira_loop_tree_node_t parent;
95
96 /* Loop level in range [0, ira_loop_tree_height). */
97 int level;
98
99 /* All the following members are defined only for nodes representing
100 loops. */
101
102 /* The loop number from CFG loop tree. The root number is 0. */
103 int loop_num;
104
105 /* True if the loop was marked for removal from the register
106 allocation. */
107 bool to_remove_p;
108
109 /* Allocnos in the loop corresponding to their regnos. If it is
110 NULL the loop does not form a separate register allocation region
111 (e.g. because it has abnormal enter/exit edges and we cannot put
112 code for register shuffling on the edges if a different
113 allocation is used for a pseudo-register on different sides of
114 the edges). Caps are not in the map (remember we can have more
115 one cap with the same regno in a region). */
116 ira_allocno_t *regno_allocno_map;
117
118 /* True if there is an entry to given loop not from its parent (or
119 grandparent) basic block. For example, it is possible for two
120 adjacent loops inside another loop. */
121 bool entered_from_non_parent_p;
122
123 /* Maximal register pressure inside loop for given register class
124 (defined only for the pressure classes). */
125 int reg_pressure[N_REG_CLASSES];
126
127 /* Numbers of allocnos referred or living in the loop node (except
128 for its subloops). */
129 bitmap all_allocnos;
130
131 /* Numbers of allocnos living at the loop borders. */
132 bitmap border_allocnos;
133
134 /* Regnos of pseudos modified in the loop node (including its
135 subloops). */
136 bitmap modified_regnos;
137
138 /* Numbers of copies referred in the corresponding loop. */
139 bitmap local_copies;
140 };
141
142 /* The root of the loop tree corresponding to the all function. */
143 extern ira_loop_tree_node_t ira_loop_tree_root;
144
145 /* Height of the loop tree. */
146 extern int ira_loop_tree_height;
147
148 /* All nodes representing basic blocks are referred through the
149 following array. We cannot use basic block member `aux' for this
150 because it is used for insertion of insns on edges. */
151 extern ira_loop_tree_node_t ira_bb_nodes;
152
153 /* Two access macros to the nodes representing basic blocks. */
154 #if defined ENABLE_IRA_CHECKING && (GCC_VERSION >= 2007)
155 #define IRA_BB_NODE_BY_INDEX(index) __extension__ \
156 (({ ira_loop_tree_node_t _node = (&ira_bb_nodes[index]); \
157 if (_node->children != NULL || _node->loop != NULL || _node->bb == NULL)\
158 { \
159 fprintf (stderr, \
160 "\n%s: %d: error in %s: it is not a block node\n", \
161 __FILE__, __LINE__, __FUNCTION__); \
162 gcc_unreachable (); \
163 } \
164 _node; }))
165 #else
166 #define IRA_BB_NODE_BY_INDEX(index) (&ira_bb_nodes[index])
167 #endif
168
169 #define IRA_BB_NODE(bb) IRA_BB_NODE_BY_INDEX ((bb)->index)
170
171 /* All nodes representing loops are referred through the following
172 array. */
173 extern ira_loop_tree_node_t ira_loop_nodes;
174
175 /* Two access macros to the nodes representing loops. */
176 #if defined ENABLE_IRA_CHECKING && (GCC_VERSION >= 2007)
177 #define IRA_LOOP_NODE_BY_INDEX(index) __extension__ \
178 (({ ira_loop_tree_node_t const _node = (&ira_loop_nodes[index]); \
179 if (_node->children == NULL || _node->bb != NULL \
180 || (_node->loop == NULL && current_loops != NULL)) \
181 { \
182 fprintf (stderr, \
183 "\n%s: %d: error in %s: it is not a loop node\n", \
184 __FILE__, __LINE__, __FUNCTION__); \
185 gcc_unreachable (); \
186 } \
187 _node; }))
188 #else
189 #define IRA_LOOP_NODE_BY_INDEX(index) (&ira_loop_nodes[index])
190 #endif
191
192 #define IRA_LOOP_NODE(loop) IRA_LOOP_NODE_BY_INDEX ((loop)->num)
193
194
195 /* The structure describes program points where a given allocno lives.
197 If the live ranges of two allocnos are intersected, the allocnos
198 are in conflict. */
199 struct live_range
200 {
201 /* Object whose live range is described by given structure. */
202 ira_object_t object;
203 /* Program point range. */
204 int start, finish;
205 /* Next structure describing program points where the allocno
206 lives. */
207 live_range_t next;
208 /* Pointer to structures with the same start/finish. */
209 live_range_t start_next, finish_next;
210 };
211
212 /* Program points are enumerated by numbers from range
213 0..IRA_MAX_POINT-1. There are approximately two times more program
214 points than insns. Program points are places in the program where
215 liveness info can be changed. In most general case (there are more
216 complicated cases too) some program points correspond to places
217 where input operand dies and other ones correspond to places where
218 output operands are born. */
219 extern int ira_max_point;
220
221 /* Arrays of size IRA_MAX_POINT mapping a program point to the allocno
222 live ranges with given start/finish point. */
223 extern live_range_t *ira_start_point_ranges, *ira_finish_point_ranges;
224
225 /* A structure representing conflict information for an allocno
226 (or one of its subwords). */
227 struct ira_object
228 {
229 /* The allocno associated with this record. */
230 ira_allocno_t allocno;
231 /* Vector of accumulated conflicting conflict_redords with NULL end
232 marker (if OBJECT_CONFLICT_VEC_P is true) or conflict bit vector
233 otherwise. */
234 void *conflicts_array;
235 /* Pointer to structures describing at what program point the
236 object lives. We always maintain the list in such way that *the
237 ranges in the list are not intersected and ordered by decreasing
238 their program points*. */
239 live_range_t live_ranges;
240 /* The subword within ALLOCNO which is represented by this object.
241 Zero means the lowest-order subword (or the entire allocno in case
242 it is not being tracked in subwords). */
243 int subword;
244 /* Allocated size of the conflicts array. */
245 unsigned int conflicts_array_size;
246 /* A unique number for every instance of this structure, which is used
247 to represent it in conflict bit vectors. */
248 int id;
249 /* Before building conflicts, MIN and MAX are initialized to
250 correspondingly minimal and maximal points of the accumulated
251 live ranges. Afterwards, they hold the minimal and maximal ids
252 of other ira_objects that this one can conflict with. */
253 int min, max;
254 /* Initial and accumulated hard registers conflicting with this
255 object and as a consequences cannot be assigned to the allocno.
256 All non-allocatable hard regs and hard regs of register classes
257 different from given allocno one are included in the sets. */
258 HARD_REG_SET conflict_hard_regs, total_conflict_hard_regs;
259 /* Number of accumulated conflicts in the vector of conflicting
260 objects. */
261 int num_accumulated_conflicts;
262 /* TRUE if conflicts are represented by a vector of pointers to
263 ira_object structures. Otherwise, we use a bit vector indexed
264 by conflict ID numbers. */
265 unsigned int conflict_vec_p : 1;
266 };
267
268 /* A structure representing an allocno (allocation entity). Allocno
269 represents a pseudo-register in an allocation region. If
270 pseudo-register does not live in a region but it lives in the
271 nested regions, it is represented in the region by special allocno
272 called *cap*. There may be more one cap representing the same
273 pseudo-register in region. It means that the corresponding
274 pseudo-register lives in more one non-intersected subregion. */
275 struct ira_allocno
276 {
277 /* The allocno order number starting with 0. Each allocno has an
278 unique number and the number is never changed for the
279 allocno. */
280 int num;
281 /* Regno for allocno or cap. */
282 int regno;
283 /* Mode of the allocno which is the mode of the corresponding
284 pseudo-register. */
285 ENUM_BITFIELD (machine_mode) mode : 8;
286 /* Widest mode of the allocno which in at least one case could be
287 for paradoxical subregs where wmode > mode. */
288 ENUM_BITFIELD (machine_mode) wmode : 8;
289 /* Register class which should be used for allocation for given
290 allocno. NO_REGS means that we should use memory. */
291 ENUM_BITFIELD (reg_class) aclass : 16;
292 /* A bitmask of the ABIs used by calls that occur while the allocno
293 is live. */
294 unsigned int crossed_calls_abis : NUM_ABI_IDS;
295 /* During the reload, value TRUE means that we should not reassign a
296 hard register to the allocno got memory earlier. It is set up
297 when we removed memory-memory move insn before each iteration of
298 the reload. */
299 unsigned int dont_reassign_p : 1;
300 #ifdef STACK_REGS
301 /* Set to TRUE if allocno can't be assigned to the stack hard
302 register correspondingly in this region and area including the
303 region and all its subregions recursively. */
304 unsigned int no_stack_reg_p : 1, total_no_stack_reg_p : 1;
305 #endif
306 /* TRUE value means that there is no sense to spill the allocno
307 during coloring because the spill will result in additional
308 reloads in reload pass. */
309 unsigned int bad_spill_p : 1;
310 /* TRUE if a hard register or memory has been assigned to the
311 allocno. */
312 unsigned int assigned_p : 1;
313 /* TRUE if conflicts for given allocno are represented by vector of
314 pointers to the conflicting allocnos. Otherwise, we use a bit
315 vector where a bit with given index represents allocno with the
316 same number. */
317 unsigned int conflict_vec_p : 1;
318 /* True if the parent loop has an allocno for the same register and
319 if the parent allocno's assignment might not be valid in this loop.
320 This means that we cannot merge this allocno and the parent allocno
321 together.
322
323 This is only ever true for non-cap allocnos. */
324 unsigned int might_conflict_with_parent_p : 1;
325 /* Hard register assigned to given allocno. Negative value means
326 that memory was allocated to the allocno. During the reload,
327 spilled allocno has value equal to the corresponding stack slot
328 number (0, ...) - 2. Value -1 is used for allocnos spilled by the
329 reload (at this point pseudo-register has only one allocno) which
330 did not get stack slot yet. */
331 signed int hard_regno : 16;
332 /* Allocnos with the same regno are linked by the following member.
333 Allocnos corresponding to inner loops are first in the list (it
334 corresponds to depth-first traverse of the loops). */
335 ira_allocno_t next_regno_allocno;
336 /* There may be different allocnos with the same regno in different
337 regions. Allocnos are bound to the corresponding loop tree node.
338 Pseudo-register may have only one regular allocno with given loop
339 tree node but more than one cap (see comments above). */
340 ira_loop_tree_node_t loop_tree_node;
341 /* Accumulated usage references of the allocno. Here and below,
342 word 'accumulated' means info for given region and all nested
343 subregions. In this case, 'accumulated' means sum of references
344 of the corresponding pseudo-register in this region and in all
345 nested subregions recursively. */
346 int nrefs;
347 /* Accumulated frequency of usage of the allocno. */
348 int freq;
349 /* Minimal accumulated and updated costs of usage register of the
350 allocno class. */
351 int class_cost, updated_class_cost;
352 /* Minimal accumulated, and updated costs of memory for the allocno.
353 At the allocation start, the original and updated costs are
354 equal. The updated cost may be changed after finishing
355 allocation in a region and starting allocation in a subregion.
356 The change reflects the cost of spill/restore code on the
357 subregion border if we assign memory to the pseudo in the
358 subregion. */
359 int memory_cost, updated_memory_cost;
360 /* Accumulated number of points where the allocno lives and there is
361 excess pressure for its class. Excess pressure for a register
362 class at some point means that there are more allocnos of given
363 register class living at the point than number of hard-registers
364 of the class available for the allocation. */
365 int excess_pressure_points_num;
366 /* Allocno hard reg preferences. */
367 ira_pref_t allocno_prefs;
368 /* Copies to other non-conflicting allocnos. The copies can
369 represent move insn or potential move insn usually because of two
370 operand insn constraints. */
371 ira_copy_t allocno_copies;
372 /* It is a allocno (cap) representing given allocno on upper loop tree
373 level. */
374 ira_allocno_t cap;
375 /* It is a link to allocno (cap) on lower loop level represented by
376 given cap. Null if given allocno is not a cap. */
377 ira_allocno_t cap_member;
378 /* The number of objects tracked in the following array. */
379 int num_objects;
380 /* An array of structures describing conflict information and live
381 ranges for each object associated with the allocno. There may be
382 more than one such object in cases where the allocno represents a
383 multi-word register. */
384 ira_object_t objects[2];
385 /* Accumulated frequency of calls which given allocno
386 intersects. */
387 int call_freq;
388 /* Accumulated number of the intersected calls. */
389 int calls_crossed_num;
390 /* The number of calls across which it is live, but which should not
391 affect register preferences. */
392 int cheap_calls_crossed_num;
393 /* Registers clobbered by intersected calls. */
394 HARD_REG_SET crossed_calls_clobbered_regs;
395 /* Array of usage costs (accumulated and the one updated during
396 coloring) for each hard register of the allocno class. The
397 member value can be NULL if all costs are the same and equal to
398 CLASS_COST. For example, the costs of two different hard
399 registers can be different if one hard register is callee-saved
400 and another one is callee-used and the allocno lives through
401 calls. Another example can be case when for some insn the
402 corresponding pseudo-register value should be put in specific
403 register class (e.g. AREG for x86) which is a strict subset of
404 the allocno class (GENERAL_REGS for x86). We have updated costs
405 to reflect the situation when the usage cost of a hard register
406 is decreased because the allocno is connected to another allocno
407 by a copy and the another allocno has been assigned to the hard
408 register. */
409 int *hard_reg_costs, *updated_hard_reg_costs;
410 /* Array of decreasing costs (accumulated and the one updated during
411 coloring) for allocnos conflicting with given allocno for hard
412 regno of the allocno class. The member value can be NULL if all
413 costs are the same. These costs are used to reflect preferences
414 of other allocnos not assigned yet during assigning to given
415 allocno. */
416 int *conflict_hard_reg_costs, *updated_conflict_hard_reg_costs;
417 /* Different additional data. It is used to decrease size of
418 allocno data footprint. */
419 void *add_data;
420 };
421
422
423 /* All members of the allocno structures should be accessed only
424 through the following macros. */
425 #define ALLOCNO_NUM(A) ((A)->num)
426 #define ALLOCNO_REGNO(A) ((A)->regno)
427 #define ALLOCNO_REG(A) ((A)->reg)
428 #define ALLOCNO_NEXT_REGNO_ALLOCNO(A) ((A)->next_regno_allocno)
429 #define ALLOCNO_LOOP_TREE_NODE(A) ((A)->loop_tree_node)
430 #define ALLOCNO_CAP(A) ((A)->cap)
431 #define ALLOCNO_CAP_MEMBER(A) ((A)->cap_member)
432 #define ALLOCNO_NREFS(A) ((A)->nrefs)
433 #define ALLOCNO_FREQ(A) ((A)->freq)
434 #define ALLOCNO_MIGHT_CONFLICT_WITH_PARENT_P(A) \
435 ((A)->might_conflict_with_parent_p)
436 #define ALLOCNO_HARD_REGNO(A) ((A)->hard_regno)
437 #define ALLOCNO_CALL_FREQ(A) ((A)->call_freq)
438 #define ALLOCNO_CALLS_CROSSED_NUM(A) ((A)->calls_crossed_num)
439 #define ALLOCNO_CHEAP_CALLS_CROSSED_NUM(A) ((A)->cheap_calls_crossed_num)
440 #define ALLOCNO_CROSSED_CALLS_ABIS(A) ((A)->crossed_calls_abis)
441 #define ALLOCNO_CROSSED_CALLS_CLOBBERED_REGS(A) \
442 ((A)->crossed_calls_clobbered_regs)
443 #define ALLOCNO_MEM_OPTIMIZED_DEST(A) ((A)->mem_optimized_dest)
444 #define ALLOCNO_MEM_OPTIMIZED_DEST_P(A) ((A)->mem_optimized_dest_p)
445 #define ALLOCNO_SOMEWHERE_RENAMED_P(A) ((A)->somewhere_renamed_p)
446 #define ALLOCNO_CHILD_RENAMED_P(A) ((A)->child_renamed_p)
447 #define ALLOCNO_DONT_REASSIGN_P(A) ((A)->dont_reassign_p)
448 #ifdef STACK_REGS
449 #define ALLOCNO_NO_STACK_REG_P(A) ((A)->no_stack_reg_p)
450 #define ALLOCNO_TOTAL_NO_STACK_REG_P(A) ((A)->total_no_stack_reg_p)
451 #endif
452 #define ALLOCNO_BAD_SPILL_P(A) ((A)->bad_spill_p)
453 #define ALLOCNO_ASSIGNED_P(A) ((A)->assigned_p)
454 #define ALLOCNO_MODE(A) ((A)->mode)
455 #define ALLOCNO_WMODE(A) ((A)->wmode)
456 #define ALLOCNO_PREFS(A) ((A)->allocno_prefs)
457 #define ALLOCNO_COPIES(A) ((A)->allocno_copies)
458 #define ALLOCNO_HARD_REG_COSTS(A) ((A)->hard_reg_costs)
459 #define ALLOCNO_UPDATED_HARD_REG_COSTS(A) ((A)->updated_hard_reg_costs)
460 #define ALLOCNO_CONFLICT_HARD_REG_COSTS(A) \
461 ((A)->conflict_hard_reg_costs)
462 #define ALLOCNO_UPDATED_CONFLICT_HARD_REG_COSTS(A) \
463 ((A)->updated_conflict_hard_reg_costs)
464 #define ALLOCNO_CLASS(A) ((A)->aclass)
465 #define ALLOCNO_CLASS_COST(A) ((A)->class_cost)
466 #define ALLOCNO_UPDATED_CLASS_COST(A) ((A)->updated_class_cost)
467 #define ALLOCNO_MEMORY_COST(A) ((A)->memory_cost)
468 #define ALLOCNO_UPDATED_MEMORY_COST(A) ((A)->updated_memory_cost)
469 #define ALLOCNO_EXCESS_PRESSURE_POINTS_NUM(A) \
470 ((A)->excess_pressure_points_num)
471 #define ALLOCNO_OBJECT(A,N) ((A)->objects[N])
472 #define ALLOCNO_NUM_OBJECTS(A) ((A)->num_objects)
473 #define ALLOCNO_ADD_DATA(A) ((A)->add_data)
474
475 /* Typedef for pointer to the subsequent structure. */
476 typedef struct ira_emit_data *ira_emit_data_t;
477
478 /* Allocno bound data used for emit pseudo live range split insns and
479 to flattening IR. */
480 struct ira_emit_data
481 {
482 /* TRUE if the allocno assigned to memory was a destination of
483 removed move (see ira-emit.cc) at loop exit because the value of
484 the corresponding pseudo-register is not changed inside the
485 loop. */
486 unsigned int mem_optimized_dest_p : 1;
487 /* TRUE if the corresponding pseudo-register has disjoint live
488 ranges and the other allocnos of the pseudo-register except this
489 one changed REG. */
490 unsigned int somewhere_renamed_p : 1;
491 /* TRUE if allocno with the same REGNO in a subregion has been
492 renamed, in other words, got a new pseudo-register. */
493 unsigned int child_renamed_p : 1;
494 /* Final rtx representation of the allocno. */
495 rtx reg;
496 /* Non NULL if we remove restoring value from given allocno to
497 MEM_OPTIMIZED_DEST at loop exit (see ira-emit.cc) because the
498 allocno value is not changed inside the loop. */
499 ira_allocno_t mem_optimized_dest;
500 };
501
502 #define ALLOCNO_EMIT_DATA(a) ((ira_emit_data_t) ALLOCNO_ADD_DATA (a))
503
504 /* Data used to emit live range split insns and to flattening IR. */
505 extern ira_emit_data_t ira_allocno_emit_data;
506
507 /* Abbreviation for frequent emit data access. */
508 static inline rtx
509 allocno_emit_reg (ira_allocno_t a)
510 {
511 return ALLOCNO_EMIT_DATA (a)->reg;
512 }
513
514 #define OBJECT_ALLOCNO(O) ((O)->allocno)
515 #define OBJECT_SUBWORD(O) ((O)->subword)
516 #define OBJECT_CONFLICT_ARRAY(O) ((O)->conflicts_array)
517 #define OBJECT_CONFLICT_VEC(O) ((ira_object_t *)(O)->conflicts_array)
518 #define OBJECT_CONFLICT_BITVEC(O) ((IRA_INT_TYPE *)(O)->conflicts_array)
519 #define OBJECT_CONFLICT_ARRAY_SIZE(O) ((O)->conflicts_array_size)
520 #define OBJECT_CONFLICT_VEC_P(O) ((O)->conflict_vec_p)
521 #define OBJECT_NUM_CONFLICTS(O) ((O)->num_accumulated_conflicts)
522 #define OBJECT_CONFLICT_HARD_REGS(O) ((O)->conflict_hard_regs)
523 #define OBJECT_TOTAL_CONFLICT_HARD_REGS(O) ((O)->total_conflict_hard_regs)
524 #define OBJECT_MIN(O) ((O)->min)
525 #define OBJECT_MAX(O) ((O)->max)
526 #define OBJECT_CONFLICT_ID(O) ((O)->id)
527 #define OBJECT_LIVE_RANGES(O) ((O)->live_ranges)
528
529 /* Map regno -> allocnos with given regno (see comments for
530 allocno member `next_regno_allocno'). */
531 extern ira_allocno_t *ira_regno_allocno_map;
532
533 /* Array of references to all allocnos. The order number of the
534 allocno corresponds to the index in the array. Removed allocnos
535 have NULL element value. */
536 extern ira_allocno_t *ira_allocnos;
537
538 /* The size of the previous array. */
539 extern int ira_allocnos_num;
540
541 /* Map a conflict id to its corresponding ira_object structure. */
542 extern ira_object_t *ira_object_id_map;
543
544 /* The size of the previous array. */
545 extern int ira_objects_num;
546
547 /* The following structure represents a hard register preference of
548 allocno. The preference represent move insns or potential move
549 insns usually because of two operand insn constraints. One move
550 operand is a hard register. */
551 struct ira_allocno_pref
552 {
553 /* The unique order number of the preference node starting with 0. */
554 int num;
555 /* Preferred hard register. */
556 int hard_regno;
557 /* Accumulated execution frequency of insns from which the
558 preference created. */
559 int freq;
560 /* Given allocno. */
561 ira_allocno_t allocno;
562 /* All preferences with the same allocno are linked by the following
563 member. */
564 ira_pref_t next_pref;
565 };
566
567 /* Array of references to all allocno preferences. The order number
568 of the preference corresponds to the index in the array. */
569 extern ira_pref_t *ira_prefs;
570
571 /* Size of the previous array. */
572 extern int ira_prefs_num;
573
574 /* The following structure represents a copy of two allocnos. The
575 copies represent move insns or potential move insns usually because
576 of two operand insn constraints. To remove register shuffle, we
577 also create copies between allocno which is output of an insn and
578 allocno becoming dead in the insn. */
579 struct ira_allocno_copy
580 {
581 /* The unique order number of the copy node starting with 0. */
582 int num;
583 /* Allocnos connected by the copy. The first allocno should have
584 smaller order number than the second one. */
585 ira_allocno_t first, second;
586 /* Execution frequency of the copy. */
587 int freq;
588 bool constraint_p;
589 /* It is a move insn which is an origin of the copy. The member
590 value for the copy representing two operand insn constraints or
591 for the copy created to remove register shuffle is NULL. In last
592 case the copy frequency is smaller than the corresponding insn
593 execution frequency. */
594 rtx_insn *insn;
595 /* All copies with the same allocno as FIRST are linked by the two
596 following members. */
597 ira_copy_t prev_first_allocno_copy, next_first_allocno_copy;
598 /* All copies with the same allocno as SECOND are linked by the two
599 following members. */
600 ira_copy_t prev_second_allocno_copy, next_second_allocno_copy;
601 /* Region from which given copy is originated. */
602 ira_loop_tree_node_t loop_tree_node;
603 };
604
605 /* Array of references to all copies. The order number of the copy
606 corresponds to the index in the array. Removed copies have NULL
607 element value. */
608 extern ira_copy_t *ira_copies;
609
610 /* Size of the previous array. */
611 extern int ira_copies_num;
612
613 /* The following structure describes a stack slot used for spilled
614 pseudo-registers. */
615 class ira_spilled_reg_stack_slot
616 {
617 public:
618 /* pseudo-registers assigned to the stack slot. */
619 bitmap_head spilled_regs;
620 /* RTL representation of the stack slot. */
621 rtx mem;
622 /* Size of the stack slot. */
623 poly_uint64_pod width;
624 };
625
626 /* The number of elements in the following array. */
627 extern int ira_spilled_reg_stack_slots_num;
628
629 /* The following array contains info about spilled pseudo-registers
630 stack slots used in current function so far. */
631 extern class ira_spilled_reg_stack_slot *ira_spilled_reg_stack_slots;
632
633 /* Correspondingly overall cost of the allocation, cost of the
634 allocnos assigned to hard-registers, cost of the allocnos assigned
635 to memory, cost of loads, stores and register move insns generated
636 for pseudo-register live range splitting (see ira-emit.cc). */
637 extern int64_t ira_overall_cost;
638 extern int64_t ira_reg_cost, ira_mem_cost;
639 extern int64_t ira_load_cost, ira_store_cost, ira_shuffle_cost;
640 extern int ira_move_loops_num, ira_additional_jumps_num;
641
642
643 /* This page contains a bitset implementation called 'min/max sets' used to
645 record conflicts in IRA.
646 They are named min/maxs set since we keep track of a minimum and a maximum
647 bit number for each set representing the bounds of valid elements. Otherwise,
648 the implementation resembles sbitmaps in that we store an array of integers
649 whose bits directly represent the members of the set. */
650
651 /* The type used as elements in the array, and the number of bits in
652 this type. */
653
654 #define IRA_INT_BITS HOST_BITS_PER_WIDE_INT
655 #define IRA_INT_TYPE HOST_WIDE_INT
656
657 /* Set, clear or test bit number I in R, a bit vector of elements with
658 minimal index and maximal index equal correspondingly to MIN and
659 MAX. */
660 #if defined ENABLE_IRA_CHECKING && (GCC_VERSION >= 2007)
661
662 #define SET_MINMAX_SET_BIT(R, I, MIN, MAX) __extension__ \
663 (({ int _min = (MIN), _max = (MAX), _i = (I); \
664 if (_i < _min || _i > _max) \
665 { \
666 fprintf (stderr, \
667 "\n%s: %d: error in %s: %d not in range [%d,%d]\n", \
668 __FILE__, __LINE__, __FUNCTION__, _i, _min, _max); \
669 gcc_unreachable (); \
670 } \
671 ((R)[(unsigned) (_i - _min) / IRA_INT_BITS] \
672 |= ((IRA_INT_TYPE) 1 << ((unsigned) (_i - _min) % IRA_INT_BITS))); }))
673
674
675 #define CLEAR_MINMAX_SET_BIT(R, I, MIN, MAX) __extension__ \
676 (({ int _min = (MIN), _max = (MAX), _i = (I); \
677 if (_i < _min || _i > _max) \
678 { \
679 fprintf (stderr, \
680 "\n%s: %d: error in %s: %d not in range [%d,%d]\n", \
681 __FILE__, __LINE__, __FUNCTION__, _i, _min, _max); \
682 gcc_unreachable (); \
683 } \
684 ((R)[(unsigned) (_i - _min) / IRA_INT_BITS] \
685 &= ~((IRA_INT_TYPE) 1 << ((unsigned) (_i - _min) % IRA_INT_BITS))); }))
686
687 #define TEST_MINMAX_SET_BIT(R, I, MIN, MAX) __extension__ \
688 (({ int _min = (MIN), _max = (MAX), _i = (I); \
689 if (_i < _min || _i > _max) \
690 { \
691 fprintf (stderr, \
692 "\n%s: %d: error in %s: %d not in range [%d,%d]\n", \
693 __FILE__, __LINE__, __FUNCTION__, _i, _min, _max); \
694 gcc_unreachable (); \
695 } \
696 ((R)[(unsigned) (_i - _min) / IRA_INT_BITS] \
697 & ((IRA_INT_TYPE) 1 << ((unsigned) (_i - _min) % IRA_INT_BITS))); }))
698
699 #else
700
701 #define SET_MINMAX_SET_BIT(R, I, MIN, MAX) \
702 ((R)[(unsigned) ((I) - (MIN)) / IRA_INT_BITS] \
703 |= ((IRA_INT_TYPE) 1 << ((unsigned) ((I) - (MIN)) % IRA_INT_BITS)))
704
705 #define CLEAR_MINMAX_SET_BIT(R, I, MIN, MAX) \
706 ((R)[(unsigned) ((I) - (MIN)) / IRA_INT_BITS] \
707 &= ~((IRA_INT_TYPE) 1 << ((unsigned) ((I) - (MIN)) % IRA_INT_BITS)))
708
709 #define TEST_MINMAX_SET_BIT(R, I, MIN, MAX) \
710 ((R)[(unsigned) ((I) - (MIN)) / IRA_INT_BITS] \
711 & ((IRA_INT_TYPE) 1 << ((unsigned) ((I) - (MIN)) % IRA_INT_BITS)))
712
713 #endif
714
715 /* The iterator for min/max sets. */
716 struct minmax_set_iterator {
717
718 /* Array containing the bit vector. */
719 IRA_INT_TYPE *vec;
720
721 /* The number of the current element in the vector. */
722 unsigned int word_num;
723
724 /* The number of bits in the bit vector. */
725 unsigned int nel;
726
727 /* The current bit index of the bit vector. */
728 unsigned int bit_num;
729
730 /* Index corresponding to the 1st bit of the bit vector. */
731 int start_val;
732
733 /* The word of the bit vector currently visited. */
734 unsigned IRA_INT_TYPE word;
735 };
736
737 /* Initialize the iterator I for bit vector VEC containing minimal and
738 maximal values MIN and MAX. */
739 static inline void
740 minmax_set_iter_init (minmax_set_iterator *i, IRA_INT_TYPE *vec, int min,
741 int max)
742 {
743 i->vec = vec;
744 i->word_num = 0;
745 i->nel = max < min ? 0 : max - min + 1;
746 i->start_val = min;
747 i->bit_num = 0;
748 i->word = i->nel == 0 ? 0 : vec[0];
749 }
750
751 /* Return TRUE if we have more allocnos to visit, in which case *N is
752 set to the number of the element to be visited. Otherwise, return
753 FALSE. */
754 static inline bool
755 minmax_set_iter_cond (minmax_set_iterator *i, int *n)
756 {
757 /* Skip words that are zeros. */
758 for (; i->word == 0; i->word = i->vec[i->word_num])
759 {
760 i->word_num++;
761 i->bit_num = i->word_num * IRA_INT_BITS;
762
763 /* If we have reached the end, break. */
764 if (i->bit_num >= i->nel)
765 return false;
766 }
767
768 /* Skip bits that are zero. */
769 int off = ctz_hwi (i->word);
770 i->bit_num += off;
771 i->word >>= off;
772
773 *n = (int) i->bit_num + i->start_val;
774
775 return true;
776 }
777
778 /* Advance to the next element in the set. */
779 static inline void
780 minmax_set_iter_next (minmax_set_iterator *i)
781 {
782 i->word >>= 1;
783 i->bit_num++;
784 }
785
786 /* Loop over all elements of a min/max set given by bit vector VEC and
787 their minimal and maximal values MIN and MAX. In each iteration, N
788 is set to the number of next allocno. ITER is an instance of
789 minmax_set_iterator used to iterate over the set. */
790 #define FOR_EACH_BIT_IN_MINMAX_SET(VEC, MIN, MAX, N, ITER) \
791 for (minmax_set_iter_init (&(ITER), (VEC), (MIN), (MAX)); \
792 minmax_set_iter_cond (&(ITER), &(N)); \
793 minmax_set_iter_next (&(ITER)))
794
795 class target_ira_int {
797 public:
798 ~target_ira_int ();
799
800 void free_ira_costs ();
801 void free_register_move_costs ();
802
803 /* Initialized once. It is a maximal possible size of the allocated
804 struct costs. */
805 size_t x_max_struct_costs_size;
806
807 /* Allocated and initialized once, and used to initialize cost values
808 for each insn. */
809 struct costs *x_init_cost;
810
811 /* Allocated once, and used for temporary purposes. */
812 struct costs *x_temp_costs;
813
814 /* Allocated once, and used for the cost calculation. */
815 struct costs *x_op_costs[MAX_RECOG_OPERANDS];
816 struct costs *x_this_op_costs[MAX_RECOG_OPERANDS];
817
818 /* Hard registers that cannot be used for the register allocator for
819 all functions of the current compilation unit. */
820 HARD_REG_SET x_no_unit_alloc_regs;
821
822 /* Map: hard regs X modes -> set of hard registers for storing value
823 of given mode starting with given hard register. */
824 HARD_REG_SET (x_ira_reg_mode_hard_regset
825 [FIRST_PSEUDO_REGISTER][NUM_MACHINE_MODES]);
826
827 /* Maximum cost of moving from a register in one class to a register
828 in another class. Based on TARGET_REGISTER_MOVE_COST. */
829 move_table *x_ira_register_move_cost[MAX_MACHINE_MODE];
830
831 /* Similar, but here we don't have to move if the first index is a
832 subset of the second so in that case the cost is zero. */
833 move_table *x_ira_may_move_in_cost[MAX_MACHINE_MODE];
834
835 /* Similar, but here we don't have to move if the first index is a
836 superset of the second so in that case the cost is zero. */
837 move_table *x_ira_may_move_out_cost[MAX_MACHINE_MODE];
838
839 /* Keep track of the last mode we initialized move costs for. */
840 int x_last_mode_for_init_move_cost;
841
842 /* Array analog of the macro MEMORY_MOVE_COST but they contain maximal
843 cost not minimal. */
844 short int x_ira_max_memory_move_cost[MAX_MACHINE_MODE][N_REG_CLASSES][2];
845
846 /* Map class->true if class is a possible allocno class, false
847 otherwise. */
848 bool x_ira_reg_allocno_class_p[N_REG_CLASSES];
849
850 /* Map class->true if class is a pressure class, false otherwise. */
851 bool x_ira_reg_pressure_class_p[N_REG_CLASSES];
852
853 /* Array of the number of hard registers of given class which are
854 available for allocation. The order is defined by the hard
855 register numbers. */
856 short x_ira_non_ordered_class_hard_regs[N_REG_CLASSES][FIRST_PSEUDO_REGISTER];
857
858 /* Index (in ira_class_hard_regs; for given register class and hard
859 register (in general case a hard register can belong to several
860 register classes;. The index is negative for hard registers
861 unavailable for the allocation. */
862 short x_ira_class_hard_reg_index[N_REG_CLASSES][FIRST_PSEUDO_REGISTER];
863
864 /* Index [CL][M] contains R if R appears somewhere in a register of the form:
865
866 (reg:M R'), R' not in x_ira_prohibited_class_mode_regs[CL][M]
867
868 For example, if:
869
870 - (reg:M 2) is valid and occupies two registers;
871 - register 2 belongs to CL; and
872 - register 3 belongs to the same pressure class as CL
873
874 then (reg:M 2) contributes to [CL][M] and registers 2 and 3 will be
875 in the set. */
876 HARD_REG_SET x_ira_useful_class_mode_regs[N_REG_CLASSES][NUM_MACHINE_MODES];
877
878 /* The value is number of elements in the subsequent array. */
879 int x_ira_important_classes_num;
880
881 /* The array containing all non-empty classes. Such classes is
882 important for calculation of the hard register usage costs. */
883 enum reg_class x_ira_important_classes[N_REG_CLASSES];
884
885 /* The array containing indexes of important classes in the previous
886 array. The array elements are defined only for important
887 classes. */
888 int x_ira_important_class_nums[N_REG_CLASSES];
889
890 /* Map class->true if class is an uniform class, false otherwise. */
891 bool x_ira_uniform_class_p[N_REG_CLASSES];
892
893 /* The biggest important class inside of intersection of the two
894 classes (that is calculated taking only hard registers available
895 for allocation into account;. If the both classes contain no hard
896 registers available for allocation, the value is calculated with
897 taking all hard-registers including fixed ones into account. */
898 enum reg_class x_ira_reg_class_intersect[N_REG_CLASSES][N_REG_CLASSES];
899
900 /* Classes with end marker LIM_REG_CLASSES which are intersected with
901 given class (the first index). That includes given class itself.
902 This is calculated taking only hard registers available for
903 allocation into account. */
904 enum reg_class x_ira_reg_class_super_classes[N_REG_CLASSES][N_REG_CLASSES];
905
906 /* The biggest (smallest) important class inside of (covering) union
907 of the two classes (that is calculated taking only hard registers
908 available for allocation into account). If the both classes
909 contain no hard registers available for allocation, the value is
910 calculated with taking all hard-registers including fixed ones
911 into account. In other words, the value is the corresponding
912 reg_class_subunion (reg_class_superunion) value. */
913 enum reg_class x_ira_reg_class_subunion[N_REG_CLASSES][N_REG_CLASSES];
914 enum reg_class x_ira_reg_class_superunion[N_REG_CLASSES][N_REG_CLASSES];
915
916 /* For each reg class, table listing all the classes contained in it
917 (excluding the class itself. Non-allocatable registers are
918 excluded from the consideration). */
919 enum reg_class x_alloc_reg_class_subclasses[N_REG_CLASSES][N_REG_CLASSES];
920
921 /* Array whose values are hard regset of hard registers for which
922 move of the hard register in given mode into itself is
923 prohibited. */
924 HARD_REG_SET x_ira_prohibited_mode_move_regs[NUM_MACHINE_MODES];
925
926 /* Flag of that the above array has been initialized. */
927 bool x_ira_prohibited_mode_move_regs_initialized_p;
928 };
929
930 extern class target_ira_int default_target_ira_int;
931 #if SWITCHABLE_TARGET
932 extern class target_ira_int *this_target_ira_int;
933 #else
934 #define this_target_ira_int (&default_target_ira_int)
935 #endif
936
937 #define ira_reg_mode_hard_regset \
938 (this_target_ira_int->x_ira_reg_mode_hard_regset)
939 #define ira_register_move_cost \
940 (this_target_ira_int->x_ira_register_move_cost)
941 #define ira_max_memory_move_cost \
942 (this_target_ira_int->x_ira_max_memory_move_cost)
943 #define ira_may_move_in_cost \
944 (this_target_ira_int->x_ira_may_move_in_cost)
945 #define ira_may_move_out_cost \
946 (this_target_ira_int->x_ira_may_move_out_cost)
947 #define ira_reg_allocno_class_p \
948 (this_target_ira_int->x_ira_reg_allocno_class_p)
949 #define ira_reg_pressure_class_p \
950 (this_target_ira_int->x_ira_reg_pressure_class_p)
951 #define ira_non_ordered_class_hard_regs \
952 (this_target_ira_int->x_ira_non_ordered_class_hard_regs)
953 #define ira_class_hard_reg_index \
954 (this_target_ira_int->x_ira_class_hard_reg_index)
955 #define ira_useful_class_mode_regs \
956 (this_target_ira_int->x_ira_useful_class_mode_regs)
957 #define ira_important_classes_num \
958 (this_target_ira_int->x_ira_important_classes_num)
959 #define ira_important_classes \
960 (this_target_ira_int->x_ira_important_classes)
961 #define ira_important_class_nums \
962 (this_target_ira_int->x_ira_important_class_nums)
963 #define ira_uniform_class_p \
964 (this_target_ira_int->x_ira_uniform_class_p)
965 #define ira_reg_class_intersect \
966 (this_target_ira_int->x_ira_reg_class_intersect)
967 #define ira_reg_class_super_classes \
968 (this_target_ira_int->x_ira_reg_class_super_classes)
969 #define ira_reg_class_subunion \
970 (this_target_ira_int->x_ira_reg_class_subunion)
971 #define ira_reg_class_superunion \
972 (this_target_ira_int->x_ira_reg_class_superunion)
973 #define ira_prohibited_mode_move_regs \
974 (this_target_ira_int->x_ira_prohibited_mode_move_regs)
975
976 /* ira.cc: */
978
979 extern void *ira_allocate (size_t);
980 extern void ira_free (void *addr);
981 extern bitmap ira_allocate_bitmap (void);
982 extern void ira_free_bitmap (bitmap);
983 extern void ira_print_disposition (FILE *);
984 extern void ira_debug_disposition (void);
985 extern void ira_debug_allocno_classes (void);
986 extern void ira_init_register_move_cost (machine_mode);
987 extern alternative_mask ira_setup_alts (rtx_insn *);
988 extern int ira_get_dup_out_num (int, alternative_mask, bool &);
989
990 /* ira-build.cc */
991
992 /* The current loop tree node and its regno allocno map. */
993 extern ira_loop_tree_node_t ira_curr_loop_tree_node;
994 extern ira_allocno_t *ira_curr_regno_allocno_map;
995
996 extern void ira_debug_pref (ira_pref_t);
997 extern void ira_debug_prefs (void);
998 extern void ira_debug_allocno_prefs (ira_allocno_t);
999
1000 extern void ira_debug_copy (ira_copy_t);
1001 extern void debug (ira_allocno_copy &ref);
1002 extern void debug (ira_allocno_copy *ptr);
1003
1004 extern void ira_debug_copies (void);
1005 extern void ira_debug_allocno_copies (ira_allocno_t);
1006 extern void debug (ira_allocno &ref);
1007 extern void debug (ira_allocno *ptr);
1008
1009 extern void ira_traverse_loop_tree (bool, ira_loop_tree_node_t,
1010 void (*) (ira_loop_tree_node_t),
1011 void (*) (ira_loop_tree_node_t));
1012 extern ira_allocno_t ira_parent_allocno (ira_allocno_t);
1013 extern ira_allocno_t ira_parent_or_cap_allocno (ira_allocno_t);
1014 extern ira_allocno_t ira_create_allocno (int, bool, ira_loop_tree_node_t);
1015 extern void ira_create_allocno_objects (ira_allocno_t);
1016 extern void ira_set_allocno_class (ira_allocno_t, enum reg_class);
1017 extern bool ira_conflict_vector_profitable_p (ira_object_t, int);
1018 extern void ira_allocate_conflict_vec (ira_object_t, int);
1019 extern void ira_allocate_object_conflicts (ira_object_t, int);
1020 extern void ior_hard_reg_conflicts (ira_allocno_t, const_hard_reg_set);
1021 extern void ira_print_expanded_allocno (ira_allocno_t);
1022 extern void ira_add_live_range_to_object (ira_object_t, int, int);
1023 extern live_range_t ira_create_live_range (ira_object_t, int, int,
1024 live_range_t);
1025 extern live_range_t ira_copy_live_range_list (live_range_t);
1026 extern live_range_t ira_merge_live_ranges (live_range_t, live_range_t);
1027 extern bool ira_live_ranges_intersect_p (live_range_t, live_range_t);
1028 extern void ira_finish_live_range (live_range_t);
1029 extern void ira_finish_live_range_list (live_range_t);
1030 extern void ira_free_allocno_updated_costs (ira_allocno_t);
1031 extern ira_pref_t ira_create_pref (ira_allocno_t, int, int);
1032 extern void ira_add_allocno_pref (ira_allocno_t, int, int);
1033 extern void ira_remove_pref (ira_pref_t);
1034 extern void ira_remove_allocno_prefs (ira_allocno_t);
1035 extern ira_copy_t ira_create_copy (ira_allocno_t, ira_allocno_t,
1036 int, bool, rtx_insn *,
1037 ira_loop_tree_node_t);
1038 extern ira_copy_t ira_add_allocno_copy (ira_allocno_t, ira_allocno_t, int,
1039 bool, rtx_insn *,
1040 ira_loop_tree_node_t);
1041
1042 extern int *ira_allocate_cost_vector (reg_class_t);
1043 extern void ira_free_cost_vector (int *, reg_class_t);
1044
1045 extern void ira_flattening (int, int);
1046 extern bool ira_build (void);
1047 extern void ira_destroy (void);
1048
1049 /* ira-costs.cc */
1050 extern void ira_init_costs_once (void);
1051 extern void ira_init_costs (void);
1052 extern void ira_costs (void);
1053 extern void ira_tune_allocno_costs (void);
1054
1055 /* ira-lives.cc */
1056
1057 extern void ira_rebuild_start_finish_chains (void);
1058 extern void ira_print_live_range_list (FILE *, live_range_t);
1059 extern void debug (live_range &ref);
1060 extern void debug (live_range *ptr);
1061 extern void ira_debug_live_range_list (live_range_t);
1062 extern void ira_debug_allocno_live_ranges (ira_allocno_t);
1063 extern void ira_debug_live_ranges (void);
1064 extern void ira_create_allocno_live_ranges (void);
1065 extern void ira_compress_allocno_live_ranges (void);
1066 extern void ira_finish_allocno_live_ranges (void);
1067 extern void ira_implicitly_set_insn_hard_regs (HARD_REG_SET *,
1068 alternative_mask);
1069
1070 /* ira-conflicts.cc */
1071 extern void ira_debug_conflicts (bool);
1072 extern void ira_build_conflicts (void);
1073
1074 /* ira-color.cc */
1075 extern ira_allocno_t ira_soft_conflict (ira_allocno_t, ira_allocno_t);
1076 extern void ira_debug_hard_regs_forest (void);
1077 extern int ira_loop_edge_freq (ira_loop_tree_node_t, int, bool);
1078 extern void ira_reassign_conflict_allocnos (int);
1079 extern void ira_initiate_assign (void);
1080 extern void ira_finish_assign (void);
1081 extern void ira_color (void);
1082
1083 /* ira-emit.cc */
1084 extern void ira_initiate_emit_data (void);
1085 extern void ira_finish_emit_data (void);
1086 extern void ira_emit (bool);
1087
1088
1089
1091 /* Return true if equivalence of pseudo REGNO is not a lvalue. */
1092 static inline bool
1093 ira_equiv_no_lvalue_p (int regno)
1094 {
1095 if (regno >= ira_reg_equiv_len)
1096 return false;
1097 return (ira_reg_equiv[regno].constant != NULL_RTX
1098 || ira_reg_equiv[regno].invariant != NULL_RTX
1099 || (ira_reg_equiv[regno].memory != NULL_RTX
1100 && MEM_READONLY_P (ira_reg_equiv[regno].memory)));
1101 }
1102
1103
1104
1106 /* Initialize register costs for MODE if necessary. */
1107 static inline void
1108 ira_init_register_move_cost_if_necessary (machine_mode mode)
1109 {
1110 if (ira_register_move_cost[mode] == NULL)
1111 ira_init_register_move_cost (mode);
1112 }
1113
1114
1115
1117 /* The iterator for all allocnos. */
1118 struct ira_allocno_iterator {
1119 /* The number of the current element in IRA_ALLOCNOS. */
1120 int n;
1121 };
1122
1123 /* Initialize the iterator I. */
1124 static inline void
1125 ira_allocno_iter_init (ira_allocno_iterator *i)
1126 {
1127 i->n = 0;
1128 }
1129
1130 /* Return TRUE if we have more allocnos to visit, in which case *A is
1131 set to the allocno to be visited. Otherwise, return FALSE. */
1132 static inline bool
1133 ira_allocno_iter_cond (ira_allocno_iterator *i, ira_allocno_t *a)
1134 {
1135 int n;
1136
1137 for (n = i->n; n < ira_allocnos_num; n++)
1138 if (ira_allocnos[n] != NULL)
1139 {
1140 *a = ira_allocnos[n];
1141 i->n = n + 1;
1142 return true;
1143 }
1144 return false;
1145 }
1146
1147 /* Loop over all allocnos. In each iteration, A is set to the next
1148 allocno. ITER is an instance of ira_allocno_iterator used to iterate
1149 the allocnos. */
1150 #define FOR_EACH_ALLOCNO(A, ITER) \
1151 for (ira_allocno_iter_init (&(ITER)); \
1152 ira_allocno_iter_cond (&(ITER), &(A));)
1153
1154 /* The iterator for all objects. */
1156 struct ira_object_iterator {
1157 /* The number of the current element in ira_object_id_map. */
1158 int n;
1159 };
1160
1161 /* Initialize the iterator I. */
1162 static inline void
1163 ira_object_iter_init (ira_object_iterator *i)
1164 {
1165 i->n = 0;
1166 }
1167
1168 /* Return TRUE if we have more objects to visit, in which case *OBJ is
1169 set to the object to be visited. Otherwise, return FALSE. */
1170 static inline bool
1171 ira_object_iter_cond (ira_object_iterator *i, ira_object_t *obj)
1172 {
1173 int n;
1174
1175 for (n = i->n; n < ira_objects_num; n++)
1176 if (ira_object_id_map[n] != NULL)
1177 {
1178 *obj = ira_object_id_map[n];
1179 i->n = n + 1;
1180 return true;
1181 }
1182 return false;
1183 }
1184
1185 /* Loop over all objects. In each iteration, OBJ is set to the next
1186 object. ITER is an instance of ira_object_iterator used to iterate
1187 the objects. */
1188 #define FOR_EACH_OBJECT(OBJ, ITER) \
1189 for (ira_object_iter_init (&(ITER)); \
1190 ira_object_iter_cond (&(ITER), &(OBJ));)
1191
1192 /* The iterator for objects associated with an allocno. */
1194 struct ira_allocno_object_iterator {
1195 /* The number of the element the allocno's object array. */
1196 int n;
1197 };
1198
1199 /* Initialize the iterator I. */
1200 static inline void
1201 ira_allocno_object_iter_init (ira_allocno_object_iterator *i)
1202 {
1203 i->n = 0;
1204 }
1205
1206 /* Return TRUE if we have more objects to visit in allocno A, in which
1207 case *O is set to the object to be visited. Otherwise, return
1208 FALSE. */
1209 static inline bool
1210 ira_allocno_object_iter_cond (ira_allocno_object_iterator *i, ira_allocno_t a,
1211 ira_object_t *o)
1212 {
1213 int n = i->n++;
1214 if (n < ALLOCNO_NUM_OBJECTS (a))
1215 {
1216 *o = ALLOCNO_OBJECT (a, n);
1217 return true;
1218 }
1219 return false;
1220 }
1221
1222 /* Loop over all objects associated with allocno A. In each
1223 iteration, O is set to the next object. ITER is an instance of
1224 ira_allocno_object_iterator used to iterate the conflicts. */
1225 #define FOR_EACH_ALLOCNO_OBJECT(A, O, ITER) \
1226 for (ira_allocno_object_iter_init (&(ITER)); \
1227 ira_allocno_object_iter_cond (&(ITER), (A), &(O));)
1228
1229
1231 /* The iterator for prefs. */
1232 struct ira_pref_iterator {
1233 /* The number of the current element in IRA_PREFS. */
1234 int n;
1235 };
1236
1237 /* Initialize the iterator I. */
1238 static inline void
1239 ira_pref_iter_init (ira_pref_iterator *i)
1240 {
1241 i->n = 0;
1242 }
1243
1244 /* Return TRUE if we have more prefs to visit, in which case *PREF is
1245 set to the pref to be visited. Otherwise, return FALSE. */
1246 static inline bool
1247 ira_pref_iter_cond (ira_pref_iterator *i, ira_pref_t *pref)
1248 {
1249 int n;
1250
1251 for (n = i->n; n < ira_prefs_num; n++)
1252 if (ira_prefs[n] != NULL)
1253 {
1254 *pref = ira_prefs[n];
1255 i->n = n + 1;
1256 return true;
1257 }
1258 return false;
1259 }
1260
1261 /* Loop over all prefs. In each iteration, P is set to the next
1262 pref. ITER is an instance of ira_pref_iterator used to iterate
1263 the prefs. */
1264 #define FOR_EACH_PREF(P, ITER) \
1265 for (ira_pref_iter_init (&(ITER)); \
1266 ira_pref_iter_cond (&(ITER), &(P));)
1267
1268
1270 /* The iterator for copies. */
1271 struct ira_copy_iterator {
1272 /* The number of the current element in IRA_COPIES. */
1273 int n;
1274 };
1275
1276 /* Initialize the iterator I. */
1277 static inline void
1278 ira_copy_iter_init (ira_copy_iterator *i)
1279 {
1280 i->n = 0;
1281 }
1282
1283 /* Return TRUE if we have more copies to visit, in which case *CP is
1284 set to the copy to be visited. Otherwise, return FALSE. */
1285 static inline bool
1286 ira_copy_iter_cond (ira_copy_iterator *i, ira_copy_t *cp)
1287 {
1288 int n;
1289
1290 for (n = i->n; n < ira_copies_num; n++)
1291 if (ira_copies[n] != NULL)
1292 {
1293 *cp = ira_copies[n];
1294 i->n = n + 1;
1295 return true;
1296 }
1297 return false;
1298 }
1299
1300 /* Loop over all copies. In each iteration, C is set to the next
1301 copy. ITER is an instance of ira_copy_iterator used to iterate
1302 the copies. */
1303 #define FOR_EACH_COPY(C, ITER) \
1304 for (ira_copy_iter_init (&(ITER)); \
1305 ira_copy_iter_cond (&(ITER), &(C));)
1306
1307 /* The iterator for object conflicts. */
1309 struct ira_object_conflict_iterator {
1310
1311 /* TRUE if the conflicts are represented by vector of allocnos. */
1312 bool conflict_vec_p;
1313
1314 /* The conflict vector or conflict bit vector. */
1315 void *vec;
1316
1317 /* The number of the current element in the vector (of type
1318 ira_object_t or IRA_INT_TYPE). */
1319 unsigned int word_num;
1320
1321 /* The bit vector size. It is defined only if
1322 OBJECT_CONFLICT_VEC_P is FALSE. */
1323 unsigned int size;
1324
1325 /* The current bit index of bit vector. It is defined only if
1326 OBJECT_CONFLICT_VEC_P is FALSE. */
1327 unsigned int bit_num;
1328
1329 /* The object id corresponding to the 1st bit of the bit vector. It
1330 is defined only if OBJECT_CONFLICT_VEC_P is FALSE. */
1331 int base_conflict_id;
1332
1333 /* The word of bit vector currently visited. It is defined only if
1334 OBJECT_CONFLICT_VEC_P is FALSE. */
1335 unsigned IRA_INT_TYPE word;
1336 };
1337
1338 /* Initialize the iterator I with ALLOCNO conflicts. */
1339 static inline void
1340 ira_object_conflict_iter_init (ira_object_conflict_iterator *i,
1341 ira_object_t obj)
1342 {
1343 i->conflict_vec_p = OBJECT_CONFLICT_VEC_P (obj);
1344 i->vec = OBJECT_CONFLICT_ARRAY (obj);
1345 i->word_num = 0;
1346 if (i->conflict_vec_p)
1347 i->size = i->bit_num = i->base_conflict_id = i->word = 0;
1348 else
1349 {
1350 if (OBJECT_MIN (obj) > OBJECT_MAX (obj))
1351 i->size = 0;
1352 else
1353 i->size = ((OBJECT_MAX (obj) - OBJECT_MIN (obj)
1354 + IRA_INT_BITS)
1355 / IRA_INT_BITS) * sizeof (IRA_INT_TYPE);
1356 i->bit_num = 0;
1357 i->base_conflict_id = OBJECT_MIN (obj);
1358 i->word = (i->size == 0 ? 0 : ((IRA_INT_TYPE *) i->vec)[0]);
1359 }
1360 }
1361
1362 /* Return TRUE if we have more conflicting allocnos to visit, in which
1363 case *A is set to the allocno to be visited. Otherwise, return
1364 FALSE. */
1365 static inline bool
1366 ira_object_conflict_iter_cond (ira_object_conflict_iterator *i,
1367 ira_object_t *pobj)
1368 {
1369 ira_object_t obj;
1370
1371 if (i->conflict_vec_p)
1372 {
1373 obj = ((ira_object_t *) i->vec)[i->word_num++];
1374 if (obj == NULL)
1375 return false;
1376 }
1377 else
1378 {
1379 unsigned IRA_INT_TYPE word = i->word;
1380 unsigned int bit_num = i->bit_num;
1381
1382 /* Skip words that are zeros. */
1383 for (; word == 0; word = ((IRA_INT_TYPE *) i->vec)[i->word_num])
1384 {
1385 i->word_num++;
1386
1387 /* If we have reached the end, break. */
1388 if (i->word_num * sizeof (IRA_INT_TYPE) >= i->size)
1389 return false;
1390
1391 bit_num = i->word_num * IRA_INT_BITS;
1392 }
1393
1394 /* Skip bits that are zero. */
1395 int off = ctz_hwi (word);
1396 bit_num += off;
1397 word >>= off;
1398
1399 obj = ira_object_id_map[bit_num + i->base_conflict_id];
1400 i->bit_num = bit_num + 1;
1401 i->word = word >> 1;
1402 }
1403
1404 *pobj = obj;
1405 return true;
1406 }
1407
1408 /* Loop over all objects conflicting with OBJ. In each iteration,
1409 CONF is set to the next conflicting object. ITER is an instance
1410 of ira_object_conflict_iterator used to iterate the conflicts. */
1411 #define FOR_EACH_OBJECT_CONFLICT(OBJ, CONF, ITER) \
1412 for (ira_object_conflict_iter_init (&(ITER), (OBJ)); \
1413 ira_object_conflict_iter_cond (&(ITER), &(CONF));)
1414
1415
1416
1418 /* The function returns TRUE if at least one hard register from ones
1419 starting with HARD_REGNO and containing value of MODE are in set
1420 HARD_REGSET. */
1421 static inline bool
1422 ira_hard_reg_set_intersection_p (int hard_regno, machine_mode mode,
1423 HARD_REG_SET hard_regset)
1424 {
1425 int i;
1426
1427 gcc_assert (hard_regno >= 0);
1428 for (i = hard_regno_nregs (hard_regno, mode) - 1; i >= 0; i--)
1429 if (TEST_HARD_REG_BIT (hard_regset, hard_regno + i))
1430 return true;
1431 return false;
1432 }
1433
1434 /* Return number of hard registers in hard register SET. */
1435 static inline int
1436 hard_reg_set_size (HARD_REG_SET set)
1437 {
1438 int i, size;
1439
1440 for (size = i = 0; i < FIRST_PSEUDO_REGISTER; i++)
1441 if (TEST_HARD_REG_BIT (set, i))
1442 size++;
1443 return size;
1444 }
1445
1446 /* The function returns TRUE if hard registers starting with
1447 HARD_REGNO and containing value of MODE are fully in set
1448 HARD_REGSET. */
1449 static inline bool
1450 ira_hard_reg_in_set_p (int hard_regno, machine_mode mode,
1451 HARD_REG_SET hard_regset)
1452 {
1453 int i;
1454
1455 ira_assert (hard_regno >= 0);
1456 for (i = hard_regno_nregs (hard_regno, mode) - 1; i >= 0; i--)
1457 if (!TEST_HARD_REG_BIT (hard_regset, hard_regno + i))
1458 return false;
1459 return true;
1460 }
1461
1462
1463
1465 /* To save memory we use a lazy approach for allocation and
1466 initialization of the cost vectors. We do this only when it is
1467 really necessary. */
1468
1469 /* Allocate cost vector *VEC for hard registers of ACLASS and
1470 initialize the elements by VAL if it is necessary */
1471 static inline void
1472 ira_allocate_and_set_costs (int **vec, reg_class_t aclass, int val)
1473 {
1474 int i, *reg_costs;
1475 int len;
1476
1477 if (*vec != NULL)
1478 return;
1479 *vec = reg_costs = ira_allocate_cost_vector (aclass);
1480 len = ira_class_hard_regs_num[(int) aclass];
1481 for (i = 0; i < len; i++)
1482 reg_costs[i] = val;
1483 }
1484
1485 /* Allocate cost vector *VEC for hard registers of ACLASS and copy
1486 values of vector SRC into the vector if it is necessary */
1487 static inline void
1488 ira_allocate_and_copy_costs (int **vec, enum reg_class aclass, int *src)
1489 {
1490 int len;
1491
1492 if (*vec != NULL || src == NULL)
1493 return;
1494 *vec = ira_allocate_cost_vector (aclass);
1495 len = ira_class_hard_regs_num[aclass];
1496 memcpy (*vec, src, sizeof (int) * len);
1497 }
1498
1499 /* Allocate cost vector *VEC for hard registers of ACLASS and add
1500 values of vector SRC into the vector if it is necessary */
1501 static inline void
1502 ira_allocate_and_accumulate_costs (int **vec, enum reg_class aclass, int *src)
1503 {
1504 int i, len;
1505
1506 if (src == NULL)
1507 return;
1508 len = ira_class_hard_regs_num[aclass];
1509 if (*vec == NULL)
1510 {
1511 *vec = ira_allocate_cost_vector (aclass);
1512 memset (*vec, 0, sizeof (int) * len);
1513 }
1514 for (i = 0; i < len; i++)
1515 (*vec)[i] += src[i];
1516 }
1517
1518 /* Allocate cost vector *VEC for hard registers of ACLASS and copy
1519 values of vector SRC into the vector or initialize it by VAL (if
1520 SRC is null). */
1521 static inline void
1522 ira_allocate_and_set_or_copy_costs (int **vec, enum reg_class aclass,
1523 int val, int *src)
1524 {
1525 int i, *reg_costs;
1526 int len;
1527
1528 if (*vec != NULL)
1529 return;
1530 *vec = reg_costs = ira_allocate_cost_vector (aclass);
1531 len = ira_class_hard_regs_num[aclass];
1532 if (src != NULL)
1533 memcpy (reg_costs, src, sizeof (int) * len);
1534 else
1535 {
1536 for (i = 0; i < len; i++)
1537 reg_costs[i] = val;
1538 }
1539 }
1540
1541 extern rtx ira_create_new_reg (rtx);
1542 extern int first_moveable_pseudo, last_moveable_pseudo;
1543
1544 /* Return the set of registers that would need a caller save if allocno A
1545 overlapped them. */
1546
1547 inline HARD_REG_SET
1548 ira_need_caller_save_regs (ira_allocno_t a)
1549 {
1550 return call_clobbers_in_region (ALLOCNO_CROSSED_CALLS_ABIS (a),
1551 ALLOCNO_CROSSED_CALLS_CLOBBERED_REGS (a),
1552 ALLOCNO_MODE (a));
1553 }
1554
1555 /* Return true if we would need to save allocno A around a call if we
1556 assigned hard register REGNO. */
1557
1558 inline bool
1559 ira_need_caller_save_p (ira_allocno_t a, unsigned int regno)
1560 {
1561 if (ALLOCNO_CALLS_CROSSED_NUM (a) == 0)
1562 return false;
1563 return call_clobbered_in_region_p (ALLOCNO_CROSSED_CALLS_ABIS (a),
1564 ALLOCNO_CROSSED_CALLS_CLOBBERED_REGS (a),
1565 ALLOCNO_MODE (a), regno);
1566 }
1567
1568 /* Represents the boundary between an allocno in one loop and its parent
1569 allocno in the enclosing loop. It is usually possible to change a
1570 register's allocation on this boundary; the class provides routines
1571 for calculating the cost of such changes. */
1572 class ira_loop_border_costs
1573 {
1574 public:
1575 ira_loop_border_costs (ira_allocno_t);
1576
1577 int move_between_loops_cost () const;
1578 int spill_outside_loop_cost () const;
1579 int spill_inside_loop_cost () const;
1580
1581 private:
1582 /* The mode and class of the child allocno. */
1583 machine_mode m_mode;
1584 reg_class m_class;
1585
1586 /* Sums the frequencies of the entry edges and the exit edges. */
1587 int m_entry_freq, m_exit_freq;
1588 };
1589
1590 /* Return the cost of storing the register on entry to the loop and
1591 loading it back on exit from the loop. This is the cost to use if
1592 the register is spilled within the loop but is successfully allocated
1593 in the parent loop. */
1594 inline int
1595 ira_loop_border_costs::spill_inside_loop_cost () const
1596 {
1597 return (m_entry_freq * ira_memory_move_cost[m_mode][m_class][0]
1598 + m_exit_freq * ira_memory_move_cost[m_mode][m_class][1]);
1599 }
1600
1601 /* Return the cost of loading the register on entry to the loop and
1602 storing it back on exit from the loop. This is the cost to use if
1603 the register is successfully allocated within the loop but is spilled
1604 in the parent loop. */
1605 inline int
1606 ira_loop_border_costs::spill_outside_loop_cost () const
1607 {
1608 return (m_entry_freq * ira_memory_move_cost[m_mode][m_class][1]
1609 + m_exit_freq * ira_memory_move_cost[m_mode][m_class][0]);
1610 }
1611
1612 /* Return the cost of moving the pseudo register between different hard
1613 registers on entry and exit from the loop. This is the cost to use
1614 if the register is successfully allocated within both this loop and
1615 the parent loop, but the allocations for the loops differ. */
1616 inline int
1617 ira_loop_border_costs::move_between_loops_cost () const
1618 {
1619 ira_init_register_move_cost_if_necessary (m_mode);
1620 auto move_cost = ira_register_move_cost[m_mode][m_class][m_class];
1621 return move_cost * (m_entry_freq + m_exit_freq);
1622 }
1623
1624 /* Return true if subloops that contain allocnos for A's register can
1625 use a different assignment from A. ALLOCATED_P is true for the case
1626 in which allocation succeeded for A. EXCLUDE_OLD_RELOAD is true if
1627 we should always return false for non-LRA targets. (This is a hack
1628 and should be removed along with old reload.) */
1629 inline bool
1630 ira_subloop_allocnos_can_differ_p (ira_allocno_t a, bool allocated_p = true,
1631 bool exclude_old_reload = true)
1632 {
1633 if (exclude_old_reload && !ira_use_lra_p)
1634 return false;
1635
1636 auto regno = ALLOCNO_REGNO (a);
1637
1638 if (pic_offset_table_rtx != NULL
1639 && regno == (int) REGNO (pic_offset_table_rtx))
1640 return false;
1641
1642 ira_assert (regno < ira_reg_equiv_len);
1643 if (ira_equiv_no_lvalue_p (regno))
1644 return false;
1645
1646 /* Avoid overlapping multi-registers. Moves between them might result
1647 in wrong code generation. */
1648 if (allocated_p)
1649 {
1650 auto pclass = ira_pressure_class_translate[ALLOCNO_CLASS (a)];
1651 if (ira_reg_class_max_nregs[pclass][ALLOCNO_MODE (a)] > 1)
1652 return false;
1653 }
1654
1655 return true;
1656 }
1657
1658 /* Return true if we should treat A and SUBLOOP_A as belonging to a
1659 single region. */
1660 inline bool
1661 ira_single_region_allocno_p (ira_allocno_t a, ira_allocno_t subloop_a)
1662 {
1663 if (flag_ira_region != IRA_REGION_MIXED)
1664 return false;
1665
1666 if (ALLOCNO_MIGHT_CONFLICT_WITH_PARENT_P (subloop_a))
1667 return false;
1668
1669 auto rclass = ALLOCNO_CLASS (a);
1670 auto pclass = ira_pressure_class_translate[rclass];
1671 auto loop_used_regs = ALLOCNO_LOOP_TREE_NODE (a)->reg_pressure[pclass];
1672 return loop_used_regs <= ira_class_hard_regs_num[pclass];
1673 }
1674
1675 /* Return the set of all hard registers that conflict with A. */
1676 inline HARD_REG_SET
1677 ira_total_conflict_hard_regs (ira_allocno_t a)
1678 {
1679 auto obj_0 = ALLOCNO_OBJECT (a, 0);
1680 HARD_REG_SET conflicts = OBJECT_TOTAL_CONFLICT_HARD_REGS (obj_0);
1681 for (int i = 1; i < ALLOCNO_NUM_OBJECTS (a); i++)
1682 conflicts |= OBJECT_TOTAL_CONFLICT_HARD_REGS (ALLOCNO_OBJECT (a, i));
1683 return conflicts;
1684 }
1685
1686 /* Return the cost of saving a caller-saved register before each call
1687 in A's live range and restoring the same register after each call. */
1688 inline int
1689 ira_caller_save_cost (ira_allocno_t a)
1690 {
1691 auto mode = ALLOCNO_MODE (a);
1692 auto rclass = ALLOCNO_CLASS (a);
1693 return (ALLOCNO_CALL_FREQ (a)
1694 * (ira_memory_move_cost[mode][rclass][0]
1695 + ira_memory_move_cost[mode][rclass][1]));
1696 }
1697
1698 /* A and SUBLOOP_A are allocnos for the same pseudo register, with A's
1699 loop immediately enclosing SUBLOOP_A's loop. If we allocate to A a
1700 hard register R that is clobbered by a call in SUBLOOP_A, decide
1701 which of the following approaches should be used for handling the
1702 conflict:
1703
1704 (1) Spill R on entry to SUBLOOP_A's loop, assign memory to SUBLOOP_A,
1705 and restore R on exit from SUBLOOP_A's loop.
1706
1707 (2) Spill R before each necessary call in SUBLOOP_A's live range and
1708 restore R after each such call.
1709
1710 Return true if (1) is better than (2). SPILL_COST is the cost of
1711 doing (1). */
1712 inline bool
1713 ira_caller_save_loop_spill_p (ira_allocno_t a, ira_allocno_t subloop_a,
1714 int spill_cost)
1715 {
1716 if (!ira_subloop_allocnos_can_differ_p (a))
1717 return false;
1718
1719 /* Calculate the cost of saving a call-clobbered register
1720 before each call and restoring it afterwards. */
1721 int call_cost = ira_caller_save_cost (subloop_a);
1722 return call_cost && call_cost >= spill_cost;
1723 }
1724
1725 #endif /* GCC_IRA_INT_H */
1726