ree.c 40.1 KB
Newer Older
1
/* Redundant Extension Elimination pass for the GNU compiler.
Jakub Jelinek committed
2
   Copyright (C) 2010-2015 Free Software Foundation, Inc.
3
   Contributed by Ilya Enkovich (ilya.enkovich@intel.com)
4

5 6
   Based on the Redundant Zero-extension elimination pass contributed by
   Sriraman Tallam (tmsriram@google.com) and Silvius Rus (rus@google.com).
7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26

This file is part of GCC.

GCC is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free
Software Foundation; either version 3, or (at your option) any later
version.

GCC is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
for more details.

You should have received a copy of the GNU General Public License
along with GCC; see the file COPYING3.  If not see
<http://www.gnu.org/licenses/>.  */


/* Problem Description :
   --------------------
27 28 29 30 31 32 33 34
   This pass is intended to remove redundant extension instructions.
   Such instructions appear for different reasons.  We expect some of
   them due to implicit zero-extension in 64-bit registers after writing
   to their lower 32-bit half (e.g. for the x86-64 architecture).
   Another possible reason is a type cast which follows a load (for
   instance a register restore) and which can be combined into a single
   instruction, and for which earlier local passes, e.g. the combiner,
   weren't able to optimize.
35 36 37 38 39

   How does this pass work  ?
   --------------------------

   This pass is run after register allocation.  Hence, all registers that
40 41 42 43 44
   this pass deals with are hard registers.  This pass first looks for an
   extension instruction that could possibly be redundant.  Such extension
   instructions show up in RTL with the pattern  :
   (set (reg:<SWI248> x) (any_extend:<SWI248> (reg:<SWI124> x))),
   where x can be any hard register.
45
   Now, this pass tries to eliminate this instruction by merging the
46
   extension with the definitions of register x.  For instance, if
47 48
   one of the definitions of register x was  :
   (set (reg:SI x) (plus:SI (reg:SI z1) (reg:SI z2))),
49 50
   followed by extension  :
   (set (reg:DI x) (zero_extend:DI (reg:SI x)))
51 52 53
   then the combination converts this into :
   (set (reg:DI x) (zero_extend:DI (plus:SI (reg:SI z1) (reg:SI z2)))).
   If all the merged definitions are recognizable assembly instructions,
54 55 56 57 58 59 60
   the extension is effectively eliminated.

   For example, for the x86-64 architecture, implicit zero-extensions
   are captured with appropriate patterns in the i386.md file.  Hence,
   these merged definition can be matched to a single assembly instruction.
   The original extension instruction is then deleted if all the
   definitions can be merged.
61 62

   However, there are cases where the definition instruction cannot be
63 64
   merged with an extension.  Examples are CALL instructions.  In such
   cases, the original extension is not redundant and this pass does
65 66 67 68 69
   not delete it.

   Handling conditional moves :
   ----------------------------

70 71
   Architectures like x86-64 support conditional moves whose semantics for
   extension differ from the other instructions.  For instance, the
72 73
   instruction *cmov ebx, eax*
   zero-extends eax onto rax only when the move from ebx to eax happens.
74
   Otherwise, eax may not be zero-extended.  Consider conditional moves as
75 76
   RTL instructions of the form
   (set (reg:SI x) (if_then_else (cond) (reg:SI y) (reg:SI z))).
77
   This pass tries to merge an extension with a conditional move by
78
   actually merging the definitions of y and z with an extension and then
79 80
   converting the conditional move into :
   (set (reg:DI x) (if_then_else (cond) (reg:DI y) (reg:DI z))).
81 82 83
   Since registers y and z are extended, register x will also be extended
   after the conditional move.  Note that this step has to be done
   transitively since the definition of a conditional copy can be
84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103
   another conditional copy.

   Motivating Example I :
   ---------------------
   For this program :
   **********************************************
   bad_code.c

   int mask[1000];

   int foo(unsigned x)
   {
     if (x < 10)
       x = x * 45;
     else
       x = x * 78;
     return mask[x];
   }
   **********************************************

104
   $ gcc -O2 bad_code.c
105 106 107
     ........
     400315:       b8 4e 00 00 00          mov    $0x4e,%eax
     40031a:       0f af f8                imul   %eax,%edi
108
     40031d:       89 ff                   mov    %edi,%edi - useless extension
109 110 111 112 113
     40031f:       8b 04 bd 60 19 40 00    mov    0x401960(,%rdi,4),%eax
     400326:       c3                      retq
     ......
     400330:       ba 2d 00 00 00          mov    $0x2d,%edx
     400335:       0f af fa                imul   %edx,%edi
114
     400338:       89 ff                   mov    %edi,%edi - useless extension
115 116 117
     40033a:       8b 04 bd 60 19 40 00    mov    0x401960(,%rdi,4),%eax
     400341:       c3                      retq

118
   $ gcc -O2 -free bad_code.c
119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
     ......
     400315:       6b ff 4e                imul   $0x4e,%edi,%edi
     400318:       8b 04 bd 40 19 40 00    mov    0x401940(,%rdi,4),%eax
     40031f:       c3                      retq
     400320:       6b ff 2d                imul   $0x2d,%edi,%edi
     400323:       8b 04 bd 40 19 40 00    mov    0x401940(,%rdi,4),%eax
     40032a:       c3                      retq

   Motivating Example II :
   ---------------------

   Here is an example with a conditional move.

   For this program :
   **********************************************

   unsigned long long foo(unsigned x , unsigned y)
   {
     unsigned z;
     if (x > 100)
       z = x + y;
     else
       z = x - y;
     return (unsigned long long)(z);
   }

145
   $ gcc -O2 bad_code.c
146 147 148 149 150 151
     ............
     400360:       8d 14 3e                lea    (%rsi,%rdi,1),%edx
     400363:       89 f8                   mov    %edi,%eax
     400365:       29 f0                   sub    %esi,%eax
     400367:       83 ff 65                cmp    $0x65,%edi
     40036a:       0f 43 c2                cmovae %edx,%eax
152
     40036d:       89 c0                   mov    %eax,%eax - useless extension
153 154
     40036f:       c3                      retq

155
   $ gcc -O2 -free bad_code.c
156 157 158 159 160 161 162 163 164
     .............
     400360:       89 fa                   mov    %edi,%edx
     400362:       8d 04 3e                lea    (%rsi,%rdi,1),%eax
     400365:       29 f2                   sub    %esi,%edx
     400367:       83 ff 65                cmp    $0x65,%edi
     40036a:       89 d6                   mov    %edx,%esi
     40036c:       48 0f 42 c6             cmovb  %rsi,%rax
     400370:       c3                      retq

165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190
  Motivating Example III :
  ---------------------

  Here is an example with a type cast.

  For this program :
  **********************************************

  void test(int size, unsigned char *in, unsigned char *out)
  {
    int i;
    unsigned char xr, xg, xy=0;

    for (i = 0; i < size; i++) {
      xr = *in++;
      xg = *in++;
      xy = (unsigned char) ((19595*xr + 38470*xg) >> 16);
      *out++ = xy;
    }
  }

  $ gcc -O2 bad_code.c
    ............
    10:   0f b6 0e                movzbl (%rsi),%ecx
    13:   0f b6 46 01             movzbl 0x1(%rsi),%eax
    17:   48 83 c6 02             add    $0x2,%rsi
191 192
    1b:   0f b6 c9                movzbl %cl,%ecx - useless extension
    1e:   0f b6 c0                movzbl %al,%eax - useless extension
193 194 195 196 197 198 199 200 201 202
    21:   69 c9 8b 4c 00 00       imul   $0x4c8b,%ecx,%ecx
    27:   69 c0 46 96 00 00       imul   $0x9646,%eax,%eax

   $ gcc -O2 -free bad_code.c
     .............
    10:   0f b6 0e                movzbl (%rsi),%ecx
    13:   0f b6 46 01             movzbl 0x1(%rsi),%eax
    17:   48 83 c6 02             add    $0x2,%rsi
    1b:   69 c9 8b 4c 00 00       imul   $0x4c8b,%ecx,%ecx
    21:   69 c0 46 96 00 00       imul   $0x9646,%eax,%eax
203 204 205 206

   Usefulness :
   ----------

207 208 209
   The original redundant zero-extension elimination pass reported reduction
   of the dynamic instruction count of a compression benchmark by 2.8% and
   improvement of its run time by about 1%.
210

211 212 213 214 215
   The additional performance gain with the enhanced pass is mostly expected
   on in-order architectures where redundancy cannot be compensated by out of
   order execution.  Measurements showed up to 10% performance gain (reduced
   run time) on EEMBC 2.0 benchmarks on Atom processor with geomean performance
   gain 1%.  */
216 217 218 219 220 221 222


#include "config.h"
#include "system.h"
#include "coretypes.h"
#include "tm.h"
#include "rtl.h"
223 224
#include "alias.h"
#include "symtab.h"
225 226 227 228 229
#include "tree.h"
#include "tm_p.h"
#include "flags.h"
#include "regs.h"
#include "hard-reg-set.h"
230
#include "predict.h"
231
#include "function.h"
232 233 234 235 236
#include "dominance.h"
#include "cfg.h"
#include "cfgrtl.h"
#include "basic-block.h"
#include "insn-config.h"
237 238 239 240 241 242 243
#include "expmed.h"
#include "dojump.h"
#include "explow.h"
#include "calls.h"
#include "emit-rtl.h"
#include "varasm.h"
#include "stmt.h"
244 245 246
#include "expr.h"
#include "insn-attr.h"
#include "recog.h"
247
#include "diagnostic-core.h"
248 249
#include "target.h"
#include "insn-codes.h"
250
#include "optabs.h"
251 252 253 254 255 256
#include "rtlhooks-def.h"
#include "params.h"
#include "tree-pass.h"
#include "df.h"
#include "cgraph.h"

257
/* This structure represents a candidate for elimination.  */
258

259
typedef struct ext_cand
260
{
261 262
  /* The expression.  */
  const_rtx expr;
263

264 265
  /* The kind of extension.  */
  enum rtx_code code;
266

267
  /* The destination mode.  */
268
  machine_mode mode;
269 270

  /* The instruction where it lives.  */
David Malcolm committed
271
  rtx_insn *insn;
272
} ext_cand;
273 274


275 276
static int max_insn_uid;

277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320
/* Update or remove REG_EQUAL or REG_EQUIV notes for INSN.  */

static bool
update_reg_equal_equiv_notes (rtx_insn *insn, machine_mode new_mode,
			      machine_mode old_mode, enum rtx_code code)
{
  rtx *loc = &REG_NOTES (insn);
  while (*loc)
    {
      enum reg_note kind = REG_NOTE_KIND (*loc);
      if (kind == REG_EQUAL || kind == REG_EQUIV)
	{
	  rtx orig_src = XEXP (*loc, 0);
	  /* Update equivalency constants.  Recall that RTL constants are
	     sign-extended.  */
	  if (GET_CODE (orig_src) == CONST_INT
	      && HOST_BITS_PER_WIDE_INT >= GET_MODE_BITSIZE (new_mode))
	    {
	      if (INTVAL (orig_src) >= 0 || code == SIGN_EXTEND)
		/* Nothing needed.  */;
	      else
		{
		  /* Zero-extend the negative constant by masking out the
		     bits outside the source mode.  */
		  rtx new_const_int
		    = gen_int_mode (INTVAL (orig_src)
				    & GET_MODE_MASK (old_mode),
				    new_mode);
		  if (!validate_change (insn, &XEXP (*loc, 0),
					new_const_int, true))
		    return false;
		}
	      loc = &XEXP (*loc, 1);
	    }
	  /* Drop all other notes, they assume a wrong mode.  */
	  else if (!validate_change (insn, loc, XEXP (*loc, 1), true))
	    return false;
	}
      else
	loc = &XEXP (*loc, 1);
    }
  return true;
}

321 322 323 324 325 326
/* Given a insn (CURR_INSN), an extension candidate for removal (CAND)
   and a pointer to the SET rtx (ORIG_SET) that needs to be modified,
   this code modifies the SET rtx to a new SET rtx that extends the
   right hand expression into a register on the left hand side.  Note
   that multiple assumptions are made about the nature of the set that
   needs to be true for this to work and is called from merge_def_and_ext.
327 328

   Original :
329
   (set (reg a) (expression))
330 331

   Transform :
332
   (set (reg a) (any_extend (expression)))
333 334

   Special Cases :
335
   If the expression is a constant or another extension, then directly
336
   assign it to the register.  */
337 338

static bool
David Malcolm committed
339
combine_set_extension (ext_cand *cand, rtx_insn *curr_insn, rtx *orig_set)
340
{
341
  rtx orig_src = SET_SRC (*orig_set);
342
  machine_mode orig_mode = GET_MODE (SET_DEST (*orig_set));
343
  rtx new_set;
344 345 346 347 348 349 350 351 352 353 354 355 356
  rtx cand_pat = PATTERN (cand->insn);

  /* If the extension's source/destination registers are not the same
     then we need to change the original load to reference the destination
     of the extension.  Then we need to emit a copy from that destination
     to the original destination of the load.  */
  rtx new_reg;
  bool copy_needed
    = (REGNO (SET_DEST (cand_pat)) != REGNO (XEXP (SET_SRC (cand_pat), 0)));
  if (copy_needed)
    new_reg = gen_rtx_REG (cand->mode, REGNO (SET_DEST (cand_pat)));
  else
    new_reg = gen_rtx_REG (cand->mode, REGNO (SET_DEST (*orig_set)));
357

358 359
#if 0
  /* Rethinking test.  Temporarily disabled.  */
360 361 362
  /* We're going to be widening the result of DEF_INSN, ensure that doing so
     doesn't change the number of hard registers needed for the result.  */
  if (HARD_REGNO_NREGS (REGNO (new_reg), cand->mode)
363 364
      != HARD_REGNO_NREGS (REGNO (SET_DEST (*orig_set)),
			   GET_MODE (SET_DEST (*orig_set))))
365
	return false;
366
#endif
367

368 369
  /* Merge constants by directly moving the constant into the register under
     some conditions.  Recall that RTL constants are sign-extended.  */
370
  if (GET_CODE (orig_src) == CONST_INT
371
      && HOST_BITS_PER_WIDE_INT >= GET_MODE_BITSIZE (cand->mode))
372
    {
373
      if (INTVAL (orig_src) >= 0 || cand->code == SIGN_EXTEND)
374
	new_set = gen_rtx_SET (new_reg, orig_src);
375
      else
376 377 378
	{
	  /* Zero-extend the negative constant by masking out the bits outside
	     the source mode.  */
379
	  rtx new_const_int
380
	    = gen_int_mode (INTVAL (orig_src) & GET_MODE_MASK (orig_mode),
381
			    GET_MODE (new_reg));
382
	  new_set = gen_rtx_SET (new_reg, new_const_int);
383 384 385 386
	}
    }
  else if (GET_MODE (orig_src) == VOIDmode)
    {
387
      /* This is mostly due to a call insn that should not be optimized.  */
388
      return false;
389
    }
390
  else if (GET_CODE (orig_src) == cand->code)
391
    {
392 393 394 395
      /* Here is a sequence of two extensions.  Try to merge them.  */
      rtx temp_extension
	= gen_rtx_fmt_e (cand->code, cand->mode, XEXP (orig_src, 0));
      rtx simplified_temp_extension = simplify_rtx (temp_extension);
396 397
      if (simplified_temp_extension)
        temp_extension = simplified_temp_extension;
398
      new_set = gen_rtx_SET (new_reg, temp_extension);
399 400 401
    }
  else if (GET_CODE (orig_src) == IF_THEN_ELSE)
    {
402
      /* Only IF_THEN_ELSE of phi-type copies are combined.  Otherwise,
403 404 405 406 407
         in general, IF_THEN_ELSE should not be combined.  */
      return false;
    }
  else
    {
408 409 410 411
      /* This is the normal case.  */
      rtx temp_extension
	= gen_rtx_fmt_e (cand->code, cand->mode, orig_src);
      rtx simplified_temp_extension = simplify_rtx (temp_extension);
412 413
      if (simplified_temp_extension)
        temp_extension = simplified_temp_extension;
414
      new_set = gen_rtx_SET (new_reg, temp_extension);
415 416
    }

417
  /* This change is a part of a group of changes.  Hence,
418
     validate_change will not try to commit the change.  */
419 420 421
  if (validate_change (curr_insn, orig_set, new_set, true)
      && update_reg_equal_equiv_notes (curr_insn, cand->mode, orig_mode,
				       cand->code))
422 423 424
    {
      if (dump_file)
        {
425
          fprintf (dump_file,
426 427
		   "Tentatively merged extension with definition %s:\n",
		   (copy_needed) ? "(copy needed)" : "");
428 429 430 431
          print_rtl_single (dump_file, curr_insn);
        }
      return true;
    }
432

433 434 435 436
  return false;
}

/* Treat if_then_else insns, where the operands of both branches
437
   are registers, as copies.  For instance,
438 439 440 441 442 443 444
   Original :
   (set (reg:SI a) (if_then_else (cond) (reg:SI b) (reg:SI c)))
   Transformed :
   (set (reg:DI a) (if_then_else (cond) (reg:DI b) (reg:DI c)))
   DEF_INSN is the if_then_else insn.  */

static bool
David Malcolm committed
445
transform_ifelse (ext_cand *cand, rtx_insn *def_insn)
446 447 448 449 450 451 452 453 454
{
  rtx set_insn = PATTERN (def_insn);
  rtx srcreg, dstreg, srcreg2;
  rtx map_srcreg, map_dstreg, map_srcreg2;
  rtx ifexpr;
  rtx cond;
  rtx new_set;

  gcc_assert (GET_CODE (set_insn) == SET);
455

456 457 458 459
  cond = XEXP (SET_SRC (set_insn), 0);
  dstreg = SET_DEST (set_insn);
  srcreg = XEXP (SET_SRC (set_insn), 1);
  srcreg2 = XEXP (SET_SRC (set_insn), 2);
460 461 462 463 464
  /* If the conditional move already has the right or wider mode,
     there is nothing to do.  */
  if (GET_MODE_SIZE (GET_MODE (dstreg)) >= GET_MODE_SIZE (cand->mode))
    return true;

465 466 467 468
  map_srcreg = gen_rtx_REG (cand->mode, REGNO (srcreg));
  map_srcreg2 = gen_rtx_REG (cand->mode, REGNO (srcreg2));
  map_dstreg = gen_rtx_REG (cand->mode, REGNO (dstreg));
  ifexpr = gen_rtx_IF_THEN_ELSE (cand->mode, cond, map_srcreg, map_srcreg2);
469
  new_set = gen_rtx_SET (map_dstreg, ifexpr);
470

471 472 473
  if (validate_change (def_insn, &PATTERN (def_insn), new_set, true)
      && update_reg_equal_equiv_notes (def_insn, cand->mode, GET_MODE (dstreg),
				       cand->code))
474 475 476
    {
      if (dump_file)
        {
477 478
          fprintf (dump_file,
		   "Mode of conditional move instruction extended:\n");
479 480 481 482
          print_rtl_single (dump_file, def_insn);
        }
      return true;
    }
483 484

  return false;
485 486
}

487 488 489 490
/* Get all the reaching definitions of an instruction.  The definitions are
   desired for REG used in INSN.  Return the definition list or NULL if a
   definition is missing.  If DEST is non-NULL, additionally push the INSN
   of the definitions onto DEST.  */
491

492
static struct df_link *
David Malcolm committed
493
get_defs (rtx_insn *insn, rtx reg, vec<rtx_insn *> *dest)
494
{
495
  df_ref use;
496
  struct df_link *ref_chain, *ref_link;
497

498
  FOR_EACH_INSN_USE (use, insn)
499
    {
500
      if (GET_CODE (DF_REF_REG (use)) == SUBREG)
501
        return NULL;
502 503
      if (REGNO (DF_REF_REG (use)) == REGNO (reg))
	break;
504 505
    }

506
  gcc_assert (use != NULL);
507

508
  ref_chain = DF_REF_CHAIN (use);
509 510

  for (ref_link = ref_chain; ref_link; ref_link = ref_link->next)
511 512
    {
      /* Problem getting some definition for this instruction.  */
513 514 515 516
      if (ref_link->ref == NULL)
        return NULL;
      if (DF_REF_INSN_INFO (ref_link->ref) == NULL)
        return NULL;
517 518
    }

519 520
  if (dest)
    for (ref_link = ref_chain; ref_link; ref_link = ref_link->next)
521
      dest->safe_push (DF_REF_INSN (ref_link->ref));
522

523
  return ref_chain;
524 525
}

526 527 528
/* Return true if INSN is
     (SET (reg REGNO (def_reg)) (if_then_else (cond) (REG x1) (REG x2)))
   and store x1 and x2 in REG_1 and REG_2.  */
529

530
static bool
David Malcolm committed
531
is_cond_copy_insn (rtx_insn *insn, rtx *reg1, rtx *reg2)
532
{
533
  rtx expr = single_set (insn);
534

535 536
  if (expr != NULL_RTX
      && GET_CODE (expr) == SET
537 538 539
      && GET_CODE (SET_DEST (expr)) == REG
      && GET_CODE (SET_SRC (expr))  == IF_THEN_ELSE
      && GET_CODE (XEXP (SET_SRC (expr), 1)) == REG
540
      && GET_CODE (XEXP (SET_SRC (expr), 2)) == REG)
541
    {
542 543 544
      *reg1 = XEXP (SET_SRC (expr), 1);
      *reg2 = XEXP (SET_SRC (expr), 2);
      return true;
545 546
    }

547
  return false;
548 549
}

550 551 552 553 554 555 556 557 558 559
enum ext_modified_kind
{
  /* The insn hasn't been modified by ree pass yet.  */
  EXT_MODIFIED_NONE,
  /* Changed into zero extension.  */
  EXT_MODIFIED_ZEXT,
  /* Changed into sign extension.  */
  EXT_MODIFIED_SEXT
};

560
struct ATTRIBUTE_PACKED ext_modified
561 562 563 564 565 566 567
{
  /* Mode from which ree has zero or sign extended the destination.  */
  ENUM_BITFIELD(machine_mode) mode : 8;

  /* Kind of modification of the insn.  */
  ENUM_BITFIELD(ext_modified_kind) kind : 2;

568 569
  unsigned int do_not_reextend : 1;

570 571 572 573 574 575 576
  /* True if the insn is scheduled to be deleted.  */
  unsigned int deleted : 1;
};

/* Vectors used by combine_reaching_defs and its helpers.  */
typedef struct ext_state
{
577
  /* In order to avoid constant alloc/free, we keep these
578
     4 vectors live through the entire find_and_remove_re and just
579
     truncate them each time.  */
David Malcolm committed
580 581 582 583
  vec<rtx_insn *> defs_list;
  vec<rtx_insn *> copies_list;
  vec<rtx_insn *> modified_list;
  vec<rtx_insn *> work_list;
584 585 586 587 588 589 590

  /* For instructions that have been successfully modified, this is
     the original mode from which the insn is extending and
     kind of extension.  */
  struct ext_modified *modified;
} ext_state;

591 592
/* Reaching Definitions of the extended register could be conditional copies
   or regular definitions.  This function separates the two types into two
593 594 595 596 597 598 599 600 601 602 603
   lists, STATE->DEFS_LIST and STATE->COPIES_LIST.  This is necessary because,
   if a reaching definition is a conditional copy, merging the extension with
   this definition is wrong.  Conditional copies are merged by transitively
   merging their definitions.  The defs_list is populated with all the reaching
   definitions of the extension instruction (EXTEND_INSN) which must be merged
   with an extension.  The copies_list contains all the conditional moves that
   will later be extended into a wider mode conditional move if all the merges
   are successful.  The function returns false upon failure, true upon
   success.  */

static bool
David Malcolm committed
604
make_defs_and_copies_lists (rtx_insn *extend_insn, const_rtx set_pat,
605
			    ext_state *state)
606
{
607
  rtx src_reg = XEXP (SET_SRC (set_pat), 0);
608
  bool *is_insn_visited;
609 610
  bool ret = true;

611
  state->work_list.truncate (0);
612

613
  /* Initialize the work list.  */
614 615
  if (!get_defs (extend_insn, src_reg, &state->work_list))
    gcc_unreachable ();
616

617
  is_insn_visited = XCNEWVEC (bool, max_insn_uid);
618 619

  /* Perform transitive closure for conditional copies.  */
620
  while (!state->work_list.is_empty ())
621
    {
David Malcolm committed
622
      rtx_insn *def_insn = state->work_list.pop ();
623 624
      rtx reg1, reg2;

625 626 627
      gcc_assert (INSN_UID (def_insn) < max_insn_uid);

      if (is_insn_visited[INSN_UID (def_insn)])
628
	continue;
629 630
      is_insn_visited[INSN_UID (def_insn)] = true;

631 632 633
      if (is_cond_copy_insn (def_insn, &reg1, &reg2))
	{
	  /* Push it onto the copy list first.  */
634
	  state->copies_list.safe_push (def_insn);
635 636

	  /* Now perform the transitive closure.  */
637 638
	  if (!get_defs (def_insn, reg1, &state->work_list)
	      || !get_defs (def_insn, reg2, &state->work_list))
639
	    {
640
	      ret = false;
641 642
	      break;
	    }
643 644
        }
      else
645
	state->defs_list.safe_push (def_insn);
646 647 648
    }

  XDELETEVEC (is_insn_visited);
649 650

  return ret;
651 652
}

653 654 655 656 657
/* If DEF_INSN has single SET expression, possibly buried inside
   a PARALLEL, return the address of the SET expression, else
   return NULL.  This is similar to single_set, except that
   single_set allows multiple SETs when all but one is dead.  */
static rtx *
David Malcolm committed
658
get_sub_rtx (rtx_insn *def_insn)
659
{
660 661
  enum rtx_code code = GET_CODE (PATTERN (def_insn));
  rtx *sub_rtx = NULL;
662 663 664

  if (code == PARALLEL)
    {
665
      for (int i = 0; i < XVECLEN (PATTERN (def_insn), 0); i++)
666
        {
667
          rtx s_expr = XVECEXP (PATTERN (def_insn), 0, i);
668 669 670 671 672 673 674 675
          if (GET_CODE (s_expr) != SET)
            continue;

          if (sub_rtx == NULL)
            sub_rtx = &XVECEXP (PATTERN (def_insn), 0, i);
          else
            {
              /* PARALLEL with multiple SETs.  */
676
              return NULL;
677 678 679 680 681 682 683 684
            }
        }
    }
  else if (code == SET)
    sub_rtx = &PATTERN (def_insn);
  else
    {
      /* It is not a PARALLEL or a SET, what could it be ? */
685
      return NULL;
686 687 688
    }

  gcc_assert (sub_rtx != NULL);
689 690 691 692 693 694 695
  return sub_rtx;
}

/* Merge the DEF_INSN with an extension.  Calls combine_set_extension
   on the SET pattern.  */

static bool
David Malcolm committed
696
merge_def_and_ext (ext_cand *cand, rtx_insn *def_insn, ext_state *state)
697
{
698
  machine_mode ext_src_mode;
699 700 701 702 703 704 705
  rtx *sub_rtx;

  ext_src_mode = GET_MODE (XEXP (SET_SRC (cand->expr), 0));
  sub_rtx = get_sub_rtx (def_insn);

  if (sub_rtx == NULL)
    return false;
706

707 708 709 710 711 712 713
  if (REG_P (SET_DEST (*sub_rtx))
      && (GET_MODE (SET_DEST (*sub_rtx)) == ext_src_mode
	  || ((state->modified[INSN_UID (def_insn)].kind
	       == (cand->code == ZERO_EXTEND
		   ? EXT_MODIFIED_ZEXT : EXT_MODIFIED_SEXT))
	      && state->modified[INSN_UID (def_insn)].mode
		 == ext_src_mode)))
714
    {
715 716 717 718 719 720 721 722 723 724 725 726 727
      if (GET_MODE_SIZE (GET_MODE (SET_DEST (*sub_rtx)))
	  >= GET_MODE_SIZE (cand->mode))
	return true;
      /* If def_insn is already scheduled to be deleted, don't attempt
	 to modify it.  */
      if (state->modified[INSN_UID (def_insn)].deleted)
	return false;
      if (combine_set_extension (cand, def_insn, sub_rtx))
	{
	  if (state->modified[INSN_UID (def_insn)].kind == EXT_MODIFIED_NONE)
	    state->modified[INSN_UID (def_insn)].mode = ext_src_mode;
	  return true;
	}
728
    }
729 730

  return false;
731 732
}

733 734 735 736 737 738 739 740 741 742 743 744
/* Given SRC, which should be one or more extensions of a REG, strip
   away the extensions and return the REG.  */

static inline rtx
get_extended_src_reg (rtx src)
{
  while (GET_CODE (src) == SIGN_EXTEND || GET_CODE (src) == ZERO_EXTEND)
    src = XEXP (src, 0);
  gcc_assert (REG_P (src));
  return src;
}

745
/* This function goes through all reaching defs of the source
746 747 748 749 750 751 752
   of the candidate for elimination (CAND) and tries to combine
   the extension with the definition instruction.  The changes
   are made as a group so that even if one definition cannot be
   merged, all reaching definitions end up not being merged.
   When a conditional copy is encountered, merging is attempted
   transitively on its definitions.  It returns true upon success
   and false upon failure.  */
753 754

static bool
755
combine_reaching_defs (ext_cand *cand, const_rtx set_pat, ext_state *state)
756
{
David Malcolm committed
757
  rtx_insn *def_insn;
758 759 760
  bool merge_successful = true;
  int i;
  int defs_ix;
761
  bool outcome;
762

763 764
  state->defs_list.truncate (0);
  state->copies_list.truncate (0);
765

766
  outcome = make_defs_and_copies_lists (cand->insn, set_pat, state);
767

768 769
  if (!outcome)
    return false;
770

771 772
  /* If the destination operand of the extension is a different
     register than the source operand, then additional restrictions
773 774
     are needed.  Note we have to handle cases where we have nested
     extensions in the source operand.  */
775 776 777 778
  bool copy_needed
    = (REGNO (SET_DEST (PATTERN (cand->insn)))
       != REGNO (get_extended_src_reg (SET_SRC (PATTERN (cand->insn)))));
  if (copy_needed)
779
    {
780 781 782 783 784 785 786 787 788 789 790
      /* Considering transformation of
	 (set (reg1) (expression))
	 ...
	 (set (reg2) (any_extend (reg1)))

	 into

	 (set (reg2) (any_extend (expression)))
	 (set (reg1) (reg2))
	 ...  */

791 792 793 794 795
      /* In theory we could handle more than one reaching def, it
	 just makes the code to update the insn stream more complex.  */
      if (state->defs_list.length () != 1)
	return false;

796 797
      /* We require the candidate not already be modified.  It may,
	 for example have been changed from a (sign_extend (reg))
798
	 into (zero_extend (sign_extend (reg))).
799 800 801 802

	 Handling that case shouldn't be terribly difficult, but the code
	 here and the code to emit copies would need auditing.  Until
	 we see a need, this is the safe thing to do.  */
803 804 805
      if (state->modified[INSN_UID (cand->insn)].kind != EXT_MODIFIED_NONE)
	return false;

806
      machine_mode dst_mode = GET_MODE (SET_DEST (PATTERN (cand->insn)));
807 808 809 810 811 812 813
      rtx src_reg = get_extended_src_reg (SET_SRC (PATTERN (cand->insn)));

      /* Ensure the number of hard registers of the copy match.  */
      if (HARD_REGNO_NREGS (REGNO (src_reg), dst_mode)
	  != HARD_REGNO_NREGS (REGNO (src_reg), GET_MODE (src_reg)))
	return false;

814
      /* There's only one reaching def.  */
David Malcolm committed
815
      rtx_insn *def_insn = state->defs_list[0];
816 817 818 819 820 821 822

      /* The defining statement must not have been modified either.  */
      if (state->modified[INSN_UID (def_insn)].kind != EXT_MODIFIED_NONE)
	return false;

      /* The defining statement and candidate insn must be in the same block.
	 This is merely to keep the test for safety and updating the insn
823 824
	 stream simple.  Also ensure that within the block the candidate
	 follows the defining insn.  */
825 826
      basic_block bb = BLOCK_FOR_INSN (cand->insn);
      if (bb != BLOCK_FOR_INSN (def_insn)
827
	  || DF_INSN_LUID (def_insn) > DF_INSN_LUID (cand->insn))
828 829 830 831 832
	return false;

      /* If there is an overlap between the destination of DEF_INSN and
	 CAND->insn, then this transformation is not safe.  Note we have
	 to test in the widened mode.  */
833 834 835 836 837
      rtx *dest_sub_rtx = get_sub_rtx (def_insn);
      if (dest_sub_rtx == NULL
	  || !REG_P (SET_DEST (*dest_sub_rtx)))
	return false;

838
      rtx tmp_reg = gen_rtx_REG (GET_MODE (SET_DEST (PATTERN (cand->insn))),
839
				 REGNO (SET_DEST (*dest_sub_rtx)));
840 841 842 843 844 845 846 847 848 849
      if (reg_overlap_mentioned_p (tmp_reg, SET_DEST (PATTERN (cand->insn))))
	return false;

      /* The destination register of the extension insn must not be
	 used or set between the def_insn and cand->insn exclusive.  */
      if (reg_used_between_p (SET_DEST (PATTERN (cand->insn)),
			      def_insn, cand->insn)
	  || reg_set_between_p (SET_DEST (PATTERN (cand->insn)),
				def_insn, cand->insn))
	return false;
850 851 852 853 854 855

      /* We must be able to copy between the two registers.   Generate,
	 recognize and verify constraints of the copy.  Also fail if this
	 generated more than one insn.

         This generates garbage since we throw away the insn when we're
Jeff Law committed
856 857 858 859 860
	 done, only to recreate it later if this test was successful. 

	 Make sure to get the mode from the extension (cand->insn).  This
	 is different than in the code to emit the copy as we have not
	 modified the defining insn yet.  */
861 862
      start_sequence ();
      rtx pat = PATTERN (cand->insn);
Jeff Law committed
863
      rtx new_dst = gen_rtx_REG (GET_MODE (SET_DEST (pat)),
864
                                 REGNO (get_extended_src_reg (SET_SRC (pat))));
Jeff Law committed
865
      rtx new_src = gen_rtx_REG (GET_MODE (SET_DEST (pat)),
866 867 868
                                 REGNO (SET_DEST (pat)));
      emit_move_insn (new_dst, new_src);

869
      rtx_insn *insn = get_insns();
870 871 872 873 874 875
      end_sequence ();
      if (NEXT_INSN (insn))
	return false;
      if (recog_memoized (insn) == -1)
	return false;
      extract_insn (insn);
876
      if (!constrain_operands (1, get_preferred_alternatives (insn, bb)))
877
	return false;
878 879 880
    }


881 882 883 884
  /* If cand->insn has been already modified, update cand->mode to a wider
     mode if possible, or punt.  */
  if (state->modified[INSN_UID (cand->insn)].kind != EXT_MODIFIED_NONE)
    {
885
      machine_mode mode;
886 887 888 889 890 891 892 893 894 895 896 897 898
      rtx set;

      if (state->modified[INSN_UID (cand->insn)].kind
	  != (cand->code == ZERO_EXTEND
	      ? EXT_MODIFIED_ZEXT : EXT_MODIFIED_SEXT)
	  || state->modified[INSN_UID (cand->insn)].mode != cand->mode
	  || (set = single_set (cand->insn)) == NULL_RTX)
	return false;
      mode = GET_MODE (SET_DEST (set));
      gcc_assert (GET_MODE_SIZE (mode) >= GET_MODE_SIZE (cand->mode));
      cand->mode = mode;
    }

899 900 901 902
  merge_successful = true;

  /* Go through the defs vector and try to merge all the definitions
     in this vector.  */
903 904
  state->modified_list.truncate (0);
  FOR_EACH_VEC_ELT (state->defs_list, defs_ix, def_insn)
905
    {
906
      if (merge_def_and_ext (cand, def_insn, state))
907
	state->modified_list.safe_push (def_insn);
908 909 910 911 912 913 914 915 916 917 918
      else
        {
          merge_successful = false;
          break;
        }
    }

  /* Now go through the conditional copies vector and try to merge all
     the copies in this vector.  */
  if (merge_successful)
    {
919
      FOR_EACH_VEC_ELT (state->copies_list, i, def_insn)
920
        {
921
          if (transform_ifelse (cand, def_insn))
922
	    state->modified_list.safe_push (def_insn);
923 924 925 926 927 928 929 930 931 932
          else
            {
              merge_successful = false;
              break;
            }
        }
    }

  if (merge_successful)
    {
933 934 935 936 937
      /* Commit the changes here if possible
	 FIXME: It's an all-or-nothing scenario.  Even if only one definition
	 cannot be merged, we entirely give up.  In the future, we should allow
	 extensions to be partially eliminated along those paths where the
	 definitions could be merged.  */
938 939 940
      if (apply_change_group ())
        {
          if (dump_file)
941
            fprintf (dump_file, "All merges were successful.\n");
942

943
	  FOR_EACH_VEC_ELT (state->modified_list, i, def_insn)
944 945 946 947 948
	    {
	      ext_modified *modified = &state->modified[INSN_UID (def_insn)];
	      if (modified->kind == EXT_MODIFIED_NONE)
		modified->kind = (cand->code == ZERO_EXTEND ? EXT_MODIFIED_ZEXT
						            : EXT_MODIFIED_SEXT);
949

950 951 952
	      if (copy_needed)
		modified->do_not_reextend = 1;
	    }
953 954 955 956
          return true;
        }
      else
        {
957 958
          /* Changes need not be cancelled explicitly as apply_change_group
             does it.  Print list of definitions in the dump_file for debug
959
             purposes.  This extension cannot be deleted.  */
960 961
          if (dump_file)
            {
962 963
	      fprintf (dump_file,
		       "Merge cancelled, non-mergeable definitions:\n");
964
	      FOR_EACH_VEC_ELT (state->modified_list, i, def_insn)
965
	        print_rtl_single (dump_file, def_insn);
966 967 968 969 970 971 972 973 974 975 976 977
            }
        }
    }
  else
    {
      /* Cancel any changes that have been made so far.  */
      cancel_changes (0);
    }

  return false;
}

978
/* Add an extension pattern that could be eliminated.  */
979 980

static void
David Malcolm committed
981
add_removable_extension (const_rtx expr, rtx_insn *insn,
982
			 vec<ext_cand> *insn_list,
983
			 unsigned *def_map)
984
{
985
  enum rtx_code code;
986
  machine_mode mode;
987
  unsigned int idx;
988 989
  rtx src, dest;

990
  /* We are looking for SET (REG N) (ANY_EXTEND (REG N)).  */
991 992 993 994
  if (GET_CODE (expr) != SET)
    return;

  src = SET_SRC (expr);
995
  code = GET_CODE (src);
996
  dest = SET_DEST (expr);
997
  mode = GET_MODE (dest);
998 999

  if (REG_P (dest)
1000
      && (code == SIGN_EXTEND || code == ZERO_EXTEND)
1001
      && REG_P (XEXP (src, 0)))
1002
    {
1003 1004 1005 1006
      struct df_link *defs, *def;
      ext_cand *cand;

      /* First, make sure we can get all the reaching definitions.  */
1007
      defs = get_defs (insn, XEXP (src, 0), NULL);
1008
      if (!defs)
1009
	{
1010 1011 1012
	  if (dump_file)
	    {
	      fprintf (dump_file, "Cannot eliminate extension:\n");
1013
	      print_rtl_single (dump_file, insn);
1014 1015 1016
	      fprintf (dump_file, " because of missing definition(s)\n");
	    }
	  return;
1017
	}
1018 1019 1020 1021

      /* Second, make sure the reaching definitions don't feed another and
	 different extension.  FIXME: this obviously can be improved.  */
      for (def = defs; def; def = def->next)
1022
	if ((idx = def_map[INSN_UID (DF_REF_INSN (def->ref))])
1023
	    && idx != -1U
1024
	    && (cand = &(*insn_list)[idx - 1])
1025
	    && cand->code != code)
1026 1027 1028 1029
	  {
	    if (dump_file)
	      {
	        fprintf (dump_file, "Cannot eliminate extension:\n");
1030
		print_rtl_single (dump_file, insn);
1031 1032 1033 1034
	        fprintf (dump_file, " because of other extension\n");
	      }
	    return;
	  }
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085
	/* For vector mode extensions, ensure that all uses of the
	   XEXP (src, 0) register are the same extension (both code
	   and to which mode), as unlike integral extensions lowpart
	   subreg of the sign/zero extended register are not equal
	   to the original register, so we have to change all uses or
	   none.  */
	else if (VECTOR_MODE_P (GET_MODE (XEXP (src, 0))))
	  {
	    if (idx == 0)
	      {
		struct df_link *ref_chain, *ref_link;

		ref_chain = DF_REF_CHAIN (def->ref);
		for (ref_link = ref_chain; ref_link; ref_link = ref_link->next)
		  {
		    if (ref_link->ref == NULL
			|| DF_REF_INSN_INFO (ref_link->ref) == NULL)
		      {
			idx = -1U;
			break;
		      }
		    rtx_insn *use_insn = DF_REF_INSN (ref_link->ref);
		    const_rtx use_set;
		    if (use_insn == insn || DEBUG_INSN_P (use_insn))
		      continue;
		    if (!(use_set = single_set (use_insn))
			|| !REG_P (SET_DEST (use_set))
			|| GET_MODE (SET_DEST (use_set)) != GET_MODE (dest)
			|| GET_CODE (SET_SRC (use_set)) != code
			|| !rtx_equal_p (XEXP (SET_SRC (use_set), 0),
					 XEXP (src, 0)))
		      {
			idx = -1U;
			break;
		      }
		  }
		if (idx == -1U)
		  def_map[INSN_UID (DF_REF_INSN (def->ref))] = idx;
	      }
	    if (idx == -1U)
	      {
		if (dump_file)
		  {
		    fprintf (dump_file, "Cannot eliminate extension:\n");
		    print_rtl_single (dump_file, insn);
		    fprintf (dump_file,
			     " because some vector uses aren't extension\n");
		  }
		return;
	      }
	  }
1086 1087 1088

      /* Then add the candidate to the list and insert the reaching definitions
         into the definition map.  */
1089
      ext_cand e = {expr, code, mode, insn};
1090 1091
      insn_list->safe_push (e);
      idx = insn_list->length ();
1092 1093

      for (def = defs; def; def = def->next)
1094
	def_map[INSN_UID (DF_REF_INSN (def->ref))] = idx;
1095 1096 1097
    }
}

1098
/* Traverse the instruction stream looking for extensions and return the
1099
   list of candidates.  */
1100

1101
static vec<ext_cand>
1102
find_removable_extensions (void)
1103
{
1104
  vec<ext_cand> insn_list = vNULL;
1105
  basic_block bb;
David Malcolm committed
1106 1107
  rtx_insn *insn;
  rtx set;
1108
  unsigned *def_map = XCNEWVEC (unsigned, max_insn_uid);
1109

1110
  FOR_EACH_BB_FN (bb, cfun)
1111 1112 1113 1114
    FOR_BB_INSNS (bb, insn)
      {
	if (!NONDEBUG_INSN_P (insn))
	  continue;
1115

1116 1117 1118 1119
	set = single_set (insn);
	if (set == NULL_RTX)
	  continue;
	add_removable_extension (set, insn, &insn_list, def_map);
1120 1121
      }

1122
  XDELETEVEC (def_map);
1123

1124
  return insn_list;
1125 1126 1127
}

/* This is the main function that checks the insn stream for redundant
1128
   extensions and tries to remove them if possible.  */
1129

1130
static void
1131
find_and_remove_re (void)
1132
{
1133
  ext_cand *curr_cand;
David Malcolm committed
1134
  rtx_insn *curr_insn = NULL;
1135
  int num_re_opportunities = 0, num_realized = 0, i;
1136
  vec<ext_cand> reinsn_list;
David Malcolm committed
1137 1138
  auto_vec<rtx_insn *> reinsn_del_list;
  auto_vec<rtx_insn *> reinsn_copy_list;
1139
  ext_state state;
1140 1141

  /* Construct DU chain to get all reaching definitions of each
1142
     extension instruction.  */
1143
  df_set_flags (DF_RD_PRUNE_DEAD_DEFS);
1144 1145
  df_chain_add_problem (DF_UD_CHAIN + DF_DU_CHAIN);
  df_analyze ();
1146
  df_set_flags (DF_DEFER_INSN_RESCAN);
1147 1148

  max_insn_uid = get_max_uid ();
1149
  reinsn_list = find_removable_extensions ();
1150 1151 1152 1153 1154
  state.defs_list.create (0);
  state.copies_list.create (0);
  state.modified_list.create (0);
  state.work_list.create (0);
  if (reinsn_list.is_empty ())
1155 1156 1157
    state.modified = NULL;
  else
    state.modified = XCNEWVEC (struct ext_modified, max_insn_uid);
1158

1159
  FOR_EACH_VEC_ELT (reinsn_list, i, curr_cand)
1160
    {
1161
      num_re_opportunities++;
1162

1163
      /* Try to combine the extension with the definition.  */
1164 1165
      if (dump_file)
        {
1166 1167
          fprintf (dump_file, "Trying to eliminate extension:\n");
          print_rtl_single (dump_file, curr_cand->insn);
1168 1169
        }

1170
      if (combine_reaching_defs (curr_cand, curr_cand->expr, &state))
1171 1172
        {
          if (dump_file)
1173
            fprintf (dump_file, "Eliminated the extension.\n");
1174
          num_realized++;
1175 1176 1177 1178 1179 1180 1181
	  /* If the RHS of the current candidate is not (extend (reg)), then
	     we do not allow the optimization of extensions where
	     the source and destination registers do not match.  Thus
	     checking REG_P here is correct.  */
	  if (REG_P (XEXP (SET_SRC (PATTERN (curr_cand->insn)), 0))
	      && (REGNO (SET_DEST (PATTERN (curr_cand->insn)))
		  != REGNO (XEXP (SET_SRC (PATTERN (curr_cand->insn)), 0))))
1182 1183 1184 1185 1186
	    {
              reinsn_copy_list.safe_push (curr_cand->insn);
              reinsn_copy_list.safe_push (state.defs_list[0]);
	    }
	  reinsn_del_list.safe_push (curr_cand->insn);
1187
	  state.modified[INSN_UID (curr_cand->insn)].deleted = 1;
1188 1189 1190
        }
    }

1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206
  /* The copy list contains pairs of insns which describe copies we
     need to insert into the INSN stream.

     The first insn in each pair is the extension insn, from which
     we derive the source and destination of the copy.

     The second insn in each pair is the memory reference where the
     extension will ultimately happen.  We emit the new copy
     immediately after this insn.

     It may first appear that the arguments for the copy are reversed.
     Remember that the memory reference will be changed to refer to the
     destination of the extention.  So we're actually emitting a copy
     from the new destination to the old destination.  */
  for (unsigned int i = 0; i < reinsn_copy_list.length (); i += 2)
    {
David Malcolm committed
1207 1208
      rtx_insn *curr_insn = reinsn_copy_list[i];
      rtx_insn *def_insn = reinsn_copy_list[i + 1];
1209 1210 1211 1212 1213 1214

      /* Use the mode of the destination of the defining insn
	 for the mode of the copy.  This is necessary if the
	 defining insn was used to eliminate a second extension
	 that was wider than the first.  */
      rtx sub_rtx = *get_sub_rtx (def_insn);
1215
      rtx pat = PATTERN (curr_insn);
1216
      rtx new_dst = gen_rtx_REG (GET_MODE (SET_DEST (sub_rtx)),
1217
				 REGNO (XEXP (SET_SRC (pat), 0)));
1218 1219
      rtx new_src = gen_rtx_REG (GET_MODE (SET_DEST (sub_rtx)),
				 REGNO (SET_DEST (pat)));
1220
      rtx set = gen_rtx_SET (new_dst, new_src);
1221
      emit_insn_after (set, def_insn);
1222 1223
    }

1224
  /* Delete all useless extensions here in one sweep.  */
1225
  FOR_EACH_VEC_ELT (reinsn_del_list, i, curr_insn)
1226
    delete_insn (curr_insn);
1227

1228 1229 1230 1231 1232
  reinsn_list.release ();
  state.defs_list.release ();
  state.copies_list.release ();
  state.modified_list.release ();
  state.work_list.release ();
1233
  XDELETEVEC (state.modified);
1234

1235
  if (dump_file && num_re_opportunities > 0)
1236 1237
    fprintf (dump_file, "Elimination opportunities = %d realized = %d\n",
	     num_re_opportunities, num_realized);
1238 1239
}

1240
/* Find and remove redundant extensions.  */
1241 1242

static unsigned int
1243
rest_of_handle_ree (void)
1244
{
1245 1246 1247
  timevar_push (TV_REE);
  find_and_remove_re ();
  timevar_pop (TV_REE);
1248 1249 1250
  return 0;
}

1251 1252 1253
namespace {

const pass_data pass_data_ree =
1254
{
1255 1256 1257 1258 1259 1260 1261 1262
  RTL_PASS, /* type */
  "ree", /* name */
  OPTGROUP_NONE, /* optinfo_flags */
  TV_REE, /* tv_id */
  0, /* properties_required */
  0, /* properties_provided */
  0, /* properties_destroyed */
  0, /* todo_flags_start */
1263
  TODO_df_finish, /* todo_flags_finish */
1264
};
1265 1266 1267 1268

class pass_ree : public rtl_opt_pass
{
public:
1269 1270
  pass_ree (gcc::context *ctxt)
    : rtl_opt_pass (pass_data_ree, ctxt)
1271 1272 1273
  {}

  /* opt_pass methods: */
1274
  virtual bool gate (function *) { return (optimize > 0 && flag_ree); }
1275
  virtual unsigned int execute (function *) { return rest_of_handle_ree (); }
1276 1277 1278 1279 1280 1281 1282 1283 1284 1285

}; // class pass_ree

} // anon namespace

rtl_opt_pass *
make_pass_ree (gcc::context *ctxt)
{
  return new pass_ree (ctxt);
}