blob: 3db0a264e29a63c8f59da8ce90b7745f23001d00 [file] [log] [blame]
/* Conditional compare related functions
Copyright (C) 2014-2022 Free Software Foundation, Inc.
This file is part of GCC.
GCC is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free
Software Foundation; either version 3, or (at your option) any later
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or
for more details.
You should have received a copy of the GNU General Public License
along with GCC; see the file COPYING3. If not see
<>. */
#include "config.h"
#include "system.h"
#include "coretypes.h"
#include "backend.h"
#include "target.h"
#include "rtl.h"
#include "tree.h"
#include "gimple.h"
#include "memmodel.h"
#include "tm_p.h"
#include "ssa.h"
#include "expmed.h"
#include "optabs.h"
#include "emit-rtl.h"
#include "stor-layout.h"
#include "tree-ssa-live.h"
#include "tree-outof-ssa.h"
#include "cfgexpand.h"
#include "ccmp.h"
#include "predict.h"
/* Check whether T is a simple boolean variable or a SSA name
set by a comparison operator in the same basic block. */
static bool
ccmp_tree_comparison_p (tree t, basic_block bb)
gimple *g = get_gimple_for_ssa_name (t);
tree_code tcode;
/* If we have a boolean variable allow it and generate a compare
to zero reg when expanding. */
if (!g)
/* Check to see if SSA name is set by a comparison operator in
the same basic block. */
if (!is_gimple_assign (g))
return false;
if (bb != gimple_bb (g))
return false;
tcode = gimple_assign_rhs_code (g);
return TREE_CODE_CLASS (tcode) == tcc_comparison;
/* The following functions expand conditional compare (CCMP) instructions.
Here is a short description about the over all algorithm:
* ccmp_candidate_p is used to identify the CCMP candidate
* expand_ccmp_expr is the main entry, which calls expand_ccmp_expr_1
to expand CCMP.
* expand_ccmp_expr_1 uses a recursive algorithm to expand CCMP.
It calls two target hooks gen_ccmp_first and gen_ccmp_next to generate
CCMP instructions.
- gen_ccmp_first expands the first compare in CCMP.
- gen_ccmp_next expands the following compares.
Both hooks return a comparison with the CC register that is equivalent
to the value of the gimple comparison. This is used by the next CCMP
and in the final conditional store.
* We use cstorecc4 pattern to convert the CCmode intermediate to
the integer mode result that expand_normal is expecting.
Since the operands of the later compares might clobber CC reg, we do not
emit the insns during expand. We keep the insn sequences in two seq
* prep_seq, which includes all the insns to prepare the operands.
* gen_seq, which includes all the compare and conditional compares.
If all checks OK in expand_ccmp_expr, it emits insns in prep_seq, then
insns in gen_seq. */
/* Check whether G is a potential conditional compare candidate. */
static bool
ccmp_candidate_p (gimple *g)
tree lhs, op0, op1;
gimple *gs0, *gs1;
tree_code tcode;
basic_block bb;
if (!g)
return false;
tcode = gimple_assign_rhs_code (g);
if (tcode != BIT_AND_EXPR && tcode != BIT_IOR_EXPR)
return false;
lhs = gimple_assign_lhs (g);
op0 = gimple_assign_rhs1 (g);
op1 = gimple_assign_rhs2 (g);
if ((TREE_CODE (op0) != SSA_NAME) || (TREE_CODE (op1) != SSA_NAME)
|| !has_single_use (lhs))
return false;
bb = gimple_bb (g);
gs0 = get_gimple_for_ssa_name (op0); /* gs0 may be NULL */
gs1 = get_gimple_for_ssa_name (op1); /* gs1 may be NULL */
if (ccmp_tree_comparison_p (op0, bb) && ccmp_tree_comparison_p (op1, bb))
return true;
if (ccmp_tree_comparison_p (op0, bb) && ccmp_candidate_p (gs1))
return true;
if (ccmp_tree_comparison_p (op1, bb) && ccmp_candidate_p (gs0))
return true;
/* We skip ccmp_candidate_p (gs1) && ccmp_candidate_p (gs0) since
there is no way to set and maintain the CC flag on both sides of
the logical operator at the same time. */
return false;
/* Extract the comparison we want to do from the tree. */
get_compare_parts (tree t, int *up, rtx_code *rcode,
tree *rhs1, tree *rhs2)
tree_code code;
gimple *g = get_gimple_for_ssa_name (t);
if (g)
*up = TYPE_UNSIGNED (TREE_TYPE (gimple_assign_rhs1 (g)));
code = gimple_assign_rhs_code (g);
*rcode = get_rtx_code (code, *up);
*rhs1 = gimple_assign_rhs1 (g);
*rhs2 = gimple_assign_rhs2 (g);
/* If g is not a comparison operator create a compare to zero. */
*up = 1;
*rcode = NE;
*rhs1 = t;
*rhs2 = build_zero_cst (TREE_TYPE (t));
/* PREV is a comparison with the CC register which represents the
result of the previous CMP or CCMP. The function expands the
next compare based on G which is ANDed/ORed with the previous
compare depending on CODE.
PREP_SEQ returns all insns to prepare opearands for compare.
GEN_SEQ returns all compare insns. */
static rtx
expand_ccmp_next (tree op, tree_code code, rtx prev,
rtx_insn **prep_seq, rtx_insn **gen_seq)
rtx_code rcode;
int unsignedp;
tree rhs1, rhs2;
get_compare_parts(op, &unsignedp, &rcode, &rhs1, &rhs2);
return targetm.gen_ccmp_next (prep_seq, gen_seq, prev, rcode,
rhs1, rhs2, get_rtx_code (code, 0));
/* Expand conditional compare gimple G. A typical CCMP sequence is like:
CC0 = CMP (a, b);
CC1 = CCMP (NE (CC0, 0), CMP (e, f));
CCn = CCMP (NE (CCn-1, 0), CMP (...));
hook gen_ccmp_first is used to expand the first compare.
hook gen_ccmp_next is used to expand the following CCMP.
PREP_SEQ returns all insns to prepare opearand.
GEN_SEQ returns all compare insns. */
static rtx
expand_ccmp_expr_1 (gimple *g, rtx_insn **prep_seq, rtx_insn **gen_seq)
tree_code code = gimple_assign_rhs_code (g);
basic_block bb = gimple_bb (g);
tree op0 = gimple_assign_rhs1 (g);
tree op1 = gimple_assign_rhs2 (g);
gimple *gs0 = get_gimple_for_ssa_name (op0);
gimple *gs1 = get_gimple_for_ssa_name (op1);
rtx tmp;
gcc_assert (code == BIT_AND_EXPR || code == BIT_IOR_EXPR);
if (ccmp_tree_comparison_p (op0, bb))
if (ccmp_tree_comparison_p (op1, bb))
int unsignedp0, unsignedp1;
rtx_code rcode0, rcode1;
tree logical_op0_rhs1, logical_op0_rhs2;
tree logical_op1_rhs1, logical_op1_rhs2;
int speed_p = optimize_insn_for_speed_p ();
rtx tmp2 = NULL_RTX, ret = NULL_RTX, ret2 = NULL_RTX;
unsigned cost1 = MAX_COST;
unsigned cost2 = MAX_COST;
get_compare_parts (op0, &unsignedp0, &rcode0,
&logical_op0_rhs1, &logical_op0_rhs2);
get_compare_parts (op1, &unsignedp1, &rcode1,
&logical_op1_rhs1, &logical_op1_rhs2);
rtx_insn *prep_seq_1, *gen_seq_1;
tmp = targetm.gen_ccmp_first (&prep_seq_1, &gen_seq_1, rcode0,
logical_op0_rhs1, logical_op0_rhs2);
if (tmp != NULL)
ret = expand_ccmp_next (op1, code, tmp, &prep_seq_1, &gen_seq_1);
cost1 = seq_cost (prep_seq_1, speed_p);
cost1 += seq_cost (gen_seq_1, speed_p);
/* FIXME: Temporary workaround for PR69619.
Avoid exponential compile time due to expanding gs0 and gs1 twice.
If gs0 and gs1 are complex, the cost will be high, so avoid
reevaluation if above an arbitrary threshold. */
rtx_insn *prep_seq_2, *gen_seq_2;
if (tmp == NULL || cost1 < COSTS_N_INSNS (25))
tmp2 = targetm.gen_ccmp_first (&prep_seq_2, &gen_seq_2, rcode1,
logical_op1_rhs1, logical_op1_rhs2);
if (!tmp && !tmp2)
return NULL_RTX;
if (tmp2 != NULL)
ret2 = expand_ccmp_next (op0, code, tmp2, &prep_seq_2,
cost2 = seq_cost (prep_seq_2, speed_p);
cost2 += seq_cost (gen_seq_2, speed_p);
if (cost2 < cost1)
*prep_seq = prep_seq_2;
*gen_seq = gen_seq_2;
return ret2;
*prep_seq = prep_seq_1;
*gen_seq = gen_seq_1;
return ret;
tmp = expand_ccmp_expr_1 (gs1, prep_seq, gen_seq);
if (!tmp)
return NULL_RTX;
return expand_ccmp_next (op0, code, tmp, prep_seq, gen_seq);
gcc_assert (gimple_assign_rhs_code (gs0) == BIT_AND_EXPR
|| gimple_assign_rhs_code (gs0) == BIT_IOR_EXPR);
gcc_assert (ccmp_tree_comparison_p (op1, bb));
tmp = expand_ccmp_expr_1 (gs0, prep_seq, gen_seq);
if (!tmp)
return NULL_RTX;
return expand_ccmp_next (op1, code, tmp, prep_seq, gen_seq);
/* Main entry to expand conditional compare statement G.
Return NULL_RTX if G is not a legal candidate or expand fail.
Otherwise return the target. */
expand_ccmp_expr (gimple *g, machine_mode mode)
rtx_insn *last;
rtx tmp;
if (!ccmp_candidate_p (g))
return NULL_RTX;
last = get_last_insn ();
rtx_insn *prep_seq = NULL, *gen_seq = NULL;
tmp = expand_ccmp_expr_1 (g, &prep_seq, &gen_seq);
if (tmp)
insn_code icode;
machine_mode cc_mode = CCmode;
rtx_code cmp_code = GET_CODE (tmp);
cc_mode = SELECT_CC_MODE (cmp_code, XEXP (tmp, 0), const0_rtx);
icode = optab_handler (cstore_optab, cc_mode);
if (icode != CODE_FOR_nothing)
rtx target = gen_reg_rtx (mode);
emit_insn (prep_seq);
emit_insn (gen_seq);
tmp = emit_cstore (target, icode, cmp_code, cc_mode, cc_mode,
0, XEXP (tmp, 0), const0_rtx, 1, mode);
if (tmp)
return tmp;
/* Clean up. */
delete_insns_since (last);
return NULL_RTX;