• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright © 2015 Connor Abbott
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  *
23  * Authors:
24  *    Connor Abbott (cwabbott0@gmail.com)
25  *
26  */
27 
28 #include "nir.h"
29 #include "nir_builder.h"
30 
31 static bool
phi_srcs_equal(nir_def * a,nir_def * b)32 phi_srcs_equal(nir_def *a, nir_def *b)
33 {
34    if (a == b)
35       return true;
36 
37    if (a->parent_instr->type != b->parent_instr->type)
38       return false;
39 
40    if (a->parent_instr->type != nir_instr_type_alu &&
41        a->parent_instr->type != nir_instr_type_load_const)
42       return false;
43 
44    if (!nir_instrs_equal(a->parent_instr, b->parent_instr))
45       return false;
46 
47    /* nir_instrs_equal ignores exact/fast_math */
48    if (a->parent_instr->type == nir_instr_type_alu) {
49       nir_alu_instr *a_alu = nir_instr_as_alu(a->parent_instr);
50       nir_alu_instr *b_alu = nir_instr_as_alu(b->parent_instr);
51       if (a_alu->exact != b_alu->exact || a_alu->fp_fast_math != b_alu->fp_fast_math)
52          return false;
53    }
54 
55    return true;
56 }
57 
58 static bool
src_dominates_block(nir_src * src,void * state)59 src_dominates_block(nir_src *src, void *state)
60 {
61    nir_block *block = state;
62    return nir_block_dominates(src->ssa->parent_instr->block, block);
63 }
64 
65 static bool
can_rematerialize_phi_src(nir_block * imm_dom,nir_def * def)66 can_rematerialize_phi_src(nir_block *imm_dom, nir_def *def)
67 {
68    if (def->parent_instr->type == nir_instr_type_alu) {
69       return nir_foreach_src(def->parent_instr, src_dominates_block, imm_dom);
70    } else if (def->parent_instr->type == nir_instr_type_load_const) {
71       return true;
72    }
73    return false;
74 }
75 
76 /*
77  * This is a pass for removing phi nodes that look like:
78  * a = phi(b, b, b, ...)
79  *
80  * Note that we can't always ignore undef sources here, or else we may create a
81  * situation where the definition of b isn't dominated by its uses. We're
82  * allowed to do this since the definition of b must dominate all of the
83  * phi node's predecessors, which means it must dominate the phi node as well
84  * as all of the phi node's uses. In essence, the phi node acts as a copy
85  * instruction. b can't be another phi node in the same block, since the only
86  * time when phi nodes can source other phi nodes defined in the same block is
87  * at the loop header, and in that case one of the sources of the phi has to
88  * be from before the loop and that source can't be b.
89  */
90 
91 static bool
remove_phis_block(nir_block * block,nir_builder * b)92 remove_phis_block(nir_block *block, nir_builder *b)
93 {
94    bool progress = false;
95 
96    nir_foreach_phi_safe(phi, block) {
97       nir_def *def = NULL;
98       bool srcs_same = true;
99       bool needs_remat = false;
100 
101       nir_foreach_phi_src(src, phi) {
102          /* For phi nodes at the beginning of loops, we may encounter some
103           * sources from backedges that point back to the destination of the
104           * same phi, i.e. something like:
105           *
106           * a = phi(a, b, ...)
107           *
108           * We can safely ignore these sources, since if all of the normal
109           * sources point to the same definition, then that definition must
110           * still dominate the phi node, and the phi will still always take
111           * the value of that definition.
112           */
113          if (src->src.ssa == &phi->def)
114             continue;
115 
116          /* Ignore undef sources. */
117          if (nir_src_is_undef(src->src))
118             continue;
119 
120          if (def == NULL) {
121             def = src->src.ssa;
122             if (!nir_block_dominates(def->parent_instr->block, block->imm_dom)) {
123                if (!can_rematerialize_phi_src(block->imm_dom, def)) {
124                   srcs_same = false;
125                   break;
126                }
127                needs_remat = true;
128             }
129          } else if (!phi_srcs_equal(src->src.ssa, def)) {
130             srcs_same = false;
131             break;
132          }
133       }
134 
135       if (!srcs_same)
136          continue;
137 
138       if (!def) {
139          /* In this case, the phi had no non undef sources. So turn it into an undef. */
140          b->cursor = nir_after_phis(block);
141          def = nir_undef(b, phi->def.num_components, phi->def.bit_size);
142       } else if (needs_remat) {
143          b->cursor = nir_after_block_before_jump(block->imm_dom);
144          nir_instr *remat = nir_instr_clone(b->shader, def->parent_instr);
145          nir_builder_instr_insert(b, remat);
146          def = nir_instr_def(remat);
147       }
148 
149       nir_def_replace(&phi->def, def);
150 
151       progress = true;
152    }
153 
154    return progress;
155 }
156 
157 bool
nir_remove_single_src_phis_block(nir_block * block)158 nir_remove_single_src_phis_block(nir_block *block)
159 {
160    assert(block->predecessors->entries <= 1);
161    bool progress = false;
162    nir_foreach_phi_safe(phi, block) {
163       nir_def *def = NULL;
164       nir_foreach_phi_src(src, phi) {
165          def = src->src.ssa;
166          break;
167       }
168 
169       if (!def) {
170          nir_builder b = nir_builder_create(nir_cf_node_get_function(&block->cf_node));
171          b.cursor = nir_after_phis(block);
172          def = nir_undef(&b, phi->def.num_components, phi->def.bit_size);
173       }
174 
175       nir_def_replace(&phi->def, def);
176       progress = true;
177    }
178    return progress;
179 }
180 
181 static bool
nir_opt_remove_phis_impl(nir_function_impl * impl)182 nir_opt_remove_phis_impl(nir_function_impl *impl)
183 {
184    bool progress = false;
185    nir_builder bld = nir_builder_create(impl);
186 
187    nir_metadata_require(impl, nir_metadata_dominance);
188 
189    nir_foreach_block(block, impl) {
190       progress |= remove_phis_block(block, &bld);
191    }
192 
193    if (progress) {
194       nir_metadata_preserve(impl, nir_metadata_control_flow);
195    } else {
196       nir_metadata_preserve(impl, nir_metadata_all);
197    }
198 
199    return progress;
200 }
201 
202 bool
nir_opt_remove_phis(nir_shader * shader)203 nir_opt_remove_phis(nir_shader *shader)
204 {
205    bool progress = false;
206 
207    nir_foreach_function_impl(impl, shader)
208       progress = nir_opt_remove_phis_impl(impl) || progress;
209 
210    return progress;
211 }
212