Home | History | Annotate | Download | only in sb
      1 /*
      2  * Copyright 2013 Vadim Girlin <vadimgirlin (at) gmail.com>
      3  *
      4  * Permission is hereby granted, free of charge, to any person obtaining a
      5  * copy of this software and associated documentation files (the "Software"),
      6  * to deal in the Software without restriction, including without limitation
      7  * on the rights to use, copy, modify, merge, publish, distribute, sub
      8  * license, and/or sell copies of the Software, and to permit persons to whom
      9  * the Software is furnished to do so, subject to the following conditions:
     10  *
     11  * The above copyright notice and this permission notice (including the next
     12  * paragraph) shall be included in all copies or substantial portions of the
     13  * Software.
     14  *
     15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     17  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
     18  * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
     19  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
     20  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
     21  * USE OR OTHER DEALINGS IN THE SOFTWARE.
     22  *
     23  * Authors:
     24  *      Vadim Girlin
     25  */
     26 
     27 #include <stack>
     28 #include <map>
     29 
     30 #include "sb_shader.h"
     31 #include "sb_pass.h"
     32 
     33 namespace r600_sb {
     34 
     35 container_node* ssa_prepare::create_phi_nodes(int count) {
     36 	container_node *p = sh.create_container();
     37 	val_set &vars = cur_set();
     38 	node *nn;
     39 
     40 	for (val_set::iterator I = vars.begin(sh), E = vars.end(sh); I != E; ++I) {
     41 		nn = sh.create_node(NT_OP, NST_PHI);
     42 		nn->dst.assign(1, *I);
     43 		nn->src.assign(count, *I);
     44 		p->push_back(nn);
     45 	}
     46 	return p;
     47 }
     48 
     49 void ssa_prepare::add_defs(node &n) {
     50 	val_set &s = cur_set();
     51 	for (vvec::iterator I = n.dst.begin(), E = n.dst.end(); I != E; ++I) {
     52 		value *v = *I;
     53 		if (!v)
     54 			continue;
     55 
     56 		if (v->is_rel()) {
     57 			s.add_vec(v->mdef);
     58 		} else
     59 			s.add_val(v);
     60 	}
     61 }
     62 
     63 bool ssa_prepare::visit(cf_node& n, bool enter) {
     64 	if (enter) {
     65 		push_stk();
     66 	} else {
     67 		add_defs(n);
     68 		pop_stk();
     69 	}
     70 	return true;
     71 }
     72 
     73 bool ssa_prepare::visit(alu_node& n, bool enter) {
     74 	if (enter) {
     75 	} else {
     76 		add_defs(n);
     77 	}
     78 	return true;
     79 }
     80 
     81 bool ssa_prepare::visit(fetch_node& n, bool enter) {
     82 	if (enter) {
     83 	} else {
     84 		add_defs(n);
     85 	}
     86 	return true;
     87 }
     88 
     89 bool ssa_prepare::visit(region_node& n, bool enter) {
     90 	if (enter) {
     91 
     92 		push_stk();
     93 	} else {
     94 		cur_set().add_set(n.vars_defined);
     95 		if (n.dep_count() > 0)
     96 			n.phi = create_phi_nodes(n.dep_count());
     97 		if (n.rep_count() > 1) {
     98 			n.loop_phi = create_phi_nodes(n.rep_count());
     99 			n.loop_phi->subtype = NST_LOOP_PHI_CONTAINER;
    100 		}
    101 		n.vars_defined.clear();
    102 		pop_stk();
    103 	}
    104 	return true;
    105 }
    106 
    107 bool ssa_prepare::visit(repeat_node& n, bool enter) {
    108 	if (enter) {
    109 		push_stk();
    110 	} else {
    111 		assert(n.target);
    112 		n.target->vars_defined.add_set(cur_set());
    113 		cur_set().clear();
    114 		pop_stk();
    115 	}
    116 	return true;
    117 }
    118 
    119 bool ssa_prepare::visit(depart_node& n, bool enter) {
    120 	if (enter) {
    121 		push_stk();
    122 	} else {
    123 		assert(n.target);
    124 		n.target->vars_defined.add_set(cur_set());
    125 		cur_set().clear();
    126 		pop_stk();
    127 	}
    128 	return true;
    129 }
    130 
    131 // ===============================
    132 
    133 int ssa_rename::init() {
    134 	rename_stack.push(def_map());
    135 	rename_lds_oq_stack.push(def_map());
    136 	rename_lds_rw_stack.push(def_map());
    137 	return 0;
    138 }
    139 
    140 bool ssa_rename::visit(alu_group_node& n, bool enter) {
    141 	// taking into account parallel execution of the alu group
    142 	if (enter) {
    143 		for (node_iterator I = n.begin(), E = n.end(); I != E; ++I) {
    144 			I->accept(*this, true);
    145 		}
    146 	} else {
    147 		for (node_iterator I = n.begin(), E = n.end(); I != E; ++I) {
    148 			I->accept(*this, false);
    149 		}
    150 	}
    151 	return false;
    152 }
    153 
    154 bool ssa_rename::visit(cf_node& n, bool enter) {
    155 	if (enter) {
    156 		rename_src(&n);
    157 	} else {
    158 		rename_dst(&n);
    159 	}
    160 	return true;
    161 }
    162 
    163 bool ssa_rename::visit(alu_node& n, bool enter) {
    164 	if (enter) {
    165 		rename_src(&n);
    166 	} else {
    167 
    168 		node *psi = NULL;
    169 
    170 		if (n.pred && n.dst[0]) {
    171 
    172 			value *d = n.dst[0];
    173 			unsigned index = get_index(rename_stack.top(), d);
    174 			value *p = sh.get_value_version(d, index);
    175 
    176 			psi = sh.create_node(NT_OP, NST_PSI);
    177 
    178 			container_node *parent;
    179 			if (n.parent->subtype == NST_ALU_GROUP)
    180 				parent = n.parent;
    181 			else {
    182 				assert (n.parent->parent->subtype == NST_ALU_GROUP);
    183 				parent = n.parent->parent;
    184 			}
    185 			parent->insert_after(psi);
    186 
    187 			assert(n.bc.pred_sel);
    188 
    189 			psi->src.resize(6);
    190 			psi->src[2] = p;
    191 			psi->src[3] = n.pred;
    192 			psi->src[4] = sh.get_pred_sel(n.bc.pred_sel - PRED_SEL_0);
    193 			psi->src[5] = d;
    194 			psi->dst.push_back(d);
    195 		}
    196 
    197 		rename_dst(&n);
    198 
    199 		if (psi) {
    200 			rename_src(psi);
    201 			rename_dst(psi);
    202 		}
    203 
    204 		if (!n.dst.empty() && n.dst[0]) {
    205 			// FIXME probably use separate pass for such things
    206 			if ((n.bc.op_ptr->flags & AF_INTERP) || n.bc.op == ALU_OP2_CUBE)
    207 				n.dst[0]->flags |= VLF_PIN_CHAN;
    208 		}
    209 	}
    210 	return true;
    211 }
    212 
    213 bool ssa_rename::visit(alu_packed_node& n, bool enter) {
    214 	if (enter) {
    215 		for (node_iterator I = n.begin(), E = n.end(); I != E; ++I) {
    216 			I->accept(*this, true);
    217 		}
    218 	} else {
    219 		for (node_iterator I = n.begin(), E = n.end(); I != E; ++I) {
    220 			I->accept(*this, false);
    221 		}
    222 
    223 		bool repl = (n.op_ptr()->flags & AF_REPL) ||
    224 				(ctx.is_cayman() && (n.first->alu_op_slot_flags() & AF_S));
    225 
    226 		n.init_args(repl);
    227 	}
    228 	return false;
    229 }
    230 
    231 bool ssa_rename::visit(fetch_node& n, bool enter) {
    232 	if (enter) {
    233 		rename_src(&n);
    234 		rename_dst(&n);
    235 	} else {
    236 	}
    237 	return true;
    238 }
    239 
    240 bool ssa_rename::visit(region_node& n, bool enter) {
    241 	if (enter) {
    242 		if (n.loop_phi)
    243 			rename_phi_args(n.loop_phi, 0, true);
    244 	} else {
    245 		if (n.phi)
    246 			rename_phi_args(n.phi, ~0u, true);
    247 	}
    248 	return true;
    249 }
    250 
    251 bool ssa_rename::visit(repeat_node& n, bool enter) {
    252 	if (enter) {
    253 		push(n.target->loop_phi);
    254 	} else {
    255 		if (n.target->loop_phi)
    256 			rename_phi_args(n.target->loop_phi, n.rep_id, false);
    257 		pop();
    258 	}
    259 	return true;
    260 }
    261 
    262 bool ssa_rename::visit(depart_node& n, bool enter) {
    263 	if (enter) {
    264 		push(n.target->phi);
    265 	} else {
    266 		if (n.target->phi)
    267 			rename_phi_args(n.target->phi, n.dep_id, false);
    268 		pop();
    269 	}
    270 	return true;
    271 }
    272 
    273 bool ssa_rename::visit(if_node& n, bool enter) {
    274 	if (enter) {
    275 	} else {
    276 		n.cond = rename_use(&n, n.cond);
    277 	}
    278 	return true;
    279 }
    280 
    281 void ssa_rename::push(node* phi) {
    282 	rename_stack.push(rename_stack.top());
    283 }
    284 
    285 void ssa_rename::pop() {
    286 	rename_stack.pop();
    287 }
    288 
    289 value* ssa_rename::rename_use(node *n, value* v) {
    290 	if (v->version)
    291 		return v;
    292 	unsigned index;
    293 	if (v->is_lds_access()) {
    294 		index = get_index(rename_lds_rw_stack.top(), v);
    295 	} else if (v->is_lds_oq()) {
    296 		index = new_index(lds_oq_count, v);
    297 		set_index(rename_lds_oq_stack.top(), v, index);
    298 	} else {
    299 		index = get_index(rename_stack.top(), v);
    300 	}
    301 
    302 	v = sh.get_value_version(v, index);
    303 
    304 	// if (alu) instruction is predicated and source arg comes from psi node
    305 	// (that is, from another predicated instruction through its psi node),
    306 	// we can try to select the corresponding source value directly
    307 	if (n->pred && v->def && v->def->subtype == NST_PSI) {
    308 		assert(n->subtype == NST_ALU_INST);
    309 		alu_node *an = static_cast<alu_node*>(n);
    310 		node *pn = v->def;
    311 		// FIXME make it more generic ???
    312 		if (pn->src.size() == 6) {
    313 			if (pn->src[3] == n->pred) {
    314 				value* ps = sh.get_pred_sel(an->bc.pred_sel - PRED_SEL_0);
    315 				if (pn->src[4] == ps)
    316 					return pn->src[5];
    317 				else
    318 					return pn->src[2];
    319 			}
    320 		}
    321 	}
    322 	return v;
    323 }
    324 
    325 value* ssa_rename::rename_def(node *n, value* v) {
    326 	unsigned index;
    327 
    328 	if (v->is_lds_access()) {
    329 		index = new_index(lds_rw_count, v);
    330 		set_index(rename_lds_rw_stack.top(), v, index);
    331 	} else {
    332 		index = new_index(def_count, v);
    333 		set_index(rename_stack.top(), v, index);
    334 	}
    335 	value *r = sh.get_value_version(v, index);
    336 	return r;
    337 }
    338 
    339 void ssa_rename::rename_src_vec(node *n, vvec &vv, bool src) {
    340 	for(vvec::iterator I = vv.begin(), E = vv.end(); I != E; ++I) {
    341 		value* &v = *I;
    342 		if (!v || v->is_readonly())
    343 			continue;
    344 
    345 		if (v->is_rel()) {
    346 			if (!v->rel->is_readonly())
    347 				v->rel = rename_use(n, v->rel);
    348 			rename_src_vec(n, v->muse, true);
    349 		} else if (src)
    350 			v = rename_use(n, v);
    351 	}
    352 }
    353 
    354 void ssa_rename::rename_src(node* n) {
    355 	if (n->pred)
    356 		n->pred = rename_use(n, n->pred);
    357 
    358 	rename_src_vec(n, n->src, true);
    359 	rename_src_vec(n, n->dst, false);
    360 
    361 }
    362 
    363 void ssa_rename::rename_dst_vec(node *n, vvec &vv, bool set_def) {
    364 
    365 	for(vvec::iterator I = vv.begin(), E = vv.end(); I != E; ++I) {
    366 		value* &v = *I;
    367 		if (!v)
    368 			continue;
    369 
    370 		if (v->is_rel()) {
    371 			rename_dst_vec(n, v->mdef, false);
    372 		} else {
    373 			v = rename_def(n, v);
    374 			if (set_def)
    375 				v->def = n;
    376 		}
    377 	}
    378 }
    379 
    380 void ssa_rename::rename_dst(node* n) {
    381 	rename_dst_vec(n, n->dst, true);
    382 }
    383 
    384 unsigned ssa_rename::get_index(def_map& m, value* v) {
    385 	def_map::iterator I = m.find(v);
    386 	if (I != m.end())
    387 		return I->second;
    388 	return 0;
    389 }
    390 
    391 void ssa_rename::set_index(def_map& m, value* v, unsigned index) {
    392 	std::pair<def_map::iterator,bool>  r = m.insert(std::make_pair(v, index));
    393 	if (!r.second)
    394 		r.first->second = index;
    395 }
    396 
    397 unsigned ssa_rename::new_index(def_map& m, value* v) {
    398 	unsigned index = 1;
    399 	def_map::iterator I = m.find(v);
    400 	if (I != m.end())
    401 		index = ++I->second;
    402 	else
    403 		m.insert(std::make_pair(v, index));
    404 	return index;
    405 }
    406 
    407 bool ssa_rename::visit(node& n, bool enter) {
    408 	if (enter) {
    409 		assert(n.subtype == NST_PSI);
    410 		rename_src(&n);
    411 		rename_dst(&n);
    412 	}
    413 	return false;
    414 }
    415 
    416 bool ssa_rename::visit(container_node& n, bool enter) {
    417 	if (enter) {
    418 	} else {
    419 		// should be root container node
    420 		assert(n.parent == NULL);
    421 		rename_src_vec(&n, n.src, true);
    422 	}
    423 	return true;
    424 }
    425 
    426 void ssa_rename::rename_phi_args(container_node* phi, unsigned op, bool def) {
    427 	for (node_iterator I = phi->begin(), E = phi->end(); I != E; ++I) {
    428 		node *o = *I;
    429 		if (op != ~0u)
    430 			o->src[op] = rename_use(o, o->src[op]);
    431 		if (def) {
    432 			o->dst[0] = rename_def(o, o->dst[0]);
    433 			o->dst[0]->def = o;
    434 		}
    435 	}
    436 }
    437 
    438 } // namespace r600_sb
    439