Home | History | Annotate | Download | only in compiler
      1 /*
      2  * Copyright (C) 2008 Nicolai Haehnle.
      3  *
      4  * All Rights Reserved.
      5  *
      6  * Permission is hereby granted, free of charge, to any person obtaining
      7  * a copy of this software and associated documentation files (the
      8  * "Software"), to deal in the Software without restriction, including
      9  * without limitation the rights to use, copy, modify, merge, publish,
     10  * distribute, sublicense, and/or sell copies of the Software, and to
     11  * permit persons to whom the Software is furnished to do so, subject to
     12  * the following conditions:
     13  *
     14  * The above copyright notice and this permission notice (including the
     15  * next paragraph) shall be included in all copies or substantial
     16  * portions of the Software.
     17  *
     18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
     19  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
     20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
     21  * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
     22  * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
     23  * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
     24  * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
     25  *
     26  */
     27 
     28 #include "radeon_program.h"
     29 
     30 #include <stdio.h>
     31 
     32 #include "radeon_compiler.h"
     33 #include "radeon_dataflow.h"
     34 
     35 
     36 /**
     37  * Transform the given clause in the following way:
     38  *  1. Replace it with an empty clause
     39  *  2. For every instruction in the original clause, try the given
     40  *     transformations in order.
     41  *  3. If one of the transformations returns GL_TRUE, assume that it
     42  *     has emitted the appropriate instruction(s) into the new clause;
     43  *     otherwise, copy the instruction verbatim.
     44  *
     45  * \note The transformation is currently not recursive; in other words,
     46  * instructions emitted by transformations are not transformed.
     47  *
     48  * \note The transform is called 'local' because it can only look at
     49  * one instruction at a time.
     50  */
     51 void rc_local_transform(
     52 	struct radeon_compiler * c,
     53 	void *user)
     54 {
     55 	struct radeon_program_transformation *transformations =
     56 		(struct radeon_program_transformation*)user;
     57 	struct rc_instruction * inst = c->Program.Instructions.Next;
     58 
     59 	while(inst != &c->Program.Instructions) {
     60 		struct rc_instruction * current = inst;
     61 		int i;
     62 
     63 		inst = inst->Next;
     64 
     65 		for(i = 0; transformations[i].function; ++i) {
     66 			struct radeon_program_transformation* t = transformations + i;
     67 
     68 			if (t->function(c, current, t->userData))
     69 				break;
     70 		}
     71 	}
     72 }
     73 
     74 struct get_used_temporaries_data {
     75 	unsigned char * Used;
     76 	unsigned int UsedLength;
     77 };
     78 
     79 static void get_used_temporaries_cb(
     80 	void * userdata,
     81 	struct rc_instruction * inst,
     82 	rc_register_file file,
     83 	unsigned int index,
     84 	unsigned int mask)
     85 {
     86 	struct get_used_temporaries_data * d = userdata;
     87 
     88 	if (file != RC_FILE_TEMPORARY)
     89 		return;
     90 
     91 	if (index >= d->UsedLength)
     92 		return;
     93 
     94 	d->Used[index] |= mask;
     95 }
     96 
     97 /**
     98  * This function fills in the parameter 'used' with a writemask that
     99  * represent which components of each temporary register are used by the
    100  * program.  This is meant to be combined with rc_find_free_temporary_list as a
    101  * more efficient version of rc_find_free_temporary.
    102  * @param used The function does not initialize this parameter.
    103  */
    104 void rc_get_used_temporaries(
    105 	struct radeon_compiler * c,
    106 	unsigned char * used,
    107 	unsigned int used_length)
    108 {
    109 	struct rc_instruction * inst;
    110 	struct get_used_temporaries_data d;
    111 	d.Used = used;
    112 	d.UsedLength = used_length;
    113 
    114 	for(inst = c->Program.Instructions.Next;
    115 			inst != &c->Program.Instructions; inst = inst->Next) {
    116 
    117 		rc_for_all_reads_mask(inst, get_used_temporaries_cb, &d);
    118 		rc_for_all_writes_mask(inst, get_used_temporaries_cb, &d);
    119 	}
    120 }
    121 
    122 /* Search a list of used temporaries for a free one
    123  * \sa rc_get_used_temporaries
    124  * @note If this functions finds a free temporary, it will mark it as used
    125  * in the used temporary list (param 'used')
    126  * @param used list of used temporaries
    127  * @param used_length number of items in param 'used'
    128  * @param mask which components must be free in the temporary index that is
    129  * returned.
    130  * @return -1 If there are no more free temporaries, otherwise the index of
    131  * a temporary register where the components specified in param 'mask' are
    132  * not being used.
    133  */
    134 int rc_find_free_temporary_list(
    135 	struct radeon_compiler * c,
    136 	unsigned char * used,
    137 	unsigned int used_length,
    138 	unsigned int mask)
    139 {
    140 	int i;
    141 	for(i = 0; i < used_length; i++) {
    142 		if ((~used[i] & mask) == mask) {
    143 			used[i] |= mask;
    144 			return i;
    145 		}
    146 	}
    147 	return -1;
    148 }
    149 
    150 unsigned int rc_find_free_temporary(struct radeon_compiler * c)
    151 {
    152 	unsigned char used[RC_REGISTER_MAX_INDEX];
    153 	int free;
    154 
    155 	memset(used, 0, sizeof(used));
    156 
    157 	rc_get_used_temporaries(c, used, RC_REGISTER_MAX_INDEX);
    158 
    159 	free = rc_find_free_temporary_list(c, used, RC_REGISTER_MAX_INDEX,
    160 								RC_MASK_XYZW);
    161 	if (free < 0) {
    162 		rc_error(c, "Ran out of temporary registers\n");
    163 		return 0;
    164 	}
    165 	return free;
    166 }
    167 
    168 
    169 struct rc_instruction *rc_alloc_instruction(struct radeon_compiler * c)
    170 {
    171 	struct rc_instruction * inst = memory_pool_malloc(&c->Pool, sizeof(struct rc_instruction));
    172 
    173 	memset(inst, 0, sizeof(struct rc_instruction));
    174 
    175 	inst->U.I.Opcode = RC_OPCODE_ILLEGAL_OPCODE;
    176 	inst->U.I.DstReg.WriteMask = RC_MASK_XYZW;
    177 	inst->U.I.SrcReg[0].Swizzle = RC_SWIZZLE_XYZW;
    178 	inst->U.I.SrcReg[1].Swizzle = RC_SWIZZLE_XYZW;
    179 	inst->U.I.SrcReg[2].Swizzle = RC_SWIZZLE_XYZW;
    180 
    181 	return inst;
    182 }
    183 
    184 void rc_insert_instruction(struct rc_instruction * after, struct rc_instruction * inst)
    185 {
    186 	inst->Prev = after;
    187 	inst->Next = after->Next;
    188 
    189 	inst->Prev->Next = inst;
    190 	inst->Next->Prev = inst;
    191 }
    192 
    193 struct rc_instruction *rc_insert_new_instruction(struct radeon_compiler * c, struct rc_instruction * after)
    194 {
    195 	struct rc_instruction * inst = rc_alloc_instruction(c);
    196 
    197 	rc_insert_instruction(after, inst);
    198 
    199 	return inst;
    200 }
    201 
    202 void rc_remove_instruction(struct rc_instruction * inst)
    203 {
    204 	inst->Prev->Next = inst->Next;
    205 	inst->Next->Prev = inst->Prev;
    206 }
    207 
    208 /**
    209  * Return the number of instructions in the program.
    210  */
    211 unsigned int rc_recompute_ips(struct radeon_compiler * c)
    212 {
    213 	unsigned int ip = 0;
    214 	struct rc_instruction * inst;
    215 
    216 	for(inst = c->Program.Instructions.Next;
    217 	    inst != &c->Program.Instructions;
    218 	    inst = inst->Next) {
    219 		inst->IP = ip++;
    220 	}
    221 
    222 	c->Program.Instructions.IP = 0xcafedead;
    223 
    224 	return ip;
    225 }
    226