1 /* 2 * Copyright 2009 Nicolai Hhnle <nhaehnle (at) gmail.com> 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * on the rights to use, copy, modify, merge, publish, distribute, sub 8 * license, and/or sell copies of the Software, and to permit persons to whom 9 * the Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */ 22 23 #include "radeon_compiler.h" 24 #include "radeon_code.h" 25 #include "../r300_reg.h" 26 27 #include <stdio.h> 28 29 static char* r300_vs_ve_ops[] = { 30 /* R300 vector ops */ 31 " VE_NO_OP", 32 " VE_DOT_PRODUCT", 33 " VE_MULTIPLY", 34 " VE_ADD", 35 " VE_MULTIPLY_ADD", 36 " VE_DISTANCE_FACTOR", 37 " VE_FRACTION", 38 " VE_MAXIMUM", 39 " VE_MINIMUM", 40 "VE_SET_GREATER_THAN_EQUAL", 41 " VE_SET_LESS_THAN", 42 " VE_MULTIPLYX2_ADD", 43 " VE_MULTIPLY_CLAMP", 44 " VE_FLT2FIX_DX", 45 " VE_FLT2FIX_DX_RND", 46 /* R500 vector ops */ 47 " VE_PRED_SET_EQ_PUSH", 48 " VE_PRED_SET_GT_PUSH", 49 " VE_PRED_SET_GTE_PUSH", 50 " VE_PRED_SET_NEQ_PUSH", 51 " VE_COND_WRITE_EQ", 52 " VE_COND_WRITE_GT", 53 " VE_COND_WRITE_GTE", 54 " VE_COND_WRITE_NEQ", 55 " VE_COND_MUX_EQ", 56 " VE_COND_MUX_GT", 57 " VE_COND_MUX_GTE", 58 " VE_SET_GREATER_THAN", 59 " VE_SET_EQUAL", 60 " VE_SET_NOT_EQUAL", 61 " (reserved)", 62 " (reserved)", 63 " (reserved)", 64 }; 65 66 static char* r300_vs_me_ops[] = { 67 /* R300 math ops */ 68 " ME_NO_OP", 69 " ME_EXP_BASE2_DX", 70 " ME_LOG_BASE2_DX", 71 " ME_EXP_BASEE_FF", 72 " ME_LIGHT_COEFF_DX", 73 " ME_POWER_FUNC_FF", 74 " ME_RECIP_DX", 75 " ME_RECIP_FF", 76 " ME_RECIP_SQRT_DX", 77 " ME_RECIP_SQRT_FF", 78 " ME_MULTIPLY", 79 " ME_EXP_BASE2_FULL_DX", 80 " ME_LOG_BASE2_FULL_DX", 81 " ME_POWER_FUNC_FF_CLAMP_B", 82 "ME_POWER_FUNC_FF_CLAMP_B1", 83 "ME_POWER_FUNC_FF_CLAMP_01", 84 " ME_SIN", 85 " ME_COS", 86 /* R500 math ops */ 87 " ME_LOG_BASE2_IEEE", 88 " ME_RECIP_IEEE", 89 " ME_RECIP_SQRT_IEEE", 90 " ME_PRED_SET_EQ", 91 " ME_PRED_SET_GT", 92 " ME_PRED_SET_GTE", 93 " ME_PRED_SET_NEQ", 94 " ME_PRED_SET_CLR", 95 " ME_PRED_SET_INV", 96 " ME_PRED_SET_POP", 97 " ME_PRED_SET_RESTORE", 98 " (reserved)", 99 " (reserved)", 100 " (reserved)", 101 }; 102 103 /* XXX refactor to avoid clashing symbols */ 104 static char* r300_vs_src_debug[] = { 105 "t", 106 "i", 107 "c", 108 "a", 109 }; 110 111 static char* r300_vs_dst_debug[] = { 112 "t", 113 "a0", 114 "o", 115 "ox", 116 "a", 117 "i", 118 "u", 119 "u", 120 }; 121 122 static char* r300_vs_swiz_debug[] = { 123 "X", 124 "Y", 125 "Z", 126 "W", 127 "0", 128 "1", 129 "U", 130 "U", 131 }; 132 133 134 static void r300_vs_op_dump(uint32_t op) 135 { 136 fprintf(stderr, " dst: %d%s op: ", 137 (op >> 13) & 0x7f, r300_vs_dst_debug[(op >> 8) & 0x7]); 138 if ((op >> PVS_DST_PRED_ENABLE_SHIFT) & 0x1) { 139 fprintf(stderr, "PRED %u", 140 (op >> PVS_DST_PRED_SENSE_SHIFT) & 0x1); 141 } 142 if (op & 0x80) { 143 if (op & 0x1) { 144 fprintf(stderr, "PVS_MACRO_OP_2CLK_M2X_ADD\n"); 145 } else { 146 fprintf(stderr, " PVS_MACRO_OP_2CLK_MADD\n"); 147 } 148 } else if (op & 0x40) { 149 fprintf(stderr, "%s\n", r300_vs_me_ops[op & 0x1f]); 150 } else { 151 fprintf(stderr, "%s\n", r300_vs_ve_ops[op & 0x1f]); 152 } 153 } 154 155 static void r300_vs_src_dump(uint32_t src) 156 { 157 fprintf(stderr, " reg: %d%s swiz: %s%s/%s%s/%s%s/%s%s\n", 158 (src >> 5) & 0xff, r300_vs_src_debug[src & 0x3], 159 src & (1 << 25) ? "-" : " ", 160 r300_vs_swiz_debug[(src >> 13) & 0x7], 161 src & (1 << 26) ? "-" : " ", 162 r300_vs_swiz_debug[(src >> 16) & 0x7], 163 src & (1 << 27) ? "-" : " ", 164 r300_vs_swiz_debug[(src >> 19) & 0x7], 165 src & (1 << 28) ? "-" : " ", 166 r300_vs_swiz_debug[(src >> 22) & 0x7]); 167 } 168 169 void r300_vertex_program_dump(struct radeon_compiler *compiler, void *user) 170 { 171 struct r300_vertex_program_compiler *c = (struct r300_vertex_program_compiler*)compiler; 172 struct r300_vertex_program_code * vs = c->code; 173 unsigned instrcount = vs->length / 4; 174 unsigned i; 175 176 fprintf(stderr, "Final vertex program code:\n"); 177 178 for(i = 0; i < instrcount; i++) { 179 unsigned offset = i*4; 180 unsigned src; 181 182 fprintf(stderr, "%d: op: 0x%08x", i, vs->body.d[offset]); 183 r300_vs_op_dump(vs->body.d[offset]); 184 185 for(src = 0; src < 3; ++src) { 186 fprintf(stderr, " src%i: 0x%08x", src, vs->body.d[offset+1+src]); 187 r300_vs_src_dump(vs->body.d[offset+1+src]); 188 } 189 } 190 191 fprintf(stderr, "Flow Control Ops: 0x%08x\n",vs->fc_ops); 192 for(i = 0; i < vs->num_fc_ops; i++) { 193 unsigned is_loop = 0; 194 switch((vs->fc_ops >> (i * 2)) & 0x3 ) { 195 case 0: fprintf(stderr, "NOP"); break; 196 case 1: fprintf(stderr, "JUMP"); break; 197 case 2: fprintf(stderr, "LOOP"); is_loop = 1; break; 198 case 3: fprintf(stderr, "JSR"); break; 199 } 200 if (c->Base.is_r500) { 201 fprintf(stderr,": uw-> 0x%08x lw-> 0x%08x " 202 "loop data->0x%08x\n", 203 vs->fc_op_addrs.r500[i].uw, 204 vs->fc_op_addrs.r500[i].lw, 205 vs->fc_loop_index[i]); 206 if (is_loop) { 207 fprintf(stderr, "Before = %u First = %u Last = %u\n", 208 vs->fc_op_addrs.r500[i].lw & 0xffff, 209 (vs->fc_op_addrs.r500[i].uw >> 16) & 0xffff, 210 vs->fc_op_addrs.r500[i].uw & 0xffff); 211 } 212 } else { 213 fprintf(stderr,": 0x%08x\n", vs->fc_op_addrs.r300[i]); 214 } 215 } 216 } 217