1 /* 2 * Mesa 3-D graphics library 3 * 4 * Copyright (C) 1999-2004 Brian Paul All Rights Reserved. 5 * 6 * Permission is hereby granted, free of charge, to any person obtaining a 7 * copy of this software and associated documentation files (the "Software"), 8 * to deal in the Software without restriction, including without limitation 9 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 10 * and/or sell copies of the Software, and to permit persons to whom the 11 * Software is furnished to do so, subject to the following conditions: 12 * 13 * The above copyright notice and this permission notice shall be included 14 * in all copies or substantial portions of the Software. 15 * 16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 17 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 22 * OTHER DEALINGS IN THE SOFTWARE. 23 */ 24 25 /* 26 * New (3.1) transformation code written by Keith Whitwell. 27 */ 28 29 30 /* KW: a clever asm implementation would nestle integer versions 31 * of the outcode calculation underneath the division. Gcc won't 32 * do this, strangely enough, so I only do the divide in 33 * the case where the cliptest passes. This isn't essential, 34 * and an asm implementation needn't replicate that behaviour. 35 * 36 * \param clip_vec vector of incoming clip-space coords 37 * \param proj_vec vector of resultant NDC-space projected coords 38 * \param clipMask resulting array of clip flags 39 * \param orMask bitwise-OR of clipMask values 40 * \param andMask bitwise-AND of clipMask values 41 * \return proj_vec pointer 42 */ 43 static GLvector4f * TAG(cliptest_points4)( GLvector4f *clip_vec, 44 GLvector4f *proj_vec, 45 GLubyte clipMask[], 46 GLubyte *orMask, 47 GLubyte *andMask, 48 GLboolean viewport_z_clip ) 49 { 50 const GLuint stride = clip_vec->stride; 51 const GLfloat *from = (GLfloat *)clip_vec->start; 52 const GLuint count = clip_vec->count; 53 GLuint c = 0; 54 GLfloat (*vProj)[4] = (GLfloat (*)[4])proj_vec->start; 55 GLubyte tmpAndMask = *andMask; 56 GLubyte tmpOrMask = *orMask; 57 GLuint i; 58 STRIDE_LOOP { 59 const GLfloat cx = from[0]; 60 const GLfloat cy = from[1]; 61 const GLfloat cz = from[2]; 62 const GLfloat cw = from[3]; 63 #if defined(__powerpc__) 64 /* on powerpc cliptest is 17% faster in this way. */ 65 GLuint mask; 66 mask = (((cw < cx) << CLIP_RIGHT_SHIFT)); 67 mask |= (((cw < -cx) << CLIP_LEFT_SHIFT)); 68 mask |= (((cw < cy) << CLIP_TOP_SHIFT)); 69 mask |= (((cw < -cy) << CLIP_BOTTOM_SHIFT)); 70 if (viewport_z_clip) { 71 mask |= (((cw < cz) << CLIP_FAR_SHIFT)); 72 mask |= (((cw < -cz) << CLIP_NEAR_SHIFT)); 73 } 74 #else 75 GLubyte mask = 0; 76 if (-cx + cw < 0) mask |= CLIP_RIGHT_BIT; 77 if ( cx + cw < 0) mask |= CLIP_LEFT_BIT; 78 if (-cy + cw < 0) mask |= CLIP_TOP_BIT; 79 if ( cy + cw < 0) mask |= CLIP_BOTTOM_BIT; 80 if (viewport_z_clip) { 81 if (-cz + cw < 0) mask |= CLIP_FAR_BIT; 82 if ( cz + cw < 0) mask |= CLIP_NEAR_BIT; 83 } 84 #endif 85 86 clipMask[i] = mask; 87 if (mask) { 88 c++; 89 tmpAndMask &= mask; 90 tmpOrMask |= mask; 91 vProj[i][0] = 0; 92 vProj[i][1] = 0; 93 vProj[i][2] = 0; 94 vProj[i][3] = 1; 95 } else { 96 GLfloat oow = 1.0F / cw; 97 vProj[i][0] = cx * oow; 98 vProj[i][1] = cy * oow; 99 vProj[i][2] = cz * oow; 100 vProj[i][3] = oow; 101 } 102 } 103 104 *orMask = tmpOrMask; 105 *andMask = (GLubyte) (c < count ? 0 : tmpAndMask); 106 107 proj_vec->flags |= VEC_SIZE_4; 108 proj_vec->size = 4; 109 proj_vec->count = clip_vec->count; 110 return proj_vec; 111 } 112 113 114 115 /* 116 * \param clip_vec vector of incoming clip-space coords 117 * \param proj_vec vector of resultant NDC-space projected coords 118 * \param clipMask resulting array of clip flags 119 * \param orMask bitwise-OR of clipMask values 120 * \param andMask bitwise-AND of clipMask values 121 * \return clip_vec pointer 122 */ 123 static GLvector4f * TAG(cliptest_np_points4)( GLvector4f *clip_vec, 124 GLvector4f *proj_vec, 125 GLubyte clipMask[], 126 GLubyte *orMask, 127 GLubyte *andMask, 128 GLboolean viewport_z_clip ) 129 { 130 const GLuint stride = clip_vec->stride; 131 const GLuint count = clip_vec->count; 132 const GLfloat *from = (GLfloat *)clip_vec->start; 133 GLuint c = 0; 134 GLubyte tmpAndMask = *andMask; 135 GLubyte tmpOrMask = *orMask; 136 GLuint i; 137 (void) proj_vec; 138 STRIDE_LOOP { 139 const GLfloat cx = from[0]; 140 const GLfloat cy = from[1]; 141 const GLfloat cz = from[2]; 142 const GLfloat cw = from[3]; 143 #if defined(__powerpc__) 144 /* on powerpc cliptest is 17% faster in this way. */ 145 GLuint mask; 146 mask = (((cw < cx) << CLIP_RIGHT_SHIFT)); 147 mask |= (((cw < -cx) << CLIP_LEFT_SHIFT)); 148 mask |= (((cw < cy) << CLIP_TOP_SHIFT)); 149 mask |= (((cw < -cy) << CLIP_BOTTOM_SHIFT)); 150 if (viewport_z_clip) { 151 mask |= (((cw < cz) << CLIP_FAR_SHIFT)); 152 mask |= (((cw < -cz) << CLIP_NEAR_SHIFT)); 153 } 154 #else 155 GLubyte mask = 0; 156 if (-cx + cw < 0) mask |= CLIP_RIGHT_BIT; 157 if ( cx + cw < 0) mask |= CLIP_LEFT_BIT; 158 if (-cy + cw < 0) mask |= CLIP_TOP_BIT; 159 if ( cy + cw < 0) mask |= CLIP_BOTTOM_BIT; 160 if (viewport_z_clip) { 161 if (-cz + cw < 0) mask |= CLIP_FAR_BIT; 162 if ( cz + cw < 0) mask |= CLIP_NEAR_BIT; 163 } 164 #endif 165 166 clipMask[i] = mask; 167 if (mask) { 168 c++; 169 tmpAndMask &= mask; 170 tmpOrMask |= mask; 171 } 172 } 173 174 *orMask = tmpOrMask; 175 *andMask = (GLubyte) (c < count ? 0 : tmpAndMask); 176 return clip_vec; 177 } 178 179 180 static GLvector4f * TAG(cliptest_points3)( GLvector4f *clip_vec, 181 GLvector4f *proj_vec, 182 GLubyte clipMask[], 183 GLubyte *orMask, 184 GLubyte *andMask, 185 GLboolean viewport_z_clip ) 186 { 187 const GLuint stride = clip_vec->stride; 188 const GLuint count = clip_vec->count; 189 const GLfloat *from = (GLfloat *)clip_vec->start; 190 GLubyte tmpOrMask = *orMask; 191 GLubyte tmpAndMask = *andMask; 192 GLuint i; 193 (void) proj_vec; 194 STRIDE_LOOP { 195 const GLfloat cx = from[0], cy = from[1], cz = from[2]; 196 GLubyte mask = 0; 197 if (cx > 1.0F) mask |= CLIP_RIGHT_BIT; 198 else if (cx < -1.0F) mask |= CLIP_LEFT_BIT; 199 if (cy > 1.0F) mask |= CLIP_TOP_BIT; 200 else if (cy < -1.0F) mask |= CLIP_BOTTOM_BIT; 201 if (viewport_z_clip) { 202 if (cz > 1.0F) mask |= CLIP_FAR_BIT; 203 else if (cz < -1.0F) mask |= CLIP_NEAR_BIT; 204 } 205 clipMask[i] = mask; 206 tmpOrMask |= mask; 207 tmpAndMask &= mask; 208 } 209 210 *orMask = tmpOrMask; 211 *andMask = tmpAndMask; 212 return clip_vec; 213 } 214 215 216 static GLvector4f * TAG(cliptest_points2)( GLvector4f *clip_vec, 217 GLvector4f *proj_vec, 218 GLubyte clipMask[], 219 GLubyte *orMask, 220 GLubyte *andMask, 221 GLboolean viewport_z_clip ) 222 { 223 const GLuint stride = clip_vec->stride; 224 const GLuint count = clip_vec->count; 225 const GLfloat *from = (GLfloat *)clip_vec->start; 226 GLubyte tmpOrMask = *orMask; 227 GLubyte tmpAndMask = *andMask; 228 GLuint i; 229 (void) proj_vec; 230 STRIDE_LOOP { 231 const GLfloat cx = from[0], cy = from[1]; 232 GLubyte mask = 0; 233 if (cx > 1.0F) mask |= CLIP_RIGHT_BIT; 234 else if (cx < -1.0F) mask |= CLIP_LEFT_BIT; 235 if (cy > 1.0F) mask |= CLIP_TOP_BIT; 236 else if (cy < -1.0F) mask |= CLIP_BOTTOM_BIT; 237 clipMask[i] = mask; 238 tmpOrMask |= mask; 239 tmpAndMask &= mask; 240 } 241 242 *orMask = tmpOrMask; 243 *andMask = tmpAndMask; 244 return clip_vec; 245 } 246 247 248 void TAG(init_c_cliptest)( void ) 249 { 250 _mesa_clip_tab[4] = TAG(cliptest_points4); 251 _mesa_clip_tab[3] = TAG(cliptest_points3); 252 _mesa_clip_tab[2] = TAG(cliptest_points2); 253 254 _mesa_clip_np_tab[4] = TAG(cliptest_np_points4); 255 _mesa_clip_np_tab[3] = TAG(cliptest_points3); 256 _mesa_clip_np_tab[2] = TAG(cliptest_points2); 257 } 258