mesa/math/m_clip_tmp.h

7117f1b4Smrg/*
7117f1b4Smrg * Mesa 3-D graphics library
7117f1b4Smrg *
7117f1b4Smrg * Copyright (C) 1999-2004  Brian Paul   All Rights Reserved.
7117f1b4Smrg *
7117f1b4Smrg * Permission is hereby granted, free of charge, to any person obtaining a
7117f1b4Smrg * copy of this software and associated documentation files (the "Software"),
7117f1b4Smrg * to deal in the Software without restriction, including without limitation
7117f1b4Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
7117f1b4Smrg * and/or sell copies of the Software, and to permit persons to whom the
7117f1b4Smrg * Software is furnished to do so, subject to the following conditions:
7117f1b4Smrg *
7117f1b4Smrg * The above copyright notice and this permission notice shall be included
7117f1b4Smrg * in all copies or substantial portions of the Software.
7117f1b4Smrg *
7117f1b4Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
7117f1b4Smrg * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
7117f1b4Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
af69d88dSmrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
af69d88dSmrg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
af69d88dSmrg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
af69d88dSmrg * OTHER DEALINGS IN THE SOFTWARE.
7117f1b4Smrg */
7117f1b4Smrg
7117f1b4Smrg/*
7117f1b4Smrg * New (3.1) transformation code written by Keith Whitwell.
7117f1b4Smrg */
7117f1b4Smrg
7117f1b4Smrg
7117f1b4Smrg/* KW: a clever asm implementation would nestle integer versions
7117f1b4Smrg * of the outcode calculation underneath the division.  Gcc won't
7117f1b4Smrg * do this, strangely enough, so I only do the divide in
7117f1b4Smrg * the case where the cliptest passes.  This isn't essential,
7117f1b4Smrg * and an asm implementation needn't replicate that behaviour.
7117f1b4Smrg *
7117f1b4Smrg * \param clip_vec vector of incoming clip-space coords
7117f1b4Smrg * \param proj_vec vector of resultant NDC-space projected coords
7117f1b4Smrg * \param clipMask resulting array of clip flags
7117f1b4Smrg * \param orMask bitwise-OR of clipMask values
7117f1b4Smrg * \param andMask bitwise-AND of clipMask values
7117f1b4Smrg * \return proj_vec pointer
7117f1b4Smrg */
01e04c3fSmrgstatic GLvector4f * TAG(cliptest_points4)( GLvector4f *clip_vec,
7117f1b4Smrg                                                     GLvector4f *proj_vec,
7117f1b4Smrg                                                     GLubyte clipMask[],
7117f1b4Smrg                                                     GLubyte *orMask,
4a49301eSmrg                                                     GLubyte *andMask,
4a49301eSmrg						     GLboolean viewport_z_clip )
7117f1b4Smrg{
7117f1b4Smrg   const GLuint stride = clip_vec->stride;
7117f1b4Smrg   const GLfloat *from = (GLfloat *)clip_vec->start;
7117f1b4Smrg   const GLuint count = clip_vec->count;
7117f1b4Smrg   GLuint c = 0;
7117f1b4Smrg   GLfloat (*vProj)[4] = (GLfloat (*)[4])proj_vec->start;
7117f1b4Smrg   GLubyte tmpAndMask = *andMask;
7117f1b4Smrg   GLubyte tmpOrMask = *orMask;
7117f1b4Smrg   GLuint i;
7117f1b4Smrg   STRIDE_LOOP {
7117f1b4Smrg      const GLfloat cx = from[0];
7117f1b4Smrg      const GLfloat cy = from[1];
7117f1b4Smrg      const GLfloat cz = from[2];
7117f1b4Smrg      const GLfloat cw = from[3];
af69d88dSmrg#if defined(__powerpc__)
7117f1b4Smrg      /* on powerpc cliptest is 17% faster in this way. */
7117f1b4Smrg      GLuint mask;
7117f1b4Smrg      mask = (((cw < cx) << CLIP_RIGHT_SHIFT));
7117f1b4Smrg      mask |= (((cw < -cx) << CLIP_LEFT_SHIFT));
7117f1b4Smrg      mask |= (((cw < cy) << CLIP_TOP_SHIFT));
7117f1b4Smrg      mask |= (((cw < -cy) << CLIP_BOTTOM_SHIFT));
4a49301eSmrg      if (viewport_z_clip) {
4a49301eSmrg	 mask |= (((cw < cz) << CLIP_FAR_SHIFT));
4a49301eSmrg	 mask |= (((cw < -cz) << CLIP_NEAR_SHIFT));
4a49301eSmrg      }
af69d88dSmrg#else
7117f1b4Smrg      GLubyte mask = 0;
7117f1b4Smrg      if (-cx + cw < 0) mask |= CLIP_RIGHT_BIT;
7117f1b4Smrg      if ( cx + cw < 0) mask |= CLIP_LEFT_BIT;
7117f1b4Smrg      if (-cy + cw < 0) mask |= CLIP_TOP_BIT;
7117f1b4Smrg      if ( cy + cw < 0) mask |= CLIP_BOTTOM_BIT;
4a49301eSmrg      if (viewport_z_clip) {
4a49301eSmrg	 if (-cz + cw < 0) mask |= CLIP_FAR_BIT;
4a49301eSmrg	 if ( cz + cw < 0) mask |= CLIP_NEAR_BIT;
4a49301eSmrg      }
af69d88dSmrg#endif
7117f1b4Smrg
7117f1b4Smrg      clipMask[i] = mask;
7117f1b4Smrg      if (mask) {
7117f1b4Smrg	 c++;
7117f1b4Smrg	 tmpAndMask &= mask;
7117f1b4Smrg	 tmpOrMask |= mask;
7117f1b4Smrg	 vProj[i][0] = 0;
7117f1b4Smrg	 vProj[i][1] = 0;
7117f1b4Smrg	 vProj[i][2] = 0;
7117f1b4Smrg	 vProj[i][3] = 1;
7117f1b4Smrg      } else {
7117f1b4Smrg	 GLfloat oow = 1.0F / cw;
7117f1b4Smrg	 vProj[i][0] = cx * oow;
7117f1b4Smrg	 vProj[i][1] = cy * oow;
7117f1b4Smrg	 vProj[i][2] = cz * oow;
7117f1b4Smrg	 vProj[i][3] = oow;
7117f1b4Smrg      }
7117f1b4Smrg   }
7117f1b4Smrg
7117f1b4Smrg   *orMask = tmpOrMask;
7117f1b4Smrg   *andMask = (GLubyte) (c < count ? 0 : tmpAndMask);
7117f1b4Smrg
7117f1b4Smrg   proj_vec->flags |= VEC_SIZE_4;
7117f1b4Smrg   proj_vec->size = 4;
7117f1b4Smrg   proj_vec->count = clip_vec->count;
7117f1b4Smrg   return proj_vec;
7117f1b4Smrg}
7117f1b4Smrg
7117f1b4Smrg
7117f1b4Smrg
7117f1b4Smrg/*
7117f1b4Smrg * \param clip_vec vector of incoming clip-space coords
7117f1b4Smrg * \param proj_vec vector of resultant NDC-space projected coords
7117f1b4Smrg * \param clipMask resulting array of clip flags
7117f1b4Smrg * \param orMask bitwise-OR of clipMask values
7117f1b4Smrg * \param andMask bitwise-AND of clipMask values
7117f1b4Smrg * \return clip_vec pointer
7117f1b4Smrg */
01e04c3fSmrgstatic GLvector4f * TAG(cliptest_np_points4)( GLvector4f *clip_vec,
7117f1b4Smrg							GLvector4f *proj_vec,
7117f1b4Smrg							GLubyte clipMask[],
7117f1b4Smrg							GLubyte *orMask,
4a49301eSmrg							GLubyte *andMask,
4a49301eSmrg							GLboolean viewport_z_clip )
7117f1b4Smrg{
7117f1b4Smrg   const GLuint stride = clip_vec->stride;
7117f1b4Smrg   const GLuint count = clip_vec->count;
7117f1b4Smrg   const GLfloat *from = (GLfloat *)clip_vec->start;
7117f1b4Smrg   GLuint c = 0;
7117f1b4Smrg   GLubyte tmpAndMask = *andMask;
7117f1b4Smrg   GLubyte tmpOrMask = *orMask;
7117f1b4Smrg   GLuint i;
7117f1b4Smrg   (void) proj_vec;
7117f1b4Smrg   STRIDE_LOOP {
7117f1b4Smrg      const GLfloat cx = from[0];
7117f1b4Smrg      const GLfloat cy = from[1];
7117f1b4Smrg      const GLfloat cz = from[2];
7117f1b4Smrg      const GLfloat cw = from[3];
af69d88dSmrg#if defined(__powerpc__)
7117f1b4Smrg      /* on powerpc cliptest is 17% faster in this way. */
7117f1b4Smrg      GLuint mask;
7117f1b4Smrg      mask = (((cw < cx) << CLIP_RIGHT_SHIFT));
7117f1b4Smrg      mask |= (((cw < -cx) << CLIP_LEFT_SHIFT));
7117f1b4Smrg      mask |= (((cw < cy) << CLIP_TOP_SHIFT));
7117f1b4Smrg      mask |= (((cw < -cy) << CLIP_BOTTOM_SHIFT));
4a49301eSmrg      if (viewport_z_clip) {
4a49301eSmrg	 mask |= (((cw < cz) << CLIP_FAR_SHIFT));
4a49301eSmrg	 mask |= (((cw < -cz) << CLIP_NEAR_SHIFT));
4a49301eSmrg      }
af69d88dSmrg#else
7117f1b4Smrg      GLubyte mask = 0;
7117f1b4Smrg      if (-cx + cw < 0) mask |= CLIP_RIGHT_BIT;
7117f1b4Smrg      if ( cx + cw < 0) mask |= CLIP_LEFT_BIT;
7117f1b4Smrg      if (-cy + cw < 0) mask |= CLIP_TOP_BIT;
7117f1b4Smrg      if ( cy + cw < 0) mask |= CLIP_BOTTOM_BIT;
4a49301eSmrg      if (viewport_z_clip) {
4a49301eSmrg	 if (-cz + cw < 0) mask |= CLIP_FAR_BIT;
4a49301eSmrg	 if ( cz + cw < 0) mask |= CLIP_NEAR_BIT;
4a49301eSmrg      }
af69d88dSmrg#endif
7117f1b4Smrg
7117f1b4Smrg      clipMask[i] = mask;
7117f1b4Smrg      if (mask) {
7117f1b4Smrg	 c++;
7117f1b4Smrg	 tmpAndMask &= mask;
7117f1b4Smrg	 tmpOrMask |= mask;
7117f1b4Smrg      }
7117f1b4Smrg   }
7117f1b4Smrg
7117f1b4Smrg   *orMask = tmpOrMask;
7117f1b4Smrg   *andMask = (GLubyte) (c < count ? 0 : tmpAndMask);
7117f1b4Smrg   return clip_vec;
7117f1b4Smrg}
7117f1b4Smrg
7117f1b4Smrg
01e04c3fSmrgstatic GLvector4f * TAG(cliptest_points3)( GLvector4f *clip_vec,
7117f1b4Smrg                                                     GLvector4f *proj_vec,
7117f1b4Smrg                                                     GLubyte clipMask[],
7117f1b4Smrg                                                     GLubyte *orMask,
4a49301eSmrg                                                     GLubyte *andMask,
4a49301eSmrg						     GLboolean viewport_z_clip )
7117f1b4Smrg{
7117f1b4Smrg   const GLuint stride = clip_vec->stride;
7117f1b4Smrg   const GLuint count = clip_vec->count;
7117f1b4Smrg   const GLfloat *from = (GLfloat *)clip_vec->start;
7117f1b4Smrg   GLubyte tmpOrMask = *orMask;
7117f1b4Smrg   GLubyte tmpAndMask = *andMask;
7117f1b4Smrg   GLuint i;
7117f1b4Smrg   (void) proj_vec;
7117f1b4Smrg   STRIDE_LOOP {
7117f1b4Smrg      const GLfloat cx = from[0], cy = from[1], cz = from[2];
7117f1b4Smrg      GLubyte mask = 0;
01e04c3fSmrg      if (cx >  1.0F)       mask |= CLIP_RIGHT_BIT;
01e04c3fSmrg      else if (cx < -1.0F)  mask |= CLIP_LEFT_BIT;
01e04c3fSmrg      if (cy >  1.0F)       mask |= CLIP_TOP_BIT;
01e04c3fSmrg      else if (cy < -1.0F)  mask |= CLIP_BOTTOM_BIT;
4a49301eSmrg      if (viewport_z_clip) {
01e04c3fSmrg	 if (cz >  1.0F)       mask |= CLIP_FAR_BIT;
01e04c3fSmrg	 else if (cz < -1.0F)  mask |= CLIP_NEAR_BIT;
4a49301eSmrg      }
7117f1b4Smrg      clipMask[i] = mask;
7117f1b4Smrg      tmpOrMask |= mask;
7117f1b4Smrg      tmpAndMask &= mask;
7117f1b4Smrg   }
7117f1b4Smrg
7117f1b4Smrg   *orMask = tmpOrMask;
7117f1b4Smrg   *andMask = tmpAndMask;
7117f1b4Smrg   return clip_vec;
7117f1b4Smrg}
7117f1b4Smrg
7117f1b4Smrg
01e04c3fSmrgstatic GLvector4f * TAG(cliptest_points2)( GLvector4f *clip_vec,
7117f1b4Smrg                                                     GLvector4f *proj_vec,
7117f1b4Smrg                                                     GLubyte clipMask[],
7117f1b4Smrg                                                     GLubyte *orMask,
4a49301eSmrg                                                     GLubyte *andMask,
4a49301eSmrg						     GLboolean viewport_z_clip )
7117f1b4Smrg{
7117f1b4Smrg   const GLuint stride = clip_vec->stride;
7117f1b4Smrg   const GLuint count = clip_vec->count;
7117f1b4Smrg   const GLfloat *from = (GLfloat *)clip_vec->start;
7117f1b4Smrg   GLubyte tmpOrMask = *orMask;
7117f1b4Smrg   GLubyte tmpAndMask = *andMask;
7117f1b4Smrg   GLuint i;
7117f1b4Smrg   (void) proj_vec;
7117f1b4Smrg   STRIDE_LOOP {
7117f1b4Smrg      const GLfloat cx = from[0], cy = from[1];
7117f1b4Smrg      GLubyte mask = 0;
01e04c3fSmrg      if (cx >  1.0F)       mask |= CLIP_RIGHT_BIT;
01e04c3fSmrg      else if (cx < -1.0F)  mask |= CLIP_LEFT_BIT;
01e04c3fSmrg      if (cy >  1.0F)       mask |= CLIP_TOP_BIT;
01e04c3fSmrg      else if (cy < -1.0F)  mask |= CLIP_BOTTOM_BIT;
7117f1b4Smrg      clipMask[i] = mask;
7117f1b4Smrg      tmpOrMask |= mask;
7117f1b4Smrg      tmpAndMask &= mask;
7117f1b4Smrg   }
7117f1b4Smrg
7117f1b4Smrg   *orMask = tmpOrMask;
7117f1b4Smrg   *andMask = tmpAndMask;
7117f1b4Smrg   return clip_vec;
7117f1b4Smrg}
7117f1b4Smrg
7117f1b4Smrg
4a49301eSmrgvoid TAG(init_c_cliptest)( void )
7117f1b4Smrg{
7117f1b4Smrg   _mesa_clip_tab[4] = TAG(cliptest_points4);
7117f1b4Smrg   _mesa_clip_tab[3] = TAG(cliptest_points3);
7117f1b4Smrg   _mesa_clip_tab[2] = TAG(cliptest_points2);
7117f1b4Smrg
7117f1b4Smrg   _mesa_clip_np_tab[4] = TAG(cliptest_np_points4);
7117f1b4Smrg   _mesa_clip_np_tab[3] = TAG(cliptest_points3);
7117f1b4Smrg   _mesa_clip_np_tab[2] = TAG(cliptest_points2);
7117f1b4Smrg}