1848b8605Smrg 2848b8605Smrg/* 3848b8605Smrg * Mesa 3-D graphics library 4848b8605Smrg * 5848b8605Smrg * Copyright (C) 1999-2003 Brian Paul All Rights Reserved. 6848b8605Smrg * 7848b8605Smrg * Permission is hereby granted, free of charge, to any person obtaining a 8848b8605Smrg * copy of this software and associated documentation files (the "Software"), 9848b8605Smrg * to deal in the Software without restriction, including without limitation 10848b8605Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense, 11848b8605Smrg * and/or sell copies of the Software, and to permit persons to whom the 12848b8605Smrg * Software is furnished to do so, subject to the following conditions: 13848b8605Smrg * 14848b8605Smrg * The above copyright notice and this permission notice shall be included 15848b8605Smrg * in all copies or substantial portions of the Software. 16848b8605Smrg * 17848b8605Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 18848b8605Smrg * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 19848b8605Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 20848b8605Smrg * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 21848b8605Smrg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 22848b8605Smrg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 23848b8605Smrg * OTHER DEALINGS IN THE SOFTWARE. 24848b8605Smrg */ 25848b8605Smrg 26848b8605Smrg/* 27848b8605Smrg * x86-64 optimizations shamelessy converted from x86/sse/3dnow assembly by 28848b8605Smrg * Mikko Tiihonen 29848b8605Smrg */ 30848b8605Smrg 31848b8605Smrg#ifdef USE_X86_64_ASM 32848b8605Smrg 33848b8605Smrg#include "main/glheader.h" 34848b8605Smrg#include "main/context.h" 35848b8605Smrg#include "math/m_xform.h" 36848b8605Smrg#include "tnl/t_context.h" 37848b8605Smrg#include "x86-64.h" 38848b8605Smrg#include "../x86/x86_xform.h" 39848b8605Smrg 40848b8605Smrg#ifdef DEBUG 41848b8605Smrg#include "math/m_debug.h" 42848b8605Smrg#endif 43848b8605Smrg 44848b8605Smrgextern void _mesa_x86_64_cpuid(unsigned int *regs); 45848b8605Smrg 46848b8605SmrgDECLARE_XFORM_GROUP( x86_64, 4 ) 47848b8605SmrgDECLARE_XFORM_GROUP( 3dnow, 4 ) 48848b8605Smrg 49848b8605Smrg#else 50848b8605Smrg/* just to silence warning below */ 51848b8605Smrg#include "x86-64.h" 52848b8605Smrg#endif 53848b8605Smrg 54848b8605Smrg/* 55848b8605Smrgextern void _mesa_x86_64_transform_points4_general( XFORM_ARGS ); 56848b8605Smrgextern void _mesa_x86_64_transform_points4_identity( XFORM_ARGS ); 57848b8605Smrgextern void _mesa_x86_64_transform_points4_perspective( XFORM_ARGS ); 58848b8605Smrgextern void _mesa_x86_64_transform_points4_3d( XFORM_ARGS ); 59848b8605Smrgextern void _mesa_x86_64_transform_points4_3d_no_rot( XFORM_ARGS ); 60848b8605Smrgextern void _mesa_x86_64_transform_points4_2d_no_rot( XFORM_ARGS ); 61848b8605Smrgextern void _mesa_x86_64_transform_points4_2d( XFORM_ARGS ); 62848b8605Smrg*/ 63848b8605Smrg 64848b8605Smrg#ifdef USE_X86_64_ASM 65848b8605Smrgstatic void message( const char *msg ) 66848b8605Smrg{ 67b8e80941Smrg if (getenv("MESA_DEBUG")) { 68848b8605Smrg _mesa_debug( NULL, "%s", msg ); 69848b8605Smrg } 70848b8605Smrg} 71848b8605Smrg#endif 72848b8605Smrg 73848b8605Smrg 74848b8605Smrgvoid _mesa_init_all_x86_64_transform_asm(void) 75848b8605Smrg{ 76848b8605Smrg#ifdef USE_X86_64_ASM 77848b8605Smrg unsigned int regs[4]; 78848b8605Smrg 79b8e80941Smrg if ( getenv( "MESA_NO_ASM" ) ) { 80848b8605Smrg return; 81848b8605Smrg } 82848b8605Smrg 83848b8605Smrg message("Initializing x86-64 optimizations\n"); 84848b8605Smrg 85848b8605Smrg 86848b8605Smrg _mesa_transform_tab[4][MATRIX_GENERAL] = 87848b8605Smrg _mesa_x86_64_transform_points4_general; 88848b8605Smrg _mesa_transform_tab[4][MATRIX_IDENTITY] = 89848b8605Smrg _mesa_x86_64_transform_points4_identity; 90848b8605Smrg _mesa_transform_tab[4][MATRIX_3D] = 91848b8605Smrg _mesa_x86_64_transform_points4_3d; 92848b8605Smrg 93848b8605Smrg regs[0] = 0x80000001; 94848b8605Smrg regs[1] = 0x00000000; 95848b8605Smrg regs[2] = 0x00000000; 96848b8605Smrg regs[3] = 0x00000000; 97848b8605Smrg _mesa_x86_64_cpuid(regs); 98848b8605Smrg if (regs[3] & (1U << 31)) { 99848b8605Smrg message("3Dnow! detected\n"); 100848b8605Smrg _mesa_transform_tab[4][MATRIX_3D_NO_ROT] = 101848b8605Smrg _mesa_3dnow_transform_points4_3d_no_rot; 102848b8605Smrg _mesa_transform_tab[4][MATRIX_PERSPECTIVE] = 103848b8605Smrg _mesa_3dnow_transform_points4_perspective; 104848b8605Smrg _mesa_transform_tab[4][MATRIX_2D_NO_ROT] = 105848b8605Smrg _mesa_3dnow_transform_points4_2d_no_rot; 106848b8605Smrg _mesa_transform_tab[4][MATRIX_2D] = 107848b8605Smrg _mesa_3dnow_transform_points4_2d; 108848b8605Smrg 109848b8605Smrg } 110848b8605Smrg 111848b8605Smrg 112848b8605Smrg#ifdef DEBUG_MATH 113848b8605Smrg _math_test_all_transform_functions("x86_64"); 114848b8605Smrg _math_test_all_cliptest_functions("x86_64"); 115848b8605Smrg _math_test_all_normal_transform_functions("x86_64"); 116848b8605Smrg#endif 117848b8605Smrg 118848b8605Smrg#endif 119848b8605Smrg} 120