103b705cfSriastradh/* 203b705cfSriastradh * Copyright © 2006 Intel Corporation 303b705cfSriastradh * 403b705cfSriastradh * Permission is hereby granted, free of charge, to any person obtaining a 503b705cfSriastradh * copy of this software and associated documentation files (the "Software"), 603b705cfSriastradh * to deal in the Software without restriction, including without limitation 703b705cfSriastradh * the rights to use, copy, modify, merge, publish, distribute, sublicense, 803b705cfSriastradh * and/or sell copies of the Software, and to permit persons to whom the 903b705cfSriastradh * Software is furnished to do so, subject to the following conditions: 1003b705cfSriastradh * 1103b705cfSriastradh * The above copyright notice and this permission notice (including the next 1203b705cfSriastradh * paragraph) shall be included in all copies or substantial portions of the 1303b705cfSriastradh * Software. 1403b705cfSriastradh * 1503b705cfSriastradh * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1603b705cfSriastradh * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1703b705cfSriastradh * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1803b705cfSriastradh * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 1903b705cfSriastradh * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 2003b705cfSriastradh * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 2103b705cfSriastradh * IN THE SOFTWARE. 2203b705cfSriastradh * 2303b705cfSriastradh * Authors: 2403b705cfSriastradh * Wang Zhenyu <zhenyu.z.wang@intel.com> 2503b705cfSriastradh * Keith Packard <keithp@keithp.com> 2603b705cfSriastradh */ 2703b705cfSriastradh 2803b705cfSriastradh/********** Compute w *************/ 2903b705cfSriastradh 3003b705cfSriastradhmul (16) temp_x<1>F dst_x<8,8,1>F dw_dx { compr align1 }; 3103b705cfSriastradhmul (16) temp_y<1>F dst_y<8,8,1>F dw_dy { compr align1 }; 3203b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F temp_y<8,8,1>F { compr align1 }; 3303b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F wo { compr align1 }; 3403b705cfSriastradhsend (8) 0 w_0<1>F temp_x_0<8,8,1>F math inv mlen 1 rlen 1 { align1 }; 3503b705cfSriastradhsend (8) 0 w_1<1>F temp_x_1<8,8,1>F math inv mlen 1 rlen 1 { sechalf align1 }; 3603b705cfSriastradh 3703b705cfSriastradh/********** Compute u *************/ 3803b705cfSriastradh 3903b705cfSriastradhmul (16) temp_x<1>F dst_x<8,8,1>F du_dx { compr align1 }; 4003b705cfSriastradhmul (16) temp_y<1>F dst_y<8,8,1>F du_dy { compr align1 }; 4103b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F temp_y<8,8,1>F { compr align1 }; 4203b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F uo { compr align1 }; 4303b705cfSriastradhmul (16) u<1>F temp_x<8,8,1>F w<8,8,1>F { compr align1 }; 4403b705cfSriastradh 4503b705cfSriastradh/********** Compute v *************/ 4603b705cfSriastradh 4703b705cfSriastradhmul (16) temp_x<1>F dst_x<8,8,1>F dv_dx { compr align1 }; 4803b705cfSriastradhmul (16) temp_y<1>F dst_y<8,8,1>F dv_dy { compr align1 }; 4903b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F temp_y<8,8,1>F { compr align1 }; 5003b705cfSriastradhadd (16) temp_x<1>F temp_x<8,8,1>F vo { compr align1 }; 5103b705cfSriastradhmul (16) v<1>F temp_x<8,8,1>F w<8,8,1>F { compr align1 }; 52