| |
| # |
| # (C) 2008-2009 Advanced Micro Devices, Inc. All Rights Reserved. |
| # |
| # This file is part of libacml_mv. |
| # |
| # libacml_mv is free software; you can redistribute it and/or |
| # modify it under the terms of the GNU Lesser General Public |
| # License as published by the Free Software Foundation; either |
| # version 2.1 of the License, or (at your option) any later version. |
| # |
| # libacml_mv is distributed in the hope that it will be useful, |
| # but WITHOUT ANY WARRANTY; without even the implied warranty of |
| # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| # Lesser General Public License for more details. |
| # |
| # You should have received a copy of the GNU Lesser General Public |
| # License along with libacml_mv. If not, see |
| # <http://www.gnu.org/licenses/>. |
| # |
| # |
| |
| |
| |
| |
| |
| # v4hlog10l.s |
| # |
| # Helper routines for testing the x4 double and x8 single vector |
| # math functions. |
| # |
| # Prototype: |
| # |
| # void v4log10(__m128d x1, __m128d x2, double * ya); |
| # |
| # Computes 4 log10 values simultaneously and returns them |
| # in the v4a array. |
| # Assumes that ya is 16 byte aligned. |
| # |
| # |
| |
| #ifdef __ELF__ |
| .section .note.GNU-stack,"",@progbits |
| #endif |
| |
| # xmm0 - __m128d x1 |
| # xmm1 - __m128d x2 |
| # rdi - double *ya |
| |
| .extern __vrd4_log10 |
| .text |
| .align 16 |
| .p2align 4,,15 |
| .globl v4log10 |
| .type v4log10,@function |
| v4log10: |
| push %rdi |
| call __vrd4_log10@PLT |
| pop %rdi |
| movdqa %xmm0,(%rdi) |
| movdqa %xmm1,16(%rdi) |
| ret |
| |
| # xmm0 - __m128 x1 |
| # xmm1 - __m128 x2 |
| # rdi - single *ya |
| |
| .extern __vrs8_log10f |
| .text |
| .align 16 |
| .p2align 4,,15 |
| .globl v8log10f |
| .type v8log10f,@function |
| v8log10f: |
| push %rdi |
| call __vrs8_log10f@PLT |
| pop %rdi |
| movdqa %xmm0,(%rdi) |
| movdqa %xmm1,16(%rdi) |
| |
| ret |