/* 
 * Copyright (c) 2016-2018, NVIDIA CORPORATION.  All rights reserved.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */


#include "directives.h"

        ALN_QUAD
.L_slog_zeromask:  .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF
                   .long 0xFFFFFFFF

.L_slog_one:       .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000
                   .long 0x3F800000


        .text
        ALN_FUNC
        .globl ENT(__fvs_log_fma3_mask)
ENT(__fvs_log_fma3_mask):

        subq $8, %rsp

        vptest  .L_slog_zeromask(%rip), %xmm1
        je      .L_fvs_log_fma3_done

        vmovups .L_slog_one(%rip), %xmm2

        vblendvps %xmm1,%xmm0,%xmm2,%xmm0

        CALL(ENT(__fvs_log_fma3))

.L_fvs_log_fma3_done:

        addq $8, %rsp
        ret

        ELF_FUNC(__fvs_log_fma3_mask)
        ELF_SIZE(__fvs_log_fma3_mask)


        .text
        ALN_FUNC
        .globl ENT(__fvs_log_fma3_256_mask)
ENT(__fvs_log_fma3_256_mask):

        subq $8, %rsp

        vptest  .L_slog_zeromask(%rip), %ymm1
        je      .L_fvs_log_fma3_256_done

        vmovups .L_slog_one(%rip), %ymm2

        vblendvps %ymm1,%ymm0,%ymm2,%ymm0
        
        CALL(ENT(__fvs_log_fma3_256))

.L_fvs_log_fma3_256_done:

        addq $8, %rsp
        ret

        ELF_FUNC(__fvs_log_fma3_256_mask)
        ELF_SIZE(__fvs_log_fma3_256_mask)

