| /************************************************************************** |
| * |
| * Copyright 2009 VMware, Inc. |
| * All Rights Reserved. |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a |
| * copy of this software and associated documentation files (the |
| * "Software"), to deal in the Software without restriction, including |
| * without limitation the rights to use, copy, modify, merge, publish, |
| * distribute, sub license, and/or sell copies of the Software, and to |
| * permit persons to whom the Software is furnished to do so, subject to |
| * the following conditions: |
| * |
| * The above copyright notice and this permission notice (including the |
| * next paragraph) shall be included in all copies or substantial portions |
| * of the Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS |
| * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
| * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. |
| * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR |
| * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, |
| * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE |
| * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. |
| * |
| **************************************************************************/ |
| |
| /** |
| * @file |
| * Helper arithmetic functions. |
| * |
| * @author Jose Fonseca <jfonseca@vmware.com> |
| */ |
| |
| |
| #ifndef LP_BLD_ARIT_H |
| #define LP_BLD_ARIT_H |
| |
| |
| #include "gallivm/lp_bld.h" |
| |
| |
| struct lp_type; |
| struct lp_build_context; |
| struct gallivm_state; |
| |
| |
| /** |
| * Complement, i.e., 1 - a. |
| */ |
| LLVMValueRef |
| lp_build_comp(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_add(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_horizontal_add(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_hadd_partial4(struct lp_build_context *bld, |
| LLVMValueRef vectors[], |
| unsigned num_vecs); |
| |
| LLVMValueRef |
| lp_build_sub(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| |
| LLVMValueRef |
| lp_build_mul_norm(struct gallivm_state *gallivm, |
| struct lp_type wide_type, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_mul(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_mul_32_lohi_cpu(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| LLVMValueRef *res_hi); |
| |
| LLVMValueRef |
| lp_build_mul_32_lohi(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| LLVMValueRef *res_hi); |
| |
| LLVMValueRef |
| lp_build_mul_imm(struct lp_build_context *bld, |
| LLVMValueRef a, |
| int b); |
| |
| LLVMValueRef |
| lp_build_div(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| |
| /* llvm.fmuladd.* intrinsic */ |
| LLVMValueRef |
| lp_build_fmuladd(LLVMBuilderRef builder, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| LLVMValueRef c); |
| |
| /* a * b + c */ |
| LLVMValueRef |
| lp_build_mad(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| LLVMValueRef c); |
| |
| |
| /** |
| * Set when the weights for normalized are prescaled, that is, in range |
| * 0..2**n, as opposed to range 0..2**(n-1). |
| */ |
| #define LP_BLD_LERP_PRESCALED_WEIGHTS (1 << 0) |
| |
| /** |
| * Used internally when using wide intermediates for normalized lerps. |
| * |
| * Do not use. |
| */ |
| #define LP_BLD_LERP_WIDE_NORMALIZED (1 << 1) |
| |
| LLVMValueRef |
| lp_build_lerp(struct lp_build_context *bld, |
| LLVMValueRef x, |
| LLVMValueRef v0, |
| LLVMValueRef v1, |
| unsigned flags); |
| |
| LLVMValueRef |
| lp_build_lerp_2d(struct lp_build_context *bld, |
| LLVMValueRef x, |
| LLVMValueRef y, |
| LLVMValueRef v00, |
| LLVMValueRef v01, |
| LLVMValueRef v10, |
| LLVMValueRef v11, |
| unsigned flags); |
| |
| LLVMValueRef |
| lp_build_lerp_3d(struct lp_build_context *bld, |
| LLVMValueRef x, |
| LLVMValueRef y, |
| LLVMValueRef z, |
| LLVMValueRef v000, |
| LLVMValueRef v001, |
| LLVMValueRef v010, |
| LLVMValueRef v011, |
| LLVMValueRef v100, |
| LLVMValueRef v101, |
| LLVMValueRef v110, |
| LLVMValueRef v111, |
| unsigned flags); |
| |
| /** |
| * Specifies floating point NaN behavior. |
| */ |
| enum gallivm_nan_behavior { |
| /* Results are undefined with NaN. Results in fastest code */ |
| GALLIVM_NAN_BEHAVIOR_UNDEFINED, |
| /* If one of the inputs is NaN, NaN is returned */ |
| GALLIVM_NAN_RETURN_NAN, |
| /* If one of the inputs is NaN, the other operand is returned */ |
| GALLIVM_NAN_RETURN_OTHER, |
| /* If one of the inputs is NaN, the other operand is returned, |
| * but we guarantee the second operand is not a NaN. |
| * In min/max it will be as fast as undefined with sse opcodes, |
| * and archs having native return_other can benefit too. */ |
| GALLIVM_NAN_RETURN_OTHER_SECOND_NONNAN, |
| /* If one of the inputs is NaN, NaN is returned, |
| * but we guarantee the first operand is not a NaN. |
| * In min/max it will be as fast as undefined with sse opcodes, |
| * and archs having native return_nan can benefit too. */ |
| GALLIVM_NAN_RETURN_NAN_FIRST_NONNAN, |
| |
| }; |
| |
| LLVMValueRef |
| lp_build_min(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_min_ext(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| enum gallivm_nan_behavior nan_behavior); |
| |
| LLVMValueRef |
| lp_build_max(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_max_ext(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b, |
| enum gallivm_nan_behavior nan_behavior); |
| |
| LLVMValueRef |
| lp_build_clamp(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef min, |
| LLVMValueRef max); |
| |
| LLVMValueRef |
| lp_build_clamp_zero_one_nanzero(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_abs(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_negate(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_sgn(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_set_sign(struct lp_build_context *bld, |
| LLVMValueRef a, LLVMValueRef sign); |
| |
| LLVMValueRef |
| lp_build_int_to_float(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_round(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_floor(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_ceil(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_trunc(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_fract(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_fract_safe(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_ifloor(struct lp_build_context *bld, |
| LLVMValueRef a); |
| LLVMValueRef |
| lp_build_iceil(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_iround(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_itrunc(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| void |
| lp_build_ifloor_fract(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef *out_ipart, |
| LLVMValueRef *out_fpart); |
| |
| void |
| lp_build_ifloor_fract_safe(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef *out_ipart, |
| LLVMValueRef *out_fpart); |
| |
| LLVMValueRef |
| lp_build_sqrt(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_rcp(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_rsqrt(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| boolean |
| lp_build_fast_rsqrt_available(struct lp_type type); |
| |
| LLVMValueRef |
| lp_build_fast_rsqrt(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_polynomial(struct lp_build_context *bld, |
| LLVMValueRef x, |
| const double *coeffs, |
| unsigned num_coeffs); |
| |
| LLVMValueRef |
| lp_build_cos(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_sin(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_pow(struct lp_build_context *bld, |
| LLVMValueRef a, |
| LLVMValueRef b); |
| |
| LLVMValueRef |
| lp_build_exp(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_log(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_log_safe(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_exp2(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_extract_exponent(struct lp_build_context *bld, |
| LLVMValueRef x, |
| int bias); |
| |
| LLVMValueRef |
| lp_build_extract_mantissa(struct lp_build_context *bld, |
| LLVMValueRef x); |
| |
| LLVMValueRef |
| lp_build_log2(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_log2_safe(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_fast_log2(struct lp_build_context *bld, |
| LLVMValueRef a); |
| |
| LLVMValueRef |
| lp_build_ilog2(struct lp_build_context *bld, |
| LLVMValueRef x); |
| |
| void |
| lp_build_log2_approx(struct lp_build_context *bld, |
| LLVMValueRef x, |
| LLVMValueRef *p_exp, |
| LLVMValueRef *p_floor_log2, |
| LLVMValueRef *p_log2, |
| boolean handle_nans); |
| |
| LLVMValueRef |
| lp_build_mod(struct lp_build_context *bld, |
| LLVMValueRef x, |
| LLVMValueRef y); |
| |
| LLVMValueRef |
| lp_build_isnan(struct lp_build_context *bld, |
| LLVMValueRef x); |
| |
| LLVMValueRef |
| lp_build_isfinite(struct lp_build_context *bld, |
| LLVMValueRef x); |
| |
| |
| LLVMValueRef |
| lp_build_is_inf_or_nan(struct gallivm_state *gallivm, |
| const struct lp_type type, |
| LLVMValueRef x); |
| |
| |
| LLVMValueRef |
| lp_build_fpstate_get(struct gallivm_state *gallivm); |
| |
| void |
| lp_build_fpstate_set_denorms_zero(struct gallivm_state *gallivm, |
| boolean zero); |
| void |
| lp_build_fpstate_set(struct gallivm_state *gallivm, |
| LLVMValueRef mxcsr); |
| |
| #endif /* !LP_BLD_ARIT_H */ |