| /* ------------------------------------------------------------------ |
| * Copyright (C) 1998-2009 PacketVideo |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either |
| * express or implied. |
| * See the License for the specific language governing permissions |
| * and limitations under the License. |
| * ------------------------------------------------------------------- |
| */ |
| /* Filename: dct_inline.h */ |
| /* Description: Implementation for in-line functions used in dct.cpp */ |
| /* Modified: */ |
| /*********************************************************************************/ |
| #ifndef _DCT_INLINE_H_ |
| #define _DCT_INLINE_H_ |
| |
| #if !defined(PV_ARM_GCC_V5) && !defined(PV_ARM_GCC_V4) |
| |
| __inline int32 mla724(int32 op1, int32 op2, int32 op3) |
| { |
| int32 out; |
| |
| OSCL_UNUSED_ARG(op1); |
| |
| out = op2 * 724 + op3; /* op1 is not used here */ |
| |
| return out; |
| } |
| |
| __inline int32 mla392(int32 k0, int32 k14, int32 round) |
| { |
| int32 k1; |
| |
| OSCL_UNUSED_ARG(k14); |
| |
| k1 = k0 * 392 + round; |
| |
| return k1; |
| } |
| |
| __inline int32 mla554(int32 k4, int32 k12, int32 k1) |
| { |
| int32 k0; |
| |
| OSCL_UNUSED_ARG(k12); |
| |
| k0 = k4 * 554 + k1; |
| |
| return k0; |
| } |
| |
| __inline int32 mla1338(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| OSCL_UNUSED_ARG(k14); |
| |
| out = k6 * 1338 + k1; |
| |
| return out; |
| } |
| |
| __inline int32 mla946(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| OSCL_UNUSED_ARG(k14); |
| |
| out = k6 * 946 + k1; |
| |
| return out; |
| } |
| |
| __inline int32 sum_abs(int32 k0, int32 k1, int32 k2, int32 k3, |
| int32 k4, int32 k5, int32 k6, int32 k7) |
| { |
| int32 carry, abs_sum; |
| |
| carry = k0 >> 31; |
| abs_sum = (k0 ^ carry); |
| carry = k1 >> 31; |
| abs_sum += (k1 ^ carry) - carry; |
| carry = k2 >> 31; |
| abs_sum += (k2 ^ carry) - carry; |
| carry = k3 >> 31; |
| abs_sum += (k3 ^ carry) - carry; |
| carry = k4 >> 31; |
| abs_sum += (k4 ^ carry) - carry; |
| carry = k5 >> 31; |
| abs_sum += (k5 ^ carry) - carry; |
| carry = k6 >> 31; |
| abs_sum += (k6 ^ carry) - carry; |
| carry = k7 >> 31; |
| abs_sum += (k7 ^ carry) - carry; |
| |
| return abs_sum; |
| } |
| |
| #elif defined(__CC_ARM) /* only work with arm v5 */ |
| |
| #if defined(__TARGET_ARCH_5TE) |
| |
| __inline int32 mla724(int32 op1, int32 op2, int32 op3) |
| { |
| int32 out; |
| |
| __asm |
| { |
| smlabb out, op1, op2, op3 |
| } |
| |
| return out; |
| } |
| |
| __inline int32 mla392(int32 k0, int32 k14, int32 round) |
| { |
| int32 k1; |
| |
| __asm |
| { |
| smlabt k1, k0, k14, round |
| } |
| |
| return k1; |
| } |
| |
| __inline int32 mla554(int32 k4, int32 k12, int32 k1) |
| { |
| int32 k0; |
| |
| __asm |
| { |
| smlabt k0, k4, k12, k1 |
| } |
| |
| return k0; |
| } |
| |
| __inline int32 mla1338(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| __asm |
| { |
| smlabb out, k6, k14, k1 |
| } |
| |
| return out; |
| } |
| |
| __inline int32 mla946(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| __asm |
| { |
| smlabb out, k6, k14, k1 |
| } |
| |
| return out; |
| } |
| |
| #else // not ARM5TE |
| |
| |
| __inline int32 mla724(int32 op1, int32 op2, int32 op3) |
| { |
| int32 out; |
| |
| __asm |
| { |
| and out, op2, #0xFFFF |
| mla out, op1, out, op3 |
| } |
| |
| return out; |
| } |
| |
| __inline int32 mla392(int32 k0, int32 k14, int32 round) |
| { |
| int32 k1; |
| |
| __asm |
| { |
| mov k1, k14, asr #16 |
| mla k1, k0, k1, round |
| } |
| |
| return k1; |
| } |
| |
| __inline int32 mla554(int32 k4, int32 k12, int32 k1) |
| { |
| int32 k0; |
| |
| __asm |
| { |
| mov k0, k12, asr #16 |
| mla k0, k4, k0, k1 |
| } |
| |
| return k0; |
| } |
| |
| __inline int32 mla1338(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| __asm |
| { |
| and out, k14, 0xFFFF |
| mla out, k6, out, k1 |
| } |
| |
| return out; |
| } |
| |
| __inline int32 mla946(int32 k6, int32 k14, int32 k1) |
| { |
| int32 out; |
| |
| __asm |
| { |
| and out, k14, 0xFFFF |
| mla out, k6, out, k1 |
| } |
| |
| return out; |
| } |
| |
| #endif |
| |
| __inline int32 sum_abs(int32 k0, int32 k1, int32 k2, int32 k3, |
| int32 k4, int32 k5, int32 k6, int32 k7) |
| { |
| int32 carry, abs_sum; |
| __asm |
| { |
| eor carry, k0, k0, asr #31 ; |
| eors abs_sum, k1, k1, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k2, k2, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k3, k3, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k4, k4, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k5, k5, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k6, k6, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| eors carry, k7, k7, asr #31 ; |
| adc abs_sum, abs_sum, carry ; |
| } |
| |
| return abs_sum; |
| } |
| |
| #elif ( defined(PV_ARM_GCC_V5) || defined(PV_ARM_GCC_V4) ) /* ARM GNU COMPILER */ |
| |
| __inline int32 mla724(int32 op1, int32 op2, int32 op3) |
| { |
| register int32 out; |
| register int32 aa = (int32)op1; |
| register int32 bb = (int32)op2; |
| register int32 cc = (int32)op3; |
| |
| asm volatile("smlabb %0, %1, %2, %3" |
| : "=&r"(out) |
| : "r"(aa), |
| "r"(bb), |
| "r"(cc)); |
| return out; |
| } |
| |
| |
| __inline int32 mla392(int32 k0, int32 k14, int32 round) |
| { |
| register int32 out; |
| register int32 aa = (int32)k0; |
| register int32 bb = (int32)k14; |
| register int32 cc = (int32)round; |
| |
| asm volatile("smlabt %0, %1, %2, %3" |
| : "=&r"(out) |
| : "r"(aa), |
| "r"(bb), |
| "r"(cc)); |
| |
| return out; |
| } |
| |
| __inline int32 mla554(int32 k4, int32 k12, int32 k1) |
| { |
| register int32 out; |
| register int32 aa = (int32)k4; |
| register int32 bb = (int32)k12; |
| register int32 cc = (int32)k1; |
| |
| asm volatile("smlabt %0, %1, %2, %3" |
| : "=&r"(out) |
| : "r"(aa), |
| "r"(bb), |
| "r"(cc)); |
| |
| return out; |
| } |
| |
| __inline int32 mla1338(int32 k6, int32 k14, int32 k1) |
| { |
| register int32 out; |
| register int32 aa = (int32)k6; |
| register int32 bb = (int32)k14; |
| register int32 cc = (int32)k1; |
| |
| asm volatile("smlabb %0, %1, %2, %3" |
| : "=&r"(out) |
| : "r"(aa), |
| "r"(bb), |
| "r"(cc)); |
| return out; |
| } |
| |
| __inline int32 mla946(int32 k6, int32 k14, int32 k1) |
| { |
| register int32 out; |
| register int32 aa = (int32)k6; |
| register int32 bb = (int32)k14; |
| register int32 cc = (int32)k1; |
| |
| asm volatile("smlabb %0, %1, %2, %3" |
| : "=&r"(out) |
| : "r"(aa), |
| "r"(bb), |
| "r"(cc)); |
| return out; |
| } |
| |
| __inline int32 sum_abs(int32 k0, int32 k1, int32 k2, int32 k3, |
| int32 k4, int32 k5, int32 k6, int32 k7) |
| { |
| register int32 carry; |
| register int32 abs_sum; |
| register int32 aa = (int32)k0; |
| register int32 bb = (int32)k1; |
| register int32 cc = (int32)k2; |
| register int32 dd = (int32)k3; |
| register int32 ee = (int32)k4; |
| register int32 ff = (int32)k5; |
| register int32 gg = (int32)k6; |
| register int32 hh = (int32)k7; |
| |
| asm volatile("eor %0, %2, %2, asr #31\n\t" |
| "eors %1, %3, %3, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %4, %4, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %5, %5, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %6, %6, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %7, %7, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %8, %8, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| "eors %0, %9, %9, asr #31\n\t" |
| "adc %1, %1, %0\n\t" |
| |
| : "=&r"(carry), |
| "=&r"(abs_sum): |
| "r"(aa), |
| "r"(bb), |
| "r"(cc), |
| "r"(dd), |
| "r"(ee), |
| "r"(ff), |
| "r"(gg), |
| "r"(hh)); |
| |
| return abs_sum; |
| } |
| |
| #endif // Diff. OS |
| |
| #endif //_DCT_INLINE_H_ |
| |
| |