ref: b8549ed8895303019730da9e7ffa7945d3ac4d0d
dir: /vp9/common/ppc/vp9_idct_vsx.c/
/* * Copyright (c) 2018 The WebM project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #include <assert.h> #include "./vp9_rtcd.h" #include "vpx_dsp/vpx_dsp_common.h" #include "vpx_dsp/ppc/inv_txfm_vsx.h" #include "vpx_dsp/ppc/bitdepth_conversion_vsx.h" #include "vp9/common/vp9_enums.h" void vp9_iht4x4_16_add_vsx(const tran_low_t *input, uint8_t *dest, int stride, int tx_type) { int16x8_t in[2], out[2]; in[0] = load_tran_low(0, input); in[1] = load_tran_low(8 * sizeof(*input), input); switch (tx_type) { case DCT_DCT: vpx_idct4_vsx(in, out); vpx_idct4_vsx(out, in); break; case ADST_DCT: vpx_idct4_vsx(in, out); vp9_iadst4_vsx(out, in); break; case DCT_ADST: vp9_iadst4_vsx(in, out); vpx_idct4_vsx(out, in); break; default: assert(tx_type == ADST_ADST); vp9_iadst4_vsx(in, out); vp9_iadst4_vsx(out, in); break; } vpx_round_store4x4_vsx(in, out, dest, stride); } void vp9_iht8x8_64_add_vsx(const tran_low_t *input, uint8_t *dest, int stride, int tx_type) { int16x8_t in[8], out[8]; // load input data in[0] = load_tran_low(0, input); in[1] = load_tran_low(8 * sizeof(*input), input); in[2] = load_tran_low(2 * 8 * sizeof(*input), input); in[3] = load_tran_low(3 * 8 * sizeof(*input), input); in[4] = load_tran_low(4 * 8 * sizeof(*input), input); in[5] = load_tran_low(5 * 8 * sizeof(*input), input); in[6] = load_tran_low(6 * 8 * sizeof(*input), input); in[7] = load_tran_low(7 * 8 * sizeof(*input), input); switch (tx_type) { case DCT_DCT: vpx_idct8_vsx(in, out); vpx_idct8_vsx(out, in); break; case ADST_DCT: vpx_idct8_vsx(in, out); vp9_iadst8_vsx(out, in); break; case DCT_ADST: vp9_iadst8_vsx(in, out); vpx_idct8_vsx(out, in); break; default: assert(tx_type == ADST_ADST); vp9_iadst8_vsx(in, out); vp9_iadst8_vsx(out, in); break; } vpx_round_store8x8_vsx(in, dest, stride); } void vp9_iht16x16_256_add_vsx(const tran_low_t *input, uint8_t *dest, int stride, int tx_type) { int16x8_t in0[16], in1[16]; LOAD_INPUT16(load_tran_low, input, 0, 8 * sizeof(*input), in0); LOAD_INPUT16(load_tran_low, input, 8 * 8 * 2 * sizeof(*input), 8 * sizeof(*input), in1); switch (tx_type) { case DCT_DCT: vpx_idct16_vsx(in0, in1); vpx_idct16_vsx(in0, in1); break; case ADST_DCT: vpx_idct16_vsx(in0, in1); vpx_iadst16_vsx(in0, in1); break; case DCT_ADST: vpx_iadst16_vsx(in0, in1); vpx_idct16_vsx(in0, in1); break; default: assert(tx_type == ADST_ADST); vpx_iadst16_vsx(in0, in1); vpx_iadst16_vsx(in0, in1); break; } vpx_round_store16x16_vsx(in0, in1, dest, stride); }