ref: baf658ec4cb9c6f32a7f15d76b104396fe851c69
dir: /vpx_dsp/ppc/bitdepth_conversion_vsx.h/
/*
 *  Copyright (c) 2017 The WebM project authors. All Rights Reserved.
 *
 *  Use of this source code is governed by a BSD-style license
 *  that can be found in the LICENSE file in the root of the source
 *  tree. An additional intellectual property rights grant can be found
 *  in the file PATENTS.  All contributing project authors may
 *  be found in the AUTHORS file in the root of the source tree.
 */
#ifndef VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_
#define VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_
#include "./vpx_config.h"
#include "vpx/vpx_integer.h"
#include "vpx_dsp/vpx_dsp_common.h"
#include "vpx_dsp/ppc/types_vsx.h"
// Load 8 16 bit values. If the source is 32 bits then pack down with
// saturation.
static INLINE int16x8_t load_tran_low(int32_t c, const tran_low_t *s) {
#if CONFIG_VP9_HIGHBITDEPTH
  int32x4_t u = vec_vsx_ld(c, s);
  int32x4_t v = vec_vsx_ld(c, s + 4);
  return vec_packs(u, v);
#else
  return vec_vsx_ld(c, s);
#endif
}
// Store 8 16 bit values. If the destination is 32 bits then sign extend the
// values by multiplying by 1.
static INLINE void store_tran_low(int16x8_t v, int32_t c, tran_low_t *s) {
#if CONFIG_VP9_HIGHBITDEPTH
  const int16x8_t one = vec_splat_s16(1);
  const int32x4_t even = vec_mule(v, one);
  const int32x4_t odd = vec_mulo(v, one);
  const int32x4_t high = vec_mergeh(even, odd);
  const int32x4_t low = vec_mergel(even, odd);
  vec_vsx_st(high, c, s);
  vec_vsx_st(low, c, s + 4);
#else
  vec_vsx_st(v, c, s);
#endif
}
#endif  // VPX_DSP_PPC_BITDEPTH_CONVERSION_VSX_H_