Blame view

ffmpeg-4.2.2/libavcodec/ppc/fmtconvert_altivec.c 2.01 KB
aac5773f   hucm   功能基本完成,接口待打磨
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
  /*
   * Copyright (c) 2006 Luca Barbato <lu_zero@gentoo.org>
   *
   * This file is part of FFmpeg.
   *
   * FFmpeg is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public
   * License as published by the Free Software Foundation; either
   * version 2.1 of the License, or (at your option) any later version.
   *
   * FFmpeg is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   * Lesser General Public License for more details.
   *
   * You should have received a copy of the GNU Lesser General Public
   * License along with FFmpeg; if not, write to the Free Software
   * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
   */
  
  #include "config.h"
  #include "libavutil/attributes.h"
  #include "libavutil/cpu.h"
  #include "libavutil/mem.h"
  #include "libavutil/ppc/cpu.h"
  #include "libavutil/ppc/util_altivec.h"
  #include "libavcodec/fmtconvert.h"
  
  #if HAVE_ALTIVEC
  
  static void int32_to_float_fmul_scalar_altivec(float *dst, const int32_t *src,
                                                 float mul, int len)
  {
      union {
          vector float v;
          float s[4];
      } mul_u;
      int i;
      vector float src1, src2, dst1, dst2, mul_v, zero;
  
      zero = (vector float)vec_splat_u32(0);
      mul_u.s[0] = mul;
      mul_v = vec_splat(mul_u.v, 0);
  
      for (i = 0; i < len; i += 8) {
          src1 = vec_ctf(vec_ld(0,  src+i), 0);
          src2 = vec_ctf(vec_ld(16, src+i), 0);
          dst1 = vec_madd(src1, mul_v, zero);
          dst2 = vec_madd(src2, mul_v, zero);
          vec_st(dst1,  0, dst+i);
          vec_st(dst2, 16, dst+i);
      }
  }
  
  #endif /* HAVE_ALTIVEC */
  
  av_cold void ff_fmt_convert_init_ppc(FmtConvertContext *c,
                                       AVCodecContext *avctx)
  {
  #if HAVE_ALTIVEC
      if (!PPC_ALTIVEC(av_get_cpu_flags()))
          return;
  
      c->int32_to_float_fmul_scalar = int32_to_float_fmul_scalar_altivec;
  #endif /* HAVE_ALTIVEC */
  }