aboutsummaryrefslogtreecommitdiff
path: root/peakval_av.c
blob: ae54c106fd401ff895eb9603006c28d2f9fe71ba (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
/* Return the largest absolute value of a vector of signed shorts

 * This is the Altivec SIMD version.

 * Copyright 2004 Phil Karn, KA9Q
 * May be used under the terms of the GNU Lesser General Public License (LGPL)
 */

#include "fec.h"

signed short peakval_av(signed short *in,int cnt){
  vector signed short x;
  int pad;
  union { vector signed char cv; vector signed short hv; signed short s[8]; signed char c[16];} s;
  vector signed short smallest,largest;

  smallest = (vector signed short)(0);
  largest = (vector signed short)(0);
  if((pad = (int)in & 15)!=0){
    /* Load unaligned leading word */
    x = vec_perm(vec_ld(0,in),(vector signed short)(0),vec_lvsl(0,in));
    if(cnt < 8){ /* Shift right to chop stuff beyond end of short block */
      s.c[15] = (8-cnt)<<4;
      x = vec_sro(x,s.cv);
    }
    smallest = vec_min(smallest,x);
    largest = vec_max(largest,x);
    in += 8-pad/2;
    cnt -= 8-pad/2;
  }
  /* Everything is now aligned, rip through most of the block */
  while(cnt >= 8){
    x = vec_ld(0,in);
    smallest = vec_min(smallest,x);
    largest = vec_max(largest,x);
    in += 8;
    cnt -= 8;
  }
  /* Handle trailing fragment, if any */
  if(cnt > 0){
    x = vec_ld(0,in);
    s.c[15] = (8-cnt)<<4;
    x = vec_sro(x,s.cv);
    smallest = vec_min(smallest,x);
    largest = vec_max(largest,x);
  }
  /* Combine and extract result */
  largest = vec_max(largest,vec_abs(smallest));

  s.c[15] = 64; /* Shift right four 16-bit words */
  largest = vec_max(largest,vec_sro(largest,s.cv));

  s.c[15] = 32; /* Shift right two 16-bit words */
  largest = vec_max(largest,vec_sro(largest,s.cv));

  s.c[15] = 16; /* Shift right one 16-bit word */
  largest = vec_max(largest,vec_sro(largest,s.cv));

  s.hv = largest;
  return s.s[7];
}