xref: /aosp_15_r20/external/fec/sumsq_mmx.c (revision 638691a093b4f9473cd6ee8f3e0139deef159a86)
1*638691a0SAndroid Build Coastguard Worker /* Compute the sum of the squares of a vector of signed shorts
2*638691a0SAndroid Build Coastguard Worker 
3*638691a0SAndroid Build Coastguard Worker  *  MMX-assisted version (also used on SSE)
4*638691a0SAndroid Build Coastguard Worker 
5*638691a0SAndroid Build Coastguard Worker  * The SSE2 and MMX assist routines both operate on multiples of
6*638691a0SAndroid Build Coastguard Worker  * 8 words; they differ only in their alignment requirements (8 bytes
7*638691a0SAndroid Build Coastguard Worker  * for MMX, 16 bytes for SSE2)
8*638691a0SAndroid Build Coastguard Worker 
9*638691a0SAndroid Build Coastguard Worker  * Copyright 2004 Phil Karn, KA9Q
10*638691a0SAndroid Build Coastguard Worker  * May be used under the terms of the GNU Lesser Public License (LGPL)
11*638691a0SAndroid Build Coastguard Worker  */
12*638691a0SAndroid Build Coastguard Worker 
13*638691a0SAndroid Build Coastguard Worker long long sumsq_mmx_assist(signed short *,int);
14*638691a0SAndroid Build Coastguard Worker 
sumsq_mmx(signed short * in,int cnt)15*638691a0SAndroid Build Coastguard Worker long long sumsq_mmx(signed short *in,int cnt){
16*638691a0SAndroid Build Coastguard Worker   long long sum = 0;
17*638691a0SAndroid Build Coastguard Worker 
18*638691a0SAndroid Build Coastguard Worker   /* Handle stuff before the next 8-byte boundary */
19*638691a0SAndroid Build Coastguard Worker   while(((int)in & 7) != 0 && cnt != 0){
20*638691a0SAndroid Build Coastguard Worker     sum += (long)in[0] * in[0];
21*638691a0SAndroid Build Coastguard Worker     in++;
22*638691a0SAndroid Build Coastguard Worker     cnt--;
23*638691a0SAndroid Build Coastguard Worker   }
24*638691a0SAndroid Build Coastguard Worker   sum += sumsq_mmx_assist(in,cnt);
25*638691a0SAndroid Build Coastguard Worker   in += cnt & ~7;
26*638691a0SAndroid Build Coastguard Worker   cnt &= 7;
27*638691a0SAndroid Build Coastguard Worker 
28*638691a0SAndroid Build Coastguard Worker   /* Handle up to 7 words at end */
29*638691a0SAndroid Build Coastguard Worker   while(cnt != 0){
30*638691a0SAndroid Build Coastguard Worker     sum += (long)in[0] * in[0];
31*638691a0SAndroid Build Coastguard Worker     in++;
32*638691a0SAndroid Build Coastguard Worker     cnt--;
33*638691a0SAndroid Build Coastguard Worker   }
34*638691a0SAndroid Build Coastguard Worker   return sum;
35*638691a0SAndroid Build Coastguard Worker }
36