1*638691a0SAndroid Build Coastguard Worker /* Compute the sum of the squares of a vector of signed shorts 2*638691a0SAndroid Build Coastguard Worker 3*638691a0SAndroid Build Coastguard Worker * MMX-assisted version (also used on SSE) 4*638691a0SAndroid Build Coastguard Worker 5*638691a0SAndroid Build Coastguard Worker * The SSE2 and MMX assist routines both operate on multiples of 6*638691a0SAndroid Build Coastguard Worker * 8 words; they differ only in their alignment requirements (8 bytes 7*638691a0SAndroid Build Coastguard Worker * for MMX, 16 bytes for SSE2) 8*638691a0SAndroid Build Coastguard Worker 9*638691a0SAndroid Build Coastguard Worker * Copyright 2004 Phil Karn, KA9Q 10*638691a0SAndroid Build Coastguard Worker * May be used under the terms of the GNU Lesser Public License (LGPL) 11*638691a0SAndroid Build Coastguard Worker */ 12*638691a0SAndroid Build Coastguard Worker 13*638691a0SAndroid Build Coastguard Worker long long sumsq_mmx_assist(signed short *,int); 14*638691a0SAndroid Build Coastguard Worker sumsq_mmx(signed short * in,int cnt)15*638691a0SAndroid Build Coastguard Workerlong long sumsq_mmx(signed short *in,int cnt){ 16*638691a0SAndroid Build Coastguard Worker long long sum = 0; 17*638691a0SAndroid Build Coastguard Worker 18*638691a0SAndroid Build Coastguard Worker /* Handle stuff before the next 8-byte boundary */ 19*638691a0SAndroid Build Coastguard Worker while(((int)in & 7) != 0 && cnt != 0){ 20*638691a0SAndroid Build Coastguard Worker sum += (long)in[0] * in[0]; 21*638691a0SAndroid Build Coastguard Worker in++; 22*638691a0SAndroid Build Coastguard Worker cnt--; 23*638691a0SAndroid Build Coastguard Worker } 24*638691a0SAndroid Build Coastguard Worker sum += sumsq_mmx_assist(in,cnt); 25*638691a0SAndroid Build Coastguard Worker in += cnt & ~7; 26*638691a0SAndroid Build Coastguard Worker cnt &= 7; 27*638691a0SAndroid Build Coastguard Worker 28*638691a0SAndroid Build Coastguard Worker /* Handle up to 7 words at end */ 29*638691a0SAndroid Build Coastguard Worker while(cnt != 0){ 30*638691a0SAndroid Build Coastguard Worker sum += (long)in[0] * in[0]; 31*638691a0SAndroid Build Coastguard Worker in++; 32*638691a0SAndroid Build Coastguard Worker cnt--; 33*638691a0SAndroid Build Coastguard Worker } 34*638691a0SAndroid Build Coastguard Worker return sum; 35*638691a0SAndroid Build Coastguard Worker } 36