Lines Matching full:vec1

415   v8i16 vec0, vec1, vec2;  in I422ToARGBRow_MSA()  local
428 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToARGBRow_MSA()
429 STOREARGB(vec0, vec1, vec2, alpha, dst_argb); in I422ToARGBRow_MSA()
445 v8i16 vec0, vec1, vec2; in I422ToRGBARow_MSA() local
458 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToRGBARow_MSA()
459 STOREARGB(alpha, vec0, vec1, vec2, dst_argb); in I422ToRGBARow_MSA()
477 v8i16 vec0, vec1, vec2; in I422AlphaToARGBRow_MSA() local
492 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422AlphaToARGBRow_MSA()
494 STOREARGB(vec0, vec1, vec2, src3, dst_argb); in I422AlphaToARGBRow_MSA()
512 v8i16 vec0, vec1, vec2, vec3, vec4, vec5; in I422ToRGB24Row_MSA() local
536 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToRGB24Row_MSA()
538 reg0 = (v16u8)__msa_ilvev_b((v16i8)vec1, (v16i8)vec0); in I422ToRGB24Row_MSA()
563 v8i16 vec0, vec1, vec2; in I422ToRGB565Row_MSA() local
575 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToRGB565Row_MSA()
577 vec1 = __msa_srli_h(vec1, 2); in I422ToRGB565Row_MSA()
580 vec1 = __msa_slli_h(vec1, 5); in I422ToRGB565Row_MSA()
581 vec0 |= vec1; in I422ToRGB565Row_MSA()
600 v8i16 vec0, vec1, vec2; in I422ToARGB4444Row_MSA() local
615 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToARGB4444Row_MSA()
618 reg1 = (v8u16)__msa_and_v(vec1, mask); in I422ToARGB4444Row_MSA()
639 v8i16 vec0, vec1, vec2; in I422ToARGB1555Row_MSA() local
653 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in I422ToARGB1555Row_MSA()
655 reg1 = (v8u16)__msa_srli_h(vec1, 3); in I422ToARGB1555Row_MSA()
692 v16u8 vec0, vec1, dst0, dst1; in YUY2ToUVRow_MSA() local
702 vec1 = __msa_aver_u_b(src1, src3); in YUY2ToUVRow_MSA()
703 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in YUY2ToUVRow_MSA()
704 dst1 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec0); in YUY2ToUVRow_MSA()
757 v16u8 vec0, vec1, dst0, dst1; in UYVYToUVRow_MSA() local
767 vec1 = __msa_aver_u_b(src1, src3); in UYVYToUVRow_MSA()
768 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in UYVYToUVRow_MSA()
769 dst1 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec0); in UYVYToUVRow_MSA()
802 v16u8 src0, src1, src2, src3, vec0, vec1, vec2, vec3, dst0; in ARGBToYRow_MSA() local
816 vec1 = (v16u8)__msa_pckev_b((v16i8)src3, (v16i8)src2); in ARGBToYRow_MSA()
820 reg1 = (v8u16)__msa_ilvev_b(zero, (v16i8)vec1); in ARGBToYRow_MSA()
824 reg5 = (v8u16)__msa_ilvod_b(zero, (v16i8)vec1); in ARGBToYRow_MSA()
854 v16u8 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, vec9; in ARGBToUVRow_MSA() local
875 vec1 = (v16u8)__msa_pckev_b((v16i8)src3, (v16i8)src2); in ARGBToUVRow_MSA()
882 vec8 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBToUVRow_MSA()
886 vec0 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec0); in ARGBToUVRow_MSA()
887 vec1 = (v16u8)__msa_pckod_b((v16i8)vec3, (v16i8)vec2); in ARGBToUVRow_MSA()
893 reg5 = __msa_hadd_u_h(vec1, vec1); in ARGBToUVRow_MSA()
903 vec1 = (v16u8)__msa_pckev_b((v16i8)src3, (v16i8)src2); in ARGBToUVRow_MSA()
910 vec8 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBToUVRow_MSA()
914 vec0 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec0); in ARGBToUVRow_MSA()
915 vec1 = (v16u8)__msa_pckod_b((v16i8)vec3, (v16i8)vec2); in ARGBToUVRow_MSA()
921 reg5 += __msa_hadd_u_h(vec1, vec1); in ARGBToUVRow_MSA()
1022 v16u8 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in ARGBToRGB565Row_MSA() local
1029 vec1 = (v16u8)__msa_slli_b((v16i8)src0, 3); in ARGBToRGB565Row_MSA()
1034 vec1 = (v16u8)__msa_sldi_b(zero, (v16i8)vec1, 1); in ARGBToRGB565Row_MSA()
1040 vec0 = __msa_binsli_b(vec0, vec1, 2); in ARGBToRGB565Row_MSA()
1041 vec1 = __msa_binsli_b(vec2, vec3, 4); in ARGBToRGB565Row_MSA()
1044 vec0 = (v16u8)__msa_ilvev_b((v16i8)vec1, (v16i8)vec0); in ARGBToRGB565Row_MSA()
1058 v16u8 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, vec9; in ARGBToARGB1555Row_MSA() local
1065 vec1 = (v16u8)__msa_slli_b((v16i8)src0, 2); in ARGBToARGB1555Row_MSA()
1067 vec1 = (v16u8)__msa_sldi_b(zero, (v16i8)vec1, 1); in ARGBToARGB1555Row_MSA()
1080 vec0 = __msa_binsli_b(vec0, vec1, 2); in ARGBToARGB1555Row_MSA()
1082 vec1 = __msa_binsli_b(vec2, vec3, 5); in ARGBToARGB1555Row_MSA()
1084 vec1 = __msa_binsli_b(vec1, vec4, 0); in ARGBToARGB1555Row_MSA()
1086 vec0 = (v16u8)__msa_ilvev_b((v16i8)vec1, (v16i8)vec0); in ARGBToARGB1555Row_MSA()
1087 vec1 = (v16u8)__msa_ilvev_b((v16i8)vec6, (v16i8)vec5); in ARGBToARGB1555Row_MSA()
1088 dst0 = (v16u8)__msa_pckev_h((v8i16)vec1, (v8i16)vec0); in ARGBToARGB1555Row_MSA()
1100 v16u8 vec0, vec1; in ARGBToARGB4444Row_MSA() local
1108 vec1 = (v16u8)__msa_srai_b((v16i8)src1, 4); in ARGBToARGB4444Row_MSA()
1112 vec1 = __msa_binsli_b(vec1, src1, 3); in ARGBToARGB4444Row_MSA()
1113 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBToARGB4444Row_MSA()
1126 v8u16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in ARGBToUV444Row_MSA() local
1149 vec1 = (v8u16)__msa_ilvl_b(zero, (v16i8)src0); in ARGBToUV444Row_MSA()
1155 vec11 = vec1 * const_18; in ARGBToUV444Row_MSA()
1161 vec1 *= const_112; in ARGBToUV444Row_MSA()
1171 vec1 += const_32896; in ARGBToUV444Row_MSA()
1175 vec1 -= vec3; in ARGBToUV444Row_MSA()
1179 vec1 = (v8u16)__msa_srai_h((v8i16)vec1, 8); in ARGBToUV444Row_MSA()
1182 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBToUV444Row_MSA()
1198 v8u16 vec0, vec1, vec2, vec3; in ARGBMultiplyRow_MSA() local
1206 vec1 = (v8u16)__msa_ilvl_b((v16i8)src0, (v16i8)src0); in ARGBMultiplyRow_MSA()
1211 reg2 = (v4u32)__msa_ilvr_h(zero, (v8i16)vec1); in ARGBMultiplyRow_MSA()
1212 reg3 = (v4u32)__msa_ilvl_h(zero, (v8i16)vec1); in ARGBMultiplyRow_MSA()
1222 vec1 = (v8u16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in ARGBMultiplyRow_MSA()
1223 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBMultiplyRow_MSA()
1278 v8u16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, vec9; in ARGBAttenuateRow_MSA() local
1287 vec1 = (v8u16)__msa_ilvl_b((v16i8)src0, (v16i8)src0); in ARGBAttenuateRow_MSA()
1292 vec6 = (v8u16)__msa_fill_h(vec1[3]); in ARGBAttenuateRow_MSA()
1293 vec7 = (v8u16)__msa_fill_h(vec1[7]); in ARGBAttenuateRow_MSA()
1312 reg2 *= (v4u32)__msa_ilvr_h(zero, (v8i16)vec1); in ARGBAttenuateRow_MSA()
1313 reg3 *= (v4u32)__msa_ilvl_h(zero, (v8i16)vec1); in ARGBAttenuateRow_MSA()
1327 vec1 = (v8u16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in ARGBAttenuateRow_MSA()
1330 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBAttenuateRow_MSA()
1345 v16u8 src0, src1, dst0, vec0, vec1; in ARGBToRGB565DitherRow_MSA() local
1358 vec1 = (v16u8)__msa_pckod_b((v16i8)src1, (v16i8)src0); in ARGBToRGB565DitherRow_MSA()
1360 reg1 = (v8i16)__msa_ilvev_b(zero, (v16i8)vec1); in ARGBToRGB565DitherRow_MSA()
1414 v8u16 vec0, vec1; in ARGBShadeRow_MSA() local
1425 vec1 = (v8u16)__msa_ilvl_b((v16i8)src0, (v16i8)src0); in ARGBShadeRow_MSA()
1428 reg2 = (v4u32)__msa_ilvr_h(zero, (v8i16)vec1); in ARGBShadeRow_MSA()
1429 reg3 = (v4u32)__msa_ilvl_h(zero, (v8i16)vec1); in ARGBShadeRow_MSA()
1439 vec1 = (v8u16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in ARGBShadeRow_MSA()
1440 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBShadeRow_MSA()
1449 v16u8 src0, src1, vec0, vec1, dst0, dst1; in ARGBGrayRow_MSA() local
1458 vec1 = (v16u8)__msa_pckod_h((v8i16)src1, (v8i16)src0); in ARGBGrayRow_MSA()
1460 reg0 = __msa_dpadd_u_h(reg0, vec1, const_0x4D); in ARGBGrayRow_MSA()
1463 vec1 = (v16u8)__msa_ilvod_b((v16i8)vec1, (v16i8)vec0); in ARGBGrayRow_MSA()
1464 dst0 = (v16u8)__msa_ilvr_b((v16i8)vec1, (v16i8)vec0); in ARGBGrayRow_MSA()
1465 dst1 = (v16u8)__msa_ilvl_b((v16i8)vec1, (v16i8)vec0); in ARGBGrayRow_MSA()
1474 v16u8 src0, src1, dst0, dst1, vec0, vec1, vec2, vec3, vec4, vec5; in ARGBSepiaRow_MSA() local
1488 vec1 = (v16u8)__msa_pckod_h((v8i16)src1, (v8i16)src0); in ARGBSepiaRow_MSA()
1489 vec3 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec1); in ARGBSepiaRow_MSA()
1493 reg0 = (v8u16)__msa_dpadd_u_h(reg0, vec1, const_0x23); in ARGBSepiaRow_MSA()
1494 reg1 = (v8u16)__msa_dpadd_u_h(reg1, vec1, const_0x2D); in ARGBSepiaRow_MSA()
1495 reg2 = (v8u16)__msa_dpadd_u_h(reg2, vec1, const_0x32); in ARGBSepiaRow_MSA()
1502 vec1 = (v16u8)__msa_pckev_b((v16i8)reg1, (v16i8)reg1); in ARGBSepiaRow_MSA()
1505 vec5 = (v16u8)__msa_ilvr_b((v16i8)vec3, (v16i8)vec1); in ARGBSepiaRow_MSA()
1518 v8u16 vec0, vec1, vec2, vec3; in ARGB4444ToARGBRow_MSA() local
1525 vec1 = (v8u16)__msa_andi_b(src1, 0x0F); in ARGB4444ToARGBRow_MSA()
1529 vec1 |= (v8u16)__msa_slli_b((v16i8)vec1, 4); in ARGB4444ToARGBRow_MSA()
1534 dst2 = (v16u8)__msa_ilvr_b((v16i8)vec3, (v16i8)vec1); in ARGB4444ToARGBRow_MSA()
1535 dst3 = (v16u8)__msa_ilvl_b((v16i8)vec3, (v16i8)vec1); in ARGB4444ToARGBRow_MSA()
1547 v8u16 vec0, vec1, vec2, vec3, vec4, vec5; in ARGB1555ToARGBRow_MSA() local
1556 vec1 = src1 & const_0x1F; in ARGB1555ToARGBRow_MSA()
1567 reg0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGB1555ToARGBRow_MSA()
1596 v8u16 src0, src1, vec0, vec1, vec2, vec3, vec4, vec5; in RGB565ToARGBRow_MSA() local
1608 vec1 = src0 & const_0x7E0; in RGB565ToARGBRow_MSA()
1614 reg1 = (v8u16)__msa_srli_h((v8i16)vec1, 3); in RGB565ToARGBRow_MSA()
1620 reg1 |= (v8u16)__msa_srli_h((v8i16)vec1, 9); in RGB565ToARGBRow_MSA()
1644 v16u8 vec0, vec1, vec2; in RGB24ToARGBRow_MSA() local
1654 vec1 = (v16u8)__msa_sldi_b((v16i8)src2, (v16i8)src1, 8); in RGB24ToARGBRow_MSA()
1658 dst2 = (v16u8)__msa_vshf_b(shuffler, (v16i8)alpha, (v16i8)vec1); in RGB24ToARGBRow_MSA()
1669 v16u8 vec0, vec1, vec2; in RAWToARGBRow_MSA() local
1679 vec1 = (v16u8)__msa_sldi_b((v16i8)src2, (v16i8)src1, 8); in RAWToARGBRow_MSA()
1683 dst2 = (v16u8)__msa_vshf_b(mask, (v16i8)alpha, (v16i8)vec1); in RAWToARGBRow_MSA()
1798 v8u16 vec0, vec1, vec2, vec3; in RGB24ToYRow_MSA() local
1818 vec1 = (v8u16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in RGB24ToYRow_MSA()
1822 vec1 = __msa_dotp_u_h((v16u8)vec1, (v16u8)const_0x8119); in RGB24ToYRow_MSA()
1824 vec1 = __msa_dpadd_u_h(vec1, (v16u8)vec3, (v16u8)const_0x42); in RGB24ToYRow_MSA()
1826 vec1 += const_0x1080; in RGB24ToYRow_MSA()
1828 vec1 = (v8u16)__msa_srai_h((v8i16)vec1, 8); in RGB24ToYRow_MSA()
1829 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in RGB24ToYRow_MSA()
1839 v8u16 vec0, vec1, vec2, vec3; in RAWToYRow_MSA() local
1859 vec1 = (v8u16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in RAWToYRow_MSA()
1863 vec1 = __msa_dotp_u_h((v16u8)vec1, (v16u8)const_0x8142); in RAWToYRow_MSA()
1865 vec1 = __msa_dpadd_u_h(vec1, (v16u8)vec3, (v16u8)const_0x19); in RAWToYRow_MSA()
1867 vec1 += const_0x1080; in RAWToYRow_MSA()
1869 vec1 = (v8u16)__msa_srai_h((v8i16)vec1, 8); in RAWToYRow_MSA()
1870 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in RAWToYRow_MSA()
2030 v8u16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in RGB24ToUVRow_MSA() local
2065 vec1 = (v8u16)__msa_ilvl_b((v16i8)src4, (v16i8)src0); in RGB24ToUVRow_MSA()
2073 vec1 = (v8u16)__msa_hadd_u_h((v16u8)vec1, (v16u8)vec1); in RGB24ToUVRow_MSA()
2080 reg0 = (v8i16)__msa_pckev_d((v2i64)vec1, (v2i64)vec0); in RGB24ToUVRow_MSA()
2084 reg0 += (v8i16)__msa_pckod_d((v2i64)vec1, (v2i64)vec0); in RGB24ToUVRow_MSA()
2101 vec1 = (v8u16)__msa_pckev_h((v8i16)vec7, (v8i16)vec6); in RGB24ToUVRow_MSA()
2104 vec4 = vec1 * const_0x4A; in RGB24ToUVRow_MSA()
2107 vec1 *= const_0x5E; in RGB24ToUVRow_MSA()
2111 reg2 = __msa_subv_h((v8i16)vec2, (v8i16)vec1); in RGB24ToUVRow_MSA()
2140 v8u16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in RAWToUVRow_MSA() local
2175 vec1 = (v8u16)__msa_ilvl_b((v16i8)src4, (v16i8)src0); in RAWToUVRow_MSA()
2183 vec1 = (v8u16)__msa_hadd_u_h((v16u8)vec1, (v16u8)vec1); in RAWToUVRow_MSA()
2190 reg0 = (v8i16)__msa_pckev_d((v2i64)vec1, (v2i64)vec0); in RAWToUVRow_MSA()
2194 reg0 += (v8i16)__msa_pckod_d((v2i64)vec1, (v2i64)vec0); in RAWToUVRow_MSA()
2211 vec1 = (v8u16)__msa_pckev_h((v8i16)vec7, (v8i16)vec6); in RAWToUVRow_MSA()
2214 vec4 = vec1 * const_0x4A; in RAWToUVRow_MSA()
2217 vec1 *= const_0x5E; in RAWToUVRow_MSA()
2221 reg2 = __msa_subv_h((v8i16)vec2, (v8i16)vec1); in RAWToUVRow_MSA()
2247 v8i16 vec0, vec1, vec2; in NV12ToARGBRow_MSA() local
2263 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in NV12ToARGBRow_MSA()
2265 res1 = (v16u8)__msa_ilvev_b((v16i8)alpha, (v16i8)vec1); in NV12ToARGBRow_MSA()
2283 v8i16 vec0, vec1, vec2; in NV12ToRGB565Row_MSA() local
2298 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in NV12ToRGB565Row_MSA()
2300 vec1 = (vec1 >> 2) << 5; in NV12ToRGB565Row_MSA()
2302 dst0 = (v16u8)(vec0 | vec1 | vec2); in NV12ToRGB565Row_MSA()
2318 v8i16 vec0, vec1, vec2; in NV21ToARGBRow_MSA() local
2336 YUVTORGB(src0, src1, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in NV21ToARGBRow_MSA()
2338 res1 = (v16u8)__msa_ilvev_b((v16i8)alpha, (v16i8)vec1); in NV21ToARGBRow_MSA()
2402 v16u8 src0, src1, vec0, vec1, vec2; in SobelXYRow_MSA() local
2410 vec1 = (v16u8)__msa_ilvr_b((v16i8)src0, (v16i8)src1); in SobelXYRow_MSA()
2414 dst0 = (v16u8)__msa_ilvr_b((v16i8)reg0, (v16i8)vec1); in SobelXYRow_MSA()
2415 dst1 = (v16u8)__msa_ilvl_b((v16i8)reg0, (v16i8)vec1); in SobelXYRow_MSA()
2514 v8u16 vec0, vec1, vec2, vec3; in ARGBToUVJRow_MSA() local
2549 vec1 = __msa_aver_u_h(src6, src7); in ARGBToUVJRow_MSA()
2573 ARGBTOUV(vec0, vec1, vec2, vec3, const_0x0000003f, const_0x00008080, in ARGBToUVJRow_MSA()
2598 vec1 = __msa_aver_u_h(src6, src7); in ARGBToUVJRow_MSA()
2622 ARGBTOUV(vec0, vec1, vec2, vec3, const_0x0000003f, const_0x00008080, in ARGBToUVJRow_MSA()
2750 v8i16 vec0, vec1, vec2; in I444ToARGBRow_MSA() local
2772 vec1 = (v8u16)__msa_ilvr_b((v16i8)zero, (v16i8)src2); in I444ToARGBRow_MSA()
2775 reg8 = (v4i32)__msa_ilvr_h((v8i16)zero, (v8i16)vec1); in I444ToARGBRow_MSA()
2776 reg9 = (v4i32)__msa_ilvl_h((v8i16)zero, (v8i16)vec1); in I444ToARGBRow_MSA()
2799 vec1 = (v8u16)__msa_pckev_h((v8i16)reg5, (v8i16)reg4); in I444ToARGBRow_MSA()
2801 vec0 = (v8u16)__msa_ilvev_b((v16i8)vec1, (v16i8)vec0); in I444ToARGBRow_MSA()
2802 vec1 = (v8u16)__msa_ilvev_b((v16i8)alpha, (v16i8)vec2); in I444ToARGBRow_MSA()
2803 dst0 = (v16u8)__msa_ilvr_h((v8i16)vec1, (v8i16)vec0); in I444ToARGBRow_MSA()
2804 dst1 = (v16u8)__msa_ilvl_h((v8i16)vec1, (v8i16)vec0); in I444ToARGBRow_MSA()
2827 v8i16 vec0, vec1; in I400ToARGBRow_MSA() local
2838 vec1 = (v8i16)__msa_ilvl_b((v16i8)src0, (v16i8)src0); in I400ToARGBRow_MSA()
2841 reg2 = (v4i32)__msa_ilvr_h(zero, vec1); in I400ToARGBRow_MSA()
2842 reg3 = (v4i32)__msa_ilvl_h(zero, vec1); in I400ToARGBRow_MSA()
2852 vec1 = (v8i16)__msa_pckev_h((v8i16)reg3, (v8i16)reg2); in I400ToARGBRow_MSA()
2854 vec1 += vec_ygb; in I400ToARGBRow_MSA()
2856 vec1 = __msa_srai_h(vec1, 6); in I400ToARGBRow_MSA()
2858 vec1 = __msa_maxi_s_h(vec1, 0); in I400ToARGBRow_MSA()
2860 vec1 = __msa_min_s_h(max, vec1); in I400ToARGBRow_MSA()
2861 res0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in I400ToARGBRow_MSA()
2878 v16u8 src0, vec0, vec1, vec2, vec3, dst0, dst1, dst2, dst3; in J400ToARGBRow_MSA() local
2884 vec1 = (v16u8)__msa_ilvl_b((v16i8)src0, (v16i8)src0); in J400ToARGBRow_MSA()
2889 dst2 = (v16u8)__msa_ilvr_b((v16i8)vec3, (v16i8)vec1); in J400ToARGBRow_MSA()
2890 dst3 = (v16u8)__msa_ilvl_b((v16i8)vec3, (v16i8)vec1); in J400ToARGBRow_MSA()
2903 v8i16 vec0, vec1, vec2; in YUY2ToARGBRow_MSA() local
2917 YUVTORGB(src1, src2, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in YUY2ToARGBRow_MSA()
2918 STOREARGB(vec0, vec1, vec2, alpha, dst_argb); in YUY2ToARGBRow_MSA()
2930 v8i16 vec0, vec1, vec2; in UYVYToARGBRow_MSA() local
2944 YUVTORGB(src1, src2, vec_ubvr, vec_ugvg, vec_yg, vec_yb, vec0, vec1, vec2); in UYVYToARGBRow_MSA()
2945 STOREARGB(vec0, vec1, vec2, alpha, dst_argb); in UYVYToARGBRow_MSA()
2963 v8u16 vec0, vec1, vec2, vec3, y_frac; in InterpolateRow_MSA() local
2995 vec1 = (v8u16)__msa_ilvl_b((v16i8)src2, (v16i8)src0); in InterpolateRow_MSA()
2999 vec1 = (v8u16)__msa_dotp_u_h((v16u8)vec1, (v16u8)y_frac); in InterpolateRow_MSA()
3003 vec1 = (v8u16)__msa_srari_h((v8i16)vec1, 8); in InterpolateRow_MSA()
3006 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in InterpolateRow_MSA()
3073 v16u8 src0, src1, src2, src3, vec0, vec1, dst0; in ARGBExtractAlphaRow_MSA() local
3081 vec1 = (v16u8)__msa_pckod_b((v16i8)src3, (v16i8)src2); in ARGBExtractAlphaRow_MSA()
3082 dst0 = (v16u8)__msa_pckod_b((v16i8)vec1, (v16i8)vec0); in ARGBExtractAlphaRow_MSA()
3095 v8u16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in ARGBBlendRow_MSA() local
3108 vec1 = (v8u16)__msa_ilvl_b(zero, (v16i8)src0); in ARGBBlendRow_MSA()
3117 vec10 = (v8u16)__msa_fill_h(vec1[3]); in ARGBBlendRow_MSA()
3118 vec11 = (v8u16)__msa_fill_h(vec1[7]); in ARGBBlendRow_MSA()
3139 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBBlendRow_MSA()
3161 v8i16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in ARGBQuantizeRow_MSA() local
3176 vec1 = (v8i16)__msa_ilvl_b(zero, (v16i8)src0); in ARGBQuantizeRow_MSA()
3185 tmp2 = (v4i32)__msa_ilvr_h((v8i16)zero, (v8i16)vec1); in ARGBQuantizeRow_MSA()
3186 tmp3 = (v4i32)__msa_ilvl_h((v8i16)zero, (v8i16)vec1); in ARGBQuantizeRow_MSA()
3232 vec1 = (v8i16)__msa_pckev_h((v8i16)tmp3, (v8i16)tmp2); in ARGBQuantizeRow_MSA()
3239 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in ARGBQuantizeRow_MSA()
3267 v8i16 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, vec9; in ARGBColorMatrixRow_MSA() local
3276 vec1 = (v8i16)__msa_ilvl_b(zero, src0); in ARGBColorMatrixRow_MSA()
3294 vec11 = vec2 * vec1; in ARGBColorMatrixRow_MSA()
3296 vec13 = vec6 * vec1; in ARGBColorMatrixRow_MSA()
3302 vec15 = vec3 * vec1; in ARGBColorMatrixRow_MSA()
3304 vec17 = vec7 * vec1; in ARGBColorMatrixRow_MSA()
3322 vec6 = vec4 * vec1; in ARGBColorMatrixRow_MSA()
3324 vec7 = vec8 * vec1; in ARGBColorMatrixRow_MSA()
3330 vec8 = vec5 * vec1; in ARGBColorMatrixRow_MSA()
3332 vec9 = vec9 * vec1; in ARGBColorMatrixRow_MSA()
3439 v8i16 vec0, vec1, vec2, vec3, vec4, vec5; in SobelXRow_MSA() local
3454 vec1 = (v8i16)__msa_vshf_b(mask1, (v16i8)src1, (v16i8)src0); in SobelXRow_MSA()
3460 vec1 = (v8i16)__msa_hsub_u_h((v16u8)vec1, (v16u8)vec1); in SobelXRow_MSA()
3466 vec1 += vec3; in SobelXRow_MSA()
3470 vec1 += vec5; in SobelXRow_MSA()
3472 vec1 = __msa_add_a_h(zero, vec1); in SobelXRow_MSA()
3474 vec1 = __msa_maxi_s_h(vec1, 0); in SobelXRow_MSA()
3476 vec1 = __msa_min_s_h(max, vec1); in SobelXRow_MSA()
3477 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in SobelXRow_MSA()
3492 v8i16 vec0, vec1, vec2, vec3, vec4, vec5, vec6; in SobelYRow_MSA() local
3500 vec1 = (v8i16)__msa_ilvl_b((v16i8)zero, (v16i8)src0); in SobelYRow_MSA()
3504 vec1 -= vec3; in SobelYRow_MSA()
3507 vec2 = (v8i16)__msa_sldi_b((v16i8)vec1, (v16i8)vec0, 2); in SobelYRow_MSA()
3508 vec3 = (v8i16)__msa_sldi_b((v16i8)vec6, (v16i8)vec1, 2); in SobelYRow_MSA()
3509 vec4 = (v8i16)__msa_sldi_b((v16i8)vec1, (v16i8)vec0, 4); in SobelYRow_MSA()
3510 vec5 = (v8i16)__msa_sldi_b((v16i8)vec6, (v16i8)vec1, 4); in SobelYRow_MSA()
3512 vec1 += vec3; in SobelYRow_MSA()
3516 vec1 += vec5; in SobelYRow_MSA()
3518 vec1 = __msa_add_a_h(zero, vec1); in SobelYRow_MSA()
3520 vec1 = __msa_maxi_s_h(vec1, 0); in SobelYRow_MSA()
3522 vec1 = __msa_min_s_h(max, vec1); in SobelYRow_MSA()
3523 dst0 = (v16u8)__msa_pckev_b((v16i8)vec1, (v16i8)vec0); in SobelYRow_MSA()
3537 v4u32 vec0, vec1, vec2, vec3, vec4, vec5, vec6, vec7; in HalfFloatRow_MSA() local
3550 vec1 = (v4u32)__msa_ilvl_h(zero, (v8i16)src0); in HalfFloatRow_MSA()
3558 fvec1 = __msa_ffint_u_w(vec1); in HalfFloatRow_MSA()
3574 vec1 = ((v4u32)fvec1) >> 13; in HalfFloatRow_MSA()
3581 dst0 = (v8u16)__msa_pckev_h((v8i16)vec1, (v8i16)vec0); in HalfFloatRow_MSA()