static void ConvertRGBA32ToUV_NEON(const uint16_t* rgb, uint8_t* u, uint8_t* v, int width) { int i; for (i = 0; i + 8 <= width; i += 8, rgb += 4 * 8) { const uint16x8x4_t RGB = vld4q_u16((const uint16_t*)rgb); int16x8_t U, V; CONVERT_RGB_TO_UV(RGB.val[0], RGB.val[1], RGB.val[2], 2, U, V); vst1_u8(u + i, vqrshrun_n_s16(U, 2)); vst1_u8(v + i, vqrshrun_n_s16(V, 2)); } for (; i < width; i += 1, rgb += 4) { const int r = rgb[0], g = rgb[1], b = rgb[2]; u[i] = VP8RGBToU(r, g, b, YUV_HALF << 2); v[i] = VP8RGBToV(r, g, b, YUV_HALF << 2); } }
inline uint16x8x4_t vld4q(const u16 * ptr) { return vld4q_u16(ptr); }
void test_vld4Qu16 (void) { uint16x8x4_t out_uint16x8x4_t; out_uint16x8x4_t = vld4q_u16 (0); }