#include #include #include #include #define H 5 #define W 5 #define IDX(n) ((n)%3) void applySeparableGaussianBlur(float src[H][W], float dst[H][W], int h, int w, float kx[3], float ky[3]) { float buf[H][W-1]={0}; float32x4_t kx_vec=vld1q_f32(kx); float32x4_t ky_vec=vld1q_f32(ky); for(int k = 0; k< 2; ++k) { for(int j=1;j