NotificationsYou must be signed in to change notification settings
Fork56.4k
Star85.4k

Commitbe4331c

committed

Remove the need for an extra buffer + conversion.

1 parent7c2c88e commitbe4331cCopy full SHA for be4331c

File tree

1 file changed

+55

-93

lines changed

modules/imgproc/src
- resize.cpp

1 file changed

+55

-93

lines changed

`‎modules/imgproc/src/resize.cpp‎`

Lines changed: 55 additions & 93 deletions

Original file line number	Diff line number	Diff line change
`@@ -3034,89 +3034,60 @@ static inline void vx_load_as(const ushort* ptr, v_float32& a)`
`3034`	`3034`	`staticinlinevoidvx_load_as(constshort* ptr, v_float32& a)`
`3035`	`3035`	`{ a =v_cvt_f32(v_reinterpret_as_s32(vx_load_expand(ptr))); }`
`3036`	`3036`
`3037`		`-template<typename VT>`
`3038`		`-VTvx_setall_local(double coeff);`
`3039`		`-template<>`
`3040`		`-v_float32vx_setall_local(double coeff) {`
	`3037`	`+staticinlinevoidvx_load_as(constfloat* ptr, v_float32& a)`
	`3038`	`+{ a =v_load(ptr); }`
	`3039`	`+`
	`3040`	`+v_float32vx_setall_local(float coeff) {`
`3041`	`3041`	`returnv_setall_f32(coeff);`
`3042`	`3042`	`}`
`3043`		`-template<typename WT,typename VT>`
`3044`		`-voidv_inter_area_set_sum(int col_end,const WT *const buf,const VT &v_coeff,`
`3045`		`- WT *sum,int &x) {`
	`3043`	`+#if CV_SIMD128_64F`
	`3044`	`+staticinlinevoidvx_load_as(constdouble* ptr, v_float64& a)`
	`3045`	`+{ a =v_load(ptr); }`
	`3046`	`+`
	`3047`	`+v_float64vx_setall_local(double coeff) {`
	`3048`	`+returnv_setall_f64(coeff);`
	`3049`	`+}`
	`3050`	`+#endif`
	`3051`	`+template<typename T,typename WT,typename VT>`
	`3052`	`+voidv_inter_area_set_or_update_sum(const T *const src,int n,bool do_set,`
	`3053`	`+ WT coeff, WT *sum) {`
`3046`	`3054`	`constexprint step = VT::nlanes;`
`3047`		`-for (x =0; x + step < col_end; x += step)`
	`3055`	`+const VT v_coeff =vx_setall_local(coeff);`
	`3056`	`+int x;`
	`3057`	`+if (do_set)`
`3048`	`3058`	`{`
`3049`		`-const VT line =vx_load(buf + x);`
`3050`		`-v_store(sum + x, line * v_coeff);`
	`3059`	`+for (x =0; x + step < n; x += step)`
	`3060`	`+ {`
	`3061`	`+ VT line;`
	`3062`	`+vx_load_as(src + x, line);`
	`3063`	`+v_store(sum + x, line * v_coeff);`
	`3064`	`+ }`
	`3065`	`+for(; x < n; ++x) sum[x] = saturate_cast<WT>(src[x]) * coeff;`
`3051`	`3066`	`}`
`3052`		`-}`
`3053`		`-template<typename WT,typename VT>`
`3054`		`-voidv_inter_area_update_sum(int col_end,const WT *const buf,const VT &v_coeff,`
`3055`		`- WT *sum,int &x) {`
`3056`		`-constexprint step = VT::nlanes;`
`3057`		`-for (x =0; x + step < col_end; x += step)`
	`3067`	`+else`
`3058`	`3068`	`{`
`3059`		`-const VT line =vx_load(buf + x);`
`3060`		`-const VT sum_x =vx_load(sum + x);`
`3061`		`-v_store(sum + x, sum_x + line * v_coeff);`
	`3069`	`+for (x =0; x + step < n; x += step)`
	`3070`	`+ {`
	`3071`	`+ VT line;`
	`3072`	`+vx_load_as(src + x, line);`
	`3073`	`+const VT sum_x =vx_load(sum + x);`
	`3074`	`+v_store(sum + x, sum_x + line * v_coeff);`
	`3075`	`+ }`
	`3076`	`+for(; x < n; ++x) sum[x] += saturate_cast<WT>(src[x]) * coeff;`
`3062`	`3077`	`}`
`3063`	`3078`	`}`
`3064`		`-template<typename S>`
`3065`		`-voidv_inter_area_copy_or_not(const S* s,int n,float d,floatconst*buf)`
`3066`		`-{`
`3067`		`-static_assert(!std::is_same<S,float>::value,"Do not specialize for float");`
`3068`		`-constexprint step = v_float32::nlanes;`
`3069`		`-int x =0;`
`3070`		`-for(; x + step < n; x += step)`
	`3079`	`+#if !CV_SIMD128_64F`
	`3080`	`+voidv_inter_area_set_or_update_sum(constdouble *const src,int n,bool do_set,`
	`3081`	`+double coeff,double *sum) {`
	`3082`	`+int x;`
	`3083`	`+if (do_set)`
`3071`	`3084`	`{`
`3072`		`- v_float32 a;`
`3073`		`-vx_load_as(s + x, a);`
`3074`		`-v_store(d + x, a);`
	`3085`	`+for(x =0; x < n; ++x) sum[x] = src[x] * coeff;`
	`3086`	`+ }`
	`3087`	`+else`
	`3088`	`+ {`
	`3089`	`+for(x =0; x < n; ++x) sum[x] += src[x] * coeff;`
`3075`	`3090`	`}`
`3076`		`-for(; x < n; ++x) d[x] = saturate_cast<float>(s[x]);`
`3077`		`- *buf = d;`
`3078`		`-}`
`3079`		`-voidv_inter_area_copy_or_not(constdouble* s,int n,double d,constdouble *buf)`
`3080`		`-{`
`3081`		`- (void)n;`
`3082`		`- (void)d;`
`3083`		`- *buf = s;`
`3084`		`-}`
`3085`		`-voidv_inter_area_copy_or_not(constfloat* s,int n,float d,constfloat *buf)`
`3086`		`-{`
`3087`		`- (void)n;`
`3088`		`- (void)d;`
`3089`		`- *buf = s;`
`3090`		`-}`
`3091`		`-`
`3092`		`-#if CV_SIMD128_64F`
`3093`		`-template<>`
`3094`		`-v_float64vx_setall_local(double coeff) {`
`3095`		`-returnv_setall_f64(coeff);`
`3096`		`-}`
`3097`		`-#else`
`3098`		`-template<>`
`3099`		`-v_uint8vx_setall_local(double coeff) {`
`3100`		`- (void)coeff;`
`3101`		`-returnv_setall_u8(0);`
`3102`		`-}`
`3103`		`-template<>`
`3104`		`-voidv_inter_area_set_sum(int col_end,constdouble *const buf,const v_uint8 &v_coeff,`
`3105`		`-double *sum,int &x) {`
`3106`		`- (void)col_end;`
`3107`		`- (void)buf;`
`3108`		`- (void)v_coeff;`
`3109`		`- (void)sum;`
`3110`		`- x =0;`
`3111`		`-}`
`3112`		`-template<>`
`3113`		`-voidv_inter_area_update_sum(int col_end,constdouble *const buf,const v_uint8 &v_coeff,`
`3114`		`-double *sum,int &x) {`
`3115`		`- (void)col_end;`
`3116`		`- (void)buf;`
`3117`		`- (void)v_coeff;`
`3118`		`- (void)sum;`
`3119`		`- x =0;`
`3120`	`3091`	`}`
`3121`	`3092`	`#endif`
`3122`	`3093`	`}`
`@@ -3144,10 +3115,8 @@ class ResizeArea_Invoker : public ParallelLoopBody`
`3144`	`3115`	`Size dsize = dst->size();`
`3145`	`3116`	`constint cn = dst->channels();`
`3146`	`3117`	`dsize.width *= cn;`
`3147`		`- AutoBuffer<WT>_buffer(std::max(src->cols * cn, range.size() * cn));`
`3148`	`3118`	`const DecimateAlpha* xtab = xtab0;`
`3149`	`3119`	`constint xtab_size = xtab_size0;`
`3150`		`- WT *buf = _buffer.data();`
`3151`	`3120`	`constint j_start = tabofs[range.start], j_end = tabofs[range.end];`
`3152`	`3121`
`3153`	`3122`	`static_assert(`
`@@ -3183,7 +3152,6 @@ class ResizeArea_Invoker : public ParallelLoopBody`
`3183`	`3152`	`}`
`3184`	`3153`	`int prev_di = -1;`
`3185`	`3154`	`int di =0;`
`3186`		`-const WT* buf_local;`
`3187`	`3155`	`WT* sum =nullptr;`
`3188`	`3156`	`for (int j = row_start; j < row_end; ++j)`
`3189`	`3157`	`{`
`@@ -3194,37 +3162,31 @@ class ResizeArea_Invoker : public ParallelLoopBody`
`3194`	`3162`	`coeff = ytab[j].alpha;`
`3195`	`3163`	`di = ytab[j].di;`
`3196`	`3164`	`si = ytab[j].si;`
`3197`		`-const T* S = src->templateptr<T>(si);`
`3198`		`-// Convert the line to the proper float/double type.`
`3199`		`-v_inter_area_copy_or_not(S, col_end, buf, &buf_local);`
`3200`	`3165`	`}`
`3201`	`3166`	`else`
`3202`	`3167`	`{`
`3203`	`3168`	`coeff = xtab[j].alpha;`
`3204`	`3169`	`di = xtab[j].di / cn;`
`3205`	`3170`	`si = xtab[j].si / cn;`
`3206`		`- buf_local = tmp.templateptr<WT>(si);`
`3207`	`3171`	`}`
`3208`		`-const VT v_coeff = vx_setall_local<VT>(coeff);`
`3209`	`3172`
`3210`		`-if (di != prev_di)`
	`3173`	`+if (di != prev_di) sum = tmp.templateptr<WT>(di - start_di);`
	`3174`	`+`
	`3175`	`+if (iter ==0)`
`3211`	`3176`	`{`
`3212`		`- sum = tmp.templateptr<WT>(di - start_di);`
`3213`		`-int x;`
`3214`		`-v_inter_area_set_sum(col_end, buf_local, v_coeff, sum, x);`
`3215`		`-for (; x < col_end; ++x) sum[x] = buf_local[x] * coeff;`
`3216`		`- prev_di = di;`
	`3177`	`+const T* s = src->templateptr<T>(si);`
	`3178`	`+ v_inter_area_set_or_update_sum<T, WT, VT>(s, col_end, di != prev_di,`
	`3179`	`+ coeff, sum);`
`3217`	`3180`	`}`
`3218`	`3181`	`else`
`3219`	`3182`	`{`
`3220`		`-int x;`
`3221`		`-v_inter_area_update_sum(col_end, buf_local, v_coeff, sum, x);`
`3222`		`-for (; x < col_end; ++x) sum[x] += buf_local[x] *coeff;`
	`3183`	`+const WT* s = tmp.templateptr<WT>(si);`
	`3184`	`+v_inter_area_set_or_update_sum<WT, WT, VT>(s, col_end, di != prev_di,`
	`3185`	`+coeff, sum);`
`3223`	`3186`	`}`
	`3187`	`+`
	`3188`	`+if (di != prev_di) prev_di = di;`
`3224`	`3189`	`}`
`3225`		`-// Deal with the last row.`
`3226`		`- WT* D = tmp.templateptr<WT>(di - start_di);`
`3227`		`-for (int x =0; x < col_end; ++x) D[x] = sum[x];`
`3228`	`3190`
`3229`	`3191`	`tmp =tmp(cv::Range(0, di - start_di +1),cv::Range(0, col_end / cn)).t();`
`3230`	`3192`	`}`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

Commitbe4331c

File tree

1 file changed

1 file changed

`‎modules/imgproc/src/resize.cpp‎`

0 commit comments