return;
}
- const int64_t ksize = OW * (KH > 1 ? KW : 1);
+ const int64_t ksize = OW * KH;
const int64_t kx = i / ksize;
const int64_t kd = kx * ksize;
const int64_t ky = (i - kd) / OW;
const uint src_base = ic * p.offset_delta + batch * p.batch_offset;
const uint dst_base = ((batch * p.OH + oh) * p.OW) * p.CHW + ic * (p.KW * p.KH);
const int oh_s1 = int(oh) * p.s1;
- const uint ksize = p.OW * (p.KH > 1 ? p.KW : 1);
+ const uint ksize = p.OW * p.KH;
const uint base_linear_idx = gidx * NUM_ITER;
- const uint max_ky = ksize / p.OW;
-
uint current_kx = base_linear_idx / ksize;
const uint rem = base_linear_idx - (current_kx * ksize);
uint current_ky = rem / p.OW;
if (++current_ix == p.OW) {
current_ix = 0;
- if (++current_ky == max_ky) {
+ if (++current_ky == p.KH) {
current_ky = 0;
current_kx++;
}