opj_dwt_decode_partial_97(): simplify/more efficient use of sparse arrays in vertical pass

This commit is contained in:
Even Rouault 2017-09-01 16:31:06 +02:00
parent ae19001ba4
commit 83b5a168ec
1 changed files with 41 additions and 53 deletions

View File

@ -2248,23 +2248,20 @@ static void opj_v4dwt_interleave_partial_v(opj_v4dwt_t* OPJ_RESTRICT dwt,
OPJ_UINT32 sa_col, OPJ_UINT32 sa_col,
OPJ_UINT32 nb_elts_read) OPJ_UINT32 nb_elts_read)
{ {
OPJ_UINT32 i; OPJ_BOOL ret;
for (i = 0; i < nb_elts_read; i++) { ret = opj_sparse_array_int32_read(sa,
OPJ_BOOL ret; sa_col, dwt->win_l_x0,
ret = opj_sparse_array_int32_read(sa, sa_col + nb_elts_read, dwt->win_l_x1,
sa_col + i, dwt->win_l_x0, (OPJ_INT32*)(dwt->wavelet + dwt->cas + 2 * dwt->win_l_x0),
sa_col + i + 1, dwt->win_l_x1, 1, 8, OPJ_TRUE);
(OPJ_INT32*)(dwt->wavelet + dwt->cas + 2 * dwt->win_l_x0) + i, assert(ret);
0, 8, OPJ_TRUE); ret = opj_sparse_array_int32_read(sa,
assert(ret); sa_col, (OPJ_UINT32)dwt->sn + dwt->win_h_x0,
ret = opj_sparse_array_int32_read(sa, sa_col + nb_elts_read, (OPJ_UINT32)dwt->sn + dwt->win_h_x1,
sa_col + i, (OPJ_UINT32)dwt->sn + dwt->win_h_x0, (OPJ_INT32*)(dwt->wavelet + 1 - dwt->cas + 2 * dwt->win_h_x0),
sa_col + i + 1, (OPJ_UINT32)dwt->sn + dwt->win_h_x1, 1, 8, OPJ_TRUE);
(OPJ_INT32*)(dwt->wavelet + 1 - dwt->cas + 2 * dwt->win_h_x0) + i, assert(ret);
0, 8, OPJ_TRUE); OPJ_UNUSED(ret);
assert(ret);
OPJ_UNUSED(ret);
}
} }
#ifdef __SSE__ #ifdef __SSE__
@ -2743,20 +2740,17 @@ OPJ_BOOL opj_dwt_decode_partial_97(opj_tcd_tilecomp_t* OPJ_RESTRICT tilec,
if ((j + 3 >= win_ll_y0 && j < win_ll_y1) || if ((j + 3 >= win_ll_y0 && j < win_ll_y1) ||
(j + 3 >= win_lh_y0 + (OPJ_UINT32)v.sn && (j + 3 >= win_lh_y0 + (OPJ_UINT32)v.sn &&
j < win_lh_y1 + (OPJ_UINT32)v.sn)) { j < win_lh_y1 + (OPJ_UINT32)v.sn)) {
OPJ_UINT32 k;
opj_v4dwt_interleave_partial_h(&h, sa, j, opj_uint_min(4U, rh - j)); opj_v4dwt_interleave_partial_h(&h, sa, j, opj_uint_min(4U, rh - j));
opj_v4dwt_decode(&h); opj_v4dwt_decode(&h);
for (k = 0; k < 4; k++) { if (!opj_sparse_array_int32_write(sa,
if (!opj_sparse_array_int32_write(sa, win_tr_x0, j,
win_tr_x0, j + k, win_tr_x1, j + 4,
win_tr_x1, j + k + 1, (OPJ_INT32*)&h.wavelet[win_tr_x0].f[0],
(OPJ_INT32*)&h.wavelet[win_tr_x0].f[k], 4, 1, OPJ_TRUE)) {
4, 0, OPJ_TRUE)) { /* FIXME event manager error callback */
/* FIXME event manager error callback */ opj_sparse_array_int32_free(sa);
opj_sparse_array_int32_free(sa); opj_aligned_free(h.wavelet);
opj_aligned_free(h.wavelet); return OPJ_FALSE;
return OPJ_FALSE;
}
} }
} }
} }
@ -2765,20 +2759,17 @@ OPJ_BOOL opj_dwt_decode_partial_97(opj_tcd_tilecomp_t* OPJ_RESTRICT tilec,
((j + 3 >= win_ll_y0 && j < win_ll_y1) || ((j + 3 >= win_ll_y0 && j < win_ll_y1) ||
(j + 3 >= win_lh_y0 + (OPJ_UINT32)v.sn && (j + 3 >= win_lh_y0 + (OPJ_UINT32)v.sn &&
j < win_lh_y1 + (OPJ_UINT32)v.sn))) { j < win_lh_y1 + (OPJ_UINT32)v.sn))) {
OPJ_UINT32 k;
opj_v4dwt_interleave_partial_h(&h, sa, j, rh - j); opj_v4dwt_interleave_partial_h(&h, sa, j, rh - j);
opj_v4dwt_decode(&h); opj_v4dwt_decode(&h);
for (k = 0; k < rh - j; k++) { if (!opj_sparse_array_int32_write(sa,
if (!opj_sparse_array_int32_write(sa, win_tr_x0, j,
win_tr_x0, j + k, win_tr_x1, rh,
win_tr_x1, j + k + 1, (OPJ_INT32*)&h.wavelet[win_tr_x0].f[0],
(OPJ_INT32*)&h.wavelet[win_tr_x0].f[k], 4, 1, OPJ_TRUE)) {
4, 0, OPJ_TRUE)) { /* FIXME event manager error callback */
/* FIXME event manager error callback */ opj_sparse_array_int32_free(sa);
opj_sparse_array_int32_free(sa); opj_aligned_free(h.wavelet);
opj_aligned_free(h.wavelet); return OPJ_FALSE;
return OPJ_FALSE;
}
} }
} }
@ -2788,22 +2779,19 @@ OPJ_BOOL opj_dwt_decode_partial_97(opj_tcd_tilecomp_t* OPJ_RESTRICT tilec,
v.win_h_x1 = win_lh_y1; v.win_h_x1 = win_lh_y1;
for (j = win_tr_x0; j < win_tr_x1; j += 4) { for (j = win_tr_x0; j < win_tr_x1; j += 4) {
OPJ_UINT32 nb_elts = opj_uint_min(4U, win_tr_x1 - j); OPJ_UINT32 nb_elts = opj_uint_min(4U, win_tr_x1 - j);
OPJ_UINT32 k;
opj_v4dwt_interleave_partial_v(&v, sa, j, nb_elts); opj_v4dwt_interleave_partial_v(&v, sa, j, nb_elts);
opj_v4dwt_decode(&v); opj_v4dwt_decode(&v);
for (k = 0; k < nb_elts; k++) { if (!opj_sparse_array_int32_write(sa,
if (!opj_sparse_array_int32_write(sa, j, win_tr_y0,
j + k, win_tr_y0, j + nb_elts, win_tr_y1,
j + k + 1, win_tr_y1, (OPJ_INT32*)&h.wavelet[win_tr_y0].f[0],
(OPJ_INT32*)&h.wavelet[win_tr_y0].f[k], 1, 4, OPJ_TRUE)) {
0, 4, OPJ_TRUE)) { /* FIXME event manager error callback */
/* FIXME event manager error callback */ opj_sparse_array_int32_free(sa);
opj_sparse_array_int32_free(sa); opj_aligned_free(h.wavelet);
opj_aligned_free(h.wavelet); return OPJ_FALSE;
return OPJ_FALSE;
}
} }
} }
} }