Commit 6507d86f authored by Michael Niedermayer's avatar Michael Niedermayer

jpeg2000dec; optimize output sample convert a bit

67935 -> 29984 kcycles
Reviewed-by: 's avatarNicolas BERTRAND <nicoinattendu@gmail.com>
Signed-off-by: 's avatarMichael Niedermayer <michaelni@gmx.at>
parent 3da71111
...@@ -1082,6 +1082,8 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile, ...@@ -1082,6 +1082,8 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile,
Jpeg2000Component *comp = tile->comp + compno; Jpeg2000Component *comp = tile->comp + compno;
float *datap = comp->f_data; float *datap = comp->f_data;
int32_t *i_datap = comp->i_data; int32_t *i_datap = comp->i_data;
int cbps = s->cbps[compno];
int w = tile->comp[compno].coord[0][1] - s->image_offset_x;
y = tile->comp[compno].coord[1][0] - s->image_offset_y; y = tile->comp[compno].coord[1][0] - s->image_offset_y;
line = picture->data[0] + y * picture->linesize[0]; line = picture->data[0] + y * picture->linesize[0];
...@@ -1091,18 +1093,24 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile, ...@@ -1091,18 +1093,24 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile,
x = tile->comp[compno].coord[0][0] - s->image_offset_x; x = tile->comp[compno].coord[0][0] - s->image_offset_x;
dst = line + x * s->ncomponents + compno; dst = line + x * s->ncomponents + compno;
for (; x < tile->comp[compno].coord[0][1] - s->image_offset_x; x += s->cdx[compno]) { if (tile->codsty->transform == FF_DWT97) {
int val; for (; x < w; x += s->cdx[compno]) {
/* DC level shift and clip see ISO 15444-1:2002 G.1.2 */ int val = lrintf(*datap) + (1 << (cbps - 1));
if (tile->codsty->transform == FF_DWT97) /* DC level shift and clip see ISO 15444-1:2002 G.1.2 */
val = lrintf(*datap) + (1 << (s->cbps[compno] - 1)); val = av_clip(val, 0, (1 << cbps) - 1);
else *dst = val << (8 - cbps);
val = *i_datap + (1 << (s->cbps[compno] - 1)); datap++;
val = av_clip(val, 0, (1 << s->cbps[compno]) - 1); dst += s->ncomponents;
*dst = val << (8 - s->cbps[compno]); }
datap++; } else {
i_datap++; for (; x < w; x += s->cdx[compno]) {
dst += s->ncomponents; int val = *i_datap + (1 << (cbps - 1));
/* DC level shift and clip see ISO 15444-1:2002 G.1.2 */
val = av_clip(val, 0, (1 << cbps) - 1);
*dst = val << (8 - cbps);
i_datap++;
dst += s->ncomponents;
}
} }
line += picture->linesize[0]; line += picture->linesize[0];
} }
...@@ -1113,6 +1121,8 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile, ...@@ -1113,6 +1121,8 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile,
float *datap = comp->f_data; float *datap = comp->f_data;
int32_t *i_datap = comp->i_data; int32_t *i_datap = comp->i_data;
uint16_t *linel; uint16_t *linel;
int cbps = s->cbps[compno];
int w = tile->comp[compno].coord[0][1] - s->image_offset_x;
y = tile->comp[compno].coord[1][0] - s->image_offset_y; y = tile->comp[compno].coord[1][0] - s->image_offset_y;
linel = (uint16_t *)picture->data[0] + y * (picture->linesize[0] >> 1); linel = (uint16_t *)picture->data[0] + y * (picture->linesize[0] >> 1);
...@@ -1121,24 +1131,32 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile, ...@@ -1121,24 +1131,32 @@ static int jpeg2000_decode_tile(Jpeg2000DecoderContext *s, Jpeg2000Tile *tile,
x = tile->comp[compno].coord[0][0] - s->image_offset_x; x = tile->comp[compno].coord[0][0] - s->image_offset_x;
dst = linel + (x * s->ncomponents + compno); dst = linel + (x * s->ncomponents + compno);
for (; x < tile->comp[compno].coord[0][1] - s->image_offset_x; x += s-> cdx[compno]) { if (tile->codsty->transform == FF_DWT97) {
int val; for (; x < w; x += s-> cdx[compno]) {
/* DC level shift and clip see ISO 15444-1:2002 G.1.2 */ int val = lrintf(*datap) + (1 << (cbps - 1));
if (tile->codsty->transform == FF_DWT97) /* DC level shift and clip see ISO 15444-1:2002 G.1.2 */
val = lrintf(*datap) + (1 << (s->cbps[compno] - 1)); val = av_clip(val, 0, (1 << cbps) - 1);
else /* align 12 bit values in little-endian mode */
val = *i_datap + (1 << (s->cbps[compno] - 1)); *dst = val << (16 - cbps);
val = av_clip(val, 0, (1 << s->cbps[compno]) - 1); datap++;
/* align 12 bit values in little-endian mode */ dst += s->ncomponents;
*dst = val << (16 - s->cbps[compno]); }
datap++; } else {
i_datap++; for (; x < w; x += s-> cdx[compno]) {
dst += s->ncomponents; int val = *i_datap + (1 << (cbps - 1));
/* DC level shift and clip see ISO 15444-1:2002 G.1.2 */
val = av_clip(val, 0, (1 << cbps) - 1);
/* align 12 bit values in little-endian mode */
*dst = val << (16 - cbps);
i_datap++;
dst += s->ncomponents;
}
} }
linel += picture->linesize[0] >> 1; linel += picture->linesize[0] >> 1;
} }
} }
} }
return 0; return 0;
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment