Commit 7822e1c1 authored by Michael Niedermayer's avatar Michael Niedermayer

reverse remainder of the failed attempt to optimize *state=c->mps_state[s]

Originally committed as revision 6609 to svn://svn.ffmpeg.org/ffmpeg/trunk
parent ef0090a9
...@@ -125,26 +125,26 @@ void ff_init_cabac_states(CABACContext *c, uint8_t const (*lps_range)[4], ...@@ -125,26 +125,26 @@ void ff_init_cabac_states(CABACContext *c, uint8_t const (*lps_range)[4],
for(i=0; i<state_count; i++){ for(i=0; i<state_count; i++){
for(j=0; j<4; j++){ //FIXME check if this is worth the 1 shift we save for(j=0; j<4; j++){ //FIXME check if this is worth the 1 shift we save
c->lps_range[2*i+2][j+4]= c->lps_range[2*i+0][j+4]=
c->lps_range[2*i+3][j+4]= lps_range[i][j]; c->lps_range[2*i+1][j+4]= lps_range[i][j];
} }
c->mps_state[2*i+2]= 2*mps_state[i]+2; c->mps_state[2*i+0]= 2*mps_state[i]+0;
c->mps_state[2*i+3]= 2*mps_state[i]+3; c->mps_state[2*i+1]= 2*mps_state[i]+1;
if( i ){ if( i ){
#ifdef BRANCHLESS_CABAD #ifdef BRANCHLESS_CABAD
c->mps_state[-2*i-3]= 2*lps_state[i]+2; //FIXME yes this is not valid C but iam lazy, cleanup welcome c->mps_state[-2*i-1]= 2*lps_state[i]+0; //FIXME yes this is not valid C but iam lazy, cleanup welcome
c->mps_state[-2*i-4]= 2*lps_state[i]+3; c->mps_state[-2*i-2]= 2*lps_state[i]+1;
}else{ }else{
c->mps_state[-2*i-3]= 3; c->mps_state[-2*i-1]= 1;
c->mps_state[-2*i-4]= 2; c->mps_state[-2*i-2]= 0;
#else #else
c->lps_state[2*i+2]= 2*lps_state[i]+2; c->lps_state[2*i+0]= 2*lps_state[i]+0;
c->lps_state[2*i+3]= 2*lps_state[i]+3; c->lps_state[2*i+1]= 2*lps_state[i]+1;
}else{ }else{
c->lps_state[2*i+2]= 3; c->lps_state[2*i+0]= 1;
c->lps_state[2*i+3]= 2; c->lps_state[2*i+1]= 0;
#endif #endif
} }
} }
......
...@@ -40,9 +40,9 @@ typedef struct CABACContext{ ...@@ -40,9 +40,9 @@ typedef struct CABACContext{
#ifdef STRICT_LIMITS #ifdef STRICT_LIMITS
int symCount; int symCount;
#endif #endif
uint8_t lps_range[2*66][4]; ///< rangeTabLPS uint8_t lps_range[2*65][4]; ///< rangeTabLPS
uint8_t lps_state[2*65]; ///< transIdxLPS uint8_t lps_state[2*64]; ///< transIdxLPS
uint8_t mps_state[2*65]; ///< transIdxMPS uint8_t mps_state[2*64]; ///< transIdxMPS
const uint8_t *bytestream_start; const uint8_t *bytestream_start;
const uint8_t *bytestream; const uint8_t *bytestream;
const uint8_t *bytestream_end; const uint8_t *bytestream_end;
...@@ -370,11 +370,11 @@ static int get_cabac(CABACContext *c, uint8_t * const state){ ...@@ -370,11 +370,11 @@ static int get_cabac(CABACContext *c, uint8_t * const state){
#define LOW "0" #define LOW "0"
#define RANGE "4" #define RANGE "4"
#define LPS_RANGE "12" #define LPS_RANGE "12"
#define LPS_STATE "12+2*66*4" #define LPS_STATE "12+2*65*4"
#define MPS_STATE "12+2*66*4+2*65" #define MPS_STATE "12+2*65*4+2*64"
#define BYTESTART "12+2*66*4+4*65" #define BYTESTART "12+2*65*4+4*64"
#define BYTE "16+2*66*4+4*65" #define BYTE "16+2*65*4+4*64"
#define BYTEEND "20+2*66*4+4*65" #define BYTEEND "20+2*65*4+4*64"
#ifndef BRANCHLESS_CABAD #ifndef BRANCHLESS_CABAD
asm volatile( asm volatile(
"movzbl (%1), %%eax \n\t" "movzbl (%1), %%eax \n\t"
......
...@@ -7401,9 +7401,9 @@ static int decode_slice(H264Context *h){ ...@@ -7401,9 +7401,9 @@ static int decode_slice(H264Context *h){
pre = clip( ((cabac_context_init_PB[h->cabac_init_idc][i][0] * s->qscale) >>4 ) + cabac_context_init_PB[h->cabac_init_idc][i][1], 1, 126 ); pre = clip( ((cabac_context_init_PB[h->cabac_init_idc][i][0] * s->qscale) >>4 ) + cabac_context_init_PB[h->cabac_init_idc][i][1], 1, 126 );
if( pre <= 63 ) if( pre <= 63 )
h->cabac_state[i] = 2 * ( 63 - pre ) + 2; h->cabac_state[i] = 2 * ( 63 - pre ) + 0;
else else
h->cabac_state[i] = 2 * ( pre - 64 ) + 3; h->cabac_state[i] = 2 * ( pre - 64 ) + 1;
} }
for(;;){ for(;;){
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment