/* This program is part of the TACLeBench benchmark suite. Version V 1.x Name: ndes Author: unknown Function: A lot of bit manipulation, shifts, array and matrix calculations. Source: Changes: no major functional changes License: May be used, modified, and re-distributed freely. */ /* A read from this address will result in an known value of 1 */ #define KNOWN_VALUE 1 #define NDES_WORSTCASE 1 /* Declaration of global variables */ typedef struct NDES_IMMENSE { unsigned long l, r; } ndes_immense; typedef struct NDES_GREAT { unsigned long l, c, r; } ndes_great; unsigned long ndes_bit[ 33 ]; ndes_immense ndes_inp, ndes_key, ndes_out; int ndes_newkey, ndes_isw; static ndes_immense ndes_icd; static char ndes_ipc1[ 57 ]; static char ndes_ipc2[ 49 ]; #ifdef NDES_WORSTCASE int ndes_value = 1; #else int ndes_value = 0; #endif /* Forward funtion prototypes */ void ndes_des( ndes_immense inp, ndes_immense key, int *newkey, int isw, ndes_immense *out ); void ndes_cyfun( unsigned long ir, ndes_great k, unsigned long *iout ); unsigned long ndes_getbit( ndes_immense source, int bitno, int nbits ); void ndes_ks( /*immense key, */int n, ndes_great *kn ); void ndes_init( void ); int ndes_return( void ); void ndes_main( void ); int main( void ); /* Initialization */ void ndes_init() { unsigned int i; static volatile char ndes_ipc1_tmp[ 57 ] = { 0, 57, 49, 41, 33, 25, 17, 9, 1, 58, 50, 42, 34, 26, 18, 10, 2, 59, 51, 43, 35, 27, 19, 11, 3, 60, 52, 44, 36, 63, 55, 47, 39, 31, 23, 15, 7, 62, 54, 46, 38, 30, 22, 14, 6, 61, 53, 45, 37, 29, 21, 13, 5, 28, 20, 12, 4 }; static volatile char ndes_ipc2_tmp[ 49 ] = { 0, 14, 17, 11, 24, 1, 5, 3, 28, 15, 6, 21, 10, 23, 19, 12, 4, 26, 8, 16, 7, 27, 20, 13, 2, 41, 52, 31, 37, 47, 55, 30, 40, 51, 45, 33, 48, 44, 49, 39, 56, 34, 53, 46, 42, 50, 36, 29, 32 }; _Pragma( "loopbound min 57 max 57" ) for ( i = 0; i < 57; i++ ) ndes_ipc1[ i ] = ndes_ipc1_tmp[ i ]; _Pragma( "loopbound min 49 max 49" ) for ( i = 0; i < 49; i++ ) ndes_ipc2[ i ] = ndes_ipc2_tmp[ i ]; ndes_inp.l = KNOWN_VALUE * 35; ndes_inp.r = KNOWN_VALUE * 26; ndes_key.l = KNOWN_VALUE * 2; ndes_key.r = KNOWN_VALUE * 16; ndes_newkey = ndes_value; ndes_isw = ndes_value; } /* Arithmetic functions */ void ndes_des( ndes_immense inp, ndes_immense key, int *newkey, int isw, ndes_immense *out ) { static volatile char ip[ 65 ] = { 0, 58, 50, 42, 34, 26, 18, 10, 2, 60, 52, 44, 36, 28, 20, 12, 4, 62, 54, 46, 38, 30, 22, 14, 6, 64, 56, 48, 40, 32, 24, 16, 8, 57, 49, 41, 33, 25, 17, 9, 1, 59, 51, 43, 35, 27, 19, 11, 3, 61, 53, 45, 37, 29, 21, 13, 5, 63, 55, 47, 39, 31, 23, 15, 7 }; static volatile char ipm[ 65 ] = { 0, 40, 8, 48, 16, 56, 24, 64, 32, 39, 7, 47, 15, 55, 23, 63, 31, 38, 6, 46, 14, 54, 22, 62, 30, 37, 5, 45, 13, 53, 21, 61, 29, 36, 4, 44, 12, 52, 20, 60, 28, 35, 3, 43, 11, 51, 19, 59, 27, 34, 2, 42, 10, 50, 18, 58, 26, 33, 1, 41, 9, 49, 17, 57, 25 }; static ndes_great kns[ 17 ]; #ifdef NDES_WORSTCASE static int initflag = 1; #else static int initflag = 0; #endif int ii, i, j, k; unsigned long ic, shifter; ndes_immense itmp; ndes_great pg; if ( initflag ) { initflag = 0; ndes_bit[ 1 ] = shifter = 1L; _Pragma( "loopbound min 31 max 31" ) for ( j = 2; j <= 32; j++ ) ndes_bit[ j ] = ( shifter <<= 1 ); } if ( *newkey ) { *newkey = 0; ndes_icd.r = ndes_icd.l = 0L; _Pragma( "loopbound min 28 max 28" ) for ( j = 28, k = 56; j >= 1; j--, k-- ) { ndes_icd.r = ( ndes_icd.r << 1 ) | ndes_getbit( key, ndes_ipc1[ j ], 32 ); ndes_icd.l = ndes_icd.l << 1; ndes_icd.l = ( ndes_icd.l ) | ndes_getbit( key, ndes_ipc1[ k ], 32 ); } _Pragma( "loopbound min 16 max 16" ) for ( i = 1; i <= 16; i++ ) { pg = kns[ i ]; ndes_ks( /* key,*/ i, &pg ); kns[ i ] = pg; } } itmp.r = itmp.l = 0L; _Pragma( "loopbound min 32 max 32" ) for ( j = 32, k = 64; j >= 1; j--, k-- ) { itmp.r = itmp.r << 1; itmp.r = ( itmp.r ) | ndes_getbit( inp, ip[ j ], 32 ); itmp.l = itmp.l << 1; itmp.l = ( itmp.l ) | ndes_getbit( inp, ip[ k ], 32 ); } _Pragma( "loopbound min 16 max 16" ) for ( i = 1; i <= 16; i++ ) { ii = ( isw == 1 ? 17 - i : i ); ndes_cyfun( itmp.l, kns[ ii ], &ic ); ic ^= itmp.r; itmp.r = itmp.l; itmp.l = ic; } ic = itmp.r; itmp.r = itmp.l; itmp.l = ic; ( *out ).r = ( *out ).l = 0L; _Pragma( "loopbound min 32 max 32" ) for ( j = 32, k = 64; j >= 1; j--, k-- ) { ( *out ).r = ( *out ).r << 1; ( *out ).r = ( ( *out ).r ) | ndes_getbit( itmp, ipm[ j ], 32 ); ( *out ).l = ( *out ).l << 1; ( *out ).l = ( ( *out ).l ) | ndes_getbit( itmp, ipm[ k ], 32 ); } } void ndes_cyfun( unsigned long ir, ndes_great k, unsigned long *iout ) { static volatile long iet[ 49 ] = {0, 32, 1, 2, 3, 4, 5, 4, 5, 6, 7, 8, 9, 8, 9, 10, 11, 12, 13, 12, 13, 14, 15, 16, 17, 16, 17, 18, 19, 20, 21, 20, 21, 22, 23, 24, 25, 24, 25, 26, 27, 28, 29, 28, 29, 30, 31, 32, 1 }; static volatile long ipp[ 33 ] = {0, 16, 7, 20, 21, 29, 12, 28, 17, 1, 15, 23, 26, 5, 18, 31, 10, 2, 8, 24, 14, 32, 27, 3, 9, 19, 13, 30, 6, 22, 11, 4, 25 }; static volatile long is[ 16 ][ 4 ][ 9 ] = {{{ 0, 14, 15, 10, 7, 2, 12, 4, 13 }, { 0, 0, 3, 13, 13, 14, 10, 13, 1 }, { 0, 4, 0, 13, 10, 4, 9, 1, 7 }, { 0, 15, 13, 1, 3, 11, 4, 6, 2 } }, { { 0, 4, 1, 0, 13, 12, 1, 11, 2 }, { 0, 15, 13, 7, 8, 11, 15, 0, 15 }, { 0, 1, 14, 6, 6, 2, 14, 4, 11 }, { 0, 12, 8, 10, 15, 8, 3, 11, 1 } }, { { 0, 13, 8, 9, 14, 4, 10, 2, 8 }, { 0, 7, 4, 0, 11, 2, 4, 11, 13 }, { 0, 14, 7, 4, 9, 1, 15, 11, 4 }, { 0, 8, 10, 13, 0, 12, 2, 13, 14 } }, { { 0, 1, 14, 14, 3, 1, 15, 14, 4 }, { 0, 4, 7, 9, 5, 12, 2, 7, 8 }, { 0, 8, 11, 9, 0, 11, 5, 13, 1 }, { 0, 2, 1, 0, 6, 7, 12, 8, 7 } }, { { 0, 2, 6, 6, 0, 7, 9, 15, 6 }, { 0, 14, 15, 3, 6, 4, 7, 4, 10 }, { 0, 13, 10, 8, 12, 10, 2, 12, 9 }, { 0, 4, 3, 6, 10, 1, 9, 1, 4 } }, { { 0, 15, 11, 3, 6, 10, 2, 0, 15 }, { 0, 2, 2, 4, 15, 7, 12, 9, 3 }, { 0, 6, 4, 15, 11, 13, 8, 3, 12 }, { 0, 9, 15, 9, 1, 14, 5, 4, 10 } }, { { 0, 11, 3, 15, 9, 11, 6, 8, 11 }, { 0, 13, 8, 6, 0, 13, 9, 1, 7 }, { 0, 2, 13, 3, 7, 7, 12, 7, 14 }, { 0, 1, 4, 8, 13, 2, 15, 10, 8 } }, { { 0, 8, 4, 5, 10, 6, 8, 13, 1 }, { 0, 1, 14, 10, 3, 1, 5, 10, 4 }, { 0, 11, 1, 0, 13, 8, 3, 14, 2 }, { 0, 7, 2, 7, 8, 13, 10, 7, 13 } }, { { 0, 3, 9, 1, 1, 8, 0, 3, 10 }, { 0, 10, 12, 2, 4, 5, 6, 14, 12 }, { 0, 15, 5, 11, 15, 15, 7, 10, 0 }, { 0, 5, 11, 4, 9, 6, 11, 9, 15 } }, { { 0, 10, 7, 13, 2, 5, 13, 12, 9 }, { 0, 6, 0, 8, 7, 0, 1, 3, 5 }, { 0, 12, 8, 1, 1, 9, 0, 15, 6 }, { 0, 11, 6, 15, 4, 15, 14, 5, 12 } }, { { 0, 6, 2, 12, 8, 3, 3, 9, 3 }, { 0, 12, 1, 5, 2, 15, 13, 5, 6 }, { 0, 9, 12, 2, 3, 12, 4, 6, 10 }, { 0, 3, 7, 14, 5, 0, 1, 0, 9 } }, { { 0, 12, 13, 7, 5, 15, 4, 7, 14 }, { 0, 11, 10, 14, 12, 10, 14, 12, 11 }, { 0, 7, 6, 12, 14, 5, 10, 8, 13 }, { 0, 14, 12, 3, 11, 9, 7, 15, 0 } }, { { 0, 5, 12, 11, 11, 13, 14, 5, 5 }, { 0, 9, 6, 12, 1, 3, 0, 2, 0 }, { 0, 3, 9, 5, 5, 6, 1, 0, 15 }, { 0, 10, 0, 11, 12, 10, 6, 14, 3 } }, { { 0, 9, 0, 4, 12, 0, 7, 10, 0 }, { 0, 5, 9, 11, 10, 9, 11, 15, 14 }, { 0, 10, 3, 10, 2, 3, 13, 5, 3 }, { 0, 0, 5, 5, 7, 4, 0, 2, 5 } }, { { 0, 0, 5, 2, 4, 14, 5, 6, 12 }, { 0, 3, 11, 15, 14, 8, 3, 8, 9 }, { 0, 5, 2, 14, 8, 0, 11, 9, 5 }, { 0, 6, 14, 2, 2, 5, 8, 3, 6 } }, { { 0, 7, 10, 8, 15, 9, 11, 1, 7 }, { 0, 8, 5, 1, 9, 6, 8, 6, 2 }, { 0, 0, 15, 7, 4, 14, 6, 2, 8 }, { 0, 13, 9, 12, 14, 3, 13, 12, 11 } } }; volatile char ibin[ 16 ] = {0, 8, 4, 12, 2, 10, 6, 14, 1, 9, 5, 13, 3, 11, 7, 15}; ndes_great ie; unsigned long itmp, ietmp1, ietmp2; char iec[ 9 ]; int irow, icol, iss, l, m; int volatile j, jj; unsigned long *p; p = ndes_bit; ie.r = ie.c = ie.l = 0; _Pragma( "loopbound min 16 max 16" ) for ( j = 16, l = 32, m = 48; j >= 1; j--, l--, m-- ) { ie.r = ( ie.r << 1 ) | ( p[ iet[ j ] ] & ir ? 1 : 0 ); ie.c = ( ie.c << 1 ) | ( p[ iet[ l ] ] & ir ? 1 : 0 ); ie.l = ( ie.l << 1 ) | ( p[ iet[ m ] ] & ir ? 1 : 0 ); } ie.r ^= k.r; ie.c ^= k.c; ie.l ^= k.l; ietmp1 = ( ( unsigned long ) ie.c << 16 ) + ( unsigned long ) ie.r; ietmp2 = ( ( unsigned long ) ie.l << 8 ) + ( ( unsigned long ) ie.c >> 8 ); _Pragma( "loopbound min 4 max 4" ) for ( j = 1, m = 5; j <= 4; j++, m++ ) { iec[ j ] = ietmp1 & 0x3fL; iec[ m ] = ietmp2 & 0x3fL; ietmp1 >>= 6; ietmp2 >>= 6; } itmp = 0L; _Pragma( "loopbound min 8 max 8" ) for ( jj = 8; jj >= 1; jj-- ) { j = iec[ jj ]; irow = ( ( j & 0x1 ) << 1 ) + ( ( j & 0x20 ) >> 5 ); icol = ( ( j & 0x2 ) << 2 ) + ( j & 0x4 ) + ( ( j & 0x8 ) >> 2 ) + ( ( j & 0x10 ) >> 4 ); iss = is[ icol ][ irow ][ jj ]; itmp = ( itmp << 4 ) | ibin[ iss ]; } *iout = 0L; p = ndes_bit; _Pragma( "loopbound min 32 max 32" ) for ( j = 32; j >= 1; j-- ) *iout = ( *iout << 1 ); *iout |= ( p[ ipp[ j ] ] & itmp ? 1 : 0 ); } unsigned long ndes_getbit( ndes_immense source, int bitno, int nbits ) { if ( bitno <= nbits ) return ndes_bit[ bitno ] & source.r ? 1L : 0L; else return ndes_bit[ bitno - nbits ] & source.l ? 1L : 0L; } void ndes_ks( /*ndes_immense key, */int n, ndes_great *kn ) { int i, j, k, l; if ( n == 1 || n == 2 || n == 9 || n == 16 ) { ndes_icd.r = ( ndes_icd.r | ( ( ndes_icd.r & 1L ) << 28 ) ) >> 1; ndes_icd.l = ( ndes_icd.l | ( ( ndes_icd.l & 1L ) << 28 ) ) >> 1; } else { _Pragma( "loopbound min 2 max 2" ) for ( i = 1; i <= 2; i++ ) { ndes_icd.r = ( ndes_icd.r | ( ( ndes_icd.r & 1L ) << 28 ) ) >> 1; ndes_icd.l = ( ndes_icd.l | ( ( ndes_icd.l & 1L ) << 28 ) ) >> 1; } } ( *kn ).r = ( *kn ).c = ( *kn ).l = 0; _Pragma( "loopbound min 16 max 16" ) for ( j = 16, k = 32, l = 48; j >= 1; j--, k--, l-- ) { ( *kn ).r = ( *kn ).r << 1; ( *kn ).r = ( ( *kn ).r ) | ( unsigned short ) ndes_getbit( ndes_icd, ndes_ipc2[ j ], 28 ); ( *kn ).c = ( *kn ).c << 1; ( *kn ).c = ( ( *kn ).c ) | ( unsigned short ) ndes_getbit( ndes_icd, ndes_ipc2[ k ], 28 ); ( *kn ).l = ( *kn ).l << 1; ( *kn ).l = ( ( *kn ).l ) | ( unsigned short ) ndes_getbit( ndes_icd, ndes_ipc2[ l ], 28 ); } } int ndes_return() { return ( ndes_icd.r + ndes_icd.l + ( -8390656 ) ) != 0 ; } void _Pragma( "entrypoint" ) ndes_main() { ndes_des( ndes_inp, ndes_key, &ndes_newkey, ndes_isw, &ndes_out ); } /* main function */ int main( void ) { ndes_init(); ndes_main(); return ( ndes_return() ); }