/* This program is part of the TACLeBench benchmark suite. Version V 1.x Name: ndes Author: unknown Function: A lot of bit manipulation, shifts, array and matrix calculations. Source: Changes: no major functional changes License: May be used, modified, and re-distributed freely. */ /* A read from this address will result in an known value of 1 */ #define KNOWN_VALUE 1 #define NDES_WORSTCASE 1 /* Declaration of global variables */ // Wasm loop bounds __attribute__((import_module("__pragma"), import_name("loopbound"))) extern void __pragma_loopbound(unsigned int min_bound, unsigned int max_bound); typedef struct NDES_IMMENSE { unsigned long l, r; } ndes_immense; typedef struct NDES_GREAT { unsigned long l, c, r; } ndes_great; unsigned long ndes_bit[33]; ndes_immense ndes_inp, ndes_key, ndes_out; int ndes_newkey, ndes_isw; static ndes_immense ndes_icd; static char ndes_ipc1[57]; static char ndes_ipc2[49]; #ifdef NDES_WORSTCASE int ndes_value = 1; #else int ndes_value = 0; #endif /* Forward funtion prototypes */ __attribute__((always_inline)) static inline void ndes_des(ndes_immense inp, ndes_immense key, int *newkey, int isw, ndes_immense *out); __attribute__((always_inline)) static inline void ndes_cyfun(unsigned long ir, ndes_great k, unsigned long *iout); __attribute__((always_inline)) static inline unsigned long ndes_getbit(ndes_immense source, int bitno, int nbits); void ndes_ks(/*immense key, */ int n, ndes_great *kn); __attribute__((always_inline)) static inline void ndes_init(void); __attribute__((always_inline)) static inline int ndes_return(void); __attribute__((noinline)) __attribute__((export_name("entrypoint"))) __attribute__((noinline)) __attribute__((export_name("entrypoint"))) void ndes_main(void); __attribute__((noinline)) __attribute__((export_name("main"))) __attribute__((noinline)) __attribute__((export_name("main"))) int main(void); /* Initialization */ __attribute__((always_inline)) static inline void ndes_init() { unsigned int i; static volatile char ndes_ipc1_tmp[57] = { 0, 57, 49, 41, 33, 25, 17, 9, 1, 58, 50, 42, 34, 26, 18, 10, 2, 59, 51, 43, 35, 27, 19, 11, 3, 60, 52, 44, 36, 63, 55, 47, 39, 31, 23, 15, 7, 62, 54, 46, 38, 30, 22, 14, 6, 61, 53, 45, 37, 29, 21, 13, 5, 28, 20, 12, 4}; static volatile char ndes_ipc2_tmp[49] = { 0, 14, 17, 11, 24, 1, 5, 3, 28, 15, 6, 21, 10, 23, 19, 12, 4, 26, 8, 16, 7, 27, 20, 13, 2, 41, 52, 31, 37, 47, 55, 30, 40, 51, 45, 33, 48, 44, 49, 39, 56, 34, 53, 46, 42, 50, 36, 29, 32}; __pragma_loopbound(57, 57); for (i = 0; i < 57; i++) ndes_ipc1[i] = ndes_ipc1_tmp[i]; __pragma_loopbound(49, 49); for (i = 0; i < 49; i++) ndes_ipc2[i] = ndes_ipc2_tmp[i]; ndes_inp.l = KNOWN_VALUE * 35; ndes_inp.r = KNOWN_VALUE * 26; ndes_key.l = KNOWN_VALUE * 2; ndes_key.r = KNOWN_VALUE * 16; ndes_newkey = ndes_value; ndes_isw = ndes_value; } /* Arithmetic functions */ __attribute__((always_inline)) static inline void ndes_des(ndes_immense inp, ndes_immense key, int *newkey, int isw, ndes_immense *out) { static volatile char ip[65] = { 0, 58, 50, 42, 34, 26, 18, 10, 2, 60, 52, 44, 36, 28, 20, 12, 4, 62, 54, 46, 38, 30, 22, 14, 6, 64, 56, 48, 40, 32, 24, 16, 8, 57, 49, 41, 33, 25, 17, 9, 1, 59, 51, 43, 35, 27, 19, 11, 3, 61, 53, 45, 37, 29, 21, 13, 5, 63, 55, 47, 39, 31, 23, 15, 7}; static volatile char ipm[65] = { 0, 40, 8, 48, 16, 56, 24, 64, 32, 39, 7, 47, 15, 55, 23, 63, 31, 38, 6, 46, 14, 54, 22, 62, 30, 37, 5, 45, 13, 53, 21, 61, 29, 36, 4, 44, 12, 52, 20, 60, 28, 35, 3, 43, 11, 51, 19, 59, 27, 34, 2, 42, 10, 50, 18, 58, 26, 33, 1, 41, 9, 49, 17, 57, 25}; static ndes_great kns[17]; #ifdef NDES_WORSTCASE static int initflag = 1; #else static int initflag = 0; #endif int ii, i, j, k; unsigned long ic, shifter; ndes_immense itmp; ndes_great pg; if (initflag) { initflag = 0; ndes_bit[1] = shifter = 1L; __pragma_loopbound(31, 31); for (j = 2; j <= 32; j++) ndes_bit[j] = (shifter <<= 1); } if (*newkey) { *newkey = 0; ndes_icd.r = ndes_icd.l = 0L; __pragma_loopbound(28, 28); for (j = 28, k = 56; j >= 1; j--, k--) { ndes_icd.r = (ndes_icd.r << 1) | ndes_getbit(key, ndes_ipc1[j], 32); ndes_icd.l = ndes_icd.l << 1; ndes_icd.l = (ndes_icd.l) | ndes_getbit(key, ndes_ipc1[k], 32); } __pragma_loopbound(16, 16); for (i = 1; i <= 16; i++) { pg = kns[i]; ndes_ks(/* key,*/ i, &pg); kns[i] = pg; } } itmp.r = itmp.l = 0L; __pragma_loopbound(32, 32); for (j = 32, k = 64; j >= 1; j--, k--) { itmp.r = itmp.r << 1; itmp.r = (itmp.r) | ndes_getbit(inp, ip[j], 32); itmp.l = itmp.l << 1; itmp.l = (itmp.l) | ndes_getbit(inp, ip[k], 32); } __pragma_loopbound(16, 16); for (i = 1; i <= 16; i++) { ii = (isw == 1 ? 17 - i : i); ndes_cyfun(itmp.l, kns[ii], &ic); ic ^= itmp.r; itmp.r = itmp.l; itmp.l = ic; } ic = itmp.r; itmp.r = itmp.l; itmp.l = ic; (*out).r = (*out).l = 0L; __pragma_loopbound(32, 32); for (j = 32, k = 64; j >= 1; j--, k--) { (*out).r = (*out).r << 1; (*out).r = ((*out).r) | ndes_getbit(itmp, ipm[j], 32); (*out).l = (*out).l << 1; (*out).l = ((*out).l) | ndes_getbit(itmp, ipm[k], 32); } } __attribute__((always_inline)) static inline void ndes_cyfun(unsigned long ir, ndes_great k, unsigned long *iout) { static volatile long iet[49] = { 0, 32, 1, 2, 3, 4, 5, 4, 5, 6, 7, 8, 9, 8, 9, 10, 11, 12, 13, 12, 13, 14, 15, 16, 17, 16, 17, 18, 19, 20, 21, 20, 21, 22, 23, 24, 25, 24, 25, 26, 27, 28, 29, 28, 29, 30, 31, 32, 1}; static volatile long ipp[33] = {0, 16, 7, 20, 21, 29, 12, 28, 17, 1, 15, 23, 26, 5, 18, 31, 10, 2, 8, 24, 14, 32, 27, 3, 9, 19, 13, 30, 6, 22, 11, 4, 25}; static volatile long is[16][4][9] = {{{0, 14, 15, 10, 7, 2, 12, 4, 13}, {0, 0, 3, 13, 13, 14, 10, 13, 1}, {0, 4, 0, 13, 10, 4, 9, 1, 7}, {0, 15, 13, 1, 3, 11, 4, 6, 2}}, {{0, 4, 1, 0, 13, 12, 1, 11, 2}, {0, 15, 13, 7, 8, 11, 15, 0, 15}, {0, 1, 14, 6, 6, 2, 14, 4, 11}, {0, 12, 8, 10, 15, 8, 3, 11, 1}}, {{0, 13, 8, 9, 14, 4, 10, 2, 8}, {0, 7, 4, 0, 11, 2, 4, 11, 13}, {0, 14, 7, 4, 9, 1, 15, 11, 4}, {0, 8, 10, 13, 0, 12, 2, 13, 14}}, {{0, 1, 14, 14, 3, 1, 15, 14, 4}, {0, 4, 7, 9, 5, 12, 2, 7, 8}, {0, 8, 11, 9, 0, 11, 5, 13, 1}, {0, 2, 1, 0, 6, 7, 12, 8, 7}}, {{0, 2, 6, 6, 0, 7, 9, 15, 6}, {0, 14, 15, 3, 6, 4, 7, 4, 10}, {0, 13, 10, 8, 12, 10, 2, 12, 9}, {0, 4, 3, 6, 10, 1, 9, 1, 4}}, {{0, 15, 11, 3, 6, 10, 2, 0, 15}, {0, 2, 2, 4, 15, 7, 12, 9, 3}, {0, 6, 4, 15, 11, 13, 8, 3, 12}, {0, 9, 15, 9, 1, 14, 5, 4, 10}}, {{0, 11, 3, 15, 9, 11, 6, 8, 11}, {0, 13, 8, 6, 0, 13, 9, 1, 7}, {0, 2, 13, 3, 7, 7, 12, 7, 14}, {0, 1, 4, 8, 13, 2, 15, 10, 8}}, {{0, 8, 4, 5, 10, 6, 8, 13, 1}, {0, 1, 14, 10, 3, 1, 5, 10, 4}, {0, 11, 1, 0, 13, 8, 3, 14, 2}, {0, 7, 2, 7, 8, 13, 10, 7, 13}}, {{0, 3, 9, 1, 1, 8, 0, 3, 10}, {0, 10, 12, 2, 4, 5, 6, 14, 12}, {0, 15, 5, 11, 15, 15, 7, 10, 0}, {0, 5, 11, 4, 9, 6, 11, 9, 15}}, {{0, 10, 7, 13, 2, 5, 13, 12, 9}, {0, 6, 0, 8, 7, 0, 1, 3, 5}, {0, 12, 8, 1, 1, 9, 0, 15, 6}, {0, 11, 6, 15, 4, 15, 14, 5, 12}}, {{0, 6, 2, 12, 8, 3, 3, 9, 3}, {0, 12, 1, 5, 2, 15, 13, 5, 6}, {0, 9, 12, 2, 3, 12, 4, 6, 10}, {0, 3, 7, 14, 5, 0, 1, 0, 9}}, {{0, 12, 13, 7, 5, 15, 4, 7, 14}, {0, 11, 10, 14, 12, 10, 14, 12, 11}, {0, 7, 6, 12, 14, 5, 10, 8, 13}, {0, 14, 12, 3, 11, 9, 7, 15, 0}}, {{0, 5, 12, 11, 11, 13, 14, 5, 5}, {0, 9, 6, 12, 1, 3, 0, 2, 0}, {0, 3, 9, 5, 5, 6, 1, 0, 15}, {0, 10, 0, 11, 12, 10, 6, 14, 3}}, {{0, 9, 0, 4, 12, 0, 7, 10, 0}, {0, 5, 9, 11, 10, 9, 11, 15, 14}, {0, 10, 3, 10, 2, 3, 13, 5, 3}, {0, 0, 5, 5, 7, 4, 0, 2, 5}}, {{0, 0, 5, 2, 4, 14, 5, 6, 12}, {0, 3, 11, 15, 14, 8, 3, 8, 9}, {0, 5, 2, 14, 8, 0, 11, 9, 5}, {0, 6, 14, 2, 2, 5, 8, 3, 6}}, {{0, 7, 10, 8, 15, 9, 11, 1, 7}, {0, 8, 5, 1, 9, 6, 8, 6, 2}, {0, 0, 15, 7, 4, 14, 6, 2, 8}, {0, 13, 9, 12, 14, 3, 13, 12, 11}}}; volatile char ibin[16] = {0, 8, 4, 12, 2, 10, 6, 14, 1, 9, 5, 13, 3, 11, 7, 15}; ndes_great ie; unsigned long itmp, ietmp1, ietmp2; char iec[9]; int irow, icol, iss, l, m; int volatile j, jj; unsigned long *p; p = ndes_bit; ie.r = ie.c = ie.l = 0; __pragma_loopbound(16, 16); for (j = 16, l = 32, m = 48; j >= 1; j--, l--, m--) { ie.r = (ie.r << 1) | (p[iet[j]] & ir ? 1 : 0); ie.c = (ie.c << 1) | (p[iet[l]] & ir ? 1 : 0); ie.l = (ie.l << 1) | (p[iet[m]] & ir ? 1 : 0); } ie.r ^= k.r; ie.c ^= k.c; ie.l ^= k.l; ietmp1 = ((unsigned long) ie.c << 16) + (unsigned long) ie.r; ietmp2 = ((unsigned long) ie.l << 8) + ((unsigned long) ie.c >> 8); __pragma_loopbound(4, 4); for (j = 1, m = 5; j <= 4; j++, m++) { iec[j] = ietmp1 & 0x3fL; iec[m] = ietmp2 & 0x3fL; ietmp1 >>= 6; ietmp2 >>= 6; } itmp = 0L; __pragma_loopbound(8, 8); for (jj = 8; jj >= 1; jj--) { j = iec[jj]; irow = ((j & 0x1) << 1) + ((j & 0x20) >> 5); icol = ((j & 0x2) << 2) + (j & 0x4) + ((j & 0x8) >> 2) + ((j & 0x10) >> 4); iss = is[icol][irow][jj]; itmp = (itmp << 4) | ibin[iss]; } *iout = 0L; p = ndes_bit; __pragma_loopbound(32, 32); for (j = 32; j >= 1; j--) *iout = (*iout << 1); *iout |= (p[ipp[j]] & itmp ? 1 : 0); } __attribute__((always_inline)) static inline unsigned long ndes_getbit(ndes_immense source, int bitno, int nbits) { if (bitno <= nbits) return ndes_bit[bitno] & source.r ? 1L : 0L; else return ndes_bit[bitno - nbits] & source.l ? 1L : 0L; } void ndes_ks(/*ndes_immense key, */ int n, ndes_great *kn) { int i, j, k, l; if (n == 1 || n == 2 || n == 9 || n == 16) { ndes_icd.r = (ndes_icd.r | ((ndes_icd.r & 1L) << 28)) >> 1; ndes_icd.l = (ndes_icd.l | ((ndes_icd.l & 1L) << 28)) >> 1; } else { __pragma_loopbound(2, 2); for (i = 1; i <= 2; i++) { ndes_icd.r = (ndes_icd.r | ((ndes_icd.r & 1L) << 28)) >> 1; ndes_icd.l = (ndes_icd.l | ((ndes_icd.l & 1L) << 28)) >> 1; } } (*kn).r = (*kn).c = (*kn).l = 0; __pragma_loopbound(16, 16); for (j = 16, k = 32, l = 48; j >= 1; j--, k--, l--) { (*kn).r = (*kn).r << 1; (*kn).r = ((*kn).r) | (unsigned short) ndes_getbit(ndes_icd, ndes_ipc2[j], 28); (*kn).c = (*kn).c << 1; (*kn).c = ((*kn).c) | (unsigned short) ndes_getbit(ndes_icd, ndes_ipc2[k], 28); (*kn).l = (*kn).l << 1; (*kn).l = ((*kn).l) | (unsigned short) ndes_getbit(ndes_icd, ndes_ipc2[l], 28); } } __attribute__((always_inline)) static inline int ndes_return() { return (ndes_icd.r + ndes_icd.l + (-8390656)) != 0; } __attribute__((noinline)) __attribute__((export_name("entrypoint"))) __attribute__((noinline)) __attribute__((export_name("entrypoint"))) void ndes_main() { ndes_des(ndes_inp, ndes_key, &ndes_newkey, ndes_isw, &ndes_out); } /* main function */ __attribute__((noinline)) __attribute__((export_name("main"))) __attribute__((noinline)) __attribute__((export_name("main"))) int main(void) { ndes_init(); ndes_main(); return (ndes_return()); }