123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136 |
- // See LICENSE for license details.
- #ifndef __UTIL_H
- #define __UTIL_H
- //--------------------------------------------------------------------------
- // Macros
- // Set HOST_DEBUG to 1 if you are going to compile this for a host
- // machine (ie Athena/Linux) for debug purposes and set HOST_DEBUG
- // to 0 if you are compiling with the smips-gcc toolchain.
- #ifndef HOST_DEBUG
- #define HOST_DEBUG 0
- #endif
- // Set PREALLOCATE to 1 if you want to preallocate the benchmark
- // function before starting stats. If you have instruction/data
- // caches and you don't want to count the overhead of misses, then
- // you will need to use preallocation.
- #ifndef PREALLOCATE
- #define PREALLOCATE 0
- #endif
- // Set SET_STATS to 1 if you want to carve out the piece that actually
- // does the computation.
- #if HOST_DEBUG
- #include <stdio.h>
- static void setStats(int enable) {}
- #else
- extern void setStats(int enable);
- #endif
- #include <stdint.h>
- #define static_assert(cond) switch(0) { case 0: case !!(long)(cond): ; }
- static void printArray(const char name[], int n, const int arr[])
- {
- #if HOST_DEBUG
- int i;
- printf( " %10s :", name );
- for ( i = 0; i < n; i++ )
- printf( " %3d ", arr[i] );
- printf( "\n" );
- #endif
- }
- static void printDoubleArray(const char name[], int n, const double arr[])
- {
- #if HOST_DEBUG
- int i;
- printf( " %10s :", name );
- for ( i = 0; i < n; i++ )
- printf( " %g ", arr[i] );
- printf( "\n" );
- #endif
- }
- static int verify(int n, const volatile int* test, const int* verify)
- {
- int i;
- // Unrolled for faster verification
- for (i = 0; i < n/2*2; i+=2)
- {
- int t0 = test[i], t1 = test[i+1];
- int v0 = verify[i], v1 = verify[i+1];
- if (t0 != v0) return i+1;
- if (t1 != v1) return i+2;
- }
- if (n % 2 != 0 && test[n-1] != verify[n-1])
- return n;
- return 0;
- }
- static int verifyDouble(int n, const volatile double* test, const double* verify)
- {
- int i;
- // Unrolled for faster verification
- for (i = 0; i < n/2*2; i+=2)
- {
- double t0 = test[i], t1 = test[i+1];
- double v0 = verify[i], v1 = verify[i+1];
- int eq1 = t0 == v0, eq2 = t1 == v1;
- if (!(eq1 & eq2)) return i+1+eq1;
- }
- if (n % 2 != 0 && test[n-1] != verify[n-1])
- return n;
- return 0;
- }
- static void __attribute__((noinline)) barrier(int ncores)
- {
- static volatile int sense;
- static volatile int count;
- static __thread int threadsense;
- __sync_synchronize();
- threadsense = !threadsense;
- if (__sync_fetch_and_add(&count, 1) == ncores-1)
- {
- count = 0;
- sense = threadsense;
- }
- else while(sense != threadsense)
- ;
- __sync_synchronize();
- }
- static uint64_t lfsr(uint64_t x)
- {
- uint64_t bit = (x ^ (x >> 1)) & 1;
- return (x >> 1) | (bit << 62);
- }
- #ifdef __riscv
- #include "encoding.h"
- #endif
- #define stringify_1(s) #s
- #define stringify(s) stringify_1(s)
- #define stats(code, iter) do { \
- unsigned long _c = -read_csr(mcycle), _i = -read_csr(minstret); \
- code; \
- _c += read_csr(mcycle), _i += read_csr(minstret); \
- if (cid == 0) \
- printf("\n%s: %ld cycles, %ld.%ld cycles/iter, %ld.%ld CPI\n", \
- stringify(code), _c, _c/iter, 10*_c/iter%10, _c/_i, 10*_c/_i%10); \
- } while(0)
- #endif //__UTIL_H
|