#include "keccak.cu" const int count = 100000; __device__ keccak::Result result; __global__ void bench_kernel() { __shared__ keccak::SharedState s; keccak::RegisterState r; keccak::init(r); for (int i=0; i>>(); return cudaPeekAtLastError() != cudaSuccess; }