Skip to content

Commit

Permalink
Optimized hashAes1Rx4
Browse files Browse the repository at this point in the history
  • Loading branch information
SChernykh committed Nov 4, 2019
1 parent c6a7e00 commit de1bdd2
Showing 1 changed file with 5 additions and 6 deletions.
11 changes: 5 additions & 6 deletions src/RandomX/aes_cuda.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -793,12 +793,11 @@ __global__ void hashAes1Rx4(const void* input, void* hash, uint32_t batch_size)

#define ITER(m) \
{ \
uint32_t k[4], y[4]; \
*(uint4*)(k) = p[m * 4]; \
y[0] = t0[get_byte(x[0], 0)] ^ t1[get_byte(x[1], s1)] ^ t2[get_byte(x[2], 16)] ^ t3[get_byte(x[3], s3)] ^ k[0]; \
y[1] = t0[get_byte(x[1], 0)] ^ t1[get_byte(x[2], s1)] ^ t2[get_byte(x[3], 16)] ^ t3[get_byte(x[0], s3)] ^ k[1]; \
y[2] = t0[get_byte(x[2], 0)] ^ t1[get_byte(x[3], s1)] ^ t2[get_byte(x[0], 16)] ^ t3[get_byte(x[1], s3)] ^ k[2]; \
y[3] = t0[get_byte(x[3], 0)] ^ t1[get_byte(x[0], s1)] ^ t2[get_byte(x[1], 16)] ^ t3[get_byte(x[2], s3)] ^ k[3]; \
uint32_t y[4]; \
y[0] = t0[get_byte(x[0], 0)] ^ t1[get_byte(x[1], s1)] ^ t2[get_byte(x[2], 16)] ^ t3[get_byte(x[3], s3)] ^ p[m * 4].x; \
y[1] = t0[get_byte(x[1], 0)] ^ t1[get_byte(x[2], s1)] ^ t2[get_byte(x[3], 16)] ^ t3[get_byte(x[0], s3)] ^ p[m * 4].y; \
y[2] = t0[get_byte(x[2], 0)] ^ t1[get_byte(x[3], s1)] ^ t2[get_byte(x[0], 16)] ^ t3[get_byte(x[1], s3)] ^ p[m * 4].z; \
y[3] = t0[get_byte(x[3], 0)] ^ t1[get_byte(x[0], s1)] ^ t2[get_byte(x[1], 16)] ^ t3[get_byte(x[2], s3)] ^ p[m * 4].w; \
x[0] = y[0]; \
x[1] = y[1]; \
x[2] = y[2]; \
Expand Down

0 comments on commit de1bdd2

Please sign in to comment.