mirror of
https://github.com/SChernykh/p2pool.git
synced 2025-01-03 17:29:24 +00:00
113 lines
2.9 KiB
C++
113 lines
2.9 KiB
C++
|
/*
|
||
|
* This file is part of the Monero P2Pool <https://github.com/SChernykh/p2pool>
|
||
|
* Copyright (c) 2021-2024 SChernykh <https://github.com/SChernykh>
|
||
|
*
|
||
|
* This program is free software: you can redistribute it and/or modify
|
||
|
* it under the terms of the GNU General Public License as published by
|
||
|
* the Free Software Foundation, version 3.
|
||
|
*
|
||
|
* This program is distributed in the hope that it will be useful, but
|
||
|
* WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
* General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License
|
||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||
|
*/
|
||
|
|
||
|
#include "common.h"
|
||
|
#include "keccak.h"
|
||
|
|
||
|
#include <immintrin.h>
|
||
|
|
||
|
namespace p2pool {
|
||
|
|
||
|
#ifndef ROTL64
|
||
|
#define ROTL64(x, y) (((x) << (y)) | ((x) >> (64 - (y))))
|
||
|
#endif
|
||
|
|
||
|
#if defined(__GNUC__) && (__GNUC__ < 12) && !defined(_andn_u64)
|
||
|
#define _andn_u64 __andn_u64
|
||
|
#endif
|
||
|
|
||
|
NOINLINE void keccakf_bmi(std::array<uint64_t, 25>& st)
|
||
|
{
|
||
|
for (int round = 0; round < KeccakParams::ROUNDS; ++round) {
|
||
|
uint64_t bc[5];
|
||
|
|
||
|
// Theta
|
||
|
bc[0] = st[0] ^ st[5] ^ st[10] ^ st[15] ^ st[20];
|
||
|
bc[1] = st[1] ^ st[6] ^ st[11] ^ st[16] ^ st[21];
|
||
|
bc[2] = st[2] ^ st[7] ^ st[12] ^ st[17] ^ st[22];
|
||
|
bc[3] = st[3] ^ st[8] ^ st[13] ^ st[18] ^ st[23];
|
||
|
bc[4] = st[4] ^ st[9] ^ st[14] ^ st[19] ^ st[24];
|
||
|
|
||
|
#define THETA(i) { \
|
||
|
const uint64_t t = bc[(i + 4) % 5] ^ ROTL64(bc[(i + 1) % 5], 1); \
|
||
|
st[i + 0 ] ^= t; \
|
||
|
st[i + 5] ^= t; \
|
||
|
st[i + 10] ^= t; \
|
||
|
st[i + 15] ^= t; \
|
||
|
st[i + 20] ^= t; \
|
||
|
}
|
||
|
|
||
|
THETA(0);
|
||
|
THETA(1);
|
||
|
THETA(2);
|
||
|
THETA(3);
|
||
|
THETA(4);
|
||
|
|
||
|
// Rho Pi
|
||
|
const uint64_t t = st[1];
|
||
|
st[1] = ROTL64(st[6], 44);
|
||
|
st[6] = ROTL64(st[9], 20);
|
||
|
st[9] = ROTL64(st[22], 61);
|
||
|
st[22] = ROTL64(st[14], 39);
|
||
|
st[14] = ROTL64(st[20], 18);
|
||
|
st[20] = ROTL64(st[2], 62);
|
||
|
st[2] = ROTL64(st[12], 43);
|
||
|
st[12] = ROTL64(st[13], 25);
|
||
|
st[13] = ROTL64(st[19], 8);
|
||
|
st[19] = ROTL64(st[23], 56);
|
||
|
st[23] = ROTL64(st[15], 41);
|
||
|
st[15] = ROTL64(st[4], 27);
|
||
|
st[4] = ROTL64(st[24], 14);
|
||
|
st[24] = ROTL64(st[21], 2);
|
||
|
st[21] = ROTL64(st[8], 55);
|
||
|
st[8] = ROTL64(st[16], 45);
|
||
|
st[16] = ROTL64(st[5], 36);
|
||
|
st[5] = ROTL64(st[3], 28);
|
||
|
st[3] = ROTL64(st[18], 21);
|
||
|
st[18] = ROTL64(st[17], 15);
|
||
|
st[17] = ROTL64(st[11], 10);
|
||
|
st[11] = ROTL64(st[7], 6);
|
||
|
st[7] = ROTL64(st[10], 3);
|
||
|
st[10] = ROTL64(t, 1);
|
||
|
|
||
|
// Chi
|
||
|
#define CHI(j) { \
|
||
|
const uint64_t st0 = st[j ]; \
|
||
|
const uint64_t st1 = st[j + 1]; \
|
||
|
const uint64_t st2 = st[j + 2]; \
|
||
|
const uint64_t st3 = st[j + 3]; \
|
||
|
const uint64_t st4 = st[j + 4]; \
|
||
|
st[j ] ^= _andn_u64(st1, st2); \
|
||
|
st[j + 1] ^= _andn_u64(st2, st3); \
|
||
|
st[j + 2] ^= _andn_u64(st3, st4); \
|
||
|
st[j + 3] ^= _andn_u64(st4, st0); \
|
||
|
st[j + 4] ^= _andn_u64(st0, st1); \
|
||
|
}
|
||
|
|
||
|
CHI(0);
|
||
|
CHI(5);
|
||
|
CHI(10);
|
||
|
CHI(15);
|
||
|
CHI(20);
|
||
|
|
||
|
// Iota
|
||
|
st[0] ^= keccakf_rndc[round];
|
||
|
}
|
||
|
}
|
||
|
|
||
|
} // namespace p2pool
|