/* * This file is part of the Monero P2Pool * Copyright (c) 2021-2024 SChernykh * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, version 3. * * This program is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #include "common.h" #include "keccak.h" #include namespace p2pool { #ifndef ROTL64 #define ROTL64(x, y) (((x) << (y)) | ((x) >> (64 - (y)))) #endif #if defined(__GNUC__) && (__GNUC__ < 12) && !defined(_andn_u64) #define _andn_u64 __andn_u64 #endif NOINLINE void keccakf_bmi(std::array& st) { for (int round = 0; round < KeccakParams::ROUNDS; ++round) { uint64_t bc[5]; // Theta bc[0] = st[0] ^ st[5] ^ st[10] ^ st[15] ^ st[20]; bc[1] = st[1] ^ st[6] ^ st[11] ^ st[16] ^ st[21]; bc[2] = st[2] ^ st[7] ^ st[12] ^ st[17] ^ st[22]; bc[3] = st[3] ^ st[8] ^ st[13] ^ st[18] ^ st[23]; bc[4] = st[4] ^ st[9] ^ st[14] ^ st[19] ^ st[24]; #define THETA(i) { \ const uint64_t t = bc[(i + 4) % 5] ^ ROTL64(bc[(i + 1) % 5], 1); \ st[i + 0 ] ^= t; \ st[i + 5] ^= t; \ st[i + 10] ^= t; \ st[i + 15] ^= t; \ st[i + 20] ^= t; \ } THETA(0); THETA(1); THETA(2); THETA(3); THETA(4); // Rho Pi const uint64_t t = st[1]; st[1] = ROTL64(st[6], 44); st[6] = ROTL64(st[9], 20); st[9] = ROTL64(st[22], 61); st[22] = ROTL64(st[14], 39); st[14] = ROTL64(st[20], 18); st[20] = ROTL64(st[2], 62); st[2] = ROTL64(st[12], 43); st[12] = ROTL64(st[13], 25); st[13] = ROTL64(st[19], 8); st[19] = ROTL64(st[23], 56); st[23] = ROTL64(st[15], 41); st[15] = ROTL64(st[4], 27); st[4] = ROTL64(st[24], 14); st[24] = ROTL64(st[21], 2); st[21] = ROTL64(st[8], 55); st[8] = ROTL64(st[16], 45); st[16] = ROTL64(st[5], 36); st[5] = ROTL64(st[3], 28); st[3] = ROTL64(st[18], 21); st[18] = ROTL64(st[17], 15); st[17] = ROTL64(st[11], 10); st[11] = ROTL64(st[7], 6); st[7] = ROTL64(st[10], 3); st[10] = ROTL64(t, 1); // Chi #define CHI(j) { \ const uint64_t st0 = st[j ]; \ const uint64_t st1 = st[j + 1]; \ const uint64_t st2 = st[j + 2]; \ const uint64_t st3 = st[j + 3]; \ const uint64_t st4 = st[j + 4]; \ st[j ] ^= _andn_u64(st1, st2); \ st[j + 1] ^= _andn_u64(st2, st3); \ st[j + 2] ^= _andn_u64(st3, st4); \ st[j + 3] ^= _andn_u64(st4, st0); \ st[j + 4] ^= _andn_u64(st0, st1); \ } CHI(0); CHI(5); CHI(10); CHI(15); CHI(20); // Iota st[0] ^= keccakf_rndc[round]; } } } // namespace p2pool