mirror of
https://github.com/sockspls/badfish
synced 2025-05-03 18:19:35 +00:00

Use TT memory functions to allocate memory for the NNUE weights. This should provide a small speed-up on systems where large pages are not automatically used, including Windows and some Linux distributions. Further, since we now have a wrapper for std::aligned_alloc(), we can simplify the TT memory management a bit: - We no longer need to store separate pointers to the hash table and its underlying memory allocation. - We also get to merge the Linux-specific and default implementations of aligned_ttmem_alloc(). Finally, we'll enable the VirtualAlloc code path with large page support also for Win32. STC: https://tests.stockfishchess.org/tests/view/5f66595823a84a47b9036fba LLR: 2.94 (-2.94,2.94) {-0.25,1.25} Total: 14896 W: 1854 L: 1686 D: 11356 Ptnml(0-2): 65, 1224, 4742, 1312, 105 closes https://github.com/official-stockfish/Stockfish/pull/3081 No functional change.
97 lines
2.8 KiB
C++
97 lines
2.8 KiB
C++
/*
|
|
Stockfish, a UCI chess playing engine derived from Glaurung 2.1
|
|
Copyright (C) 2004-2020 The Stockfish developers (see AUTHORS file)
|
|
|
|
Stockfish is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Stockfish is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef TT_H_INCLUDED
|
|
#define TT_H_INCLUDED
|
|
|
|
#include "misc.h"
|
|
#include "types.h"
|
|
|
|
/// TTEntry struct is the 10 bytes transposition table entry, defined as below:
|
|
///
|
|
/// key 16 bit
|
|
/// depth 8 bit
|
|
/// generation 5 bit
|
|
/// pv node 1 bit
|
|
/// bound type 2 bit
|
|
/// move 16 bit
|
|
/// value 16 bit
|
|
/// eval value 16 bit
|
|
|
|
struct TTEntry {
|
|
|
|
Move move() const { return (Move )move16; }
|
|
Value value() const { return (Value)value16; }
|
|
Value eval() const { return (Value)eval16; }
|
|
Depth depth() const { return (Depth)depth8 + DEPTH_OFFSET; }
|
|
bool is_pv() const { return (bool)(genBound8 & 0x4); }
|
|
Bound bound() const { return (Bound)(genBound8 & 0x3); }
|
|
void save(Key k, Value v, bool pv, Bound b, Depth d, Move m, Value ev);
|
|
|
|
private:
|
|
friend class TranspositionTable;
|
|
|
|
uint16_t key16;
|
|
uint8_t depth8;
|
|
uint8_t genBound8;
|
|
uint16_t move16;
|
|
int16_t value16;
|
|
int16_t eval16;
|
|
};
|
|
|
|
|
|
/// A TranspositionTable is an array of Cluster, of size clusterCount. Each
|
|
/// cluster consists of ClusterSize number of TTEntry. Each non-empty TTEntry
|
|
/// contains information on exactly one position. The size of a Cluster should
|
|
/// divide the size of a cache line for best performance, as the cacheline is
|
|
/// prefetched when possible.
|
|
|
|
class TranspositionTable {
|
|
|
|
static constexpr int ClusterSize = 3;
|
|
|
|
struct Cluster {
|
|
TTEntry entry[ClusterSize];
|
|
char padding[2]; // Pad to 32 bytes
|
|
};
|
|
|
|
static_assert(sizeof(Cluster) == 32, "Unexpected Cluster size");
|
|
|
|
public:
|
|
~TranspositionTable() { aligned_large_pages_free(table); }
|
|
void new_search() { generation8 += 8; } // Lower 3 bits are used by PV flag and Bound
|
|
TTEntry* probe(const Key key, bool& found) const;
|
|
int hashfull() const;
|
|
void resize(size_t mbSize);
|
|
void clear();
|
|
|
|
TTEntry* first_entry(const Key key) const {
|
|
return &table[mul_hi64(key, clusterCount)].entry[0];
|
|
}
|
|
|
|
private:
|
|
friend struct TTEntry;
|
|
|
|
size_t clusterCount;
|
|
Cluster* table;
|
|
uint8_t generation8; // Size must be not bigger than TTEntry::genBound8
|
|
};
|
|
|
|
extern TranspositionTable TT;
|
|
|
|
#endif // #ifndef TT_H_INCLUDED
|