mirror of
https://github.com/sockspls/badfish
synced 2025-07-12 03:59:15 +00:00

This aims to remove some of the annoying global structure which Stockfish has. Overall there is no major elo regression to be expected. Non regression SMP STC (paused, early version): https://tests.stockfishchess.org/tests/view/65983d7979aa8af82b9608f1 LLR: 0.23 (-2.94,2.94) <-1.75,0.25> Total: 76232 W: 19035 L: 19096 D: 38101 Ptnml(0-2): 92, 8735, 20515, 8690, 84 Non regression STC (early version): https://tests.stockfishchess.org/tests/view/6595b3a479aa8af82b95da7f LLR: 2.93 (-2.94,2.94) <-1.75,0.25> Total: 185344 W: 47027 L: 46972 D: 91345 Ptnml(0-2): 571, 21285, 48943, 21264, 609 Non regression SMP STC: https://tests.stockfishchess.org/tests/view/65a0715c79aa8af82b96b7e4 LLR: 2.94 (-2.94,2.94) <-1.75,0.25> Total: 142936 W: 35761 L: 35662 D: 71513 Ptnml(0-2): 209, 16400, 38135, 16531, 193 These global structures/variables add hidden dependencies and allow data to be mutable from where it shouldn't it be (i.e. options). They also prevent Stockfish from internal selfplay, which would be a nice thing to be able to do, i.e. instantiate two Stockfish instances and let them play against each other. It will also allow us to make Stockfish a library, which can be easier used on other platforms. For consistency with the old search code, `thisThread` has been kept, even though it is not strictly necessary anymore. This the first major refactor of this kind (in recent time), and future changes are required, to achieve the previously described goals. This includes cleaning up the dependencies, transforming the network to be self contained and coming up with a plan to deal with proper tablebase memory management (see comments for more information on this). The removal of these global structures has been discussed in parts with Vondele and Sopel. closes https://github.com/official-stockfish/Stockfish/pull/4968 No functional change
152 lines
5.3 KiB
C++
152 lines
5.3 KiB
C++
/*
|
|
Stockfish, a UCI chess playing engine derived from Glaurung 2.1
|
|
Copyright (C) 2004-2024 The Stockfish developers (see AUTHORS file)
|
|
|
|
Stockfish is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Stockfish is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "tt.h"
|
|
|
|
#include <cassert>
|
|
#include <cstdlib>
|
|
#include <cstring>
|
|
#include <iostream>
|
|
#include <thread>
|
|
#include <vector>
|
|
|
|
#include "misc.h"
|
|
|
|
namespace Stockfish {
|
|
|
|
// Populates the TTEntry with a new node's data, possibly
|
|
// overwriting an old position. The update is not atomic and can be racy.
|
|
void TTEntry::save(
|
|
Key k, Value v, bool pv, Bound b, Depth d, Move m, Value ev, uint8_t generation8) {
|
|
|
|
// Preserve any existing move for the same position
|
|
if (m || uint16_t(k) != key16)
|
|
move16 = m;
|
|
|
|
// Overwrite less valuable entries (cheapest checks first)
|
|
if (b == BOUND_EXACT || uint16_t(k) != key16 || d - DEPTH_OFFSET + 2 * pv > depth8 - 4)
|
|
{
|
|
assert(d > DEPTH_OFFSET);
|
|
assert(d < 256 + DEPTH_OFFSET);
|
|
|
|
key16 = uint16_t(k);
|
|
depth8 = uint8_t(d - DEPTH_OFFSET);
|
|
genBound8 = uint8_t(generation8 | uint8_t(pv) << 2 | b);
|
|
value16 = int16_t(v);
|
|
eval16 = int16_t(ev);
|
|
}
|
|
}
|
|
|
|
|
|
// Sets the size of the transposition table,
|
|
// measured in megabytes. Transposition table consists of a power of 2 number
|
|
// of clusters and each cluster consists of ClusterSize number of TTEntry.
|
|
void TranspositionTable::resize(size_t mbSize, int threadCount) {
|
|
aligned_large_pages_free(table);
|
|
|
|
clusterCount = mbSize * 1024 * 1024 / sizeof(Cluster);
|
|
|
|
table = static_cast<Cluster*>(aligned_large_pages_alloc(clusterCount * sizeof(Cluster)));
|
|
if (!table)
|
|
{
|
|
std::cerr << "Failed to allocate " << mbSize << "MB for transposition table." << std::endl;
|
|
exit(EXIT_FAILURE);
|
|
}
|
|
|
|
clear(threadCount);
|
|
}
|
|
|
|
|
|
// Initializes the entire transposition table to zero,
|
|
// in a multi-threaded way.
|
|
void TranspositionTable::clear(size_t threadCount) {
|
|
std::vector<std::thread> threads;
|
|
|
|
for (size_t idx = 0; idx < size_t(threadCount); ++idx)
|
|
{
|
|
threads.emplace_back([this, idx, threadCount]() {
|
|
// Thread binding gives faster search on systems with a first-touch policy
|
|
if (threadCount > 8)
|
|
WinProcGroup::bindThisThread(idx);
|
|
|
|
// Each thread will zero its part of the hash table
|
|
const size_t stride = size_t(clusterCount / threadCount), start = size_t(stride * idx),
|
|
len = idx != size_t(threadCount) - 1 ? stride : clusterCount - start;
|
|
|
|
std::memset(&table[start], 0, len * sizeof(Cluster));
|
|
});
|
|
}
|
|
|
|
for (std::thread& th : threads)
|
|
th.join();
|
|
}
|
|
|
|
|
|
// Looks up the current position in the transposition
|
|
// table. It returns true and a pointer to the TTEntry if the position is found.
|
|
// Otherwise, it returns false and a pointer to an empty or least valuable TTEntry
|
|
// to be replaced later. The replace value of an entry is calculated as its depth
|
|
// minus 8 times its relative age. TTEntry t1 is considered more valuable than
|
|
// TTEntry t2 if its replace value is greater than that of t2.
|
|
TTEntry* TranspositionTable::probe(const Key key, bool& found) const {
|
|
|
|
TTEntry* const tte = first_entry(key);
|
|
const uint16_t key16 = uint16_t(key); // Use the low 16 bits as key inside the cluster
|
|
|
|
for (int i = 0; i < ClusterSize; ++i)
|
|
if (tte[i].key16 == key16 || !tte[i].depth8)
|
|
{
|
|
tte[i].genBound8 =
|
|
uint8_t(generation8 | (tte[i].genBound8 & (GENERATION_DELTA - 1))); // Refresh
|
|
|
|
return found = bool(tte[i].depth8), &tte[i];
|
|
}
|
|
|
|
// Find an entry to be replaced according to the replacement strategy
|
|
TTEntry* replace = tte;
|
|
for (int i = 1; i < ClusterSize; ++i)
|
|
// Due to our packed storage format for generation and its cyclic
|
|
// nature we add GENERATION_CYCLE (256 is the modulus, plus what
|
|
// is needed to keep the unrelated lowest n bits from affecting
|
|
// the result) to calculate the entry age correctly even after
|
|
// generation8 overflows into the next cycle.
|
|
if (replace->depth8
|
|
- ((GENERATION_CYCLE + generation8 - replace->genBound8) & GENERATION_MASK)
|
|
> tte[i].depth8
|
|
- ((GENERATION_CYCLE + generation8 - tte[i].genBound8) & GENERATION_MASK))
|
|
replace = &tte[i];
|
|
|
|
return found = false, replace;
|
|
}
|
|
|
|
|
|
// Returns an approximation of the hashtable
|
|
// occupation during a search. The hash is x permill full, as per UCI protocol.
|
|
|
|
int TranspositionTable::hashfull() const {
|
|
|
|
int cnt = 0;
|
|
for (int i = 0; i < 1000; ++i)
|
|
for (int j = 0; j < ClusterSize; ++j)
|
|
cnt += table[i].entry[j].depth8
|
|
&& (table[i].entry[j].genBound8 & GENERATION_MASK) == generation8;
|
|
|
|
return cnt / ClusterSize;
|
|
}
|
|
|
|
} // namespace Stockfish
|