|
io-chess
UCI chess engine
|
Contains the globally shared, read-only weights for the Factorized MoE network. More...
#include <MoECacheModel.hpp>
Public Member Functions | |
| void | init_architecture (int branchConvLayers) |
Public Attributes | |
| std::array< Branch, 12 > | branches {} |
| std::array< float,(size_t) 12 *NET_MIXER_OUT *NET_BRANCH_DIM > | mixerWBr {} |
| std::array< float,(size_t) NET_BYPASS *NET_MIXER_OUT > | mixerWBp {} |
| std::array< float, NET_MIXER_OUT > | mixerB {} |
| std::array< float,(size_t) NET_MIXER_OUT *NET_GLOBALS > | globalW {} |
| std::array< float, NET_MIXER_OUT > | globalB {} |
| std::array< float,(size_t) NET_EXPERTS *NET_GLOBALS > | gateW {} |
| std::array< float, NET_EXPERTS > | gateB {} |
| std::array< Expert, NET_EXPERTS > | experts {} |
Static Public Attributes | |
| static constexpr int | bd = NET_BRANCH_DIM |
| static constexpr int | nf = NET_MIXER_OUT |
| static constexpr int | nBypass = NET_BYPASS |
| static constexpr int | nGlobals = NET_GLOBALS |
| static constexpr int | nExperts = NET_EXPERTS |
| static constexpr int | ebo = NET_EXPERT_BOTTLENECK |
| static constexpr int | eh = NET_EXPERT_HIDDEN |
Contains the globally shared, read-only weights for the Factorized MoE network.
This struct stores the pre-trained weights for all convolution branches, the mixer layer, the router gate, and the individual expert networks. In the engine, these weights are loaded once into memory and shared across all search threads.
|
inline |


|
staticconstexpr |
| std::array<Branch, 12> SharedMoEWeights::branches {} |
|
staticconstexpr |
|
staticconstexpr |
| std::array<Expert, NET_EXPERTS> SharedMoEWeights::experts {} |
| std::array<float, NET_EXPERTS> SharedMoEWeights::gateB {} |
| std::array< float, (size_t)NET_EXPERTS * NET_GLOBALS> SharedMoEWeights::gateW {} |
| std::array<float, NET_MIXER_OUT> SharedMoEWeights::globalB {} |
| std::array<float, (size_t)NET_MIXER_OUT * NET_GLOBALS> SharedMoEWeights::globalW {} |
| std::array<float, NET_MIXER_OUT> SharedMoEWeights::mixerB {} |
| std::array<float, (size_t)NET_BYPASS * NET_MIXER_OUT> SharedMoEWeights::mixerWBp {} |
| std::array<float, (size_t)12 * NET_MIXER_OUT * NET_BRANCH_DIM> SharedMoEWeights::mixerWBr {} |
|
staticconstexpr |
|
staticconstexpr |
|
staticconstexpr |
|
staticconstexpr |