| backbone_weights() const | MoEDoubleAccumulator | inline |
| bd | MoEDoubleAccumulator | static |
| branch_forward(int b, const float *in_planes, float *out) | MoEDoubleAccumulator | inline |
| branch_forward_bd16_fast(const Branch &br, const float *HOT_RESTRICT in_planes, float *HOT_RESTRICT out, float *HOT_RESTRICT mid_plane, float *HOT_RESTRICT l1_accum) | MoEDoubleAccumulator | inline |
| branch_forward_with_scratch(int b, const float *in_planes, float *out, float *scratch0, float *scratch1) | MoEDoubleAccumulator | inline |
| branchCache | MoEDoubleAccumulator | |
| branchConvLayers | MoEDoubleAccumulator | |
| copy_weights_from(const MoEDoubleAccumulator &src) | MoEDoubleAccumulator | inline |
| denseDirtySqThreshold | MoEDoubleAccumulator | |
| ebo | MoEDoubleAccumulator | static |
| eh | MoEDoubleAccumulator | static |
| exGapCache | MoEDoubleAccumulator | |
| expertPoolMode | MoEDoubleAccumulator | |
| experts_total_weights() const | MoEDoubleAccumulator | inline |
| exPool16Cache | MoEDoubleAccumulator | |
| exPreAccum | MoEDoubleAccumulator | |
| exReluCache | MoEDoubleAccumulator | |
| exValid | MoEDoubleAccumulator | |
| fill_random(unsigned seed) | MoEDoubleAccumulator | inline |
| full_rebuild_accumulators(const FactorizedInput &inp, const int *active_experts, int active_count) | MoEDoubleAccumulator | inline |
| global_proj_at(int oc, const float *g) const | MoEDoubleAccumulator | inline |
| hiddenAcc | MoEDoubleAccumulator | |
| init(const SharedMoEWeights *shared, const BenchConfig &cfg) | MoEDoubleAccumulator | inline |
| init(const BenchConfig &cfg) | MoEDoubleAccumulator | inline |
| initialized | MoEDoubleAccumulator | |
| minParallelActiveExperts | MoEDoubleAccumulator | |
| minParallelDirtyHeads | MoEDoubleAccumulator | |
| mixerLinearAccum | MoEDoubleAccumulator | |
| mixerReluCache | MoEDoubleAccumulator | |
| mutable_owned_weights() | MoEDoubleAccumulator | inline |
| nBypass | MoEDoubleAccumulator | static |
| nExperts | MoEDoubleAccumulator | static |
| nf | MoEDoubleAccumulator | static |
| nGlobals | MoEDoubleAccumulator | static |
| nThreads | MoEDoubleAccumulator | |
| oldGlobalV | MoEDoubleAccumulator | |
| ownedWeights | MoEDoubleAccumulator | |
| parallel_for_indices(int n, int min_parallel_n, Fn &&fn) | MoEDoubleAccumulator | inline |
| parallel_for_indices(int n, Fn &&fn) | MoEDoubleAccumulator | inline |
| profile | MoEDoubleAccumulator | |
| rebuild_expert_cache_from_mixer(int e) | MoEDoubleAccumulator | inline |
| rebuild_hidden_acc_from_flat(int e) | MoEDoubleAccumulator | inline |
| rebuild_hidden_acc_from_gap(int e) | MoEDoubleAccumulator | inline |
| rebuild_hidden_acc_from_pool2x2(int e, bool max_pool) | MoEDoubleAccumulator | inline |
| reset_profile() | MoEDoubleAccumulator | inline |
| reset_runtime_state() | MoEDoubleAccumulator | inline |
| routeSlowGlobals | MoEDoubleAccumulator | |
| run_active_expert(int e, float out_wdl[3]) | MoEDoubleAccumulator | inline |
| run_top2_experts(int e0, int e1, float w0, float w1, float out_wdl[3]) | MoEDoubleAccumulator | inline |
| runtime_topk_weights(int topk) const | MoEDoubleAccumulator | inline |
| scratchBranchDelta | MoEDoubleAccumulator | |
| scratchBypassDelta | MoEDoubleAccumulator | |
| scratchDeltaRelu | MoEDoubleAccumulator | |
| scratchDirtyBranches | MoEDoubleAccumulator | |
| scratchFlatDelta | MoEDoubleAccumulator | |
| scratchGproj | MoEDoubleAccumulator | |
| scratchHidden | MoEDoubleAccumulator | |
| scratchNewBranch | MoEDoubleAccumulator | |
| scratchParallelBranch0 | MoEDoubleAccumulator | |
| scratchParallelBranch1 | MoEDoubleAccumulator | |
| scratchParallelExpertDelta | MoEDoubleAccumulator | |
| scratchT0 | MoEDoubleAccumulator | |
| scratchT1 | MoEDoubleAccumulator | |
| shared_weights() const | MoEDoubleAccumulator | inline |
| single_expert_weights() const | MoEDoubleAccumulator | inline |
| threadPool | MoEDoubleAccumulator | |
| top2_experts(const float *global, int &e0, int &e1, float &w0, float &w1) const | MoEDoubleAccumulator | inline |
| total_weights() const | MoEDoubleAccumulator | inline |
| update_incremental(const FactorizedInput &cur, const FactorizedInput &prev, const int *dirty_branches, int dirty_count, const int *active_experts, int active_count) | MoEDoubleAccumulator | inline |
| validate_fixed_architecture(const BenchConfig &cfg) | MoEDoubleAccumulator | inlinestatic |
| weights | MoEDoubleAccumulator | |