vllm/csrc/moe/moe_ops.h

10 lines
197 B
C
Raw Normal View History

#pragma once
#include <torch/extension.h>
void topk_softmax(
torch::Tensor& topk_weights,
torch::Tensor& topk_indices,
torch::Tensor& token_expert_indices,
torch::Tensor& gating_output);