vllm/csrc/moe/moe_ops.cpp

8 lines
182 B
C++
Raw Normal View History

#include "moe_ops.h"
#include <torch/extension.h>
PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
m.def("topk_softmax", &topk_softmax, "Apply topk softmax to the gating outputs.");
}