vllm/csrc/moe/moe_ops.cpp
2024-02-05 17:38:02 -08:00

8 lines
182 B
C++

#include "moe_ops.h"
#include <torch/extension.h>
PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
m.def("topk_softmax", &topk_softmax, "Apply topk softmax to the gating outputs.");
}