2024-02-05 17:38:02 -08:00
|
|
|
#pragma once
|
|
|
|
|
2024-06-09 16:23:30 -04:00
|
|
|
#include <torch/all.h>
|
2024-02-05 17:38:02 -08:00
|
|
|
|
2024-05-22 03:18:41 -04:00
|
|
|
void topk_softmax(torch::Tensor& topk_weights, torch::Tensor& topk_indices,
|
|
|
|
torch::Tensor& token_expert_indices,
|
|
|
|
torch::Tensor& gating_output);
|