| void matmul_persistent_cuda( | |
| torch::Tensor const &a, | |
| torch::Tensor const &b, | |
| torch::Tensor &c, | |
| torch::Tensor const &bias); | |
| void log_softmax_cuda( | |
| torch::Tensor const &input, | |
| torch::Tensor &output); | |
| void mean_dim_cuda( | |
| torch::Tensor const &input, | |
| torch::Tensor &output, | |
| int dim); |