void silu_and_mul( torch::Tensor& out, torch::Tensor& input);