void silu_and_mul(
  torch::Tensor& out,
  torch::Tensor& input);