h = o*torch.tanh(c) return torch.sum(h @ W2) dim_in, dim_hidden, dim_out, batch_size = 10, 10, 10, 10 lstm_vars = [torch.randn(dim_in + 2*dim_hidden, 4*dim_hidden), torch.randn(dim_hidden, dim_out)] [W.requires_