added rnn

2026-06-27 17:33:07 +08:00 · 2018-04-03 23:48:51 -04:00
parent e6e88c5006
commit 076e45cac0
6 changed files with 56 additions and 0 deletions
@@ -0,0 +1,53 @@
+import torch.nn as nn
+from torch import normal, multinomial
+
+
+
+class MDNRNN(nn.Module):
+    def __init__(self, z_dim, action_dim, hidden_size, n_mixture, temperature):
+        """
+            :param z_dim: the dimension of VAE latent variable
+            :param hidden_size: hidden size of RNN
+            :param n_mixture: number of Gaussian Mixture Models to be used
+            :param temperature: controls the randomness of the model
+
+            MDNRNN stands for Mixture Density Network - RNN.
+            The output of this model is [mean, sigma^2, K],
+            where mean and sigma^2 have z_dim * n_mixture elements and
+            K has n_mixture elements.
+        """
+        super(MDNRNN, self).__init__()
+        # define rnn
+        self.inpt_size = z_dim + action_dim
+        self.rnn = nn.LSTM(input_size=self.inpt_size, hidden_size=hidden_size, batch_first=True)
+
+        # define MDN as fully connected layer
+        self.mdn = nn.Linear(hidden_size, n_mixture * z_dim * 2 + n_mixture)
+        self.tau = temperature
+
+    def forward(self, inpt, hidden_state, action):
+        """
+        :param inpt: a tensor of size (batch_size, seq_len, D)
+        :param hidden_state: two tensors of size (1, batch_size, hidden_size)
+        :param action: a tensor of (batch_size, seq_len, D*)
+        :return: pi, mean, sigma, hidden_state
+        """
+        # TODO: Add forward function
+        return
+
+    def sample(self, inpt, hidden_state, action):
+        """
+        parameters same as forward
+        :return:
+        """
+        # forward and get pi, mean. sigma, hidden_state
+        pi, mean, sigma, hidden_state = self.forward(inpt, hidden_state, action)
+
+        # randomly draw a mixture model
+        k = multinomial(pi, 1)
+        selected_mean = mean[..., k]
+        selected_sigma = sigma[..., k]
+
+        # sample from normal dist
+        z = normal(selected_mean, selected_sigma)
+        return z, hidden_state