Fix bug that misplaced function arguments

Signed-off-by: Mihir Kulkarni <[email protected]>
ntnu-arl · Jul 26, 2024 · 070391c · 070391c
1 parent b3b2ce4
commit 070391c
Show file tree

Hide file tree

Showing 2 changed files with 49 additions and 40 deletions.
diff --git a/aerial_gym/task/position_setpoint_task/position_setpoint_task.py b/aerial_gym/task/position_setpoint_task/position_setpoint_task.py
@@ -217,8 +217,8 @@ def compute_rewards_and_crashes(self, obs_dict):
         )
         return compute_reward(
             pos_error_vehicle_frame,
-            angular_velocity,
             root_quats,
+            angular_velocity,
             obs_dict["crashes"],
             1.0,  # obs_dict["curriculum_level_multiplier"],
             self.actions,

diff --git a/aerial_gym/utils/vae/VAE.py b/aerial_gym/utils/vae/VAE.py
@@ -1,6 +1,7 @@
 import torch
 import torch.nn as nn
 
+
 class ImgDecoder(nn.Module):
     def __init__(self, input_dim=1, latent_dim=64, with_logits=False):
         """
@@ -11,23 +12,31 @@ def __init__(self, input_dim=1, latent_dim=64, with_logits=False):
         """
 
         super(ImgDecoder, self).__init__()
-        print('[ImgDecoder] Starting create_model')
+        print("[ImgDecoder] Starting create_model")
         self.with_logits = with_logits
         self.n_channels = input_dim
         self.dense = nn.Linear(latent_dim, 512)
-        self.dense1 = nn.Linear(512, 9*15*128)
+        self.dense1 = nn.Linear(512, 9 * 15 * 128)
         # Pytorch docs: output_padding is only used to find output shape, but does not actually add zero-padding to output
         self.deconv1 = nn.ConvTranspose2d(128, 128, kernel_size=3, stride=1, padding=1)
-        self.deconv2 = nn.ConvTranspose2d(128, 64, kernel_size=5, stride=2, padding=(2,2), output_padding=(0,1), dilation=1)
-        self.deconv4 = nn.ConvTranspose2d(64, 32, kernel_size=6, stride=4, padding=(2,2), output_padding=(0,0), dilation=1)
-        self.deconv6 = nn.ConvTranspose2d(32, 16, kernel_size=6, stride=2, padding=(0,0), output_padding=(0,1))
-        self.deconv7 = nn.ConvTranspose2d(16, self.n_channels, kernel_size=4, stride=2, padding=2) # tanh activation or sigmoid
-        print('[ImgDecoder] Done with create_model')
+        self.deconv2 = nn.ConvTranspose2d(
+            128, 64, kernel_size=5, stride=2, padding=(2, 2), output_padding=(0, 1), dilation=1
+        )
+        self.deconv4 = nn.ConvTranspose2d(
+            64, 32, kernel_size=6, stride=4, padding=(2, 2), output_padding=(0, 0), dilation=1
+        )
+        self.deconv6 = nn.ConvTranspose2d(
+            32, 16, kernel_size=6, stride=2, padding=(0, 0), output_padding=(0, 1)
+        )
+        self.deconv7 = nn.ConvTranspose2d(
+            16, self.n_channels, kernel_size=4, stride=2, padding=2
+        )  # tanh activation or sigmoid
+        print("[ImgDecoder] Done with create_model")
         print("Defined decoder.")
 
     def forward(self, z):
         return self.decode(z)
-    
+
     def decode(self, z):
         x = self.dense(z)
         x = torch.relu(x)
@@ -55,10 +64,12 @@ def decode(self, z):
         # print(f"- After sigmoid, mean: {x.mean():.3f} var: {x.var():.3f}")
         return x
 
+
 class ImgEncoder(nn.Module):
     """
     ResNet8 architecture as encoder.
     """
+
     def __init__(self, input_dim, latent_dim):
         """
         Parameters:
@@ -74,39 +85,37 @@ def __init__(self, input_dim, latent_dim):
         self.define_encoder()
         self.elu = nn.ELU()
         print("Defined encoder.")
-    
+
     def define_encoder(self):
         # define conv functions
         self.conv0 = nn.Conv2d(self.input_dim, 32, kernel_size=5, stride=2, padding=2)
         self.conv0_1 = nn.Conv2d(32, 32, kernel_size=3, stride=2, padding=2)
-        nn.init.xavier_uniform_(self.conv0_1.weight, gain=nn.init.calculate_gain('linear'))
+        nn.init.xavier_uniform_(self.conv0_1.weight, gain=nn.init.calculate_gain("linear"))
         nn.init.zeros_(self.conv0_1.bias)
-
-
+
         self.conv1_0 = nn.Conv2d(32, 32, kernel_size=5, stride=2, padding=1)
         self.conv1_1 = nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1)
-        nn.init.xavier_uniform_(self.conv1_1.weight, gain=nn.init.calculate_gain('linear'))
+        nn.init.xavier_uniform_(self.conv1_1.weight, gain=nn.init.calculate_gain("linear"))
         nn.init.zeros_(self.conv1_1.bias)
 
         self.conv2_0 = nn.Conv2d(64, 64, kernel_size=5, stride=2, padding=2)
         self.conv2_1 = nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1)
-        nn.init.xavier_uniform_(self.conv2_1.weight, gain=nn.init.calculate_gain('linear'))
+        nn.init.xavier_uniform_(self.conv2_1.weight, gain=nn.init.calculate_gain("linear"))
         nn.init.zeros_(self.conv2_1.bias)
 
         self.conv3_0 = nn.Conv2d(128, 128, kernel_size=5, stride=2)
 
-
         self.conv0_jump_2 = nn.Conv2d(32, 64, kernel_size=4, stride=2, padding=1)
         self.conv1_jump_3 = nn.Conv2d(64, 128, kernel_size=5, stride=4, padding=(2, 1))
-        
-        self.dense0 = nn.Linear(3*6*128, 512)
-        self.dense1 = nn.Linear(512, 2*self.latent_dim)
+
+        self.dense0 = nn.Linear(3 * 6 * 128, 512)
+        self.dense1 = nn.Linear(512, 2 * self.latent_dim)
 
         print("Encoder network initialized.")
 
     def forward(self, img):
         return self.encode(img)
-    
+
     def encode(self, img):
         """
         Encodes the input image.
@@ -144,21 +153,22 @@ def encode(self, img):
         x = self.dense1(x)
         return x
 
+
 class Lambda(nn.Module):
     """Lambda function that accepts tensors as input."""
-    
+
     def __init__(self, func):
         super(Lambda, self).__init__()
         self.func = func
-        
+
     def forward(self, x):
         return self.func(x)
 
 
 class VAE(nn.Module):
     """Variational Autoencoder for reconstruction of depth images."""
 
-    def __init__(self, input_dim=1, latent_dim=64, with_logits=False, inference_mode = False):
+    def __init__(self, input_dim=1, latent_dim=64, with_logits=False, inference_mode=False):
         """
         Parameters
         ----------
@@ -169,26 +179,27 @@ def __init__(self, input_dim=1, latent_dim=64, with_logits=False, inference_mode
         """
 
         super(VAE, self).__init__()
-        
+
         self.with_logits = with_logits
         self.input_dim = input_dim
         self.latent_dim = latent_dim
         self.inference_mode = inference_mode
         self.encoder = ImgEncoder(input_dim=self.input_dim, latent_dim=self.latent_dim)
-        self.img_decoder = ImgDecoder(input_dim=1, latent_dim=self.latent_dim, with_logits=self.with_logits)
-
-        self.mean_params = Lambda(lambda x: x[:, :self.latent_dim]) # mean parameters
-        self.logvar_params = Lambda(lambda x: x[:, self.latent_dim:]) # log variance parameters
-
-
+        self.img_decoder = ImgDecoder(
+            input_dim=1, latent_dim=self.latent_dim, with_logits=self.with_logits
+        )
+
+        self.mean_params = Lambda(lambda x: x[:, : self.latent_dim])  # mean parameters
+        self.logvar_params = Lambda(lambda x: x[:, self.latent_dim :])  # log variance parameters
+
     def forward(self, img):
-        """ Do a forward pass of the VAE. Generates a reconstructed image based on img
+        """Do a forward pass of the VAE. Generates a reconstructed image based on img
         Parameters
         ----------
         img: torch.Tensor
             The input image.
         """
-        
+
         # encode
         z = self.encoder(img)
 
@@ -206,13 +217,13 @@ def forward(self, img):
         return img_recon, mean, logvar, z_sampled
 
     def forward_test(self, img):
-        """ Do a forward pass of the VAE. Generates a reconstructed image based on img
+        """Do a forward pass of the VAE. Generates a reconstructed image based on img
         Parameters
         ----------
         img: torch.Tensor
             The input image.
         """
-        
+
         # encode
         z = self.encoder(img)
 
@@ -229,16 +240,15 @@ def forward_test(self, img):
         img_recon = self.img_decoder(z_sampled)
         return img_recon, mean, logvar, z_sampled
 
-
     def encode(self, img):
-        """ Do a forward pass of the VAE. Generates a latent vector based on img
+        """Do a forward pass of the VAE. Generates a latent vector based on img
         Parameters
         ----------
         img: torch.Tensor
             The input image.
         """
         z = self.encoder(img)
-        
+
         means = self.mean_params(z)
         logvars = self.logvar_params(z)
         std = torch.exp(0.5 * logvars)
@@ -248,10 +258,9 @@ def encode(self, img):
         z_sampled = means + eps * std
 
         return z_sampled, means, std
-
 
     def decode(self, z):
-        """ Do a forward pass of the VAE. Generates a reconstructed image based on z
+        """Do a forward pass of the VAE. Generates a reconstructed image based on z
         Parameters
         ----------
         z: torch.Tensor
@@ -261,6 +270,6 @@ def decode(self, z):
         if self.with_logits:
             return torch.sigmoid(img_recon)
         return img_recon
-    
+
     def set_inference_mode(self, mode):
         self.inference_mode = mode