Embodied-CoT
/

ecot-openvla-7b-bridge

feature-extraction

Model card Files Files and versions Community

verityw commited on Jul 11, 2024

Commit

be477d4

·

1 Parent(s): 31c5444

update action inference code

Files changed (1) hide show

modeling_prismatic.py +6 -5

modeling_prismatic.py CHANGED Viewed

@@ -510,12 +510,13 @@ class OpenVLAForActionPrediction(PrismaticForConditionalGeneration):
         # We need to add this special empty token ('') after the colon (':') token in "ASSISTANT:"
         # in order for the predictions to match the training configuration and be accurate.
-        input_ids = torch.cat(
-            (input_ids, torch.unsqueeze(torch.Tensor([29871]).long(), dim=0).to(input_ids.device)), dim=1
-        )
         # Run VLA inference
-        generated_ids = self.generate(input_ids, max_new_tokens=self.get_action_dim(unnorm_key), **kwargs)
         # Extract predicted action tokens and translate into (normalized) continuous actions
         predicted_action_token_ids = generated_ids[0, -self.get_action_dim(unnorm_key) :].cpu().numpy()
@@ -533,7 +534,7 @@ class OpenVLAForActionPrediction(PrismaticForConditionalGeneration):
             normalized_actions,
         )
-        return actions
     @staticmethod
     def _check_unnorm_key(norm_stats: Dict[str, Dict[str, Any]], unnorm_key: Optional[str]) -> str:

         # We need to add this special empty token ('') after the colon (':') token in "ASSISTANT:"
         # in order for the predictions to match the training configuration and be accurate.
+        # NOTE: This is NOT needed for ECoT
+        # input_ids = torch.cat(
+        #     (input_ids, torch.unsqueeze(torch.Tensor([29871]).long(), dim=0).to(input_ids.device)), dim=1
+        # )
         # Run VLA inference
+        generated_ids = self.generate(input_ids, **kwargs)
         # Extract predicted action tokens and translate into (normalized) continuous actions
         predicted_action_token_ids = generated_ids[0, -self.get_action_dim(unnorm_key) :].cpu().numpy()
             normalized_actions,
         )
+        return actions, generated_ids
     @staticmethod
     def _check_unnorm_key(norm_stats: Dict[str, Dict[str, Any]], unnorm_key: Optional[str]) -> str: