databricks · rithwik-db · Jul 30, 2025 · Jul 28, 2025 · Jul 29, 2025 · Jul 29, 2025
@@ -70,11 +70,6 @@ repos:
     - "#"
     - --allow-past-years
     types: [python]
-- repo: https://github.com/PyCQA/docformatter
-  rev: v1.5.0
-  hooks:
-  - id: docformatter
-    args: [--in-place, --wrap-summaries=80, --wrap-descriptions=80]
 - repo: https://github.com/PyCQA/pydocstyle
   hooks:
   - id: pydocstyle

@@ -247,7 +247,11 @@ def policy_loss(
             logits=gen_logits,
         )
         assert token_entropies.shape == batch['action_mask'].shape, (
-            f'Token entropies shape {token_entropies.shape} does not match action mask shape {batch["action_mask"].shape}.',
+            'Token entropies shape {token_entropies_shape} does not match action mask shape {action_mask_shape}.'
+            .format(
+                token_entropies_shape=token_entropies.shape,
+                action_mask_shape=batch['action_mask'].shape,
+            ),
         )
         seq_entropies = utils.get_sequence_entropies(
             token_entropies=token_entropies,

@@ -329,7 +329,7 @@ def forward(
                 batch['input_ids'],
                 attention_mask=batch['attention_mask'],
             ).logits
-            logits = logits[:, :, self.eos_token_id]
+            logits = logits[:, :, self.eos_token_id]  # type: ignore
             if self.min_threshold is not None and self.max_threshold is not None:
                 logits: torch.Tensor = torch.clamp(
                     logits,