Fix linting errors

apd10 · apd10 · commit 3d65a9623f61 · 2025-07-22T18:04:34.000-05:00
diff --git a/sparse_attention_hub/metric_logging/__init__.py b/sparse_attention_hub/metric_logging/__init__.py
@@ -2,4 +2,4 @@
 
 from .logger import MicroMetricLogger
 
-__all__ = ["MicroMetricLogger"] 
+__all__ = ["MicroMetricLogger"]
diff --git a/sparse_attention_hub/metric_logging/logger.py b/sparse_attention_hub/metric_logging/logger.py
@@ -1,18 +1,19 @@
 """MicroMetricLogger implementation for sparse attention hub."""
 
+import inspect
 import json
 import os
 import time
 from collections import deque
-from dataclasses import dataclass, asdict
+from dataclasses import asdict, dataclass
 from datetime import datetime
 from typing import Any, Dict, List, Optional, Union
-import inspect
 
 
 @dataclass
 class LogEvent:
     """Log event data structure."""
+
     timestamp: datetime
     metric: str  # Metric identifier string
     value: Union[None, Any]
@@ -25,7 +26,7 @@ class MicroMetricLogger:
 
     _instance: Optional["MicroMetricLogger"] = None
     _initialized: bool = False
-    
+
     # Class-level storage for registered metrics (works without initialization)
     _registered_metrics: Dict[str, type] = {}  # identifier -> dtype mapping
 
@@ -34,34 +35,36 @@ def __new__(cls, *args, **kwargs) -> "MicroMetricLogger":
             cls._instance = super().__new__(cls)
         return cls._instance
 
-    def __init__(self, 
-                 log_path: Optional[str] = None,
-                 flush_every: int = 1000,  # Flush every N events
-                 flush_interval: float = 60.0,  # Flush every N seconds
-                 enabled_metrics: Union[List[str], str] = None):  # List of string identifiers to enable, or "all"
+    def __init__(
+        self,
+        log_path: Optional[str] = None,
+        flush_every: int = 1000,  # Flush every N events
+        flush_interval: float = 60.0,  # Flush every N seconds
+        enabled_metrics: Union[List[str], str] = None,
+    ):  # List of string identifiers to enable, or "all"
         if not self._initialized:
             self.log_path = log_path
             self.flush_every = flush_every
             self.flush_interval = flush_interval
-            
+
             # Internal state
             self.log_queue: deque = deque(maxlen=10000)  # Circular buffer
             self.enabled_metrics: set = set()
             self.last_flush_time = time.time()
-            
+
             # Enable metrics if log_path is provided
             if self.log_path is not None:
                 self._ensure_log_directory()
                 self.enable_metrics(enabled_metrics)
-            
+
             MicroMetricLogger._initialized = True
 
     # main registration function
 
     @classmethod
     def register_metric(cls, identifier: str, dtype: type) -> None:
         """Register a metric with its string identifier and expected data type.
-        
+
         This works at class level and doesn't require initialization.
         """
         if identifier in cls._registered_metrics:
@@ -73,7 +76,6 @@ def get_registered_metrics(cls) -> Dict[str, type]:
         """Get all registered metrics at class level."""
         return cls._registered_metrics.copy()
 
-
     # helper methods
 
     def _ensure_log_directory(self) -> None:
@@ -88,19 +90,19 @@ def _get_calling_location(self) -> str:
             caller_frame = inspect.currentframe().f_back.f_back
             if caller_frame is None:
                 return "unknown"
-            
+
             # Get module name
             module = inspect.getmodule(caller_frame)
             module_name = module.__name__ if module else "unknown"
-            
+
             # Get function/class name
             function_name = caller_frame.f_code.co_name
-            
+
             # Try to get class name if it's a method
             class_name = None
-            if 'self' in caller_frame.f_locals:
-                class_name = caller_frame.f_locals['self'].__class__.__name__
-            
+            if "self" in caller_frame.f_locals:
+                class_name = caller_frame.f_locals["self"].__class__.__name__
+
             if class_name:
                 return f"{module_name}.{class_name}.{function_name}"
             else:
@@ -110,14 +112,13 @@ def _get_calling_location(self) -> str:
 
     def __del__(self):
         """Cleanup when logger is destroyed."""
-        self.flush()  # Final flush 
-
+        self.flush()  # Final flush
 
-    # api 
+    # api
 
     def enable_metrics(self, metrics: Union[List[str], str] = None) -> None:
         """Enable logging for specific metrics.
-        
+
         Args:
             metrics: List of metric identifiers to enable, or "all" for all registered metrics.
                     If None, enables no metrics (empty list).
@@ -129,46 +130,54 @@ def enable_metrics(self, metrics: Union[List[str], str] = None) -> None:
             valid_metrics = set(metrics) & set(self._registered_metrics.keys())
             invalid_metrics = set(metrics) - set(self._registered_metrics.keys())
             if invalid_metrics:
-                print(f"Warning: Attempting to enable unregistered metrics: {invalid_metrics}")
+                print(
+                    f"Warning: Attempting to enable unregistered metrics: {invalid_metrics}"
+                )
             self.enabled_metrics = valid_metrics
         else:
             # Default to empty set
             self.enabled_metrics = set()
 
     def log(self, identifier: str, value: Any, metadata: Dict[str, Any] = None) -> None:
         """Log a metric value with optional metadata. Location is auto-inferred.
-        
+
         This only works if log_path is defined.
         """
         # Check if logging is configured
         if self.log_path is None:
-            print(f"Warning: Cannot log metric '{identifier}' - log_path not defined. Use configure_logging() first.")
+            print(
+                f"Warning: Cannot log metric '{identifier}' - log_path not defined. Use configure_logging() first."
+            )
             return
-            
+
         # Check if metric is enabled
         if identifier not in self.enabled_metrics:
-            print(f"Warning: Attempting to log metric '{identifier}' which is not enabled")
+            print(
+                f"Warning: Attempting to log metric '{identifier}' which is not enabled"
+            )
             return
-        
+
         # Create log event
         event = LogEvent(
             timestamp=datetime.now(),
             metric=identifier,
             value=value,
             metadata=metadata or {},
-            location=self._get_calling_location()
+            location=self._get_calling_location(),
         )
-        
+
         # Add to queue
         self.log_queue.append(event)
-        
+
         # Check if we should flush
         if len(self.log_queue) >= self.flush_every:
             self.flush()
 
-    def configure_logging(self, log_path: str, enabled_metrics: Union[List[str], str] = None) -> None:
+    def configure_logging(
+        self, log_path: str, enabled_metrics: Union[List[str], str] = None
+    ) -> None:
         """Configure logging with a log path and optionally enable metrics.
-        
+
         This must be called before logging can work.
         """
         self.log_path = log_path
@@ -179,11 +188,11 @@ def flush(self) -> None:
         """Force flush the current queue to disk."""
         if not self.log_queue or self.log_path is None:
             return
-            
+
         # Get current timestamp for filename
         filename = f"micro_metrics.jsonl"
         filepath = os.path.join(self.log_path, filename)
-        
+
         # Write events to file
         with open(filepath, "a", encoding="utf-8") as f:
             while self.log_queue:
@@ -193,7 +202,7 @@ def flush(self) -> None:
                 # Convert datetime to ISO format string
                 event_dict["timestamp"] = event_dict["timestamp"].isoformat()
                 f.write(json.dumps(event_dict) + "\n")
-        
+
         self.last_flush_time = time.time()
 
     def is_metric_enabled(self, identifier: str) -> bool:
@@ -206,4 +215,4 @@ def get_enabled_metrics(self) -> set:
 
     def is_logging_configured(self) -> bool:
         """Check if logging is configured (log_path is set)."""
-        return self.log_path is not None
+        return self.log_path is not None
diff --git a/sparse_attention_hub/sparse_attention/research_attention/base.py b/sparse_attention_hub/sparse_attention/research_attention/base.py
@@ -6,16 +6,21 @@
 import torch
 from torch import nn
 
+from sparse_attention_hub.metric_logging.logger import MicroMetricLogger
+
 from ..base import SparseAttention, SparseAttentionConfig
 from ..utils.mask import Mask
-from ..utils.mask_attention_utils import get_masked_attention_output, get_true_attention_output
+from ..utils.mask_attention_utils import (
+    get_masked_attention_output,
+    get_true_attention_output,
+)
 from .maskers.base import MaskerConfig, ResearchMasker
 from .maskers.sampling.base import SamplingMasker
 
-from sparse_attention_hub.metric_logging.logger import MicroMetricLogger
 MicroMetricLogger.register_metric("research_attention_density", float)
 MicroMetricLogger.register_metric("research_attention_output_error", float)
 
+
 @dataclass
 class ResearchAttentionConfig(SparseAttentionConfig):
     """Configuration class for research attention mechanisms."""
@@ -104,9 +109,13 @@ def custom_attention(
                 previous_mask=sparse_attention_mask,
                 **kwargs,
             )
-            
+
         if MicroMetricLogger().is_metric_enabled("research_attention_density"):
-            MicroMetricLogger().log("research_attention_density", sparse_attention_mask.get_density(), metadata={"layer_idx" : kwargs["layer_idx"]})
+            MicroMetricLogger().log(
+                "research_attention_density",
+                sparse_attention_mask.get_density(),
+                metadata={"layer_idx": kwargs["layer_idx"]},
+            )
 
         # Call compute_masked_attention_output on the result of the last mask
         # Always request attention weights to match the expected return signature
@@ -126,9 +135,24 @@ def custom_attention(
         )
 
         if MicroMetricLogger().is_metric_enabled("research_attention_output_error"):
-            true_attention_output, _ = get_true_attention_output(module, queries, keys, values, attention_mask, scaling, dropout, **kwargs)
-            error = torch.norm(true_attention_output - attention_output) / torch.norm(true_attention_output)
-            MicroMetricLogger().log("research_attention_output_error", float(error.item()), metadata={"layer_idx" : kwargs["layer_idx"]})
+            true_attention_output, _ = get_true_attention_output(
+                module,
+                queries,
+                keys,
+                values,
+                attention_mask,
+                scaling,
+                dropout,
+                **kwargs,
+            )
+            error = torch.norm(true_attention_output - attention_output) / torch.norm(
+                true_attention_output
+            )
+            MicroMetricLogger().log(
+                "research_attention_output_error",
+                float(error.item()),
+                metadata={"layer_idx": kwargs["layer_idx"]},
+            )
 
         return attention_output, attention_weights
 
diff --git a/sparse_attention_hub/sparse_attention/research_attention/maskers/sampling/implementations/magic_pig.py b/sparse_attention_hub/sparse_attention/research_attention/maskers/sampling/implementations/magic_pig.py
@@ -19,7 +19,6 @@
     _get_num_key_value_groups,
     repeat_kv,
 )
-
 from sparse_attention_hub.sparse_attention.utils.mask import Mask
 
 from ..base import SamplingMasker, SamplingMaskerConfig
diff --git a/sparse_attention_hub/sparse_attention/utils/mask.py b/sparse_attention_hub/sparse_attention/utils/mask.py
@@ -656,4 +656,4 @@ def get_density(self) -> float:
         elif self.from_index:
             return float(len(self.indices)) / float(np.prod(self.shape))
         else:
-            raise RuntimeError("Mask object is in an invalid state")
+            raise RuntimeError("Mask object is in an invalid state")
diff --git a/sparse_attention_hub/sparse_attention/utils/mask_attention_utils.py b/sparse_attention_hub/sparse_attention/utils/mask_attention_utils.py
@@ -45,13 +45,17 @@ def get_true_attention_output(
         causal_mask = attention_mask[:, :, :, : key_states.shape[-2]]
         attn_weights = attn_weights + causal_mask
 
-    attn_weights = nn.functional.softmax(attn_weights, dim=-1, dtype=torch.float32).to(queries.dtype)
-    attn_weights = nn.functional.dropout(attn_weights, p=dropout, training=module.training)
+    attn_weights = nn.functional.softmax(attn_weights, dim=-1, dtype=torch.float32).to(
+        queries.dtype
+    )
+    attn_weights = nn.functional.dropout(
+        attn_weights, p=dropout, training=module.training
+    )
     attn_output = torch.matmul(attn_weights, value_states)
     attn_output = attn_output.transpose(1, 2).contiguous()
 
     return attn_output, attn_weights
-    
+
 
 def apply_inv_mask_sum(input_tensor: torch.Tensor, mask: Mask) -> torch.Tensor:
     """Apply inverse mask to input tensor and sum along the last dimension.
diff --git a/tests/unit/sparse_attention/research_attention/maskers/sampling/test_adaptive_sampling.py b/tests/unit/sparse_attention/research_attention/maskers/sampling/test_adaptive_sampling.py

Original file line number	Diff line number	Diff line change
`@@ -2,4 +2,4 @@`
`2`	`2`
`3`	`3`	`from .logger import MicroMetricLogger`
`4`	`4`
`5`		`-__all__ = ["MicroMetricLogger"]`
	`5`	`+__all__ = ["MicroMetricLogger"]`
Original file line number	Diff line number	Diff line change
`@@ -19,7 +19,6 @@`
`19`	`19`	`_get_num_key_value_groups,`
`20`	`20`	`repeat_kv,`
`21`	`21`	`)`
`22`		`-`
`23`	`22`	`from sparse_attention_hub.sparse_attention.utils.mask import Mask`
`24`	`23`
`25`	`24`	`from ..base import SamplingMasker, SamplingMaskerConfig`