umaf/processor.py at main · MillionthOdin16/umaf · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
"""
Input processor module for the UMAF Capability Extractor.

This module handles preprocessing of model activation inputs.
"""

from typing import Optional, Union, Dict, Any

import torch
import torch.nn as nn
import torch.nn.functional as F


class InputProcessor:
    """
    Processes and normalizes model activation inputs.

    Handles diverse model activation inputs, normalizes and preprocesses activation tensors.
    """

    def __init__(
        self,
        max_length: int = 128,
        normalization: Optional[str] = 'layer',
        pad_value: float = 0.0,
        device: Optional[torch.device] = None
    ):
        """
        Initialize input processor.

        Args:
            max_length (int): Maximum sequence length
            normalization (Optional[str]): Normalization method ('mean', 'l2', 'layer', or None)
            pad_value (float): Value to use for padding
            device (Optional[torch.device]): Device to use for processing
        """
        self.max_length = max_length
        self.normalization = normalization
        self.pad_value = pad_value
        self.device = device or torch.device('cuda' if torch.cuda.is_available() else 'cpu')

        # Initialize layer normalization if needed
        if normalization == 'layer':
            self.layer_norm = None  # Will be initialized dynamically based on input dimension

    def process(self, activations: Union[torch.Tensor, Dict[str, Any]]) -> torch.Tensor:
        """
        Process activation tensors.

        Args:
            activations (Union[torch.Tensor, Dict[str, Any]]): Model activations
                - If torch.Tensor: Expected shape [batch_size, sequence_length, hidden_size]
                - If Dict: Expected to contain 'last_hidden_state' or 'hidden_states'

        Returns:
            torch.Tensor: Processed activations
        """
        # Extract tensor from dictionary if needed
        if isinstance(activations, dict):
            if 'last_hidden_state' in activations:
                activations = activations['last_hidden_state']
            elif 'hidden_states' in activations:
                # Use the last layer's hidden states
                activations = activations['hidden_states'][-1]
            else:
                raise ValueError("Input dictionary must contain 'last_hidden_state' or 'hidden_states'")

        # Convert numpy arrays to torch tensors if needed
        if not isinstance(activations, torch.Tensor):
            activations = torch.tensor(activations, device=self.device)

        # Move to device
        activations = activations.to(self.device)

        # Handle sequence length
        activations = self._handle_sequence_length(activations)

        # Apply normalization
        activations = self._normalize(activations)

        return activations

    def _handle_sequence_length(self, activations: torch.Tensor) -> torch.Tensor:
        """
        Handle sequence length by padding or truncating.

        Args:
            activations (torch.Tensor): Activation tensor [batch_size, sequence_length, hidden_size]

        Returns:
            torch.Tensor: Tensor with adjusted sequence length
        """
        batch_size, seq_len, hidden_size = activations.shape

        if seq_len > self.max_length:
            # Truncate
            return activations[:, :self.max_length, :]
        elif seq_len < self.max_length:
            # Pad
            padding = torch.full(
                (batch_size, self.max_length - seq_len, hidden_size),
                self.pad_value,
                dtype=activations.dtype,
                device=activations.device
            )
            return torch.cat([activations, padding], dim=1)
        else:
            # No adjustment needed
            return activations

    def _normalize(self, activations: torch.Tensor) -> torch.Tensor:
        """
        Apply normalization to activations.

        Args:
            activations (torch.Tensor): Activation tensor [batch_size, sequence_length, hidden_size]

        Returns:
            torch.Tensor: Normalized activations
        """
        if self.normalization is None:
            return activations

        if self.normalization == 'mean':
            # Mean subtraction
            mean = activations.mean(dim=-1, keepdim=True)
            return activations - mean

        elif self.normalization == 'l2':
            # L2 normalization
            norm = torch.norm(activations, p=2, dim=-1, keepdim=True)
            # Avoid division by zero
            norm = torch.clamp(norm, min=1e-12)
            return activations / norm

        elif self.normalization == 'layer':
            # Layer normalization
            if self.layer_norm is None or self.layer_norm.normalized_shape[0] != activations.size(-1):
                self.layer_norm = nn.LayerNorm(
                    normalized_shape=activations.size(-1),
                    device=activations.device
                )
            return self.layer_norm(activations)

        else:
            raise ValueError(f"Unknown normalization method: {self.normalization}")