Add InformationIntegration and WorkingMemory modules; enhance Conscio…

…usnessModel with self-awareness and memory update mechanisms
Neuro-Flex · Dec 26, 2024 · 7d4db12 · 7d4db12
1 parent 9fa746e
commit 7d4db12
Show file tree

Hide file tree

Showing 14 changed files with 443 additions and 11 deletions.
diff --git a/models/__pycache__/consciousness.cpython-310.pyc b/models/__pycache__/consciousness.cpython-310.pyc
diff --git a/models/__pycache__/consciousness_model.cpython-310.pyc b/models/__pycache__/consciousness_model.cpython-310.pyc
diff --git a/models/__pycache__/consciousness_state.cpython-310.pyc b/models/__pycache__/consciousness_state.cpython-310.pyc
diff --git a/models/__pycache__/information_integration.cpython-310.pyc b/models/__pycache__/information_integration.cpython-310.pyc
diff --git a/models/__pycache__/self_awareness.cpython-310.pyc b/models/__pycache__/self_awareness.cpython-310.pyc
diff --git a/models/__pycache__/working_memory.cpython-310.pyc b/models/__pycache__/working_memory.cpython-310.pyc
diff --git a/models/consciousness.py b/models/consciousness.py
@@ -1,6 +1,9 @@
 import torch
 import torch.nn as nn
 from typing import Dict, Tuple, Optional
+from .working_memory import WorkingMemory
+from .information_integration import InformationIntegration
+from .self_awareness import SelfAwareness  # Add this import
 
 class MultiHeadAttention(nn.Module):
     """Custom MultiHeadAttention implementation"""
@@ -41,21 +44,26 @@ def forward(self, inputs: torch.Tensor, memory_state: Optional[torch.Tensor] = N
               deterministic: bool = True) -> Tuple[torch.Tensor, torch.Tensor]:
         # Process inputs through attention mechanism
         attended = self.attention(inputs, deterministic=deterministic)
-
-        # Update working memory
+        
+        # Ensure memory_state has correct shape
         if memory_state is None:
             memory_state = torch.zeros_like(attended)
+        else:
+            # Expand memory state if needed
+            memory_state = memory_state.unsqueeze(1).expand(-1, attended.size(1), -1)
 
+        # Update working memory with broadcasting
         gate = torch.sigmoid(self.memory_gate(attended))
         update = self.memory_update(attended)
         memory_state = gate * memory_state + (1 - gate) * update
 
-        # Ensure memory gate output dimensions are correct
-        memory_state = memory_state.view(memory_state.size(0), -1)
+        # Pool across sequence dimension if needed
+        if len(memory_state.shape) == 3:
+            memory_state = memory_state.mean(dim=1)
 
         # Integrate information
         integrated = torch.relu(self.integration_layer(
-            torch.cat([attended, memory_state], dim=-1)
+            torch.cat([attended.mean(dim=1), memory_state], dim=-1)
         ))
 
         # Generate conscious output
@@ -105,6 +113,16 @@ def __init__(self, hidden_dim: int, num_heads: int, num_layers: int, num_states:
             dropout=dropout_rate,
             batch_first=True
         )
+
+        # Add self-awareness module
+        self.self_awareness = SelfAwareness(
+            hidden_dim=hidden_dim,
+            num_heads=num_heads,
+            dropout_rate=dropout_rate
+        )
+
+        # State tracking
+        self.previous_state = None
 
     def get_config(self):
         return {
@@ -144,24 +162,37 @@ def forward(self, inputs: Dict[str, torch.Tensor],
         if state is None:
             state = torch.zeros(inputs['attention'].shape[0], self.hidden_dim, device=device)
 
-        # Process inputs
-        x = torch.stack(list(inputs.values()), dim=1)
+        # Get input tensor
+        x = inputs['attention']  # [batch_size, seq_len, hidden_dim]
 
-        # Apply attention
+        # Apply attention - x is already in the correct shape
         attn_out, attention_weights = self.attention(x, x, x)
 
-        # Process through global workspace
+        # Process through global workspace with reshaped state
         conscious_out, memory_state = self.global_workspace(attn_out, state, deterministic)
 
+        # Process through self-awareness
+        aware_state, awareness_metrics = self.self_awareness(
+            conscious_out,
+            previous_state=self.previous_state
+        )
+
+        # Update previous state
+        self.previous_state = aware_state.detach()
+
         # Calculate integration metrics
         integrated_out, phi = self.information_integration(conscious_out, deterministic)
 
-        return integrated_out, {
+        # Update metrics
+        metrics = {
             'attention_weights': attention_weights,
             'memory_state': memory_state,
             'phi': phi,
-            'attention_maps': attention_weights
+            'attention_maps': attention_weights,
+            **awareness_metrics
         }
+
+        return aware_state, metrics
 
 def create_consciousness_module(hidden_dim: int = 512,
                              num_cognitive_processes: int = 4) -> ConsciousnessModel:

diff --git a/models/information_integration.py b/models/information_integration.py
@@ -0,0 +1,44 @@
+import torch
+import torch.nn as nn
+from typing import Tuple
+
+class InformationIntegration(nn.Module):
+    """Module for integrating information across different cognitive processes."""
+
+    def __init__(self, hidden_dim: int, num_modules: int, dropout_rate: float = 0.1):
+        super().__init__()
+        self.hidden_dim = hidden_dim
+        self.num_modules = num_modules
+
+        # Integration layers
+        self.integration_network = nn.Sequential(
+            nn.Linear(hidden_dim, hidden_dim * 2),
+            nn.ReLU(),
+            nn.Dropout(dropout_rate),
+            nn.Linear(hidden_dim * 2, hidden_dim),
+            nn.LayerNorm(hidden_dim)
+        )
+
+        # Phi calculation network
+        self.phi_network = nn.Sequential(
+            nn.Linear(hidden_dim, hidden_dim // 2),
+            nn.ReLU(),
+            nn.Linear(hidden_dim // 2, 1),
+            nn.Sigmoid()
+        )
+
+    def forward(self, x: torch.Tensor, deterministic: bool = True) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Forward pass for information integration.
+        Returns integrated information and phi value.
+        """
+        # Set dropout behavior
+        self.train(not deterministic)
+
+        # Integrate information
+        integrated = self.integration_network(x)
+
+        # Calculate phi (information integration measure)
+        phi = self.phi_network(integrated)
+
+        return integrated, phi
diff --git a/models/self_awareness.py b/models/self_awareness.py
@@ -0,0 +1,143 @@
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from typing import Dict, Tuple, Optional
+
+class SelfAwareness(nn.Module):
+    """Module for implementing self-awareness, monitoring, and representation."""
+
+    def __init__(self, hidden_dim: int, num_heads: int = 4, dropout_rate: float = 0.1):
+        super().__init__()
+        self.hidden_dim = hidden_dim
+
+        # Self-representation components
+        self.self_embed = nn.Linear(hidden_dim, hidden_dim)
+        self.state_encoder = nn.LSTM(hidden_dim, hidden_dim, num_layers=2, batch_first=True)
+
+        # Self-monitoring components
+        self.monitor = nn.ModuleDict({
+            'attention': nn.MultiheadAttention(hidden_dim, num_heads, dropout_rate),
+            'state_tracker': nn.Linear(hidden_dim * 2, hidden_dim),
+            'anomaly_detector': nn.Sequential(
+                nn.Linear(hidden_dim, hidden_dim // 2),
+                nn.ReLU(),
+                nn.Linear(hidden_dim // 2, 1),
+                nn.Sigmoid()
+            )
+        })
+
+        # Metacognitive components
+        self.metacognition = nn.ModuleDict({
+            'confidence': nn.Linear(hidden_dim, 1),
+            'error_prediction': nn.Linear(hidden_dim, hidden_dim),
+            'adaptation_net': nn.Sequential(
+                nn.Linear(hidden_dim, 1),
+                nn.Sigmoid()
+            )
+        })
+
+        # Store adaptation rate as buffer instead of parameter
+        self.register_buffer('adaptation_rate', torch.tensor(0.1))
+
+        self.history_size = 1000
+        self.state_history = []
+
+    def update_state_history(self, state: torch.Tensor):
+        """Maintain a history of internal states."""
+        self.state_history.append(state.detach())
+        if len(self.state_history) > self.history_size:
+            self.state_history.pop(0)
+
+    def compute_self_representation(self, current_state: torch.Tensor) -> torch.Tensor:
+        """Generate self-representation from current state."""
+        self_rep = self.self_embed(current_state)
+        historical_context = None
+
+        if self.state_history:
+            historical_tensor = torch.stack(self.state_history[-10:], dim=1)
+            historical_context, _ = self.state_encoder(historical_tensor)
+            historical_context = historical_context[:, -1, :]  # Take last state
+
+        if historical_context is not None:
+            self_rep = self_rep + 0.1 * historical_context
+
+        return self_rep
+
+    def monitor_state(self, current_state: torch.Tensor, 
+                     previous_state: Optional[torch.Tensor] = None) -> Dict[str, torch.Tensor]:
+        """Monitor internal state and detect anomalies."""
+        # Compare current state with previous if available
+        if previous_state is None:
+            previous_state = torch.zeros_like(current_state)
+
+        # Attend to important aspects of state
+        attended_state, _ = self.monitor['attention'](
+            current_state.unsqueeze(0), 
+            current_state.unsqueeze(0), 
+            current_state.unsqueeze(0)
+        )
+        attended_state = attended_state.squeeze(0)
+
+        # Track state changes
+        state_diff = self.monitor['state_tracker'](
+            torch.cat([current_state, previous_state], dim=-1)
+        )
+
+        # Calculate state magnitude for anomaly detection
+        state_magnitude = torch.norm(current_state, dim=-1, keepdim=True)
+        normalized_state = current_state / (state_magnitude + 1e-6)
+
+        # Detect anomalies based on normalized state
+        anomaly_score = self.monitor['anomaly_detector'](normalized_state)
+
+        return {
+            'attended_state': attended_state,
+            'state_change': state_diff,
+            'anomaly_score': anomaly_score
+        }
+
+    def assess_metacognition(self, state: torch.Tensor) -> Dict[str, torch.Tensor]:
+        """Assess metacognitive aspects like confidence and error prediction."""
+        # Normalize state for more stable confidence estimation
+        state_magnitude = torch.norm(state, dim=-1, keepdim=True)
+        normalized_state = state / (state_magnitude + 1e-6)
+
+        # Calculate confidence based on normalized state
+        confidence = torch.sigmoid(self.metacognition['confidence'](normalized_state))
+        confidence = confidence * torch.exp(-state_magnitude / 100)  # Reduce confidence for extreme values
+
+        error_pred = self.metacognition['error_prediction'](state)
+
+        return {
+            'confidence': confidence,
+            'error_prediction': error_pred,
+            'adaptation_rate': self.adaptation_rate
+        }
+
+    def forward(self, current_state: torch.Tensor, 
+                previous_state: Optional[torch.Tensor] = None) -> Tuple[torch.Tensor, Dict]:
+        """Process current state through self-awareness mechanisms."""
+        # Update state history
+        self.update_state_history(current_state)
+
+        # Generate self representation
+        self_rep = self.compute_self_representation(current_state)
+
+        # Monitor state
+        monitoring_results = self.monitor_state(current_state, previous_state)
+
+        # Assess metacognition
+        metacog_results = self.assess_metacognition(self_rep)
+
+        # Combine all metrics
+        metrics = {
+            'self_representation': self_rep,
+            **monitoring_results,
+            **metacog_results
+        }
+
+        # Update based on monitoring and metacognition
+        updated_state = current_state + \
+                       (monitoring_results['attended_state'] * metacog_results['adaptation_rate'])
+
+        return updated_state, metrics
diff --git a/models/working_memory.py b/models/working_memory.py
@@ -0,0 +1,50 @@
+import torch
+import torch.nn as nn
+from typing import Optional, Tuple
+
+class WorkingMemory(nn.Module):
+    """Working memory component for maintaining and updating information"""
+
+    def __init__(self, input_dim: int, hidden_dim: int, dropout_rate: float = 0.1):
+        super().__init__()
+        self.input_dim = input_dim
+        self.hidden_dim = hidden_dim
+
+        # Memory cells
+        self.memory_rnn = nn.LSTM(
+            input_size=input_dim,
+            hidden_size=hidden_dim,
+            num_layers=2,
+            dropout=dropout_rate,
+            batch_first=True
+        )
+
+        # Update gate
+        self.update_gate = nn.Sequential(
+            nn.Linear(hidden_dim * 2, hidden_dim),
+            nn.Sigmoid()
+        )
+
+        # Output projection
+        self.output_projection = nn.Linear(hidden_dim, hidden_dim)
+
+        # Layer normalization
+        self.layer_norm = nn.LayerNorm(hidden_dim)
+
+    def forward(self, inputs: torch.Tensor, prev_state: Optional[Tuple[torch.Tensor, torch.Tensor]] = None) -> Tuple[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
+        # Process through LSTM
+        output, (h_n, c_n) = self.memory_rnn(inputs, prev_state)
+
+        # Apply update gate
+        if prev_state is not None:
+            prev_h = prev_state[0]
+            gate = self.update_gate(torch.cat([output, prev_h[-1:]], dim=-1))
+            output = gate * output + (1 - gate) * prev_h[-1:]
+
+        # Project output
+        output = self.output_projection(output)
+
+        # Apply layer normalization
+        output = self.layer_norm(output)
+
+        return output, (h_n, c_n)
diff --git a/tests/__pycache__/conftest.cpython-310-pytest-8.3.4.pyc b/tests/__pycache__/conftest.cpython-310-pytest-8.3.4.pyc
diff --git a/tests/__pycache__/test_consciousness.cpython-310-pytest-8.3.4.pyc b/tests/__pycache__/test_consciousness.cpython-310-pytest-8.3.4.pyc
diff --git a/tests/__pycache__/test_self_awareness.cpython-310-pytest-8.3.4.pyc b/tests/__pycache__/test_self_awareness.cpython-310-pytest-8.3.4.pyc