Updates

2025-10-30 04:36:05 +02:00 · 2025-02-07 08:58:14 -08:00 · 2025-02-07 08:58:14 -08:00 · b4279401c2
--- a/.obsidian/workspace.json
+++ b/.obsidian/workspace.json
@ -163,26 +163,29 @@
  },
  "active": "0ba8a1b9b9dd949a",
  "lastOpenFiles": [
    "Things/Simple_POMDP/Output/efe_components_detailed.png",
    "Things/Simple_POMDP/Output/policy_evolution.png",
    "Things/Simple_POMDP/Output/free_energies.png",
    "Things/Simple_POMDP/Output/belief_history.png",
    "Things/Simple_POMDP/Output/action_history.png",
    "Things/Simple_POMDP/Output/observation_likelihood.png",
    "Things/Simple_POMDP/Output/state_transitions.png",
    "Things/Simple_POMDP/Output/belief_evolution.png",
    "Things/Simple_POMDP/Output/simulation_log.txt",
    "Things/Simple_POMDP/Output/all_matrices.png",
    "Things/Simple_POMDP/Output/C_preferences.png",
    "Things/Simple_POMDP/Output/B_matrices.png",
    "Things/Simple_POMDP/Output/matrix_validation.txt",
    "Things/Simple_POMDP/Output",
    "src/models/active_inference/docs/dispatcher.md",
    "src/models/active_inference/docs/active_inference_dispatcher.md",
    "src/models/active_inference/docs/active_inference.md",
    "src/models/active_inference/docs",
    "src/models/active_inference/config_examples/continuous_sampling.yaml",
    "src/models/active_inference/config_examples/discrete_variational.yaml",
    "src/models/active_inference/config_examples",
    "src/models/active_inference/dispatcher.py",
    "Things/Continuous_Generic/__pycache__/test_continuous_generic.cpython-310-pytest-8.3.2.pyc",
-    "Things/Continuous_Generic/__pycache__/conftest.cpython-310-pytest-8.3.2.pyc",
+    "Things/Continuous_Generic/__pycache__/conftest.cpython-310-pytest-8.3.2.pyc"
    "Things/Continuous_Generic/Output/tests/single_step",
    "Things/Continuous_Generic/Output/tests/multi_step",
    "Things/Continuous_Generic/Output/tests/complex",
    "Things/Continuous_Generic/Output/tests/basic",
    "Things/Continuous_Generic/Output/tests",
    "Things/Continuous_Generic/Output",
    "Things/Continuous_Generic/__pycache__/visualization.cpython-310.pyc",
    "Things/Continuous_Generic/__pycache__/continuous_generic.cpython-310.pyc",
    "Things/Continuous_Generic/Output/tests/complex/energy_conservation/energy_evolution.gif",
    "Things/Continuous_Generic/Output/tests/complex/energy_conservation/energy_analysis.png",
    "Things/Continuous_Generic/Output/tests/complex/taylor_prediction/prediction_analysis.png",
    "Things/Continuous_Generic/Output/tests/complex/generalized_coordinates/error_analysis.png",
    "Things/Continuous_Generic/Output/tests/complex/generalized_coordinates/derivative_analysis.png",
    "Things/Continuous_Generic/Output/tests/complex/generalized_coordinates/generalized_coordinates.gif",
    "Things/Continuous_Generic/Output/tests/complex/driven_oscillator/prediction_analysis.png",
    "Things/Continuous_Generic/Output/tests/complex/driven_oscillator/state_correlations.png",
    "Things/Continuous_Generic/Output/tests/complex/driven_oscillator/time_evolution.png",
    "Things/Continuous_Generic/Output/tests/complex/driven_oscillator/phase_space.png"
  ]
 }
--- a/Things/Simple_POMDP/Output/A_matrix.png
+++ b/Things/Simple_POMDP/Output/A_matrix.png
--- a/Things/Simple_POMDP/Output/B_matrices.png
+++ b/Things/Simple_POMDP/Output/B_matrices.png
--- a/Things/Simple_POMDP/Output/C_matrix.png
+++ b/Things/Simple_POMDP/Output/C_matrix.png
--- a/Things/Simple_POMDP/Output/action_history.png
+++ b/Things/Simple_POMDP/Output/action_history.png
--- a/Things/Simple_POMDP/Output/all_matrices.png
+++ b/Things/Simple_POMDP/Output/all_matrices.png
--- a/Things/Simple_POMDP/Output/belief_evolution.png
+++ b/Things/Simple_POMDP/Output/belief_evolution.png
--- a/Things/Simple_POMDP/Output/belief_history.png
+++ b/Things/Simple_POMDP/Output/belief_history.png
--- a/Things/Simple_POMDP/Output/efe_components_detailed.png
+++ b/Things/Simple_POMDP/Output/efe_components_detailed.png
--- a/Things/Simple_POMDP/Output/free_energies.png
+++ b/Things/Simple_POMDP/Output/free_energies.png
--- a/Things/Simple_POMDP/Output/matrix_validation.txt
+++ b/Things/Simple_POMDP/Output/matrix_validation.txt
@ -7,15 +7,15 @@ A Matrix (Observation Model):
 - Non-negative: True
 Observation probabilities:
-  P(Low|Low) = 0.092
+  P(Low|Low) = 0.202
-  P(Low|Medium) = 0.219
+  P(Low|Medium) = 0.003
-  P(Low|High) = 0.423
+  P(Low|High) = 0.411
-  P(Medium|Low) = 0.270
+  P(Medium|Low) = 0.582
-  P(Medium|Medium) = 0.375
+  P(Medium|Medium) = 0.714
-  P(Medium|High) = 0.405
+  P(Medium|High) = 0.186
-  P(High|Low) = 0.638
+  P(High|Low) = 0.216
-  P(High|Medium) = 0.406
+  P(High|Medium) = 0.283
-  P(High|High) = 0.173
+  P(High|High) = 0.403
 B Matrix (Transition Model):
 - Shape: (3, 3, 3)
@ -25,45 +25,45 @@ Action: Decrease
 - Non-negative: True
 Transition probabilities:
-  P(Low|Low,Decrease) = 0.172
+  P(Low|Low,Decrease) = 0.324
-  P(Low|Medium,Decrease) = 0.278
+  P(Low|Medium,Decrease) = 0.186
-  P(Low|High,Decrease) = 0.042
+  P(Low|High,Decrease) = 0.012
-  P(Medium|Low,Decrease) = 0.158
+  P(Medium|Low,Decrease) = 0.320
-  P(Medium|Medium,Decrease) = 0.296
+  P(Medium|Medium,Decrease) = 0.162
-  P(Medium|High,Decrease) = 0.157
+  P(Medium|High,Decrease) = 0.722
-  P(High|Low,Decrease) = 0.670
+  P(High|Low,Decrease) = 0.356
-  P(High|Medium,Decrease) = 0.426
+  P(High|Medium,Decrease) = 0.651
-  P(High|High,Decrease) = 0.801
+  P(High|High,Decrease) = 0.266
 Action: Stay
 - Column stochastic: True
 - Non-negative: True
 Transition probabilities:
-  P(Low|Low,Stay) = 0.413
+  P(Low|Low,Stay) = 0.423
-  P(Low|Medium,Stay) = 0.319
+  P(Low|Medium,Stay) = 0.005
-  P(Low|High,Stay) = 0.453
+  P(Low|High,Stay) = 0.182
-  P(Medium|Low,Stay) = 0.048
+  P(Medium|Low,Stay) = 0.257
-  P(Medium|Medium,Stay) = 0.660
+  P(Medium|Medium,Stay) = 0.738
-  P(Medium|High,Stay) = 0.462
+  P(Medium|High,Stay) = 0.719
-  P(High|Low,Stay) = 0.539
+  P(High|Low,Stay) = 0.320
-  P(High|Medium,Stay) = 0.021
+  P(High|Medium,Stay) = 0.257
-  P(High|High,Stay) = 0.085
+  P(High|High,Stay) = 0.099
 Action: Increase
 - Column stochastic: True
 - Non-negative: True
 Transition probabilities:
-  P(Low|Low,Increase) = 0.272
+  P(Low|Low,Increase) = 0.320
-  P(Low|Medium,Increase) = 0.423
+  P(Low|Medium,Increase) = 0.367
-  P(Low|High,Increase) = 0.258
+  P(Low|High,Increase) = 0.486
-  P(Medium|Low,Increase) = 0.264
+  P(Medium|Low,Increase) = 0.241
-  P(Medium|Medium,Increase) = 0.401
+  P(Medium|Medium,Increase) = 0.364
-  P(Medium|High,Increase) = 0.364
+  P(Medium|High,Increase) = 0.264
-  P(High|Low,Increase) = 0.464
+  P(High|Low,Increase) = 0.438
-  P(High|Medium,Increase) = 0.176
+  P(High|Medium,Increase) = 0.269
-  P(High|High,Increase) = 0.377
+  P(High|High,Increase) = 0.250
 C Matrix (Log Preferences over Observations):
 - Shape: (3,)
--- a/Things/Simple_POMDP/Output/observation_likelihood.png
+++ b/Things/Simple_POMDP/Output/observation_likelihood.png
--- a/Things/Simple_POMDP/Output/policy_distribution.png
+++ b/Things/Simple_POMDP/Output/policy_distribution.png
--- a/Things/Simple_POMDP/Output/policy_evolution.png
+++ b/Things/Simple_POMDP/Output/policy_evolution.png
--- a/Things/Simple_POMDP/Output/simulation_log.txt
+++ b/Things/Simple_POMDP/Output/simulation_log.txt
@ -3,321 +3,321 @@ Simulation Log
 Step 1:
-State: Low
+State: High
-Observation: High
+Observation: Low
-Action: Increase
+Action: Decrease
-Variational FE: 0.914
+Variational FE: 1.557
 Expected Free Energies:
-Decrease: 0.095
+Decrease: 0.047
-Stay: 0.319
+Stay: -0.200
-Increase: 0.330
+Increase: 0.052
 Beliefs:
-Low: 0.420
+Low: 0.250
-Medium: 0.340
+Medium: 0.170
-High: 0.240
+High: 0.580
 Step 2:
-State: Low
+State: High
-Observation: High
+Observation: Low
-Action: Decrease
+Action: Increase
-Variational FE: 1.194
+Variational FE: 1.561
 Expected Free Energies:
-Decrease: 0.116
+Decrease: -0.112
-Stay: 0.334
+Stay: -0.280
-Increase: 0.330
+Increase: 0.031
 Beliefs:
-Low: 0.396
+Low: 0.329
-Medium: 0.307
+Medium: 0.087
-High: 0.296
+High: 0.584
 Step 3:
-State: Low
+State: Medium
 Observation: Medium
-Action: Stay
+Action: Increase
-Variational FE: 1.077
+Variational FE: 0.708
 Expected Free Energies:
-Decrease: 0.094
+Decrease: -0.131
-Stay: 0.332
+Stay: -0.230
-Increase: 0.328
+Increase: 0.043
 Beliefs:
-Low: 0.355
+Low: 0.413
-Medium: 0.351
+Medium: 0.235
-High: 0.294
+High: 0.351
 Step 4:
 State: High
 Observation: Medium
-Action: Stay
+Action: Decrease
-Variational FE: 1.078
+Variational FE: 0.729
 Expected Free Energies:
-Decrease: 0.109
+Decrease: 0.025
-Stay: 0.323
+Stay: -0.153
-Increase: 0.331
+Increase: 0.064
 Beliefs:
-Low: 0.333
+Low: 0.317
-Medium: 0.388
+Medium: 0.432
-High: 0.280
+High: 0.252
 Step 5:
 State: Medium
 Observation: Medium
 Action: Increase
-Variational FE: 1.049
+Variational FE: 0.702
 Expected Free Energies:
-Decrease: 0.123
+Decrease: 0.090
-Stay: 0.315
+Stay: -0.206
-Increase: 0.333
+Increase: 0.051
 Beliefs:
-Low: 0.292
+Low: 0.383
-Medium: 0.379
+Medium: 0.432
-High: 0.329
+High: 0.186
 Step 6:
 State: Medium
 Observation: Medium
 Action: Increase
 Variational FE: 1.048
 Expected Free Energies:
 Decrease: 0.111
 Stay: 0.304
 Increase: 0.332
 Beliefs:
 Low: 0.271
 Medium: 0.376
 High: 0.353
 Step 7:
 State: Medium
 Observation: Low
 Action: Stay
 Variational FE: 1.577
 Expected Free Energies:
 Decrease: 0.105
 Stay: 0.298
 Increase: 0.332
 Beliefs:
 Low: 0.223
 Medium: 0.412
 High: 0.365
 Step 8:
 State: Medium
 Observation: High
 Action: Stay
-Variational FE: 0.778
+Variational FE: 1.204
 Expected Free Energies:
-Decrease: 0.114
+Decrease: 0.110
-Stay: 0.276
+Stay: -0.158
-Increase: 0.333
+Increase: 0.062
 Beliefs:
-Low: 0.382
+Low: 0.263
-Medium: 0.406
+Medium: 0.475
-High: 0.212
+High: 0.262
 Step 7:
 State: High
 Observation: Low
 Action: Decrease
 Variational FE: 1.465
 Expected Free Energies:
 Decrease: 0.090
 Stay: -0.247
 Increase: 0.042
 Beliefs:
 Low: 0.209
 Medium: 0.240
 High: 0.551
 Step 8:
 State: Low
 Observation: Low
 Action: Stay
 Variational FE: 2.159
 Expected Free Energies:
 Decrease: -0.082
 Stay: -0.306
 Increase: 0.025
 Beliefs:
 Low: 0.270
 Medium: 0.128
 High: 0.601
 Step 9:
 State: High
 Observation: Low
-Action: Decrease
+Action: Increase
-Variational FE: 1.149
+Variational FE: 1.554
 Expected Free Energies:
-Decrease: 0.142
+Decrease: -0.134
-Stay: 0.325
+Stay: -0.269
-Increase: 0.334
+Increase: 0.034
 Beliefs:
-Low: 0.218
+Low: 0.338
-Medium: 0.277
+Medium: 0.066
-High: 0.505
+High: 0.595
 Step 10:
 State: Medium
 Observation: High
 Action: Stay
-Variational FE: 0.772
+Variational FE: 1.244
 Expected Free Energies:
-Decrease: 0.036
+Decrease: -0.143
-Stay: 0.287
+Stay: -0.226
-Increase: 0.327
+Increase: 0.044
 Beliefs:
-Low: 0.390
+Low: 0.264
-Medium: 0.326
+Medium: 0.310
-High: 0.284
+High: 0.426
 Step 11:
-State: Medium
+State: High
 Observation: High
-Action: Stay
+Action: Increase
-Variational FE: 0.818
+Variational FE: 1.229
 Expected Free Energies:
-Decrease: 0.103
+Decrease: 0.000
-Stay: 0.331
+Stay: -0.255
-Increase: 0.330
+Increase: 0.039
 Beliefs:
-Low: 0.480
+Low: 0.282
-Medium: 0.331
+Medium: 0.295
-High: 0.189
+High: 0.424
 Step 12:
 State: Low
 Observation: Medium
 Action: Increase
 Variational FE: 1.045
 Expected Free Energies:
 Decrease: 0.123
 Stay: 0.339
 Increase: 0.329
 Beliefs:
 Low: 0.362
 Medium: 0.340
 High: 0.297
 Step 13:
 State: High
 Observation: Medium
 Action: Increase
 Variational FE: 1.046
 Expected Free Energies:
 Decrease: 0.105
 Stay: 0.325
 Increase: 0.330
 Beliefs:
 Low: 0.304
 Medium: 0.352
 High: 0.345
 Step 14:
 State: High
 Observation: Low
 Action: Increase
-Variational FE: 1.403
+Variational FE: 1.564
 Expected Free Energies:
-Decrease: 0.099
+Decrease: -0.000
-Stay: 0.310
+Stay: -0.242
-Increase: 0.331
+Increase: 0.042
 Beliefs:
-Low: 0.212
+Low: 0.336
-Medium: 0.330
+Medium: 0.149
-High: 0.458
+High: 0.515
 Step 13:
 State: Medium
 Observation: Medium
 Action: Stay
 Variational FE: 0.547
 Expected Free Energies:
 Decrease: -0.075
 Stay: -0.217
 Increase: 0.047
 Beliefs:
 Low: 0.287
 Medium: 0.424
 High: 0.289
 Step 14:
 State: High
 Observation: Medium
 Action: Increase
 Variational FE: 0.697
 Expected Free Energies:
 Decrease: 0.075
 Stay: -0.229
 Increase: 0.046
 Beliefs:
 Low: 0.370
 Medium: 0.427
 High: 0.203
 Step 15:
 State: Medium
 Observation: High
-Action: Increase
+Action: Stay
-Variational FE: 0.910
+Variational FE: 1.205
 Expected Free Energies:
 Decrease: 0.066
 Stay: 0.280
 Increase: 0.330
 Beliefs:
 Low: 0.356
 Medium: 0.344
 High: 0.300
 Step 16:
 State: Low
 Observation: High
 Action: Increase
 Variational FE: 0.913
 Expected Free Energies:
 Decrease: 0.105
-Stay: 0.324
+Stay: -0.167
-Increase: 0.331
+Increase: 0.060
 Beliefs:
-Low: 0.433
+Low: 0.256
-Medium: 0.345
+Medium: 0.476
-High: 0.223
+High: 0.268
 Step 16:
 State: Low
 Observation: Medium
 Action: Increase
 Variational FE: 0.692
 Expected Free Energies:
 Decrease: 0.088
 Stay: -0.252
 Increase: 0.041
 Beliefs:
 Low: 0.353
 Medium: 0.456
 High: 0.191
 Step 17:
 State: High
-Observation: Medium
+Observation: High
-Action: Stay
+Action: Increase
-Variational FE: 1.074
+Variational FE: 1.214
 Expected Free Energies:
-Decrease: 0.121
+Decrease: 0.111
-Stay: 0.336
+Stay: -0.178
-Increase: 0.330
+Increase: 0.058
 Beliefs:
-Low: 0.370
+Low: 0.312
-Medium: 0.365
+Medium: 0.371
-High: 0.265
+High: 0.316
 Step 18:
 State: High
 Observation: Low
-Action: Decrease
+Action: Increase
-Variational FE: 1.134
+Variational FE: 1.563
 Expected Free Energies:
-Decrease: 0.119
+Decrease: 0.059
-Stay: 0.325
+Stay: -0.213
-Increase: 0.332
+Increase: 0.049
 Beliefs:
-Low: 0.210
+Low: 0.344
-Medium: 0.253
+Medium: 0.188
-High: 0.537
+High: 0.468
 Step 19:
-State: Medium
+State: Low
 Observation: Medium
 Action: Stay
-Variational FE: 1.089
+Variational FE: 0.553
 Expected Free Energies:
-Decrease: 0.019
+Decrease: -0.041
-Stay: 0.286
+Stay: -0.206
-Increase: 0.325
+Increase: 0.050
 Beliefs:
-Low: 0.270
+Low: 0.289
-Medium: 0.363
+Medium: 0.443
-High: 0.367
+High: 0.267
 Step 20:
-State: High
+State: Low
-Observation: High
+Observation: Medium
-Action: Decrease
+Action: Stay
-Variational FE: 1.214
+Variational FE: 0.565
 Expected Free Energies:
-Decrease: 0.098
+Decrease: 0.085
-Stay: 0.298
+Stay: -0.227
-Increase: 0.331
+Increase: 0.047
 Beliefs:
-Low: 0.310
+Low: 0.233
-Medium: 0.324
+Medium: 0.595
-High: 0.367
+High: 0.172
--- a/Things/Simple_POMDP/Output/state_transitions.png
+++ b/Things/Simple_POMDP/Output/state_transitions.png
--- a/src/models/active_inference/init.py
+++ b/src/models/active_inference/init.py
@ -2,4 +2,21 @@
 Active Inference model implementations.
 """
-from .base import ActiveInferenceModel 
+from .base import ActiveInferenceModel, ModelState
 from .dispatcher import (
    ActiveInferenceDispatcher,
    ActiveInferenceFactory,
    InferenceConfig,
    InferenceMethod,
    PolicyType
 )
 __all__ = [
    'ActiveInferenceModel',
    'ModelState',
    'ActiveInferenceDispatcher',
    'ActiveInferenceFactory',
    'InferenceConfig',
    'InferenceMethod',
    'PolicyType'
 ] 
--- a/src/models/active_inference/config_examples/continuous_sampling.yaml
+++ b/src/models/active_inference/config_examples/continuous_sampling.yaml
@ -0,0 +1,30 @@
 # Example configuration for continuous sampling-based active inference
 method: sampling
 policy_type: continuous
 temporal_horizon: 10
 learning_rate: 0.005
 precision_init: 1.0
 use_gpu: false
 num_samples: 2000
 temperature: 0.8
 # Model-specific parameters
 custom_params:
  exploration_weight: 0.4
  state_dimensions: [6]  # Continuous state space dimension
  action_dimensions: [2]  # Continuous action space dimension
  # Sampling parameters
  proposal_std: 0.1
  min_acceptance_rate: 0.2
  adaptation_rate: 0.01
  # Prior parameters
  state_prior_mean: [0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
  state_prior_std: [1.0, 1.0, 1.0, 1.0, 1.0, 1.0]
  # MCMC parameters
  burn_in: 500
  thinning: 2
  num_chains: 4 
--- a/src/models/active_inference/config_examples/discrete_variational.yaml
+++ b/src/models/active_inference/config_examples/discrete_variational.yaml
@ -0,0 +1,23 @@
 # Example configuration for discrete variational active inference
 method: variational
 policy_type: discrete
 temporal_horizon: 5
 learning_rate: 0.01
 precision_init: 1.0
 use_gpu: false
 # Model-specific parameters
 custom_params:
  exploration_weight: 0.3  # Balance between exploration and exploitation
  state_dimensions: [10, 10]  # Example state space dimensions
  action_dimensions: [4]  # Example action space dimensions
  # Prior preferences
  goal_prior_weight: 2.0
  entropy_weight: 0.5
  # Learning parameters
  belief_momentum: 0.9
  policy_temperature: 0.5
  max_iterations: 100 
--- a/src/models/active_inference/dispatcher.py
+++ b/src/models/active_inference/dispatcher.py
@ -34,6 +34,8 @@ class InferenceConfig:
    learning_rate: float
    precision_init: float
    use_gpu: bool = False
    num_samples: int = 1000  # For sampling-based methods
    temperature: float = 1.0  # For policy selection
    custom_params: Optional[Dict[str, Any]] = None
 class ActiveInferenceDispatcher:
@ -47,6 +49,7 @@ class ActiveInferenceDispatcher:
        self.config = config
        self._setup_implementations()
        self._initialize_matrices()
        self._rng = np.random.default_rng()  # For sampling methods
    def _setup_implementations(self):
        """Set up mapping of operations to implementations."""
@ -121,9 +124,41 @@ class ActiveInferenceDispatcher:
                              observation: np.ndarray,
                              state: ModelState,
                              **kwargs) -> np.ndarray:
-        """Sampling-based implementation of belief updates."""
+        """Sampling-based implementation of belief updates using particle filtering."""
-        # Implementation for sampling-based updates
+        num_samples = self.config.num_samples
-        raise NotImplementedError("Sampling-based belief updates not yet implemented")
+        generative_matrix = kwargs.get('generative_matrix', np.eye(len(state.beliefs)))
        # Initialize particles
        particles = self._rng.dirichlet(
            state.beliefs * num_samples,
            size=num_samples
        )
        # Compute weights based on likelihood
        likelihoods = np.array([
            self._compute_likelihood(observation, p, generative_matrix)
            for p in particles
        ])
        weights = likelihoods / np.sum(likelihoods)
        # Resample particles
        resampled_indices = self._rng.choice(
            num_samples,
            size=num_samples,
            p=weights
        )
        particles = particles[resampled_indices]
        # Return mean belief state
        return np.mean(particles, axis=0)
    def _compute_likelihood(self,
                          observation: np.ndarray,
                          particle: np.ndarray,
                          generative_matrix: np.ndarray) -> float:
        """Compute likelihood of observation given particle state."""
        prediction = np.dot(particle, generative_matrix)
        return np.exp(-0.5 * np.sum(np.square(observation - prediction)))
    def _mean_field_belief_update(self,
                                observation: np.ndarray,
@ -150,8 +185,45 @@ class ActiveInferenceDispatcher:
                                 state: ModelState,
                                 goal_prior: Optional[np.ndarray] = None,
                                 **kwargs) -> np.ndarray:
-        """Sampling-based implementation of policy inference."""
+        """Sampling-based implementation of policy inference using MCMC."""
-        raise NotImplementedError("Sampling-based policy inference not yet implemented")
+        if goal_prior is None:
            goal_prior = np.ones(len(state.policies)) / len(state.policies)
        num_samples = self.config.num_samples
        current_policies = state.policies.copy()
        accepted_policies = []
        # MCMC sampling
        for _ in range(num_samples):
            # Propose new policy distribution
            proposal = self._propose_policy(current_policies)
            # Compute acceptance ratio
            current_energy = self._policy_energy(current_policies, state, goal_prior)
            proposal_energy = self._policy_energy(proposal, state, goal_prior)
            # Accept/reject
            if np.log(self._rng.random()) < proposal_energy - current_energy:
                current_policies = proposal
            accepted_policies.append(current_policies.copy())
        # Return mean policy distribution
        return np.mean(accepted_policies, axis=0)
    def _propose_policy(self, current: np.ndarray) -> np.ndarray:
        """Generate policy proposal for MCMC."""
        proposal = current + self._rng.normal(0, 0.1, size=current.shape)
        return self.matrix_ops.normalize_rows(np.maximum(proposal, 0))
    def _policy_energy(self,
                      policies: np.ndarray,
                      state: ModelState,
                      goal_prior: np.ndarray) -> float:
        """Compute energy (negative log probability) for policy distribution."""
        expected_free_energy = self._calculate_expected_free_energy(
            state, goal_prior)
        return np.sum(policies * expected_free_energy)
    def _mean_field_policy_inference(self,
                                   state: ModelState,
@ -165,15 +237,43 @@ class ActiveInferenceDispatcher:
                                      goal_prior: np.ndarray,
                                      **kwargs) -> np.ndarray:
        """Calculate expected free energy for policy evaluation."""
-        # Basic implementation - can be extended based on specific needs
+        # Enhanced implementation with both pragmatic and epistemic value
-        pragmatic_value = -np.log(goal_prior + 1e-8)  # Avoid log(0)
+        pragmatic_value = self._calculate_pragmatic_value(state, goal_prior)
        epistemic_value = self._calculate_epistemic_value(state)
-        return pragmatic_value + epistemic_value
+        
        # Weight between exploration and exploitation
        exploration_weight = kwargs.get('exploration_weight', 0.5)
        return (1 - exploration_weight) * pragmatic_value + exploration_weight * epistemic_value
    def _calculate_pragmatic_value(self,
                                 state: ModelState,
                                 goal_prior: np.ndarray) -> np.ndarray:
        """Calculate pragmatic value component of expected free energy."""
        # KL divergence from current state to goal state
        return -np.log(goal_prior + 1e-8)
    def _calculate_epistemic_value(self, state: ModelState) -> np.ndarray:
        """Calculate epistemic value component of expected free energy."""
-        # Simple implementation - can be extended
+        # Information gain approximation
-        return -state.prediction_error * np.ones(len(state.policies))
+        uncertainty = -np.sum(state.beliefs * np.log(state.beliefs + 1e-8))
        return -uncertainty * np.ones(len(state.policies))
    def update_precision(self, prediction_error: float) -> float:
        """Update precision parameter based on prediction errors."""
        if self.config.method == InferenceMethod.VARIATIONAL:
            # Precision updates for variational method
            self.config.precision_init = (
                0.9 * self.config.precision_init +
                0.1 / (prediction_error + 1e-8)
            )
        elif self.config.method == InferenceMethod.SAMPLING:
            # Adaptive step size for sampling method
            self.config.precision_init = np.clip(
                1.0 / (prediction_error + 1e-8),
                0.1,
                10.0
            )
        return self.config.precision_init
 class ActiveInferenceFactory:
    """Factory for creating Active Inference instances with specific configurations."""
@ -197,6 +297,8 @@ class ActiveInferenceFactory:
            learning_rate=config_dict['learning_rate'],
            precision_init=config_dict['precision_init'],
            use_gpu=config_dict.get('use_gpu', False),
            num_samples=config_dict.get('num_samples', 1000),
            temperature=config_dict.get('temperature', 1.0),
            custom_params=config_dict.get('custom_params', None)
        )
        return ActiveInferenceFactory.create(config) 
--- a/src/models/active_inference/docs/active_inference_dispatcher.md
+++ b/src/models/active_inference/docs/active_inference_dispatcher.md
@ -0,0 +1,212 @@
 # Active Inference Implementation Documentation
 ## Overview
 This document describes the implementation of [[Active Inference]] methods in the cognitive modeling framework. The implementation provides a flexible and extensible architecture for different inference approaches and policy types.
 ## Core Components
 ### Dispatcher Pattern
 The [[ActiveInferenceDispatcher]] serves as the main interface for routing operations to specific implementations. It handles:
 - Belief updates
 - Policy inference
 - Free energy calculations
 - Precision updates
 ### Configuration
 [[InferenceConfig]] provides a structured way to configure the active inference process:
 - Inference method selection
 - Policy type specification
 - Temporal horizon
 - Learning parameters
 - GPU acceleration options
 ### Inference Methods
 Three main inference methods are supported:
 1. [[Variational Inference]]
   - Gradient-based belief updates
   - Deterministic policy optimization
   - Precision-weighted prediction errors
 2. [[Sampling Based Inference]]
   - Particle filtering for belief updates
   - MCMC for policy inference
   - Adaptive precision updates
 3. [[Mean Field Inference]]
   - Factorized approximations
   - Independent treatment of variables
   - (Implementation pending)
 ### Policy Types
 The framework supports multiple [[Policy Types]]:
 - `DISCRETE`: Finite action spaces
 - `CONTINUOUS`: Continuous action spaces
 - `HIERARCHICAL`: Nested policy structures
 ## Usage Examples
 ### Basic Configuration
 ```yaml
 method: variational
 policy_type: discrete
 temporal_horizon: 5
 learning_rate: 0.01
 precision_init: 1.0
 ```
 See [[Configuration Examples]] for more detailed examples.
 ### Code Usage
 ```python
 from models.active_inference import (
    ActiveInferenceFactory,
    InferenceConfig,
    InferenceMethod,
    PolicyType
 )
 # Create configuration
 config = InferenceConfig(...)
 dispatcher = ActiveInferenceFactory.create(config)
 # Update beliefs
 updated_beliefs = dispatcher.dispatch_belief_update(
    observation=current_observation,
    current_state=model_state
 )
 ```
 ## Implementation Details
 ### Free Energy Calculation
 The [[Expected Free Energy]] calculation combines:
 1. Pragmatic value (goal-directed behavior)
 2. Epistemic value (information seeking)
 ```python
 def _calculate_expected_free_energy(self, state, goal_prior, **kwargs):
    pragmatic_value = self._calculate_pragmatic_value(state, goal_prior)
    epistemic_value = self._calculate_epistemic_value(state)
    exploration_weight = kwargs.get('exploration_weight', 0.5)
    return (1 - exploration_weight) * pragmatic_value + exploration_weight * epistemic_value
 ```
 ### Belief Updates
 Different methods for [[Belief Updates]]:
 1. Variational:
   - Gradient-based updates
   - Precision-weighted errors
 2. Sampling:
   - Particle filtering
   - Importance resampling
 3. Mean Field:
   - Factorized updates
   - Independent parameter optimization
 ### Policy Inference
 [[Policy Inference]] implementations:
 1. Variational:
   ```python
   expected_free_energy = self._calculate_expected_free_energy(...)
   return self.matrix_ops.softmax(-expected_free_energy)
   ```
 2. MCMC:
   - Metropolis-Hastings sampling
   - Proposal distribution
   - Energy-based acceptance
 ## Advanced Features
 ### Precision Updates
 [[Precision Updates]] adapt based on prediction errors:
 - Variational: Running average updates
 - Sampling: Adaptive step sizes
 - Bounded optimization
 ### Matrix Operations
 Utility functions in [[Matrix Operations]]:
 - Normalization
 - Softmax
 - Information metrics
 ### GPU Acceleration
 [[GPU Support]] preparation:
 - Flag in configuration
 - Matrix operation optimization
 - Batch processing support
 ## Configuration Examples
 ### [[Discrete Variational Config]]
 ```yaml
 method: variational
 policy_type: discrete
 temporal_horizon: 5
 custom_params:
  exploration_weight: 0.3
  state_dimensions: [10, 10]
 ```
 ### [[Continuous Sampling Config]]
 ```yaml
 method: sampling
 policy_type: continuous
 num_samples: 2000
 custom_params:
  proposal_std: 0.1
  burn_in: 500
 ```
 ## Best Practices
 ### [[Performance Optimization]]
 1. Use appropriate number of samples
 2. Enable GPU for large state spaces
 3. Tune precision updates
 ### [[Numerical Stability]]
 1. Add small constants to denominators
 2. Use log probabilities where appropriate
 3. Implement bounds checking
 ### [[Debugging Tips]]
 1. Monitor acceptance rates in MCMC
 2. Track prediction errors
 3. Validate belief normalization
 ## Related Topics
 - [[Free Energy Principle]]
 - [[Active Inference Theory]]
 - [[Variational Bayes]]
 - [[MCMC Methods]]
 - [[Particle Filtering]]
 ## Future Extensions
 ### Planned Features
 1. [[Hierarchical Policies]]
   - Nested action spaces
   - Multi-scale temporal horizons
 2. [[Advanced Sampling]]
   - Hamiltonian Monte Carlo
   - Sequential Monte Carlo
 3. [[Neural Implementation]]
   - Deep active inference
   - Learned generative models
 ## References
 1. Friston, K. (2010). [[The Free-Energy Principle]]
 2. Da Costa, L., et al. (2020). [[Active Inference Algorithms]]
 3. Parr, T., & Friston, K. (2019). [[Discrete Active Inference]] 
--- a/src/models/active_inference/docs/dispatcher.md
+++ b/src/models/active_inference/docs/dispatcher.md
@ -0,0 +1,214 @@
 # Active Inference Dispatcher
 ## Overview
 The [[ActiveInferenceDispatcher]] is the core component that manages different implementations of active inference methods. It provides a clean interface for routing operations while handling the complexity of different inference approaches.
 ## Class Structure
 ```python
 class ActiveInferenceDispatcher:
    def __init__(self, config: InferenceConfig):
        self.config = config
        self._setup_implementations()
        self._initialize_matrices()
 ```
 ## Key Components
 ### 1. Method Dispatch
 The dispatcher uses a dictionary-based routing system to map methods to their implementations:
 ```python
 self._implementations = {
    InferenceMethod.VARIATIONAL: {
        'belief_update': self._variational_belief_update,
        'policy_inference': self._variational_policy_inference
    },
    # ... other methods
 }
 ```
 See [[Implementation Mapping]] for details.
 ### 2. Configuration
 Uses [[InferenceConfig]] for structured configuration:
 - Method selection
 - Policy type
 - Learning parameters
 - Custom parameters
 ### 3. Matrix Operations
 Integrates with [[Matrix Operations]] for efficient computations:
 - Normalization
 - Softmax
 - Information metrics
 ## Core Operations
 ### Belief Updates
 The [[Belief Update Methods]] include:
 1. **Variational**
   ```python
   def _variational_belief_update(self, observation, state, **kwargs):
       prediction = np.dot(state.beliefs, generative_matrix)
       prediction_error = observation - prediction
       return state.beliefs + state.precision * prediction_error
   ```
 2. **Sampling**
   ```python
   def _sampling_belief_update(self, observation, state, **kwargs):
       particles = self._initialize_particles(state)
       weights = self._compute_weights(particles, observation)
       return self._resample_particles(particles, weights)
   ```
 See [[Belief Update Implementation]] for more details.
 ### Policy Inference
 [[Policy Inference Methods]]:
 1. **Variational**
   - Expected free energy minimization
   - Softmax policy selection
 2. **MCMC**
   - Metropolis-Hastings algorithm
   - Proposal distribution
   - Energy-based acceptance
 ## Advanced Features
 ### 1. Precision Updates
 [[Precision Adaptation]] mechanisms:
 ```python
 def update_precision(self, prediction_error: float) -> float:
    if self.config.method == InferenceMethod.VARIATIONAL:
        return self._update_variational_precision(prediction_error)
    elif self.config.method == InferenceMethod.SAMPLING:
        return self._update_sampling_precision(prediction_error)
 ```
 ### 2. Free Energy Calculation
 [[Free Energy Components]]:
 1. Pragmatic value
 2. Epistemic value
 3. Exploration-exploitation balance
 ### 3. GPU Support
 [[GPU Acceleration]] features:
 - Configuration flag
 - Matrix operation optimization
 - Batch processing
 ## Usage Examples
 ### Basic Usage
 ```python
 # Create dispatcher
 config = InferenceConfig(method=InferenceMethod.VARIATIONAL, ...)
 dispatcher = ActiveInferenceFactory.create(config)
 # Update beliefs
 new_beliefs = dispatcher.dispatch_belief_update(
    observation=current_observation,
    current_state=model_state
 )
 # Infer policies
 policies = dispatcher.dispatch_policy_inference(
    state=model_state,
    goal_prior=goal_distribution
 )
 ```
 See [[Usage Examples]] for more scenarios.
 ## Configuration
 ### Variational Configuration
 ```yaml
 method: variational
 policy_type: discrete
 temporal_horizon: 5
 learning_rate: 0.01
 precision_init: 1.0
 ```
 ### Sampling Configuration
 ```yaml
 method: sampling
 policy_type: continuous
 num_samples: 2000
 custom_params:
  proposal_std: 0.1
 ```
 See [[Configuration Guide]] for details.
 ## Best Practices
 ### Performance
 [[Performance Guidelines]]:
 1. Use appropriate batch sizes
 2. Enable GPU for large models
 3. Optimize matrix operations
 ### Numerical Stability
 [[Stability Guidelines]]:
 1. Use log probabilities
 2. Add small constants
 3. Check bounds
 ### Debugging
 [[Debugging Strategies]]:
 1. Monitor convergence
 2. Track prediction errors
 3. Validate distributions
 ## Extension Points
 ### Adding New Methods
 To add a new inference method:
 1. Add to [[InferenceMethod]] enum
 2. Implement belief update method
 3. Implement policy inference method
 4. Add to implementation mapping
 ### Custom Policies
 [[Custom Policy Implementation]]:
 1. Extend PolicyType enum
 2. Implement policy-specific methods
 3. Add configuration support
 ## Related Components
 - [[Active Inference Model]]
 - [[Matrix Operations]]
 - [[Configuration System]]
 - [[Visualization Tools]]
 ## Future Development
 ### Planned Features
 1. [[Hierarchical Implementation]]
   - Nested policies
   - Multi-scale inference
 2. [[Advanced Methods]]
   - Hamiltonian Monte Carlo
   - Variational message passing
 3. [[Optimization]]
   - Parallel processing
   - Memory efficiency
 ## References
 1. [[Implementation Architecture]]
 2. [[Method Specifications]]
 3. [[API Documentation]]