Spaces:
Running
on
Zero
Running
on
Zero
File size: 14,437 Bytes
0ccf2f0 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 |
"""
Comprehensive tests for warbler_cda.semantic_anchors module.
Tests the SemanticAnchorGraph with mocked dependencies.
"""
import pytest
from unittest.mock import Mock, patch
import time
class TestSemanticAnchorGraphInitialization:
"""Test SemanticAnchorGraph initialization."""
def test_graph_default_init(self):
"""Graph should initialize with default settings."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
assert graph.embedding_provider is not None
assert graph.memory_pool is not None
assert graph.anchors == {}
assert graph.clusters == {}
assert graph.max_age_days == 30
assert graph.consolidation_threshold == 0.8
assert graph.eviction_heat_threshold == 0.1
def test_graph_custom_config(self):
"""Graph should accept custom configuration."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
config = {
"max_age_days": 60,
"consolidation_threshold": 0.9,
"eviction_heat_threshold": 0.05,
"enable_memory_pooling": False
}
graph = SemanticAnchorGraph(config=config)
assert graph.max_age_days == 60
assert graph.consolidation_threshold == 0.9
assert graph.eviction_heat_threshold == 0.05
assert graph.enable_memory_pooling is False
def test_graph_custom_embedding_provider(self):
"""Graph should accept custom embedding provider."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
mock_provider = Mock()
graph = SemanticAnchorGraph(embedding_provider=mock_provider)
assert graph.embedding_provider == mock_provider
class TestCreateOrUpdateAnchor:
"""Test create_or_update_anchor method."""
def test_create_new_anchor(self):
"""create_or_update_anchor should create new anchor."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
anchor_id = graph.create_or_update_anchor(
concept_text="test concept",
utterance_id="u1",
context={"source": "test"}
)
assert anchor_id in graph.anchors
assert graph.anchors[anchor_id].concept_text == "test concept"
assert graph.metrics["total_anchors_created"] == 1
def test_update_existing_anchor(self):
"""create_or_update_anchor should update similar anchor."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.7})
# Create first anchor
anchor_id1 = graph.create_or_update_anchor(
concept_text="test concept",
utterance_id="u1",
context={}
)
initial_updates = graph.metrics["total_updates"]
# Create very similar anchor - should update existing
anchor_id2 = graph.create_or_update_anchor(
concept_text="test concept", # Same text
utterance_id="u2",
context={}
)
# Should be same anchor
assert anchor_id1 == anchor_id2
assert graph.metrics["total_updates"] == initial_updates + 1
assert graph.anchors[anchor_id1].provenance.update_count >= 2
def test_create_anchor_with_privacy_hooks(self):
"""create_or_update_anchor should use privacy hooks if available."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
mock_privacy = Mock()
mock_privacy.scrub_content_for_anchor_injection.return_value = (
"scrubbed content",
{"privacy_hook_applied": True}
)
mock_privacy.validate_privacy_compliance.return_value = (True, [])
graph = SemanticAnchorGraph(privacy_hooks=mock_privacy)
anchor_id = graph.create_or_update_anchor(
concept_text="sensitive data",
utterance_id="u1",
context={}
)
# Should have called privacy hooks
mock_privacy.scrub_content_for_anchor_injection.assert_called_once()
mock_privacy.validate_privacy_compliance.assert_called_once()
class TestGetSemanticClusters:
"""Test get_semantic_clusters method."""
def test_get_clusters_empty_graph(self):
"""get_semantic_clusters should return empty list for empty graph."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
clusters = graph.get_semantic_clusters()
assert clusters == []
def test_get_clusters_single_anchor(self):
"""get_semantic_clusters should return empty list with single anchor."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
graph.create_or_update_anchor("concept1", "u1", {})
clusters = graph.get_semantic_clusters()
assert clusters == []
def test_get_clusters_similar_anchors(self):
"""get_semantic_clusters should group similar anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.5})
# Create similar anchors
graph.create_or_update_anchor("jumping", "u1", {})
time.sleep(0.01)
graph.create_or_update_anchor("leaping", "u2", {})
time.sleep(0.01)
graph.create_or_update_anchor("completely different topic", "u3", {})
clusters = graph.get_semantic_clusters(max_clusters=5)
# Should find at least some clusters
assert isinstance(clusters, list)
class TestGetAnchorDiff:
"""Test get_anchor_diff method."""
def test_get_diff_no_changes(self):
"""get_anchor_diff should show no changes for future timestamp."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
graph.create_or_update_anchor("concept", "u1", {})
# Query from future
diff = graph.get_anchor_diff(since_timestamp=time.time() + 1000)
assert len(diff["added"]) == 0
assert len(diff["updated"]) == 0
def test_get_diff_added_anchors(self):
"""get_anchor_diff should detect newly added anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.95}) # Set high to prevent accidental consolidation
past_time = time.time() - 100
graph.create_or_update_anchor("concept1", "u1", {})
graph.create_or_update_anchor("completely different concept2", "u2", {}) # Make it clearly different
diff = graph.get_anchor_diff(since_timestamp=past_time)
assert len(diff["added"]) == 2
assert diff["total_anchors"] == 2
class TestApplyLifecyclePolicies:
"""Test apply_lifecycle_policies method."""
def test_lifecycle_aging(self):
"""apply_lifecycle_policies should age all anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
graph.create_or_update_anchor("concept", "u1", {})
actions = graph.apply_lifecycle_policies()
assert actions["aged"] == 1
def test_lifecycle_eviction_low_heat(self):
"""apply_lifecycle_policies should evict cold anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"eviction_heat_threshold": 0.5})
anchor_id = graph.create_or_update_anchor("concept", "u1", {})
# Manually set low heat
graph.anchors[anchor_id].heat = 0.1
actions = graph.apply_lifecycle_policies()
assert actions["evicted"] == 1
assert anchor_id not in graph.anchors
def test_lifecycle_eviction_old_age(self):
"""apply_lifecycle_policies should evict old anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
from warbler_cda.anchor_data_classes import AnchorProvenance
graph = SemanticAnchorGraph(config={"max_age_days": 1})
anchor_id = graph.create_or_update_anchor("concept", "u1", {})
# Manually set old timestamp (40 days ago)
old_time = time.time() - (40 * 24 * 3600)
graph.anchors[anchor_id].provenance.first_seen = old_time
actions = graph.apply_lifecycle_policies()
assert actions["evicted"] >= 1
class TestGetStabilityMetrics:
"""Test get_stability_metrics method."""
def test_stability_metrics_empty_graph(self):
"""get_stability_metrics should handle empty graph."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
metrics = graph.get_stability_metrics()
assert metrics["total_anchors"] == 0
assert metrics["average_age_days"] == 0
assert metrics["stability_score"] == 1.0
def test_stability_metrics_with_anchors(self):
"""get_stability_metrics should calculate metrics."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.95}) # Prevent consolidation
graph.create_or_update_anchor("first concept", "u1", {})
graph.create_or_update_anchor("very different second concept", "u2", {})
metrics = graph.get_stability_metrics()
assert metrics["total_anchors"] == 2
assert metrics["average_heat"] > 0
assert 0 <= metrics["stability_score"] <= 1.0
assert "provider_info" in metrics
class TestPrivacyIntegration:
"""Test privacy hooks integration."""
def test_get_privacy_metrics_no_hooks(self):
"""get_privacy_metrics should handle missing privacy hooks."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
metrics = graph.get_privacy_metrics()
assert metrics["privacy_hooks_enabled"] is False
def test_get_privacy_metrics_with_hooks(self):
"""get_privacy_metrics should call privacy hooks."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
mock_privacy = Mock()
mock_privacy.get_privacy_metrics.return_value = {
"pii_detections": 5,
"scrubbing_applied": 3
}
graph = SemanticAnchorGraph(privacy_hooks=mock_privacy)
metrics = graph.get_privacy_metrics()
assert metrics["pii_detections"] == 5
mock_privacy.get_privacy_metrics.assert_called_once()
class TestHelperMethods:
"""Test helper methods."""
def test_generate_anchor_id(self):
"""_generate_anchor_id should create unique IDs."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
id1 = graph._generate_anchor_id("concept1")
time.sleep(0.01)
id2 = graph._generate_anchor_id("concept2")
assert id1 != id2
assert id1.startswith("anchor_")
assert id2.startswith("anchor_")
def test_calculate_drift(self):
"""_calculate_drift should compute semantic drift."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
# Identical embeddings = 0 drift
emb1 = [1.0, 0.0, 0.0]
emb2 = [1.0, 0.0, 0.0]
drift = graph._calculate_drift(emb1, emb2)
assert drift < 0.01
# Different embeddings = higher drift
emb3 = [0.0, 1.0, 0.0]
drift2 = graph._calculate_drift(emb1, emb3)
assert drift2 > 0.5
def test_find_similar_anchor_none(self):
"""_find_similar_anchor should return None when no similar anchors."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph()
result = graph._find_similar_anchor([0.1, 0.2, 0.3])
assert result is None
def test_find_similar_anchor_match(self):
"""_find_similar_anchor should find similar anchor."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.7})
anchor_id = graph.create_or_update_anchor("test", "u1", {})
# Get the embedding
anchor = graph.anchors[anchor_id]
similar_id = graph._find_similar_anchor(anchor.embedding)
assert similar_id == anchor_id
class TestIntegration:
"""Integration tests for complete anchor lifecycle."""
def test_full_anchor_lifecycle(self):
"""Test complete lifecycle: create, update, age, evict."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={
"max_age_days": 1,
"eviction_heat_threshold": 0.05
})
# Create anchor
anchor_id = graph.create_or_update_anchor("concept", "u1", {})
assert anchor_id in graph.anchors
# Update anchor
graph.create_or_update_anchor("concept", "u2", {})
assert graph.anchors[anchor_id].provenance.update_count >= 2
# Age anchor (set old timestamp)
graph.anchors[anchor_id].provenance.first_seen = time.time() - (10 * 24 * 3600)
# Apply lifecycle
actions = graph.apply_lifecycle_policies()
# Should be evicted due to age
assert actions["evicted"] >= 1
def test_stability_metrics_workflow(self):
"""Test stability metrics calculation workflow."""
from warbler_cda.semantic_anchors import SemanticAnchorGraph
graph = SemanticAnchorGraph(config={"consolidation_threshold": 0.95}) # Prevent consolidation
# Create multiple distinct anchors
distinct_concepts = [
"quantum physics fundamentals",
"machine learning algorithms",
"ancient Greek philosophy",
"modern art techniques",
"sustainable agriculture"
]
for i, concept in enumerate(distinct_concepts):
graph.create_or_update_anchor(concept, f"u{i}", {})
# Get metrics
metrics = graph.get_stability_metrics()
assert metrics["total_anchors"] == 5
assert metrics["average_heat"] > 0
assert "provider_info" in metrics
assert "memory_pool_metrics" in metrics
|