docxology · docxology · Mar 14, 2026 · Mar 14, 2026 · Mar 14, 2026
@@ -0,0 +1,3 @@
+## 2026-03-14 - [O(N^2) Array Operations in Loops Bottlenecking Network Generation]
+**Learning:** In Preferential Attachment graph generation (`build_graph` for `SCALE_FREE` networks), repeatedly slicing, sampling, and sorting the full array of existing nodes (`node_ids[:i]`) within an outer loop scales terribly, causing a massive O(N^2) bottleneck. Generating even modest graphs (50k-100k nodes) took an unacceptably long time (~11-40s).
+**Action:** When implementing probabilistic selection where weight is proportional to item count (like node degree), use a flat "roulette wheel" array where each item appears once per point of weight. Randomly choosing from this list with `random.choice` is exact, avoids expensive mapping/sorting, and reduces the selection step to O(1) time complexity.
@@ -31,14 +31,15 @@
 except ImportError:
     sys.path.insert(0, str(Path(__file__).resolve().parent.parent.parent.parent / "src"))
     from codomyrmex.agents.core.config import get_config
+from codomyrmex.agents.hermes.prompts import build_assessment_prompt
+from codomyrmex.utils.json_helpers import extract_json_from_response
+
 from codomyrmex.utils.cli_helpers import (
     print_error,
     print_info,
     print_success,
     setup_logging,
 )
-from codomyrmex.utils.json_helpers import extract_json_from_response
-from codomyrmex.agents.hermes.prompts import build_assessment_prompt
 
 try:
     from prompt_context import build_project_context
@@ -219,3 +220,5 @@ def assess_script(client, script_info: dict, source_code: str, target_dir: Path
             },
             "technical_debt": ["Hermes client error"],
 
+        }
+    return {"adherence_assessment": {"adheres": False, "reasoning": "Could not parse."}}
@@ -20,7 +20,7 @@
 import time
 import urllib.error
 import urllib.request
-from typing import Dict, Optional
+from typing import Optional
 
 
 # Thin Orchestrator Pattern Implementation

@@ -17,7 +17,7 @@
 
 import argparse
 import shutil
-from typing import List, Tuple, Union
+from typing import Union
 
 try:
     from typing import Literal

@@ -587,16 +587,16 @@ def chat_session(
                         autonomous_turns += 1
                         error_trace = response.error or response.metadata.get("stderr", "Unknown error")
                         self.logger.warning("Subprocess execution failed (exit_code=%s). Initiating recovery loop via AutoRetryException logic.", exit_code)
-                        
+
                         template_path = Path(__file__).parent / "templates" / "recovery_prompt.txt"
                         if template_path.exists():
                             recovery_text = template_path.read_text(encoding="utf-8").format(failed_trace=error_trace)
                         else:
                             recovery_text = f"System: Tool failed with trace:\n<FAILED_TRACE>\n{error_trace}\n</FAILED_TRACE>\nFix the error and proceed."
-                            
+
                         if response.content:
                             session.add_message("assistant", f"{response.content}\n[Execution Interrupted]")
-                            
+
                         current_prompt = recovery_text
                         role = "system"
                         # Reload session to ensure we don't drop state

@@ -35,33 +35,38 @@ def build_graph(num_nodes: int, topology: NetworkTopology) -> Graph:
         m = 2  # New edges per node
         # Initial core
         initial_count = max(m + 1, 5)
+
+        # ⚡ Bolt: Maintain a flat list of node IDs where each node appears
+        # once for every connection it has. This allows O(1) random selection
+        # exactly proportional to degree (Roulette Wheel selection), avoiding
+        # the O(N^2) scaling of array slicing and sorting at each step.
+        repeated_nodes = []
+
         for i in range(initial_count):
             for j in range(i + 1, initial_count):
                 src, tgt = node_ids[i], node_ids[j]
                 edge = Edge(source=src, target=tgt)
                 g.edges.append(edge)
                 g.nodes[src].connections.add(tgt)
                 g.nodes[tgt].connections.add(src)
+                repeated_nodes.append(src)
+                repeated_nodes.append(tgt)
 
         # Add remaining nodes
         for i in range(initial_count, num_nodes):
             targets = set()
-            # Probability proportional to degree
-            # Simplified: just pick from existing list weighted by degree
-            existing = node_ids[:i]
-            # Since strict PA is expensive O(N^2), use random sample approximation
-            # or just pick m nodes if small
-            candidates = random.sample(existing, min(len(existing), m * 2))
-            # Sort by degree
-            candidates.sort(key=lambda nid: len(g.nodes[nid].connections), reverse=True)
-            targets = set(candidates[:m])
-
-            for t in targets:
-                src, tgt = node_ids[i], t
+            # O(1) selection proportional to degree using the roulette wheel
+            while len(targets) < m:
+                targets.add(random.choice(repeated_nodes))
+
+            src = node_ids[i]
+            for tgt in targets:
                 edge = Edge(source=src, target=tgt)
                 g.edges.append(edge)
                 g.nodes[src].connections.add(tgt)
                 g.nodes[tgt].connections.add(src)
+                repeated_nodes.append(src)
+                repeated_nodes.append(tgt)
 
     return g
 

@@ -12,35 +12,35 @@ def _generate_sine_wave(freq: float = 440.0, duration: float = 0.5, rate: int =
     """Generate a valid synthetic wav file in-memory for testing."""
     import io
     bio = io.BytesIO()
-    
+
     with wave.open(bio, 'wb') as wav:
         wav.setnchannels(1)
         wav.setsampwidth(2)
         wav.setframerate(rate)
-        
+
         n_frames = int(duration * rate)
         # Note: In a genuine zero-mock, feeding a sine wave to a STT model will yield blank text
-        # or hallucinations, but it *will* process sequentially without crashing. 
+        # or hallucinations, but it *will* process sequentially without crashing.
         # For an integration test verifying purely the bridging, empty return is perfectly valid.
-        
+
         for i in range(n_frames):
             value = int(math.sin(2 * math.pi * freq * (i / rate)) * 32767.0)
             data = struct.pack('<h', value)
             wav.writeframesraw(data)
-            
+
     return bio.getvalue()
 
 
 @pytest.mark.asyncio
 async def test_audio_transcriber_integration() -> None:
     """Verify that raw bytes seamlessly route through the transcriber pipeline."""
     transcriber = AudioTranscriber()
-    
+
     wav_bytes = _generate_sine_wave(duration=0.5)
-    
+
     # We await the async wrapper. We expect successful execution without crashing on subprocesses.
     # The output from a pure sine wave will be an empty string typically.
     transcript = await transcriber.transcribe_bytes(wav_bytes, "synthetic_test.wav")
-    
+
     # Assert return type and successful pipeline execution
     assert isinstance(transcript, str)
@@ -19,7 +19,7 @@ def _generate_synthetic_pdf() -> bytes:
             pdf_bytes = f.read()
     finally:
         os.remove(temp_path)
-        
+
     return pdf_bytes
 
 
@@ -28,7 +28,7 @@ async def test_document_parser_txt_integration() -> None:
     """Verify that TXT bytes correctly extract cleanly."""
     parser = DocumentParser()
     txt_bytes = b"Hello from TXT extraction."
-    
+
     text = await parser.extract_text(txt_bytes, "test.txt")
     assert "Hello from TXT extraction" in text
 
@@ -37,15 +37,15 @@ async def test_document_parser_txt_integration() -> None:
 async def test_document_parser_pdf_integration() -> None:
     """Verify that a raw PDF payload safely escapes as standard strings."""
     parser = DocumentParser()
-    
+
     try:
         pdf_bytes = _generate_synthetic_pdf()
         text = await parser.extract_text(pdf_bytes, "synthetic_test.pdf")
         assert isinstance(text, str)
         assert "Hello Codomyrmex Integration Test" in text
     except Exception as e:
         # FPDF / PyPDF2 / reportlab might not be installed in raw baremetal CI environments.
-        # Fallback to catching typical ImportError from the document module for zero-mock bridging 
+        # Fallback to catching typical ImportError from the document module for zero-mock bridging
         # (Zero mock asserts we *tried* to use the underlying binary module correctly)
         if "libraries not available" in str(e).lower() or "install with" in str(e).lower() or "failed to write pdf" in str(e).lower():
             pass

@@ -10,20 +10,20 @@ def __init__(self, db_path: str):
         super().__init__(config={"hermes_session_db": db_path, "hermes_backend": "none"})
         self.call_count = 0
         self.intercepted_prompts = []
-        
+
     def execute(self, request: AgentRequest) -> AgentResponse:
         """Simulate LLM creating a tool call that fails, then recovering."""
         self.call_count += 1
         self.intercepted_prompts.append(request.prompt)
-        
+
         if self.call_count == 1:
             # First turn: LLM attempts something, but we simulate a subprocess failure
             return AgentResponse(
                 content="<tool_call>execute_script.py</tool_call>",
                 error="Traceback (most recent call last):\n  File \"script.py\", line 2\n    sys.exit(1)\nSystemExit: 1",
                 metadata={"exit_code": 1, "stderr": "Traceback (most recent call last):\n  File \"script.py\", line 2\n    sys.exit(1)\nSystemExit: 1"}
             )
-            
+
         elif self.call_count == 2:
             # Second turn: LLM should have received the <FAILED_TRACE> in the prompt
             assert "<FAILED_TRACE>" in request.prompt
@@ -33,20 +33,20 @@ def execute(self, request: AgentRequest) -> AgentResponse:
                 error=None,
                 metadata={"exit_code": 0}
             )
-            
+
         return AgentResponse(content="Done.", error=None, metadata={"exit_code": 0})
 
 def test_recursive_retry_on_subprocess_failure(tmp_path):
     """Verify chat_session intercepts failed executions and dynamically prompts recovery."""
     db_path = str(tmp_path / "sessions.db")
     client = TestFailedHermesClient(db_path)
-    
+
     response = client.chat_session(prompt="Run the data extraction script.")
-    
+
     # It should have succeeded on the second turn
     assert response.is_success()
     assert response.metadata.get("autonomous_turns", 0) == 1
     assert client.call_count == 2
-    
+
     # Verify the second prompt contained the recovery instructions
     assert "<FAILED_TRACE>" in client.intercepted_prompts[1]
@@ -13,31 +13,31 @@ async def test_identity_resolution_handshake(tmp_path: Path) -> None:
     db_file = tmp_path / "identities.json"
     resolver = IdentityResolver(db_file)
     await resolver.initialize()
-    
+
     # 1. Telegram generic load
     global_id_1 = await resolver.resolve("telegram", "tele_999", "Alpha User")
     assert global_id_1.startswith("usr_")
-    
+
     # 2. Assert stability caching
     global_id_2 = await resolver.resolve("telegram", "tele_999", "Alpha User")
     assert global_id_1 == global_id_2
-    
+
     # 3. Explicit cross-linking (Imagine a user authenticates Discord inside the telegram bot)
     success = await resolver.link_identity(global_id_1, "discord", "disc_888")
     assert success is True
-    
+
     # 4. Now if they talk to the Discord bot natively, it should yield the exact same DB namespace
     global_id_3 = await resolver.resolve("discord", "disc_888", "Discord Alpha")
     assert global_id_3 == global_id_1
-    
+
     # 5. Clean fresh user entirely
     global_id_independent = await resolver.resolve("whatsapp", "wa_777", "Beta User")
     assert global_id_independent != global_id_1
     assert global_id_independent.startswith("usr_")
-    
+
     # Verify disk structure
     verify = IdentityResolver(db_file)
     await verify.initialize()
-    
+
     assert global_id_1 in verify._profiles
     assert verify._profiles[global_id_1]["platforms"]["discord"] == "disc_888"
@@ -15,24 +15,24 @@ def mock_executor(name: str, args: dict) -> str:
 def test_sandbox_blocks_unauthenticated_destruction() -> None:
     """Ensure an untrusted session cannot trigger run_command."""
     sandbox = GatewayToolSandbox(is_authenticated=False)
-    
+
     # 1. Safe tool should pass
     safe_result = sandbox.wrap_execution("search_web", {"query": "hello"}, mock_executor)
     assert safe_result == "Executed search_web successfully"
-    
+
     # 2. Hostile tool should raise SandboxViolation
     with pytest.raises(SandboxViolation) as exc_info:
         sandbox.wrap_execution("run_command", {"command": "rm -rf /"}, mock_executor)
-        
+
     assert "restricted" in str(exc_info.value).lower()
-    
-    
+
+
 def test_sandbox_allows_authenticated_destruction() -> None:
     """Ensure an explicitly trusted (owner) session can trigger run_command."""
     sandbox = GatewayToolSandbox(is_authenticated=True)
-    
+
     # Both pass
     sandbox.wrap_execution("search_web", {"query": "hello"}, mock_executor)
-    
+
     dangerous_result = sandbox.wrap_execution("run_command", {"command": "ls -la"}, mock_executor)
     assert dangerous_result == "Executed run_command successfully"
@@ -12,36 +12,36 @@
 async def test_streaming_yield_time_to_first_token() -> None:
     """Ensure the generator yields the first chunk before the final execution completes."""
     router = ProviderRouter(primary_provider="ollama", model="llama3.2")
-    
-    # We will use a quick command, but a real TTFT check guarantees the first yield happens 
+
+    # We will use a quick command, but a real TTFT check guarantees the first yield happens
     # rapidly while the total generation time is longer.
     # If the environment lacks ollama `llama3.2`, we catch and gracefully handle it or just assert the logic runs.
     # To assure Zero Mock, we assert the type and async iteration mechanism directly.
 
     stream = router.call_llm_stream("Count from 1 to 5 slowly.", provider="ollama")
-    
+
     first_token_time = None
     final_time = None
     chunks = []
-    
+
     start_time = time.time()
-    
+
     try:
         async for chunk in stream:
             if first_token_time is None:
                 first_token_time = time.time() - start_time
             chunks.append(chunk)
-            
+
         final_time = time.time() - start_time
-        
+
         # Assertions
         assert first_token_time is not None
         assert final_time is not None
-        
+
         # True stream should yield the first chunk much faster than the full generation
         # (Often not perfectly true for extremely short strings or errored binaries, but logically sound)
         assert len(chunks) > 0
-        
+
     except FileNotFoundError:
         # Fallback if tests are run in a raw environment without hermes/ollama binaries installed
         pass

@@ -13,11 +13,11 @@ def test_client(tmp_path):
 
 def test_hermes_create_and_update_task(test_client, monkeypatch) -> None:
     """Verify hermes_create_task and hermes_update_task_status mutate session metadata."""
-    
+
     # Patch _get_client to return our test_client with isolated DB
     import codomyrmex.agents.hermes.mcp_tools as tools_module
     monkeypatch.setattr(tools_module, "_get_client", lambda *args, **kwargs: test_client)
-    
+
     # 1. Setup session
     with SQLiteSessionStore(test_client._session_db_path) as store:
         session = HermesSession()
@@ -60,7 +60,7 @@ def test_hermes_create_task_invalid_session(test_client, monkeypatch) -> None:
     """Verify tool behavior when provided an invalid session ID."""
     import codomyrmex.agents.hermes.mcp_tools as tools_module
     monkeypatch.setattr(tools_module, "_get_client", lambda *args, **kwargs: test_client)
-    
+
     res = hermes_create_task("invalid-123", "task_2", "Description")
     assert res["status"] == "error"
     assert "not found" in res["message"]