Aureliolo
diff --git a/‎docs/api/memory.md‎
Lines changed: 6 additions & 0 deletions b/‎docs/api/memory.md‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/synthorg/memory/consolidation/abstractive.py‎
Lines changed: 43 additions & 17 deletions b/‎src/synthorg/memory/consolidation/abstractive.py‎
Lines changed: 43 additions & 17 deletions
diff --git a/‎src/synthorg/memory/consolidation/config.py‎
Lines changed: 5 additions & 4 deletions b/‎src/synthorg/memory/consolidation/config.py‎
Lines changed: 5 additions & 4 deletions
diff --git a/‎src/synthorg/memory/consolidation/dual_mode_strategy.py‎
Lines changed: 22 additions & 10 deletions b/‎src/synthorg/memory/consolidation/dual_mode_strategy.py‎
Lines changed: 22 additions & 10 deletions
diff --git a/‎src/synthorg/memory/consolidation/extractive.py‎
Lines changed: 7 additions & 11 deletions b/‎src/synthorg/memory/consolidation/extractive.py‎
Lines changed: 7 additions & 11 deletions
diff --git a/‎src/synthorg/memory/consolidation/models.py‎
Lines changed: 26 additions & 2 deletions b/‎src/synthorg/memory/consolidation/models.py‎
Lines changed: 26 additions & 2 deletions
diff --git a/‎src/synthorg/memory/consolidation/service.py‎
Lines changed: 12 additions & 9 deletions b/‎src/synthorg/memory/consolidation/service.py‎
Lines changed: 12 additions & 9 deletions
@@ -77,6 +77,12 @@ Persistent agent memory — protocol, retrieval pipeline, shared org memory, con
 
 ::: synthorg.memory.consolidation.service
 
+::: synthorg.memory.consolidation.retention
+
+::: synthorg.memory.consolidation.archival
+
+::: synthorg.memory.consolidation.simple_strategy
+
 ::: synthorg.memory.consolidation.density
 
 ::: synthorg.memory.consolidation.extractive
 
@@ -5,7 +5,7 @@
 if the LLM call fails.
 """
 
-import builtins
+import asyncio
 
 from synthorg.core.types import NotBlankStr  # noqa: TC001
 from synthorg.memory.models import MemoryEntry  # noqa: TC001
@@ -15,6 +15,7 @@
     DUAL_MODE_ABSTRACTIVE_SUMMARY,
 )
 from synthorg.providers.enums import MessageRole
+from synthorg.providers.errors import ProviderError
 from synthorg.providers.models import ChatMessage, CompletionConfig
 from synthorg.providers.protocol import CompletionProvider  # noqa: TC001
 
@@ -41,20 +42,23 @@ class AbstractiveSummarizer:
 
     Uses a ``CompletionProvider`` to generate concise summaries of
     conversational/narrative memory content.  Falls back to truncation
-    if the LLM call fails.
+    if the LLM call fails with a retryable error.
 
     Args:
         provider: Completion provider for LLM calls.
         model: Model identifier to use for summarization.
         max_summary_tokens: Maximum tokens for the summary response.
         temperature: Sampling temperature for summarization.
+
+    Raises:
+        ValueError: If ``model`` is empty or whitespace-only.
     """
 
     def __init__(
         self,
         *,
         provider: CompletionProvider,
-        model: str,
+        model: NotBlankStr,
         max_summary_tokens: int = 200,
         temperature: float = 0.3,
     ) -> None:
@@ -71,8 +75,9 @@ def __init__(
     async def summarize(self, content: str) -> str:
         """Generate an abstractive summary of the given content.
 
-        Falls back to truncation if the LLM call fails or returns
-        empty content.
+        Falls back to truncation if the LLM call fails with a
+        retryable error or returns empty content.  Non-retryable
+        provider errors (authentication, invalid model) propagate.
 
         Args:
             content: The sparse/conversational text to summarize.
@@ -98,42 +103,63 @@ async def summarize(self, content: str) -> str:
                     model=self._model,
                 )
                 return response.content.strip()
-        except builtins.MemoryError, RecursionError:
+        except MemoryError, RecursionError:
             raise
+        except ProviderError as exc:
+            if not exc.is_retryable:
+                raise
+            logger.warning(
+                DUAL_MODE_ABSTRACTIVE_FALLBACK,
+                content_length=len(content),
+                error=str(exc),
+                error_type=type(exc).__name__,
+            )
+            return _truncate_fallback(content)
         except Exception as exc:
             logger.warning(
                 DUAL_MODE_ABSTRACTIVE_FALLBACK,
                 content_length=len(content),
                 error=str(exc),
                 error_type=type(exc).__name__,
             )
+            return _truncate_fallback(content)
 
-        # Fallback: truncation
+        # Fallback: empty/whitespace-only LLM response
         logger.debug(
             DUAL_MODE_ABSTRACTIVE_FALLBACK,
             content_length=len(content),
-            reason="empty_or_failed",
+            reason="empty_response",
         )
         return _truncate_fallback(content)
 
     async def summarize_batch(
         self,
         entries: tuple[MemoryEntry, ...],
     ) -> tuple[tuple[NotBlankStr, str], ...]:
-        """Summarize multiple entries.
+        """Summarize multiple entries concurrently.
 
-        Each entry is summarized independently.  Failures for
-        individual entries fall back to truncation without aborting
-        the batch.
+        Each entry is summarized independently via ``asyncio.TaskGroup``.
+        Failures for individual entries fall back to truncation without
+        aborting the batch.
 
         Args:
             entries: Memory entries to summarize.
 
         Returns:
             Tuple of ``(entry_id, summary)`` pairs in input order.
         """
-        results: list[tuple[NotBlankStr, str]] = []
-        for entry in entries:
-            summary = await self.summarize(entry.content)
-            results.append((entry.id, summary))
-        return tuple(results)
+        if not entries:
+            return ()
+
+        results: dict[NotBlankStr, str] = {}
+        async with asyncio.TaskGroup() as tg:
+            tasks: dict[NotBlankStr, asyncio.Task[str]] = {}
+            for entry in entries:
+                tasks[entry.id] = tg.create_task(
+                    self.summarize(entry.content),
+                )
+
+        for entry_id, task in tasks.items():
+            results[entry_id] = task.result()
+
+        return tuple((entry.id, results[entry.id]) for entry in entries)
@@ -9,6 +9,7 @@
 from pydantic import BaseModel, ConfigDict, Field, model_validator
 
 from synthorg.core.enums import ConsolidationInterval
+from synthorg.core.types import NotBlankStr  # noqa: TC001
 from synthorg.memory.consolidation.models import RetentionRule  # noqa: TC001
 
 
@@ -57,7 +58,7 @@ class DualModeConfig(BaseModel):
 
     Attributes:
         enabled: Whether dual-mode density classification is active.
-            When ``False``, all entries use abstractive mode.
+            When ``False``, the dual-mode strategy is not used.
         dense_threshold: Density score threshold for DENSE classification
             (0.0 = classify everything as dense, 1.0 = everything sparse).
         summarization_model: Model ID for abstractive summarization.
@@ -80,8 +81,8 @@ class DualModeConfig(BaseModel):
         le=1.0,
         description="Density score threshold for DENSE classification",
     )
-    summarization_model: str = Field(
-        default="",
+    summarization_model: NotBlankStr | None = Field(
+        default=None,
         description="Model ID for abstractive summarization",
     )
     max_summary_tokens: int = Field(
@@ -106,7 +107,7 @@ class DualModeConfig(BaseModel):
     @model_validator(mode="after")
     def _validate_model_when_enabled(self) -> Self:
         """Require a summarization model when dual-mode is enabled."""
-        if self.enabled and not self.summarization_model.strip():
+        if self.enabled and self.summarization_model is None:
             msg = "summarization_model must be non-blank when dual-mode is enabled"
             raise ValueError(msg)
         return self
 
@@ -5,6 +5,7 @@
 preservation (dense) accordingly.
 """
 
+import asyncio
 from itertools import groupby
 from operator import attrgetter
 
@@ -179,8 +180,6 @@ async def _process_group(
         group_mode = self._determine_group_mode(group_tuple)
         _, to_remove = self._select_entries(group_tuple)
 
-        # Tie-breaking note: 50/50 dense/sparse splits default to
-        # ABSTRACTIVE (strict > comparison), which is the safer mode.
         logger.debug(
             DUAL_MODE_GROUP_CLASSIFIED,
             agent_id=agent_id,
@@ -203,7 +202,16 @@ async def _process_group(
         removed_ids: list[NotBlankStr] = []
         assignments: list[ArchivalModeAssignment] = []
         for entry in to_remove:
-            await self._backend.delete(agent_id, entry.id)
+            deleted = await self._backend.delete(agent_id, entry.id)
+            if not deleted:
+                logger.warning(
+                    DUAL_MODE_GROUP_CLASSIFIED,
+                    agent_id=agent_id,
+                    category=category.value,
+                    reason="delete_not_found",
+                    entry_id=entry.id,
+                )
+                continue
             removed_ids.append(entry.id)
             assignments.append(
                 ArchivalModeAssignment(
@@ -229,6 +237,8 @@ def _determine_group_mode(
         dense_count = sum(
             1 for _, density in classified if density == ContentDensity.DENSE
         )
+        # Tie-breaking: 50/50 dense/sparse splits default to
+        # ABSTRACTIVE (strict > comparison), which is the safer mode.
         is_majority_dense = dense_count > len(classified) / 2
         return (
             ArchivalMode.EXTRACTIVE if is_majority_dense else ArchivalMode.ABSTRACTIVE
@@ -273,11 +283,13 @@ async def _build_content(
         Returns:
             Consolidated content text.
         """
-        parts: list[str] = []
-        for entry in entries:
-            if mode == ArchivalMode.EXTRACTIVE:
-                parts.append(self._extractor.extract(entry.content))
-            else:
-                summary = await self._summarizer.summarize(entry.content)
-                parts.append(summary)
+        if mode == ArchivalMode.EXTRACTIVE:
+            parts = [self._extractor.extract(e.content) for e in entries]
+        else:
+            async with asyncio.TaskGroup() as tg:
+                tasks = [
+                    tg.create_task(self._summarizer.summarize(e.content))
+                    for e in entries
+                ]
+            parts = [t.result() for t in tasks]
         return "\n---\n".join(parts)
@@ -29,7 +29,7 @@
 _VERSION_PATTERN = re.compile(r"\bv?\d+\.\d+\.\d+(?:\.\d+)?\b")
 
 _KEY_VALUE_PATTERN = re.compile(
-    r"^\s*([\w.-]+)\s*[:=]\s*(\S.*)$",
+    r"^\s*([\w.-]+\s*[:=]\s*.*)$",
     re.MULTILINE,
 )
 
@@ -52,9 +52,8 @@ def _extract_versions(text: str) -> list[str]:
 
 
 def _extract_key_values(text: str) -> list[str]:
-    """Extract key=value and key: value pairs from text."""
-    matches = _KEY_VALUE_PATTERN.findall(text)
-    return [f"{k}={v.strip()}" for k, v in matches]
+    """Extract key-value pairs from text, preserving original form."""
+    return [m.strip() for m in _KEY_VALUE_PATTERN.findall(text)]
 
 
 def _build_anchors(
@@ -75,9 +74,7 @@ def _build_anchors(
     if text_len <= anchor_length:
         return text, "", ""
 
-    start = text[:anchor_length]
-    if text_len > anchor_length:
-        start += "..."
+    start = text[:anchor_length] + "..."
 
     mid_offset = max(0, (text_len - anchor_length) // 2)
     mid = text[mid_offset : mid_offset + anchor_length]
@@ -86,9 +83,7 @@ def _build_anchors(
     if mid_offset + anchor_length < text_len:
         mid += "..."
 
-    end = text[-anchor_length:]
-    if text_len > anchor_length:
-        end = "..." + end
+    end = "..." + text[-anchor_length:]
 
     return start, mid, end
 
@@ -152,7 +147,8 @@ def extract(self, content: str) -> str:
 
         lines = ["[Extractive preservation]"]
         if facts:
-            lines.append(f"Key facts: {', '.join(facts)}")
+            lines.append("Key facts:")
+            lines.extend(f"- {fact}" for fact in facts)
         lines.append(f"[START] {start}")
         if mid:
             lines.append(f"[MID] {mid}")
 
@@ -116,14 +116,38 @@ class ConsolidationResult(BaseModel):
     )
 
     @model_validator(mode="after")
-    def _validate_index_count(self) -> Self:
-        """Ensure archival index does not exceed archived count."""
+    def _validate_archival_consistency(self) -> Self:
+        """Ensure archival fields are internally consistent."""
+        if self.archived_count > self.consolidated_count:
+            msg = (
+                f"archived_count ({self.archived_count}) must not exceed "
+                f"consolidated_count ({self.consolidated_count})"
+            )
+            raise ValueError(msg)
         if len(self.archival_index) > self.archived_count:
             msg = (
                 f"archival_index length ({len(self.archival_index)}) "
                 f"must not exceed archived_count ({self.archived_count})"
             )
             raise ValueError(msg)
+        if len(self.mode_assignments) > len(self.removed_ids):
+            msg = (
+                f"mode_assignments length ({len(self.mode_assignments)}) "
+                f"must not exceed removed_ids length "
+                f"({len(self.removed_ids)})"
+            )
+            raise ValueError(msg)
+        removed_set = set(self.removed_ids)
+        for idx_entry in self.archival_index:
+            if idx_entry.original_id not in removed_set:
+                msg = (
+                    f"archival_index entry '{idx_entry.original_id}' not in removed_ids"
+                )
+                raise ValueError(msg)
+        index_ids = [e.original_id for e in self.archival_index]
+        if len(index_ids) != len(set(index_ids)):
+            msg = "archival_index contains duplicate original_ids"
+            raise ValueError(msg)
         return self
 
     @computed_field  # type: ignore[prop-decorator]
 
@@ -78,10 +78,10 @@ async def run_consolidation(
     ) -> ConsolidationResult:
         """Run memory consolidation for an agent.
 
-        Retrieves memories, applies the consolidation strategy, and
-        archives removed entries if archival is configured and enabled.
-        Per-entry archival failures are logged and skipped — they do
-        not abort the entire archival batch.
+        Retrieves up to 1000 entries per invocation and applies the
+        consolidation strategy, then archives removed entries if archival
+        is configured and enabled.  Per-entry archival failures are
+        logged and skipped — they do not abort the entire batch.
 
         Args:
             agent_id: Agent whose memories to consolidate.
@@ -260,14 +260,17 @@ async def _archive_entries(
         if self._archival_store is None:
             return 0, ()
 
-        mode_map = {a.original_id: a.mode for a in mode_assignments}
-        removed_set = set(removed_ids)
+        mode_map: dict[NotBlankStr, ArchivalMode] = {
+            a.original_id: a.mode for a in mode_assignments
+        }
+        entry_map = {entry.id: entry for entry in all_entries}
         now = datetime.now(UTC)
         archived = 0
         index_entries: list[ArchivalIndexEntry] = []
 
-        for entry in all_entries:
-            if entry.id not in removed_set:
+        for removed_id in removed_ids:
+            entry = entry_map.get(removed_id)
+            if entry is None:
                 continue
             success, idx = await self._archive_single_entry(
                 entry,
@@ -294,7 +297,7 @@ async def _archive_single_entry(
         self,
         entry: MemoryEntry,
         agent_id: NotBlankStr,
-        mode_map: dict[str, ArchivalMode],
+        mode_map: dict[NotBlankStr, ArchivalMode],
         now: datetime,
     ) -> tuple[bool, ArchivalIndexEntry | None]:
         """Archive a single entry to cold storage.