Function bodies 288 total

run_benchmark function · python · L29-L86 (58 LOC)

benchmarks/bench_memory_write.py

def run_benchmark(
    n_iterations: int = 1000,
    seed: int = 42,
) -> dict[str, object]:
    """Measure write throughput and per-write latency.

    Parameters
    ----------
    n_iterations:
        Number of individual write operations to measure.
    seed:
        Reproducibility seed.

    Returns
    -------
    dict with throughput (memories/sec) and per-write latency stats.
    """
    entries, _ = generate_memory_dataset(
        n_memories=n_iterations, seed=seed, layer=MemoryLayer.SEMANTIC
    )
    store = InMemoryStorage()

    individual_latencies_ms: list[float] = []

    # Warmup — write 10 entries to prime any interpreter JIT paths
    warmup_count = min(10, len(entries))
    for entry in entries[:warmup_count]:
        store.save(entry)
    store.clear()

    # Timed run
    overall_start = time.perf_counter()
    for entry in entries:
        start = time.perf_counter()
        store.save(entry)
        elapsed_ms = (time.perf_counter() - start) * 1000
        in

_measure_query_latencies function · python · L29-L71 (43 LOC)

benchmarks/bench_retrieval_latency.py

def _measure_query_latencies(
    store_size: int,
    n_queries: int,
    seed: int,
) -> dict[str, float]:
    """Populate a store of store_size entries and run n_queries, return stats.

    Parameters
    ----------
    store_size:
        Number of memories in the store.
    n_queries:
        Number of search operations to measure.
    seed:
        Reproducibility seed.

    Returns
    -------
    dict with p50/p95/p99/mean latencies in milliseconds.
    """
    store = build_store(n_memories=store_size, seed=seed)
    queries = [generate_query_for_topic(t) for t in TOPIC_NAMES] * (
        n_queries // len(TOPIC_NAMES) + 1
    )
    queries = queries[:n_queries]

    latencies_ms: list[float] = []
    for query in queries:
        start = time.perf_counter()
        store.search(query, layer=MemoryLayer.SEMANTIC, limit=10)
        elapsed_ms = (time.perf_counter() - start) * 1000
        latencies_ms.append(elapsed_ms)

    sorted_lats = sorted(latencies_ms)
    n = len(sorted_

run_benchmark function · python · L74-L112 (39 LOC)

benchmarks/bench_retrieval_latency.py

def run_benchmark(
    store_sizes: list[int] | None = None,
    n_queries: int = 200,
    seed: int = 42,
) -> dict[str, object]:
    """Measure retrieval latency across multiple store sizes.

    Parameters
    ----------
    store_sizes:
        List of store sizes to evaluate. Defaults to [100, 1000, 10000].
    n_queries:
        Queries to run per store size.
    seed:
        Reproducibility seed.

    Returns
    -------
    dict with latency stats per store size.
    """
    if store_sizes is None:
        store_sizes = [100, 1_000, 10_000]

    size_results: dict[str, dict[str, float]] = {}
    for size in store_sizes:
        print(f"  Measuring store_size={size:,} with {n_queries} queries...")
        size_results[str(size)] = _measure_query_latencies(
            store_size=size,
            n_queries=n_queries,
            seed=seed,
        )

    return {
        "benchmark": "retrieval_latency",
        "store_sizes": store_sizes,
        "n_queries_per_size": n_querie

precision_at_k function · python · L38-L63 (26 LOC)

benchmarks/bench_retrieval_precision.py

def precision_at_k(
    retrieved_ids: list[str],
    relevant_ids: set[str],
    k: int,
) -> float:
    """Compute precision@k: fraction of top-k results that are relevant.

    Parameters
    ----------
    retrieved_ids:
        Ordered list of memory_ids returned by the search.
    relevant_ids:
        Set of memory_ids that are relevant (same topic).
    k:
        Cut-off rank.

    Returns
    -------
    float
        Precision in [0.0, 1.0].
    """
    if k <= 0:
        return 0.0
    top_k = retrieved_ids[:k]
    hits = sum(1 for mid in top_k if mid in relevant_ids)
    return hits / k

recall_at_k function · python · L66-L91 (26 LOC)

benchmarks/bench_retrieval_precision.py

def recall_at_k(
    retrieved_ids: list[str],
    relevant_ids: set[str],
    k: int,
) -> float:
    """Compute recall@k: fraction of relevant items found in top-k.

    Parameters
    ----------
    retrieved_ids:
        Ordered list of memory_ids returned by the search.
    relevant_ids:
        Complete set of relevant memory_ids.
    k:
        Cut-off rank.

    Returns
    -------
    float
        Recall in [0.0, 1.0].
    """
    if not relevant_ids:
        return 0.0
    top_k = set(retrieved_ids[:k])
    hits = len(top_k & relevant_ids)
    return hits / len(relevant_ids)

run_benchmark function · python · L94-L183 (90 LOC)

benchmarks/bench_retrieval_precision.py

def run_benchmark(
    n_memories: int = 1000,
    k_values: list[int] | None = None,
    seed: int = 42,
) -> dict[str, object]:
    """Measure retrieval precision@k and recall@k.

    Parameters
    ----------
    n_memories:
        Total memories inserted into the store.
    k_values:
        List of k cut-offs to evaluate. Defaults to [1, 5, 10].
    seed:
        Fixed seed for reproducibility.

    Returns
    -------
    dict
        Benchmark results with precision/recall per k value.
    """
    if k_values is None:
        k_values = [1, 5, 10]

    entries, ground_truth = generate_memory_dataset(
        n_memories=n_memories, seed=seed, layer=MemoryLayer.SEMANTIC
    )
    store = InMemoryStorage()
    for entry in entries:
        store.save(entry)

    per_topic_results: list[dict[str, float]] = []
    latencies_ms: list[float] = []

    for topic in TOPIC_NAMES:
        query = generate_query_for_topic(topic)
        relevant_ids: set[str] = set(ground_truth.get(topic,

_fmt_table function · python · L34-L41 (8 LOC)

benchmarks/compare.py

def _fmt_table(rows: list[tuple[str, str]], title: str) -> None:
    """Print a simple two-column table."""
    col1_width = max(len(r[0]) for r in rows) + 2
    print(f"\n{'=' * 60}")
    print(f"  {title}")
    print(f"{'=' * 60}")
    for key, value in rows:
        print(f"  {key:<{col1_width}} {value}")

Citation: Repobility (2026). State of AI-Generated Code. https://repobility.com/research/

display_precision_results function · python · L51-L64 (14 LOC)

benchmarks/compare.py

def display_precision_results(data: dict[str, object]) -> None:
    """Display precision/recall benchmark results."""
    metrics = data.get("metrics", {})
    rows: list[tuple[str, str]] = []
    for k in [1, 5, 10]:
        rows.append((f"Precision@{k}", f"{metrics.get(f'mean_precision_at_{k}', 'N/A'):.4f}"))
        rows.append((f"Recall@{k}", f"{metrics.get(f'mean_recall_at_{k}', 'N/A'):.4f}"))
        rows.append((f"F1@{k}", f"{metrics.get(f'mean_f1_at_{k}', 'N/A'):.4f}"))
    lat = data.get("query_latency_ms", {})
    rows.append(("Query latency p50 (ms)", str(lat.get("p50", "N/A"))))
    rows.append(("Query latency p95 (ms)", str(lat.get("p95", "N/A"))))
    rows.append(("Query latency p99 (ms)", str(lat.get("p99", "N/A"))))
    _fmt_table(rows, "Retrieval Precision Results")
    print(f"\n  Note: {COMPETITOR_NOTES['retrieval_precision']}")

display_latency_results function · python · L67-L76 (10 LOC)

benchmarks/compare.py

def display_latency_results(data: dict[str, object]) -> None:
    """Display latency benchmark results across store sizes."""
    size_results = data.get("results_by_store_size", {})
    rows: list[tuple[str, str]] = []
    for size, stats in size_results.items():
        rows.append((f"Store size {size} — p50 (ms)", str(stats.get("p50_ms"))))
        rows.append((f"Store size {size} — p95 (ms)", str(stats.get("p95_ms"))))
        rows.append((f"Store size {size} — p99 (ms)", str(stats.get("p99_ms"))))
    _fmt_table(rows, "Retrieval Latency by Store Size")
    print(f"\n  Note: {COMPETITOR_NOTES['retrieval_latency']}")

display_write_results function · python · L79-L90 (12 LOC)

benchmarks/compare.py

def display_write_results(data: dict[str, object]) -> None:
    """Display write throughput benchmark results."""
    lat = data.get("per_write_latency_ms", {})
    rows: list[tuple[str, str]] = [
        ("Throughput (memories/sec)", str(data.get("throughput_memories_per_second"))),
        ("Per-write p50 (ms)", str(lat.get("p50"))),
        ("Per-write p95 (ms)", str(lat.get("p95"))),
        ("Per-write p99 (ms)", str(lat.get("p99"))),
        ("Total elapsed (sec)", str(data.get("total_elapsed_seconds"))),
    ]
    _fmt_table(rows, "Write Throughput Results")
    print(f"\n  Note: {COMPETITOR_NOTES['memory_write_throughput']}")

main function · python · L93-L121 (29 LOC)

benchmarks/compare.py

def main() -> None:
    """Load all result files and display comparison tables."""
    results_dir = Path(__file__).parent / "results"

    baseline = _load_json(results_dir / "baseline.json")
    latency = _load_json(results_dir / "latency_baseline.json")
    write = _load_json(results_dir / "write_baseline.json")

    if baseline:
        display_precision_results(baseline)
    else:
        print("No baseline.json found. Run bench_retrieval_precision.py first.")

    if latency:
        display_latency_results(latency)
    else:
        print("No latency_baseline.json found. Run bench_retrieval_latency.py first.")

    if write:
        display_write_results(write)
    else:
        print("No write_baseline.json found. Run bench_memory_write.py first.")

    print("\n" + "=" * 60)
    print("  To regenerate all results:")
    print("    python benchmarks/bench_retrieval_precision.py")
    print("    python benchmarks/bench_retrieval_latency.py")
    print("    python benchmarks/benc

build_store function · python · L24-L47 (24 LOC)

benchmarks/conftest.py

def build_store(n_memories: int, seed: int = 42) -> InMemoryStorage:
    """Return an InMemoryStorage pre-populated with n_memories entries.

    Parameters
    ----------
    n_memories:
        Number of MemoryEntry objects to insert.
    seed:
        Fixed seed for reproducibility.

    Returns
    -------
    InMemoryStorage
        Populated store ready for benchmarking.
    """
    entries, _ = generate_memory_dataset(
        n_memories=n_memories,
        seed=seed,
        layer=MemoryLayer.SEMANTIC,
    )
    store = InMemoryStorage()
    for entry in entries:
        store.save(entry)
    return store

_generate_content function · python · L57-L67 (11 LOC)

benchmarks/datasets/synthetic_memories.py

def _generate_content(topic: str, keywords: list[str], rng: random.Random) -> str:
    """Generate a deterministic sentence for a topic using its keywords."""
    keyword = rng.choice(keywords)
    templates = [
        f"The {keyword} is essential for understanding {topic.replace('_', ' ')} concepts.",
        f"When working with {topic.replace('_', ' ')}, remember that {keyword} matters most.",
        f"A common pattern in {topic.replace('_', ' ')} involves configuring the {keyword} correctly.",
        f"The {keyword} component of {topic.replace('_', ' ')} requires careful attention.",
        f"Experienced engineers use {keyword} as a core primitive in {topic.replace('_', ' ')}.",
    ]
    return rng.choice(templates)

generate_memory_dataset function · python · L70-L114 (45 LOC)

benchmarks/datasets/synthetic_memories.py

def generate_memory_dataset(
    n_memories: int = 1000,
    seed: int = 42,
    layer: MemoryLayer = MemoryLayer.SEMANTIC,
) -> tuple[list[MemoryEntry], dict[str, list[str]]]:
    """Generate a reproducible synthetic memory dataset.

    Parameters
    ----------
    n_memories:
        Total number of MemoryEntry objects to generate.
    seed:
        Random seed for reproducibility.
    layer:
        The MemoryLayer to assign to all generated entries.

    Returns
    -------
    tuple of:
        - list of MemoryEntry objects
        - dict mapping topic name to list of memory_ids for that topic
          (the ground truth for retrieval evaluation)
    """
    rng = random.Random(seed)
    entries: list[MemoryEntry] = []
    ground_truth: dict[str, list[str]] = {topic: [] for topic in TOPIC_NAMES}

    for index in range(n_memories):
        topic = TOPIC_NAMES[index % len(TOPIC_NAMES)]
        keywords = TOPIC_KEYWORDS[topic]
        content = _generate_content(topic, keywords, r

generate_query_for_topic function · python · L117-L123 (7 LOC)

benchmarks/datasets/synthetic_memories.py

def generate_query_for_topic(topic: str) -> str:
    """Return the primary search keyword for a topic.

    The first keyword in the topic's vocabulary is used as the canonical
    query. This ensures the query matches only entries from that topic.
    """
    return TOPIC_KEYWORDS[topic][0]

Repobility · code-quality intelligence platform · https://repobility.com

generate_ground_truth_entries function · python · L126-L163 (38 LOC)

benchmarks/datasets/synthetic_memories.py

def generate_ground_truth_entries(
    n_memories: int = 100,
    seed: int = 42,
    layer: MemoryLayer = MemoryLayer.SEMANTIC,
) -> list[GroundTruthEntry]:
    """Generate GroundTruthEntry objects for precision/recall evaluation.

    Parameters
    ----------
    n_memories:
        Total number of entries to generate.
    seed:
        Random seed for reproducibility.
    layer:
        Memory layer for all entries.

    Returns
    -------
    list of GroundTruthEntry
        Each entry has its memory and the canonical topic+keywords.
    """
    entries, ground_truth = generate_memory_dataset(n_memories, seed, layer)
    result: list[GroundTruthEntry] = []
    memory_to_topic: dict[str, str] = {}
    for topic, memory_ids in ground_truth.items():
        for memory_id in memory_ids:
            memory_to_topic[memory_id] = topic

    for entry in entries:
        topic = memory_to_topic[entry.memory_id]
        result.append(
            GroundTruthEntry(
                entry=en

AnthropicMemoryBridge.store_conversation method · python · L28-L48 (21 LOC)

src/agent_memory/adapters/anthropic_sdk.py

    def store_conversation(self, conversation_id: str, messages: list[Any]) -> str:
        """Persist a conversation's messages under a conversation ID.

        Returns a unique memory entry ID.
        """
        entry_id = str(uuid.uuid4())
        entry: dict[str, Any] = {
            "id": entry_id,
            "type": "conversation",
            "conversation_id": conversation_id,
            "messages": [str(m) for m in messages],
            "count": len(messages),
        }
        self._items.append(entry)
        logger.debug(
            "Stored conversation conversation_id=%s entry_id=%s messages=%d",
            conversation_id,
            entry_id,
            len(messages),
        )
        return entry_id

AnthropicMemoryBridge.retrieve_context method · python · L50-L59 (10 LOC)

src/agent_memory/adapters/anthropic_sdk.py

    def retrieve_context(self, query: str) -> list[dict[str, Any]]:
        """Retrieve memory entries whose messages contain the query string.

        Returns matching entries across all conversations.
        """
        results: list[dict[str, Any]] = []
        for item in self._items:
            if any(query.lower() in msg.lower() for msg in item.get("messages", [])):
                results.append(item)
        return results

CrewAIMemoryBridge.store_task_result method · python · L28-L42 (15 LOC)

src/agent_memory/adapters/crewai.py

    def store_task_result(self, task_name: str, result: Any) -> str:
        """Persist a task result to the memory store.

        Returns a unique memory entry ID.
        """
        entry_id = str(uuid.uuid4())
        entry: dict[str, Any] = {
            "id": entry_id,
            "type": "task_result",
            "task_name": task_name,
            "result": str(result) if result is not None else "",
        }
        self._items.append(entry)
        logger.debug("Stored task result for task=%s id=%s", task_name, entry_id)
        return entry_id

CrewAIMemoryBridge.retrieve_knowledge method · python · L44-L54 (11 LOC)

src/agent_memory/adapters/crewai.py

    def retrieve_knowledge(self, query: str) -> list[dict[str, Any]]:
        """Retrieve stored knowledge entries that match the query.

        Returns task result entries (naive full-scan; replace with vector
        search in production).
        """
        results: list[dict[str, Any]] = []
        for item in self._items:
            if query.lower() in item.get("task_name", "").lower() or query.lower() in item.get("result", "").lower():
                results.append(item)
        return results

LangChainMemoryBridge.store_conversation method · python · L29-L43 (15 LOC)

src/agent_memory/adapters/langchain.py

    def store_conversation(self, messages: list[Any]) -> str:
        """Persist a list of LangChain messages to the memory store.

        Returns a unique memory entry ID for later retrieval.
        """
        entry_id = str(uuid.uuid4())
        entry: dict[str, Any] = {
            "id": entry_id,
            "type": "conversation",
            "messages": [str(m) for m in messages],
            "count": len(messages),
        }
        self._items.append(entry)
        logger.debug("Stored conversation with id=%s, messages=%d", entry_id, len(messages))
        return entry_id

LangChainMemoryBridge.retrieve_context method · python · L45-L51 (7 LOC)

src/agent_memory/adapters/langchain.py

    def retrieve_context(self, query: str, k: int = 5) -> list[dict[str, Any]]:
        """Retrieve the most recent k memory entries relevant to the query.

        Returns a list of memory entry dictionaries (naive recency ranking).
        """
        conversation_items = [item for item in self._items if item.get("type") == "conversation"]
        return conversation_items[-k:]

MicrosoftMemoryBridge.store_turn method · python · L28-L42 (15 LOC)

src/agent_memory/adapters/microsoft_agents.py

    def store_turn(self, conversation_id: str, turn: Any) -> str:
        """Persist a single conversation turn for a given conversation.

        Returns a unique memory entry ID.
        """
        entry_id = str(uuid.uuid4())
        entry: dict[str, Any] = {
            "id": entry_id,
            "type": "turn",
            "conversation_id": conversation_id,
            "turn": str(turn) if turn is not None else "",
        }
        self._items.append(entry)
        logger.debug("Stored turn for conversation_id=%s entry_id=%s", conversation_id, entry_id)
        return entry_id

Repobility (the analyzer behind this table) · https://repobility.com

MicrosoftMemoryBridge.retrieve_state method · python · L44-L55 (12 LOC)

src/agent_memory/adapters/microsoft_agents.py

    def retrieve_state(self, conversation_id: str) -> dict[str, Any]:
        """Retrieve the aggregated state for a conversation.

        Returns a dict with turn count and the most recent turn text.
        """
        turns = [item for item in self._items if item.get("conversation_id") == conversation_id]
        latest_turn = turns[-1].get("turn", "") if turns else ""
        return {
            "conversation_id": conversation_id,
            "turn_count": len(turns),
            "latest_turn": latest_turn,
        }

OpenAIMemoryBridge.store_messages method · python · L28-L43 (16 LOC)

src/agent_memory/adapters/openai_agents.py

    def store_messages(self, thread_id: str, messages: list[Any]) -> str:
        """Persist a list of messages for a given thread.

        Returns a unique memory entry ID.
        """
        entry_id = str(uuid.uuid4())
        entry: dict[str, Any] = {
            "id": entry_id,
            "type": "thread_messages",
            "thread_id": thread_id,
            "messages": [str(m) for m in messages],
            "count": len(messages),
        }
        self._items.append(entry)
        logger.debug("Stored %d messages for thread=%s id=%s", len(messages), thread_id, entry_id)
        return entry_id

OpenAIMemoryBridge.retrieve_context method · python · L45-L56 (12 LOC)

src/agent_memory/adapters/openai_agents.py

    def retrieve_context(self, thread_id: str, query: str) -> list[dict[str, Any]]:
        """Retrieve message entries for a thread that contain the query string.

        Returns matching entries in insertion order.
        """
        results: list[dict[str, Any]] = []
        for item in self._items:
            if item.get("thread_id") != thread_id:
                continue
            if any(query.lower() in msg.lower() for msg in item.get("messages", [])):
                results.append(item)
        return results

TierStats.to_dict method · python · L106-L116 (11 LOC)