gabriel / musehub public
test_walk_commit_delta_scale.py python
124 lines 5.0 KB
Raw
sha256:3c58668648c7323bb9f5c6881cfe6a3f14fc93fcb73b537d253732952a5bf8bf chore: bump version to 0.2.0rc12 Sonnet 4.6 patch 8 days ago
1 """TDD — _walk_commit_delta scale regression (issue #60).
2
3 L-tier bench (1000 commits) fails: wire_fetch_mpack returns mpack_id='' because
4 _walk_commit_delta returns {} for a 1000-commit chain. M-tier (100 commits) passes.
5
6 These tests confirm _walk_commit_delta returns the full delta at any scale:
7
8 WD-1 Single commit, have=[] → returns 1 commit.
9 WD-2 100-commit linear chain, have=[] → returns 100 commits.
10 WD-3 1000-commit linear chain, have=[] → returns 1000 commits. ← RED at L-tier
11 WD-4 have cuts the chain — only commits above have are returned.
12 """
13 from __future__ import annotations
14
15 import pytest
16 import msgpack
17 from datetime import datetime, timezone
18 from muse.core.types import fake_id
19 from musehub.db import musehub_repo_models as db
20 from musehub.db.musehub_repo_models import MusehubCommitGraph
21 from sqlalchemy.ext.asyncio import AsyncSession
22
23
24 def _now() -> datetime:
25 return datetime.now(tz=timezone.utc)
26
27
28 async def _build_chain(session: AsyncSession, n: int) -> list[str]:
29 """Insert a linear chain of N commits. Returns commit_ids tip→root order."""
30 commit_ids: list[str] = []
31 parent: list[str] = []
32 for i in range(n):
33 snap_id = fake_id(f"snap-wdscale-{i}")
34 snap = db.MusehubSnapshot(
35 snapshot_id=snap_id,
36 manifest_blob=msgpack.packb({f"file{i}.txt": fake_id(f"obj-{i}")}, use_bin_type=True),
37 directories=[],
38 entry_count=1,
39 created_at=_now(),
40 )
41 session.add(snap)
42 cid = fake_id(f"commit-wdscale-{i}")
43 commit = db.MusehubCommit(
44 commit_id=cid,
45 branch="main",
46 parent_ids=parent,
47 message=f"commit {i}",
48 author="gabriel",
49 timestamp=_now(),
50 snapshot_id=snap_id,
51 )
52 session.add(commit)
53 session.add(MusehubCommitGraph(
54 commit_id=cid,
55 parent_ids=parent,
56 generation=i,
57 snapshot_id=snap_id,
58 ))
59 commit_ids.append(cid)
60 parent = [cid]
61 await session.commit()
62 return commit_ids # [root, ..., tip]
63
64
65 # ── WD-1 ──────────────────────────────────────────────────────────────────────
66
67 @pytest.mark.asyncio
68 async def test_wd1_single_commit(db_session: AsyncSession) -> None:
69 """Single commit, have=[] → _walk_commit_delta returns exactly that commit."""
70 from musehub.services.musehub_wire import _walk_commit_delta
71
72 ids = await _build_chain(db_session, 1)
73 result = await _walk_commit_delta(db_session, want=[ids[-1]], have=[])
74
75 assert len(result) == 1
76 assert ids[-1] in result
77
78
79 # ── WD-2 ──────────────────────────────────────────────────────────────────────
80
81 @pytest.mark.asyncio
82 async def test_wd2_hundred_commit_chain(db_session: AsyncSession) -> None:
83 """100-commit linear chain, have=[] → _walk_commit_delta returns all 100 commits."""
84 from musehub.services.musehub_wire import _walk_commit_delta
85
86 ids = await _build_chain(db_session, 100)
87 result = await _walk_commit_delta(db_session, want=[ids[-1]], have=[])
88
89 assert len(result) == 100, f"expected 100 commits, got {len(result)}"
90
91
92 # ── WD-3 ──────────────────────────────────────────────────────────────────────
93
94 @pytest.mark.asyncio
95 async def test_wd3_thousand_commit_chain(db_session: AsyncSession) -> None:
96 """1000-commit linear chain, have=[] → _walk_commit_delta returns all 1000 commits.
97
98 This is the L-tier regression: the bench push succeeds (commits exist in DB)
99 but clone/fetch/pull return mpack_id='' because _walk_commit_delta returns {}.
100 """
101 from musehub.services.musehub_wire import _walk_commit_delta
102
103 ids = await _build_chain(db_session, 1_000)
104 result = await _walk_commit_delta(db_session, want=[ids[-1]], have=[])
105
106 assert len(result) == 1_000, f"expected 1000 commits, got {len(result)}"
107
108
109 # ── WD-4 ──────────────────────────────────────────────────────────────────────
110
111 @pytest.mark.asyncio
112 async def test_wd4_have_cuts_delta(db_session: AsyncSession) -> None:
113 """have=[root] → only commits above root are returned."""
114 from musehub.services.musehub_wire import _walk_commit_delta
115
116 ids = await _build_chain(db_session, 10)
117 # ids[0] = root, ids[9] = tip; have=[ids[4]] means commits 5–9 are needed
118 result = await _walk_commit_delta(db_session, want=[ids[-1]], have=[ids[4]])
119
120 assert len(result) == 5, f"expected 5 commits above have, got {len(result)}"
121 for cid in ids[5:]:
122 assert cid in result
123 for cid in ids[:5]:
124 assert cid not in result
File History 1 commit
sha256:8b0fb5814ab41a08af1f212c956bd08fe74190c2818ba5c503848fda6e33e216 chore: bump version to 0.2.0rc12 Sonnet 4.6 patch 8 days ago