test: Full E2E Pipeline 성공 (Plan→Code→Review) — 3호출 219초 #task-190

2026-03-06 17:46:45 +09:00
parent 57c9cb6143
commit b6ed432fe3
2 changed files with 67 additions and 35 deletions
--- a/tests/test_pipeline_e2e.py
+++ b/tests/test_pipeline_e2e.py
@@ -1,12 +1,13 @@
-"""E2E Test: Task Pipeline with real Gemini CLI.
+"""Full E2E Test: Plan → Code → Review with real Gemini CLI.

-Tests Planner phase against the variet-agent project.
+Tests the complete pipeline against a concrete improvement task.
 """

 import sys
 import io
 import asyncio
 import json
+import time

 if sys.stdout.encoding != "utf-8":
    sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding="utf-8", errors="replace")
@@ -16,40 +17,71 @@ from core.task_pipeline import TaskPipeline

 PROJECT = r"C:\Users\CafeVariet-GL552VW\Desktop\source_diff\variet-agent"

-
-async def test_planner():
-    print("=" * 60)
-    print("E2E TEST: Planner")
-    print("=" * 60)
-
-    pipeline = TaskPipeline(PROJECT, token_budget=30_000)
-    pipeline.setup()
-
-    plan = await pipeline.plan(
-        "project_indexer.py의 find_relevant 함수가 공백이 포함된 쿼리를 처리하지 못합니다. "
-        "'gemini caller'로 검색하면 gemini_caller.py를 찾지 못합니다. "
-        "밑줄과 공백을 동일하게 처리하도록 개선해주세요."
-    )
-
-    print(f"\n📋 Plan result:")
-    print(json.dumps(plan, ensure_ascii=False, indent=2))
-
-    if plan.get("tasks"):
-        print(f"\n✅ Planner returned {len(plan['tasks'])} tasks")
-        for t in plan["tasks"]:
-            print(f"  - {t.get('title', t.get('id', '?'))}: {t.get('description', '')[:80]}")
-    else:
-        print(f"\n⚠️ No structured tasks, raw response:")
-        print(plan.get("raw", plan.get("summary", ""))[:500])
-
-    return plan
+USER_REQUEST = (
+    "project_indexer.py의 find_relevant 함수가 공백이 포함된 쿼리를 처리하지 못합니다. "
+    "'gemini caller'로 검색하면 gemini_caller.py를 찾지 못합니다. "
+    "밑줄과 공백을 동일하게 처리하도록 개선해주세요."
+)


 async def main():
-    plan = await test_planner()
+    start = time.time()
+    pipeline = TaskPipeline(PROJECT, token_budget=15_000)
+    pipeline.setup()
+
+    # === PHASE 1: Plan ===
+    print("=" * 60)
+    print("PHASE 1: PLANNER")
+    print("=" * 60)
+
+    plan = await pipeline.plan(USER_REQUEST)
+    tasks = plan.get("tasks", [])
+
+    print(f"Summary: {plan.get('summary', 'N/A')}")
+    print(f"Tasks: {len(tasks)}")
+    for t in tasks:
+        print(f"  [{t.get('id')}] {t.get('title')}")
+        print(f"      Files: {t.get('files')}")
+    print(f"  Risk: {plan.get('risk', 'N/A')}")
+
+    if not tasks:
+        print("❌ No tasks returned, stopping.")
+        return
+
+    # === PHASE 2: Code (first task only) ===
    print(f"\n{'=' * 60}")
-    print(f"Gemini calls: {1}")
-    print(f"✅ E2E Planner test complete!")
+    print("PHASE 2: CODER (Task 1 only)")
+    print("=" * 60)
+
+    first_task = tasks[0]
+    code_output = await pipeline.code(first_task)
+
+    print(f"Output length: {len(code_output)} chars")
+    print(f"First 800 chars:")
+    print(code_output[:800])
+    print("...")
+
+    # === PHASE 3: Review ===
+    print(f"\n{'=' * 60}")
+    print("PHASE 3: REVIEWER")
+    print("=" * 60)
+
+    review = await pipeline.review(first_task, code_output)
+
+    print(f"Passed: {review.get('passed', 'N/A')}")
+    if review.get("issues"):
+        for issue in review["issues"]:
+            print(f"  [{issue.get('severity')}] {issue.get('description', '')[:80]}")
+    print(f"Summary: {review.get('summary', 'N/A')[:200]}")
+
+    # === Results ===
+    elapsed = time.time() - start
+    print(f"\n{'=' * 60}")
+    print(f"RESULTS")
+    print(f"  Gemini calls: {pipeline.gemini.call_count}")
+    print(f"  Total time: {elapsed:.1f}s")
+    print(f"  Pipeline log entries: {len(pipeline.log)}")
+    print(f"✅ Full E2E test complete!")


 if __name__ == "__main__":