feat: support multiple --enhance-workflow flags with shared workflow_runner

- Change --enhance-workflow from type:str to action:append in all argument files (workflow, create, scrape, github, pdf) so the flag can be given multiple times to chain workflows in sequence - Add workflow_runner.py: shared utility used by all 4 scrapers - collect_workflow_vars(): merges extra context then user --var flags (user flags take precedence over scraper metadata) - run_workflows(): executes named workflows in order, then any inline --enhance-stage workflow; handles dry-run/preview mode - Remove duplicate ~115-130 line workflow blocks from doc_scraper, github_scraper, pdf_scraper, and codebase_scraper; replace with single run_workflows() call each - Remove mutual exclusivity between workflows and AI enhancement: workflows now run first, then traditional enhancement continues independently (--enhance-level 0 to disable) - Add tests/test_workflow_runner.py: 21 tests covering no-flags, single workflow, multiple/chained workflows, inline stages, mixed mode, variable precedence, and dry-run - Fix test_markdown_parsing: accept "text" or "unknown" for unlabelled code blocks (unified MarkdownParser returns "text" by default) Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
2026-02-17 22:05:27 +03:00
parent 9fd6cdcd5c
commit 60c46673ed
13 changed files with 959 additions and 16 deletions
--- a/src/skill_seekers/cli/codebase_scraper.py
+++ b/src/skill_seekers/cli/codebase_scraper.py
@@ -1250,7 +1250,8 @@ def analyze_codebase(
        logger.info("Detecting design patterns...")
        from skill_seekers.cli.pattern_recognizer import PatternRecognizer

-        pattern_recognizer = PatternRecognizer(depth=depth, enhance_with_ai=enhance_patterns)
+        # Step 1: Detect patterns WITHOUT enhancement (collect all first)
+        pattern_recognizer = PatternRecognizer(depth=depth, enhance_with_ai=False)
        pattern_results = []

        for file_path in files:
@@ -1267,6 +1268,31 @@ def analyze_codebase(
                logger.warning(f"Pattern detection failed for {file_path}: {e}")
                continue

+        # Step 2: Enhance ALL patterns at once (batched across all files)
+        if enhance_patterns and pattern_results:
+            logger.info("🤖 Enhancing patterns with AI (batched)...")
+            from skill_seekers.cli.ai_enhancer import PatternEnhancer
+
+            enhancer = PatternEnhancer()
+
+            # Flatten all patterns from all files
+            all_patterns = []
+            pattern_map = []  # Track (report_idx, pattern_idx) for each pattern
+
+            for report_idx, report in enumerate(pattern_results):
+                for pattern_idx, pattern in enumerate(report.get("patterns", [])):
+                    all_patterns.append(pattern)
+                    pattern_map.append((report_idx, pattern_idx))
+
+            if all_patterns:
+                # Enhance all patterns in batches (this is where batching happens!)
+                enhanced_patterns = enhancer.enhance_patterns(all_patterns)
+
+                # Map enhanced patterns back to their reports
+                for i, (report_idx, pattern_idx) in enumerate(pattern_map):
+                    if i < len(enhanced_patterns):
+                        pattern_results[report_idx]["patterns"][pattern_idx] = enhanced_patterns[i]
+
        # Save pattern results with multi-level filtering (Issue #240)
        if pattern_results:
            pattern_output = output_dir / "patterns"
@@ -2365,6 +2391,45 @@ Examples:
        ),
    )

+    # Workflow enhancement arguments
+    parser.add_argument(
+        "--enhance-workflow",
+        type=str,
+        help=(
+            "Enhancement workflow to use (name or path to YAML file). "
+            "Examples: 'security-focus', 'architecture-comprehensive', "
+            "'.skill-seekers/my-workflow.yaml'. "
+            "Overrides --enhance-level when provided."
+        ),
+        metavar="WORKFLOW",
+    )
+    parser.add_argument(
+        "--enhance-stage",
+        type=str,
+        action="append",
+        help=(
+            "Add inline enhancement stage. Format: 'name:prompt'. "
+            "Can be used multiple times. Example: "
+            "--enhance-stage 'security:Analyze for security issues'"
+        ),
+        metavar="NAME:PROMPT",
+    )
+    parser.add_argument(
+        "--var",
+        type=str,
+        action="append",
+        help=(
+            "Override workflow variable. Format: 'key=value'. "
+            "Can be used multiple times. Example: --var focus_area=performance"
+        ),
+        metavar="KEY=VALUE",
+    )
+    parser.add_argument(
+        "--workflow-dry-run",
+        action="store_true",
+        help="Show workflow stages without executing (dry run mode)",
+    )
+
    # Check for deprecated flags
    deprecated_flags = {
        "--build-api-reference": "--skip-api-reference",
@@ -2473,14 +2538,25 @@ Examples:
            enhance_level=args.enhance_level,  # AI enhancement level (0-3)
        )

+        # ============================================================
+        # WORKFLOW SYSTEM INTEGRATION (Phase 2)
+        # ============================================================
+        from skill_seekers.cli.workflow_runner import run_workflows
+
+        workflow_executed, workflow_names = run_workflows(args)
+
        # Print summary
        print(f"\n{'=' * 60}")
        print("CODEBASE ANALYSIS COMPLETE")
+        if workflow_executed:
+            print(f" + {len(workflow_names)} ENHANCEMENT WORKFLOW(S) EXECUTED")
        print(f"{'=' * 60}")
        print(f"Files analyzed: {len(results['files'])}")
        print(f"Output directory: {args.output}")
        if not args.skip_api_reference:
            print(f"API reference: {Path(args.output) / 'api_reference'}")
+        if workflow_executed:
+            print(f"Workflows applied: {', '.join(workflow_names)}")
        print(f"{'=' * 60}\n")

        return 0