feat: add enhancement workflow system and unified enhancer
- enhancement_workflow.py: WorkflowEngine class for multi-stage AI enhancement workflows with preset support (security-focus, architecture-comprehensive, api-documentation, minimal, default) - unified_enhancer.py: unified enhancement orchestrator integrating workflow execution with traditional enhance-level based enhancement - create_command.py: wire workflow args into the unified create command - AGENTS.md: update agent capability documentation - configs/godot_unified.json: add unified Godot documentation config - ENHANCEMENT_WORKFLOW_SYSTEM.md: documentation for the workflow system - WORKFLOW_ENHANCEMENT_SEQUENTIAL_EXECUTION.md: docs explaining sequential execution of workflows followed by AI enhancement Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
This commit is contained in:
@@ -374,6 +374,18 @@ class CreateCommand:
|
||||
if getattr(self.args, "interactive_enhancement", False):
|
||||
argv.append("--interactive-enhancement")
|
||||
|
||||
# Enhancement Workflow arguments (NEW - Phase 2)
|
||||
if getattr(self.args, "enhance_workflow", None):
|
||||
argv.extend(["--enhance-workflow", self.args.enhance_workflow])
|
||||
if getattr(self.args, "enhance_stage", None):
|
||||
for stage in self.args.enhance_stage:
|
||||
argv.extend(["--enhance-stage", stage])
|
||||
if getattr(self.args, "var", None):
|
||||
for var in self.args.var:
|
||||
argv.extend(["--var", var])
|
||||
if getattr(self.args, "workflow_dry_run", False):
|
||||
argv.append("--workflow-dry-run")
|
||||
|
||||
|
||||
def main() -> int:
|
||||
"""Entry point for create command.
|
||||
|
||||
532
src/skill_seekers/cli/enhancement_workflow.py
Normal file
532
src/skill_seekers/cli/enhancement_workflow.py
Normal file
@@ -0,0 +1,532 @@
|
||||
#!/usr/bin/env python3
|
||||
"""
|
||||
Enhancement Workflow Engine
|
||||
|
||||
Allows users to define custom AI enhancement workflows with:
|
||||
- Sequential stages that build on previous results
|
||||
- Custom prompts per stage
|
||||
- History passing between stages
|
||||
- Post-processing configuration
|
||||
- Per-project and global workflow support
|
||||
|
||||
Usage:
|
||||
# Use global workflow
|
||||
skill-seekers analyze . --enhance-workflow security-focus
|
||||
|
||||
# Use project workflow
|
||||
skill-seekers analyze . --enhance-workflow .skill-seekers/enhancement.yaml
|
||||
|
||||
# Quick inline stages
|
||||
skill-seekers analyze . \\
|
||||
--enhance-stage "security:Analyze for security issues" \\
|
||||
--enhance-stage "cleanup:Remove boilerplate"
|
||||
"""
|
||||
|
||||
import json
|
||||
import logging
|
||||
import os
|
||||
from dataclasses import dataclass, field
|
||||
from datetime import datetime
|
||||
from pathlib import Path
|
||||
from typing import Any, Literal
|
||||
|
||||
import yaml
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
|
||||
@dataclass
|
||||
class WorkflowStage:
|
||||
"""Single enhancement stage in a workflow."""
|
||||
|
||||
name: str
|
||||
type: Literal["builtin", "custom"]
|
||||
target: str # "patterns", "examples", "config", "skill_md", "all"
|
||||
prompt: str | None = None
|
||||
uses_history: bool = False
|
||||
enabled: bool = True
|
||||
metadata: dict[str, Any] = field(default_factory=dict)
|
||||
|
||||
|
||||
@dataclass
|
||||
class PostProcessConfig:
|
||||
"""Post-processing configuration."""
|
||||
|
||||
remove_sections: list[str] = field(default_factory=list)
|
||||
reorder_sections: list[str] = field(default_factory=list)
|
||||
add_metadata: dict[str, Any] = field(default_factory=dict)
|
||||
custom_transforms: list[dict[str, Any]] = field(default_factory=list)
|
||||
|
||||
|
||||
@dataclass
|
||||
class EnhancementWorkflow:
|
||||
"""Complete enhancement workflow definition."""
|
||||
|
||||
name: str
|
||||
description: str
|
||||
version: str = "1.0"
|
||||
applies_to: list[str] = field(default_factory=lambda: ["codebase_analysis"])
|
||||
variables: dict[str, Any] = field(default_factory=dict)
|
||||
stages: list[WorkflowStage] = field(default_factory=list)
|
||||
post_process: PostProcessConfig = field(default_factory=PostProcessConfig)
|
||||
extends: str | None = None # Inherit from another workflow
|
||||
|
||||
|
||||
class WorkflowEngine:
|
||||
"""
|
||||
Execute enhancement workflows with sequential stages.
|
||||
|
||||
Each stage can:
|
||||
- Access previous stage results
|
||||
- Access all history
|
||||
- Access specific stages by name
|
||||
- Run custom AI prompts
|
||||
- Target specific parts of the analysis
|
||||
"""
|
||||
|
||||
def __init__(self, workflow: EnhancementWorkflow | str | Path):
|
||||
"""
|
||||
Initialize workflow engine.
|
||||
|
||||
Args:
|
||||
workflow: EnhancementWorkflow object or path to YAML file
|
||||
"""
|
||||
if isinstance(workflow, (str, Path)):
|
||||
self.workflow = self._load_workflow(workflow)
|
||||
else:
|
||||
self.workflow = workflow
|
||||
|
||||
self.history: list[dict[str, Any]] = []
|
||||
self.enhancer = None # Lazy load UnifiedEnhancer
|
||||
|
||||
def _load_workflow(self, workflow_path: str | Path) -> EnhancementWorkflow:
|
||||
"""Load workflow from YAML file."""
|
||||
workflow_path = Path(workflow_path)
|
||||
|
||||
# Resolve path (support both absolute and relative)
|
||||
if not workflow_path.is_absolute():
|
||||
# Try relative to CWD first
|
||||
if not workflow_path.exists():
|
||||
# Try in config directory
|
||||
config_dir = Path.home() / ".config" / "skill-seekers" / "workflows"
|
||||
workflow_path = config_dir / workflow_path
|
||||
|
||||
if not workflow_path.exists():
|
||||
raise FileNotFoundError(f"Workflow not found: {workflow_path}")
|
||||
|
||||
logger.info(f"📋 Loading workflow: {workflow_path}")
|
||||
|
||||
with open(workflow_path, encoding="utf-8") as f:
|
||||
data = yaml.safe_load(f)
|
||||
|
||||
# Handle inheritance (extends)
|
||||
if "extends" in data and data["extends"]:
|
||||
parent = self._load_workflow(data["extends"])
|
||||
data = self._merge_workflows(parent, data)
|
||||
|
||||
# Parse stages
|
||||
stages = []
|
||||
for stage_data in data.get("stages", []):
|
||||
stages.append(
|
||||
WorkflowStage(
|
||||
name=stage_data["name"],
|
||||
type=stage_data.get("type", "custom"),
|
||||
target=stage_data.get("target", "all"),
|
||||
prompt=stage_data.get("prompt"),
|
||||
uses_history=stage_data.get("uses_history", False),
|
||||
enabled=stage_data.get("enabled", True),
|
||||
metadata=stage_data.get("metadata", {}),
|
||||
)
|
||||
)
|
||||
|
||||
# Parse post-processing
|
||||
post_process_data = data.get("post_process", {})
|
||||
post_process = PostProcessConfig(
|
||||
remove_sections=post_process_data.get("remove_sections", []),
|
||||
reorder_sections=post_process_data.get("reorder_sections", []),
|
||||
add_metadata=post_process_data.get("add_metadata", {}),
|
||||
custom_transforms=post_process_data.get("custom_transforms", []),
|
||||
)
|
||||
|
||||
return EnhancementWorkflow(
|
||||
name=data.get("name", "Unnamed Workflow"),
|
||||
description=data.get("description", ""),
|
||||
version=data.get("version", "1.0"),
|
||||
applies_to=data.get("applies_to", ["codebase_analysis"]),
|
||||
variables=data.get("variables", {}),
|
||||
stages=stages,
|
||||
post_process=post_process,
|
||||
extends=data.get("extends"),
|
||||
)
|
||||
|
||||
def _merge_workflows(
|
||||
self, parent: EnhancementWorkflow, child_data: dict
|
||||
) -> dict:
|
||||
"""Merge child workflow with parent (inheritance)."""
|
||||
# Start with parent as dict
|
||||
merged = {
|
||||
"name": child_data.get("name", parent.name),
|
||||
"description": child_data.get("description", parent.description),
|
||||
"version": child_data.get("version", parent.version),
|
||||
"applies_to": child_data.get("applies_to", parent.applies_to),
|
||||
"variables": {**parent.variables, **child_data.get("variables", {})},
|
||||
"stages": [],
|
||||
"post_process": {},
|
||||
}
|
||||
|
||||
# Merge stages (child can override by name)
|
||||
parent_stages = {s.name: s for s in parent.stages}
|
||||
child_stages = {s["name"]: s for s in child_data.get("stages", [])}
|
||||
|
||||
for name in list(parent_stages.keys()) + list(child_stages.keys()):
|
||||
if name in child_stages:
|
||||
# Child overrides parent
|
||||
stage_dict = child_stages[name]
|
||||
else:
|
||||
# Use parent stage
|
||||
stage = parent_stages[name]
|
||||
stage_dict = {
|
||||
"name": stage.name,
|
||||
"type": stage.type,
|
||||
"target": stage.target,
|
||||
"prompt": stage.prompt,
|
||||
"uses_history": stage.uses_history,
|
||||
"enabled": stage.enabled,
|
||||
}
|
||||
|
||||
if stage_dict not in merged["stages"]:
|
||||
merged["stages"].append(stage_dict)
|
||||
|
||||
# Merge post-processing
|
||||
parent_post = parent.post_process
|
||||
child_post = child_data.get("post_process", {})
|
||||
merged["post_process"] = {
|
||||
"remove_sections": child_post.get(
|
||||
"remove_sections", parent_post.remove_sections
|
||||
),
|
||||
"reorder_sections": child_post.get(
|
||||
"reorder_sections", parent_post.reorder_sections
|
||||
),
|
||||
"add_metadata": {
|
||||
**parent_post.add_metadata,
|
||||
**child_post.get("add_metadata", {}),
|
||||
},
|
||||
"custom_transforms": parent_post.custom_transforms
|
||||
+ child_post.get("custom_transforms", []),
|
||||
}
|
||||
|
||||
return merged
|
||||
|
||||
def run(self, analysis_results: dict, context: dict | None = None) -> dict:
|
||||
"""
|
||||
Run workflow stages sequentially.
|
||||
|
||||
Args:
|
||||
analysis_results: Results from analysis (patterns, examples, etc.)
|
||||
context: Additional context variables
|
||||
|
||||
Returns:
|
||||
Enhanced results after all stages
|
||||
"""
|
||||
logger.info(f"🚀 Starting workflow: {self.workflow.name}")
|
||||
logger.info(f" Description: {self.workflow.description}")
|
||||
logger.info(f" Stages: {len(self.workflow.stages)}")
|
||||
|
||||
current_results = analysis_results
|
||||
context = context or {}
|
||||
|
||||
# Merge workflow variables into context
|
||||
context.update(self.workflow.variables)
|
||||
|
||||
# Run each stage
|
||||
for idx, stage in enumerate(self.workflow.stages, 1):
|
||||
if not stage.enabled:
|
||||
logger.info(f"⏭️ Skipping disabled stage: {stage.name}")
|
||||
continue
|
||||
|
||||
logger.info(f"🔄 Running stage {idx}/{len(self.workflow.stages)}: {stage.name}")
|
||||
|
||||
# Build stage context
|
||||
stage_context = self._build_stage_context(
|
||||
stage, current_results, context
|
||||
)
|
||||
|
||||
# Run stage
|
||||
try:
|
||||
stage_results = self._run_stage(stage, stage_context)
|
||||
|
||||
# Save to history
|
||||
self.history.append(
|
||||
{
|
||||
"stage": stage.name,
|
||||
"results": stage_results,
|
||||
"timestamp": datetime.now().isoformat(),
|
||||
"metadata": stage.metadata,
|
||||
}
|
||||
)
|
||||
|
||||
# Merge stage results into current results
|
||||
current_results = self._merge_stage_results(
|
||||
current_results, stage_results, stage.target
|
||||
)
|
||||
|
||||
logger.info(f" ✅ Stage complete: {stage.name}")
|
||||
|
||||
except Exception as e:
|
||||
logger.error(f" ❌ Stage failed: {stage.name} - {e}")
|
||||
# Continue with next stage (optional: make this configurable)
|
||||
continue
|
||||
|
||||
# Post-processing
|
||||
logger.info("🔧 Running post-processing...")
|
||||
final_results = self._post_process(current_results)
|
||||
|
||||
logger.info(f"✅ Workflow complete: {self.workflow.name}")
|
||||
return final_results
|
||||
|
||||
def _build_stage_context(
|
||||
self, stage: WorkflowStage, current_results: dict, base_context: dict
|
||||
) -> dict:
|
||||
"""Build context for a stage (includes history if needed)."""
|
||||
context = {
|
||||
"current_results": current_results,
|
||||
**base_context,
|
||||
}
|
||||
|
||||
if stage.uses_history and self.history:
|
||||
# Add previous stage
|
||||
context["previous_results"] = self.history[-1]["results"]
|
||||
|
||||
# Add all history
|
||||
context["all_history"] = self.history
|
||||
|
||||
# Add stages by name for easy access
|
||||
context["stages"] = {h["stage"]: h["results"] for h in self.history}
|
||||
|
||||
return context
|
||||
|
||||
def _run_stage(self, stage: WorkflowStage, context: dict) -> dict:
|
||||
"""Run a single stage."""
|
||||
if stage.type == "builtin":
|
||||
return self._run_builtin_stage(stage, context)
|
||||
else:
|
||||
return self._run_custom_stage(stage, context)
|
||||
|
||||
def _run_builtin_stage(self, stage: WorkflowStage, context: dict) -> dict:
|
||||
"""Run built-in enhancement stage."""
|
||||
# Use existing enhancement system
|
||||
from skill_seekers.cli.ai_enhancer import PatternEnhancer, TestExampleEnhancer
|
||||
|
||||
current = context["current_results"]
|
||||
|
||||
# Determine what to enhance based on target
|
||||
if stage.target == "patterns" and "patterns" in current:
|
||||
enhancer = PatternEnhancer()
|
||||
enhanced_patterns = enhancer.enhance_patterns(current["patterns"])
|
||||
return {"patterns": enhanced_patterns}
|
||||
|
||||
elif stage.target == "examples" and "examples" in current:
|
||||
enhancer = TestExampleEnhancer()
|
||||
enhanced_examples = enhancer.enhance_examples(current["examples"])
|
||||
return {"examples": enhanced_examples}
|
||||
|
||||
else:
|
||||
logger.warning(f"Unknown builtin target: {stage.target}")
|
||||
return {}
|
||||
|
||||
def _run_custom_stage(self, stage: WorkflowStage, context: dict) -> dict:
|
||||
"""Run custom AI enhancement stage."""
|
||||
if not stage.prompt:
|
||||
logger.warning(f"Custom stage '{stage.name}' has no prompt")
|
||||
return {}
|
||||
|
||||
# Lazy load enhancer
|
||||
if not self.enhancer:
|
||||
from skill_seekers.cli.ai_enhancer import AIEnhancer
|
||||
|
||||
self.enhancer = AIEnhancer()
|
||||
|
||||
# Format prompt with context
|
||||
try:
|
||||
formatted_prompt = stage.prompt.format(**context)
|
||||
except KeyError as e:
|
||||
logger.warning(f"Missing context variable: {e}")
|
||||
formatted_prompt = stage.prompt
|
||||
|
||||
# Call AI with custom prompt
|
||||
logger.info(f" 🤖 Running custom AI prompt...")
|
||||
response = self.enhancer._call_claude(formatted_prompt, max_tokens=3000)
|
||||
|
||||
if not response:
|
||||
logger.warning(f" ⚠️ No response from AI")
|
||||
return {}
|
||||
|
||||
# Try to parse as JSON first, fallback to plain text
|
||||
try:
|
||||
result = json.loads(response)
|
||||
except json.JSONDecodeError:
|
||||
# Plain text response
|
||||
result = {"content": response, "stage": stage.name}
|
||||
|
||||
return result
|
||||
|
||||
def _merge_stage_results(
|
||||
self, current: dict, stage_results: dict, target: str
|
||||
) -> dict:
|
||||
"""Merge stage results into current results."""
|
||||
if target == "all":
|
||||
# Merge everything
|
||||
return {**current, **stage_results}
|
||||
else:
|
||||
# Merge only specific target
|
||||
current[target] = stage_results.get(target, stage_results)
|
||||
return current
|
||||
|
||||
def _post_process(self, results: dict) -> dict:
|
||||
"""Apply post-processing configuration."""
|
||||
config = self.workflow.post_process
|
||||
|
||||
# Remove sections
|
||||
for section in config.remove_sections:
|
||||
if section in results:
|
||||
logger.info(f" 🗑️ Removing section: {section}")
|
||||
del results[section]
|
||||
|
||||
# Add metadata
|
||||
if config.add_metadata:
|
||||
if "metadata" not in results:
|
||||
results["metadata"] = {}
|
||||
results["metadata"].update(config.add_metadata)
|
||||
logger.info(f" 📝 Added metadata: {list(config.add_metadata.keys())}")
|
||||
|
||||
# Reorder sections (for SKILL.md generation)
|
||||
if config.reorder_sections and "skill_md_sections" in results:
|
||||
logger.info(f" 🔄 Reordering sections...")
|
||||
# This will be used during SKILL.md generation
|
||||
results["section_order"] = config.reorder_sections
|
||||
|
||||
# Custom transforms (extensibility)
|
||||
for transform in config.custom_transforms:
|
||||
logger.info(f" ⚙️ Applying transform: {transform.get('name', 'unknown')}")
|
||||
# TODO: Implement custom transform system
|
||||
|
||||
return results
|
||||
|
||||
def save_history(self, output_path: Path):
|
||||
"""Save workflow execution history."""
|
||||
output_path = Path(output_path)
|
||||
output_path.parent.mkdir(parents=True, exist_ok=True)
|
||||
|
||||
history_data = {
|
||||
"workflow": self.workflow.name,
|
||||
"version": self.workflow.version,
|
||||
"executed_at": datetime.now().isoformat(),
|
||||
"stages": self.history,
|
||||
}
|
||||
|
||||
with open(output_path, "w", encoding="utf-8") as f:
|
||||
json.dump(history_data, f, indent=2)
|
||||
|
||||
logger.info(f"💾 Saved workflow history: {output_path}")
|
||||
|
||||
|
||||
def create_default_workflows():
|
||||
"""Create default workflow templates in user config directory."""
|
||||
config_dir = Path.home() / ".config" / "skill-seekers" / "workflows"
|
||||
config_dir.mkdir(parents=True, exist_ok=True)
|
||||
|
||||
# Default workflow
|
||||
default_workflow = {
|
||||
"name": "Default Enhancement",
|
||||
"description": "Standard AI enhancement with all features",
|
||||
"version": "1.0",
|
||||
"applies_to": ["codebase_analysis", "doc_scraping", "github_analysis"],
|
||||
"stages": [
|
||||
{
|
||||
"name": "base_analysis",
|
||||
"type": "builtin",
|
||||
"target": "patterns",
|
||||
"enabled": True,
|
||||
},
|
||||
{
|
||||
"name": "test_examples",
|
||||
"type": "builtin",
|
||||
"target": "examples",
|
||||
"enabled": True,
|
||||
},
|
||||
],
|
||||
"post_process": {
|
||||
"add_metadata": {"enhanced": True, "workflow": "default"}
|
||||
},
|
||||
}
|
||||
|
||||
# Security-focused workflow
|
||||
security_workflow = {
|
||||
"name": "Security-Focused Analysis",
|
||||
"description": "Emphasize security patterns and vulnerabilities",
|
||||
"version": "1.0",
|
||||
"applies_to": ["codebase_analysis"],
|
||||
"variables": {"focus_area": "security"},
|
||||
"stages": [
|
||||
{
|
||||
"name": "base_patterns",
|
||||
"type": "builtin",
|
||||
"target": "patterns",
|
||||
},
|
||||
{
|
||||
"name": "security_analysis",
|
||||
"type": "custom",
|
||||
"target": "security",
|
||||
"uses_history": True,
|
||||
"prompt": """Based on the patterns detected: {previous_results}
|
||||
|
||||
Perform deep security analysis:
|
||||
|
||||
1. **Authentication/Authorization**:
|
||||
- Auth bypass risks?
|
||||
- Token handling secure?
|
||||
- Session management issues?
|
||||
|
||||
2. **Input Validation**:
|
||||
- User input sanitized?
|
||||
- SQL injection risks?
|
||||
- XSS vulnerabilities?
|
||||
|
||||
3. **Data Exposure**:
|
||||
- Sensitive data in logs?
|
||||
- Secrets in config?
|
||||
- PII handling?
|
||||
|
||||
4. **Cryptography**:
|
||||
- Weak algorithms?
|
||||
- Hardcoded keys?
|
||||
- Insecure RNG?
|
||||
|
||||
Output as JSON with 'findings' array.""",
|
||||
},
|
||||
],
|
||||
"post_process": {
|
||||
"add_metadata": {"security_reviewed": True},
|
||||
},
|
||||
}
|
||||
|
||||
# Save workflows
|
||||
workflows = {
|
||||
"default.yaml": default_workflow,
|
||||
"security-focus.yaml": security_workflow,
|
||||
}
|
||||
|
||||
for filename, workflow_data in workflows.items():
|
||||
workflow_file = config_dir / filename
|
||||
if not workflow_file.exists():
|
||||
with open(workflow_file, "w", encoding="utf-8") as f:
|
||||
yaml.dump(workflow_data, f, default_flow_style=False, sort_keys=False)
|
||||
logger.info(f"✅ Created workflow: {workflow_file}")
|
||||
|
||||
return config_dir
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
# Create default workflows
|
||||
create_default_workflows()
|
||||
print("✅ Default workflows created!")
|
||||
476
src/skill_seekers/cli/unified_enhancer.py
Normal file
476
src/skill_seekers/cli/unified_enhancer.py
Normal file
@@ -0,0 +1,476 @@
|
||||
#!/usr/bin/env python3
|
||||
"""
|
||||
Unified AI Enhancement System
|
||||
|
||||
Replaces all separate enhancer classes with a single unified interface:
|
||||
- PatternEnhancer (C3.1)
|
||||
- TestExampleEnhancer (C3.2)
|
||||
- GuideEnhancer (C3.3)
|
||||
- ConfigEnhancer (C3.4)
|
||||
- SkillEnhancer (SKILL.md)
|
||||
|
||||
Benefits:
|
||||
- Single source of truth
|
||||
- No code duplication
|
||||
- Consistent behavior
|
||||
- Easy to maintain
|
||||
- Supports custom prompts via workflow system
|
||||
"""
|
||||
|
||||
import json
|
||||
import logging
|
||||
import os
|
||||
import subprocess
|
||||
import tempfile
|
||||
from concurrent.futures import ThreadPoolExecutor, as_completed
|
||||
from dataclasses import dataclass
|
||||
from pathlib import Path
|
||||
from typing import Any, Literal
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
# Import config manager for settings
|
||||
try:
|
||||
from skill_seekers.cli.config_manager import get_config_manager
|
||||
|
||||
CONFIG_AVAILABLE = True
|
||||
except ImportError:
|
||||
CONFIG_AVAILABLE = False
|
||||
|
||||
|
||||
@dataclass
|
||||
class EnhancementConfig:
|
||||
"""Configuration for enhancement."""
|
||||
|
||||
mode: Literal["auto", "api", "local"] = "auto"
|
||||
batch_size: int = 20
|
||||
parallel_workers: int = 3
|
||||
enabled: bool = True
|
||||
api_key: str | None = None
|
||||
|
||||
|
||||
class UnifiedEnhancer:
|
||||
"""
|
||||
Single unified AI enhancement system.
|
||||
|
||||
Supports all enhancement types:
|
||||
- patterns: Design pattern analysis
|
||||
- examples: Test example context
|
||||
- guides: How-to guide enhancement
|
||||
- config: Configuration pattern analysis
|
||||
- skill: SKILL.md enhancement
|
||||
- custom: Custom prompts via workflow system
|
||||
"""
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
mode: str = "auto",
|
||||
api_key: str | None = None,
|
||||
enabled: bool = True,
|
||||
config: EnhancementConfig | None = None,
|
||||
):
|
||||
"""
|
||||
Initialize unified enhancer.
|
||||
|
||||
Args:
|
||||
mode: Enhancement mode - "auto", "api", or "local"
|
||||
api_key: Anthropic API key (uses env if None)
|
||||
enabled: Enable AI enhancement
|
||||
config: Optional EnhancementConfig object
|
||||
"""
|
||||
if config:
|
||||
self.config = config
|
||||
else:
|
||||
self.config = EnhancementConfig(
|
||||
mode=mode, api_key=api_key, enabled=enabled
|
||||
)
|
||||
|
||||
# Get settings from config manager
|
||||
if CONFIG_AVAILABLE:
|
||||
cfg = get_config_manager()
|
||||
self.config.batch_size = cfg.get_local_batch_size()
|
||||
self.config.parallel_workers = cfg.get_local_parallel_workers()
|
||||
|
||||
# Determine actual mode
|
||||
self.api_key = self.config.api_key or os.environ.get("ANTHROPIC_API_KEY")
|
||||
|
||||
if self.config.mode == "auto":
|
||||
if self.api_key:
|
||||
self.config.mode = "api"
|
||||
else:
|
||||
self.config.mode = "local"
|
||||
logger.info("ℹ️ No API key found, using LOCAL mode (Claude Code CLI)")
|
||||
|
||||
# Initialize API client if needed
|
||||
self.client = None
|
||||
if self.config.mode == "api" and self.config.enabled:
|
||||
try:
|
||||
import anthropic
|
||||
|
||||
client_kwargs = {"api_key": self.api_key}
|
||||
base_url = os.environ.get("ANTHROPIC_BASE_URL")
|
||||
if base_url:
|
||||
client_kwargs["base_url"] = base_url
|
||||
logger.info(f"✅ Using custom API base URL: {base_url}")
|
||||
self.client = anthropic.Anthropic(**client_kwargs)
|
||||
logger.info("✅ AI enhancement enabled (using Claude API)")
|
||||
except ImportError:
|
||||
logger.warning(
|
||||
"⚠️ anthropic package not installed, falling back to LOCAL mode"
|
||||
)
|
||||
self.config.mode = "local"
|
||||
except Exception as e:
|
||||
logger.warning(
|
||||
f"⚠️ Failed to initialize API client: {e}, falling back to LOCAL mode"
|
||||
)
|
||||
self.config.mode = "local"
|
||||
|
||||
if self.config.mode == "local" and self.config.enabled:
|
||||
if self._check_claude_cli():
|
||||
logger.info("✅ AI enhancement enabled (using LOCAL mode - Claude Code CLI)")
|
||||
else:
|
||||
logger.warning("⚠️ Claude Code CLI not found. AI enhancement disabled.")
|
||||
self.config.enabled = False
|
||||
|
||||
def _check_claude_cli(self) -> bool:
|
||||
"""Check if Claude Code CLI is available."""
|
||||
try:
|
||||
result = subprocess.run(
|
||||
["claude", "--version"],
|
||||
capture_output=True,
|
||||
text=True,
|
||||
timeout=5,
|
||||
)
|
||||
return result.returncode == 0
|
||||
except (FileNotFoundError, subprocess.TimeoutExpired):
|
||||
return False
|
||||
|
||||
def enhance(
|
||||
self,
|
||||
items: list[dict],
|
||||
enhancement_type: str,
|
||||
custom_prompt: str | None = None,
|
||||
) -> list[dict]:
|
||||
"""
|
||||
Universal enhancement method.
|
||||
|
||||
Args:
|
||||
items: List of items to enhance (patterns, examples, guides, etc.)
|
||||
enhancement_type: Type of enhancement ("pattern", "example", "guide", "config", "skill", "custom")
|
||||
custom_prompt: Optional custom prompt (overrides default)
|
||||
|
||||
Returns:
|
||||
Enhanced items
|
||||
"""
|
||||
if not self.config.enabled or not items:
|
||||
return items
|
||||
|
||||
# Get appropriate prompt
|
||||
if custom_prompt:
|
||||
prompt_template = custom_prompt
|
||||
else:
|
||||
prompt_template = self._get_default_prompt(enhancement_type)
|
||||
|
||||
# Batch processing
|
||||
batch_size = (
|
||||
self.config.batch_size
|
||||
if self.config.mode == "local"
|
||||
else 5 # API uses smaller batches
|
||||
)
|
||||
parallel_workers = (
|
||||
self.config.parallel_workers if self.config.mode == "local" else 1
|
||||
)
|
||||
|
||||
logger.info(
|
||||
f"🤖 Enhancing {len(items)} {enhancement_type}s with AI "
|
||||
f"({self.config.mode.upper()} mode: {batch_size} per batch, {parallel_workers} workers)..."
|
||||
)
|
||||
|
||||
# Create batches
|
||||
batches = []
|
||||
for i in range(0, len(items), batch_size):
|
||||
batches.append(items[i : i + batch_size])
|
||||
|
||||
# Process batches (parallel for LOCAL, sequential for API)
|
||||
if parallel_workers > 1 and len(batches) > 1:
|
||||
enhanced = self._enhance_parallel(batches, prompt_template)
|
||||
else:
|
||||
enhanced = []
|
||||
for batch in batches:
|
||||
batch_results = self._enhance_batch(batch, prompt_template)
|
||||
enhanced.extend(batch_results)
|
||||
|
||||
logger.info(f"✅ Enhanced {len(enhanced)} {enhancement_type}s")
|
||||
return enhanced
|
||||
|
||||
def _enhance_parallel(
|
||||
self, batches: list[list[dict]], prompt_template: str
|
||||
) -> list[dict]:
|
||||
"""Process batches in parallel using ThreadPoolExecutor."""
|
||||
results = [None] * len(batches) # Preserve order
|
||||
|
||||
with ThreadPoolExecutor(max_workers=self.config.parallel_workers) as executor:
|
||||
future_to_idx = {
|
||||
executor.submit(self._enhance_batch, batch, prompt_template): idx
|
||||
for idx, batch in enumerate(batches)
|
||||
}
|
||||
|
||||
completed = 0
|
||||
total = len(batches)
|
||||
for future in as_completed(future_to_idx):
|
||||
idx = future_to_idx[future]
|
||||
try:
|
||||
results[idx] = future.result()
|
||||
completed += 1
|
||||
|
||||
# Show progress
|
||||
if total < 10 or completed % 5 == 0 or completed == total:
|
||||
logger.info(f" Progress: {completed}/{total} batches completed")
|
||||
except Exception as e:
|
||||
logger.warning(f"⚠️ Batch {idx} failed: {e}")
|
||||
results[idx] = batches[idx] # Return unenhanced on failure
|
||||
|
||||
# Flatten results
|
||||
enhanced = []
|
||||
for batch_result in results:
|
||||
if batch_result:
|
||||
enhanced.extend(batch_result)
|
||||
return enhanced
|
||||
|
||||
def _enhance_batch(
|
||||
self, items: list[dict], prompt_template: str
|
||||
) -> list[dict]:
|
||||
"""Enhance a batch of items."""
|
||||
# Prepare prompt
|
||||
item_descriptions = []
|
||||
for idx, item in enumerate(items):
|
||||
desc = self._format_item_for_prompt(idx, item)
|
||||
item_descriptions.append(desc)
|
||||
|
||||
prompt = prompt_template.format(
|
||||
items="\n".join(item_descriptions), count=len(items)
|
||||
)
|
||||
|
||||
# Call AI
|
||||
response = self._call_claude(prompt, max_tokens=3000)
|
||||
|
||||
if not response:
|
||||
return items
|
||||
|
||||
# Parse response and merge with items
|
||||
try:
|
||||
analyses = json.loads(response)
|
||||
|
||||
for idx, item in enumerate(items):
|
||||
if idx < len(analyses):
|
||||
analysis = analyses[idx]
|
||||
item["ai_analysis"] = analysis
|
||||
|
||||
# Apply confidence boost if present
|
||||
if "confidence_boost" in analysis and "confidence" in item:
|
||||
boost = analysis["confidence_boost"]
|
||||
if -0.2 <= boost <= 0.2:
|
||||
item["confidence"] = min(
|
||||
1.0, max(0.0, item["confidence"] + boost)
|
||||
)
|
||||
|
||||
return items
|
||||
|
||||
except json.JSONDecodeError:
|
||||
logger.warning("⚠️ Failed to parse AI response, returning items unchanged")
|
||||
return items
|
||||
except Exception as e:
|
||||
logger.warning(f"⚠️ Error processing AI analysis: {e}")
|
||||
return items
|
||||
|
||||
def _call_claude(self, prompt: str, max_tokens: int = 1000) -> str | None:
|
||||
"""Call Claude (API or LOCAL mode) with error handling."""
|
||||
if self.config.mode == "api":
|
||||
return self._call_claude_api(prompt, max_tokens)
|
||||
elif self.config.mode == "local":
|
||||
return self._call_claude_local(prompt)
|
||||
return None
|
||||
|
||||
def _call_claude_api(self, prompt: str, max_tokens: int = 1000) -> str | None:
|
||||
"""Call Claude API."""
|
||||
if not self.client:
|
||||
return None
|
||||
|
||||
try:
|
||||
response = self.client.messages.create(
|
||||
model="claude-sonnet-4-20250514",
|
||||
max_tokens=max_tokens,
|
||||
messages=[{"role": "user", "content": prompt}],
|
||||
)
|
||||
return response.content[0].text
|
||||
except Exception as e:
|
||||
logger.warning(f"⚠️ API call failed: {e}")
|
||||
return None
|
||||
|
||||
def _call_claude_local(self, prompt: str) -> str | None:
|
||||
"""Call Claude Code CLI in LOCAL mode."""
|
||||
try:
|
||||
with tempfile.TemporaryDirectory() as temp_dir:
|
||||
temp_path = Path(temp_dir)
|
||||
|
||||
# Write prompt to file
|
||||
prompt_file = temp_path / "prompt.txt"
|
||||
prompt_file.write_text(prompt)
|
||||
|
||||
# Output file
|
||||
output_file = temp_path / "response.json"
|
||||
|
||||
# Call Claude CLI
|
||||
result = subprocess.run(
|
||||
[
|
||||
"claude",
|
||||
str(prompt_file),
|
||||
"--output",
|
||||
str(output_file),
|
||||
"--model",
|
||||
"sonnet",
|
||||
],
|
||||
capture_output=True,
|
||||
text=True,
|
||||
timeout=120,
|
||||
cwd=str(temp_path),
|
||||
)
|
||||
|
||||
if result.returncode != 0:
|
||||
logger.warning(f"⚠️ Claude CLI returned error: {result.returncode}")
|
||||
return None
|
||||
|
||||
# Read output
|
||||
if output_file.exists():
|
||||
response_text = output_file.read_text()
|
||||
try:
|
||||
json.loads(response_text)
|
||||
return response_text
|
||||
except json.JSONDecodeError:
|
||||
# Try to extract JSON
|
||||
import re
|
||||
|
||||
json_match = re.search(r"\[[\s\S]*\]|\{[\s\S]*\}", response_text)
|
||||
if json_match:
|
||||
return json_match.group()
|
||||
return None
|
||||
else:
|
||||
for json_file in temp_path.glob("*.json"):
|
||||
if json_file.name != "prompt.json":
|
||||
return json_file.read_text()
|
||||
return None
|
||||
|
||||
except subprocess.TimeoutExpired:
|
||||
logger.warning("⚠️ Claude CLI timeout (2 minutes)")
|
||||
return None
|
||||
except Exception as e:
|
||||
logger.warning(f"⚠️ LOCAL mode error: {e}")
|
||||
return None
|
||||
|
||||
def _get_default_prompt(self, enhancement_type: str) -> str:
|
||||
"""Get default prompt for enhancement type."""
|
||||
prompts = {
|
||||
"pattern": """Analyze these {count} design patterns and provide insights:
|
||||
|
||||
{items}
|
||||
|
||||
For EACH pattern, provide (in JSON format):
|
||||
1. "explanation": Brief why this pattern was detected (1-2 sentences)
|
||||
2. "issues": List of potential issues or anti-patterns (if any)
|
||||
3. "recommendations": Suggestions for improvement (if any)
|
||||
4. "related_patterns": Other patterns that might be relevant
|
||||
5. "confidence_boost": Confidence adjustment from -0.2 to +0.2
|
||||
|
||||
Format as JSON array matching input order. Be concise and actionable.""",
|
||||
"example": """Analyze these {count} test examples and provide context:
|
||||
|
||||
{items}
|
||||
|
||||
For EACH example, provide (in JSON format):
|
||||
1. "context": What this example demonstrates (1-2 sentences)
|
||||
2. "best_practices": What's done well
|
||||
3. "common_use_cases": When to use this pattern
|
||||
4. "related_examples": Similar examples
|
||||
5. "confidence_boost": Confidence adjustment from -0.2 to +0.2
|
||||
|
||||
Format as JSON array matching input order.""",
|
||||
"guide": """Enhance these {count} how-to guides:
|
||||
|
||||
{items}
|
||||
|
||||
For EACH guide, add:
|
||||
1. "prerequisites": What users need to know first
|
||||
2. "troubleshooting": Common issues and solutions
|
||||
3. "next_steps": What to learn after this
|
||||
4. "use_cases": Real-world scenarios
|
||||
|
||||
Format as JSON array.""",
|
||||
"config": """Analyze these {count} configuration patterns:
|
||||
|
||||
{items}
|
||||
|
||||
For EACH pattern, provide:
|
||||
1. "purpose": Why this configuration exists
|
||||
2. "common_values": Typical values used
|
||||
3. "security_implications": Any security concerns
|
||||
4. "best_practices": Recommended configuration
|
||||
|
||||
Format as JSON array.""",
|
||||
}
|
||||
|
||||
return prompts.get(enhancement_type, prompts["pattern"])
|
||||
|
||||
def _format_item_for_prompt(self, idx: int, item: dict) -> str:
|
||||
"""Format item for inclusion in prompt."""
|
||||
# Pattern formatting
|
||||
if "pattern_type" in item:
|
||||
return f"{idx + 1}. {item['pattern_type']} in {item.get('class_name', 'unknown')}\n Evidence: {', '.join(item.get('evidence', []))}"
|
||||
|
||||
# Example formatting
|
||||
elif "category" in item and "code" in item:
|
||||
return f"{idx + 1}. {item['category']}: {item['code'][:100]}"
|
||||
|
||||
# Generic formatting
|
||||
else:
|
||||
desc = item.get("description", item.get("name", str(item)))
|
||||
return f"{idx + 1}. {desc}"
|
||||
|
||||
|
||||
# Backward compatibility aliases
|
||||
class PatternEnhancer(UnifiedEnhancer):
|
||||
"""Backward compatible pattern enhancer."""
|
||||
|
||||
def enhance_patterns(self, patterns: list[dict]) -> list[dict]:
|
||||
return self.enhance(patterns, "pattern")
|
||||
|
||||
|
||||
class TestExampleEnhancer(UnifiedEnhancer):
|
||||
"""Backward compatible test example enhancer."""
|
||||
|
||||
def enhance_examples(self, examples: list[dict]) -> list[dict]:
|
||||
return self.enhance(examples, "example")
|
||||
|
||||
|
||||
class GuideEnhancer(UnifiedEnhancer):
|
||||
"""Backward compatible guide enhancer."""
|
||||
|
||||
def enhance_guides(self, guides: list[dict]) -> list[dict]:
|
||||
return self.enhance(guides, "guide")
|
||||
|
||||
|
||||
class ConfigEnhancer(UnifiedEnhancer):
|
||||
"""Backward compatible config enhancer."""
|
||||
|
||||
def enhance_config(self, config: list[dict]) -> list[dict]:
|
||||
return self.enhance(config, "config")
|
||||
|
||||
|
||||
# Main enhancer export
|
||||
AIEnhancer = UnifiedEnhancer
|
||||
|
||||
if __name__ == "__main__":
|
||||
# Quick test
|
||||
enhancer = UnifiedEnhancer(mode="local", enabled=False)
|
||||
print(f"✅ Mode: {enhancer.config.mode}")
|
||||
print(f"✅ Batch size: {enhancer.config.batch_size}")
|
||||
print(f"✅ Workers: {enhancer.config.parallel_workers}")
|
||||
Reference in New Issue
Block a user