skill-seekers-reference/tests/test_issue_219_e2e.py

#!/usr/bin/env python3
"""
End-to-End Tests for Issue #219 - All Three Problems

Tests verify complete fixes for:
1. Large file encoding error (ccxt/ccxt 1.4MB CHANGELOG)
2. Missing --enhance-local CLI flag
3. Custom API endpoint support (ANTHROPIC_BASE_URL, ANTHROPIC_AUTH_TOKEN)
"""

import os
import shutil
import subprocess
import sys
import tempfile
import unittest
from pathlib import Path
from types import SimpleNamespace
from unittest.mock import Mock, patch

# Add src to path
sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", "src"))

# Check if anthropic is available
try:
    import anthropic  # noqa: F401

    ANTHROPIC_AVAILABLE = True
except ImportError:
    ANTHROPIC_AVAILABLE = False


class TestIssue219Problem1LargeFiles(unittest.TestCase):
    """E2E Test: Problem #1 - Large file download via download_url"""

    def setUp(self):
        """Set up test environment"""
        try:
            from github import Github, GithubException  # noqa: F401

            self.PYGITHUB_AVAILABLE = True
        except ImportError:
            self.PYGITHUB_AVAILABLE = False

        if not self.PYGITHUB_AVAILABLE:
            self.skipTest("PyGithub not installed")

        from skill_seekers.cli.github_scraper import GitHubScraper

        self.GitHubScraper = GitHubScraper

    def test_large_file_extraction_end_to_end(self):
        """E2E: Verify large files (encoding='none') are downloaded via URL"""

        config = {"repo": "ccxt/ccxt", "name": "ccxt", "github_token": None}

        # Mock large CHANGELOG (1.4MB, encoding="none")
        mock_content = Mock()
        mock_content.type = "file"
        mock_content.encoding = "none"  # This is what GitHub API returns for large files
        mock_content.size = 1388271
        mock_content.download_url = (
            "https://raw.githubusercontent.com/ccxt/ccxt/master/CHANGELOG.md"
        )

        with patch("skill_seekers.cli.github_scraper.Github"):
            scraper = self.GitHubScraper(config)
            scraper.repo = Mock()
            scraper.repo.get_contents.return_value = mock_content

            # Mock requests.get for download
            with patch("requests.get") as mock_requests:
                mock_response = Mock()
                mock_response.text = "# CCXT Changelog\n\n## v4.4.20\n- Bug fixes"
                mock_response.raise_for_status = Mock()
                mock_requests.return_value = mock_response

                # Call _extract_changelog (full workflow)
                scraper._extract_changelog()

                # VERIFY: download_url was called
                mock_requests.assert_called_once_with(
                    "https://raw.githubusercontent.com/ccxt/ccxt/master/CHANGELOG.md",
                    timeout=30,
                )

                # VERIFY: CHANGELOG was extracted successfully
                self.assertIn("changelog", scraper.extracted_data)
                self.assertIn("Bug fixes", scraper.extracted_data["changelog"])
                self.assertEqual(scraper.extracted_data["changelog"], mock_response.text)

    def test_large_file_fallback_on_error(self):
        """E2E: Verify graceful handling if download_url fails"""

        config = {"repo": "test/repo", "name": "test", "github_token": None}

        # Mock large file without download_url
        mock_content = Mock()
        mock_content.type = "file"
        mock_content.encoding = "none"
        mock_content.size = 2000000
        mock_content.download_url = None  # Missing download URL

        with patch("skill_seekers.cli.github_scraper.Github"):
            scraper = self.GitHubScraper(config)
            scraper.repo = Mock()
            scraper.repo.get_contents.return_value = mock_content

            # Should return None gracefully
            result = scraper._get_file_content("CHANGELOG.md")
            self.assertIsNone(result)

            # Should not crash
            scraper._extract_changelog()
            self.assertEqual(scraper.extracted_data["changelog"], "")


class TestIssue219Problem2CLIFlags(unittest.TestCase):
    """E2E Test: Problem #2 - CLI flags working through create command"""

    def test_create_command_has_enhancement_flags(self):
        """E2E: Verify --enhance-level flag exists in create command help"""
        result = subprocess.run(
            ["skill-seekers", "create", "--help"], capture_output=True, text=True
        )

        # VERIFY: Command succeeds
        self.assertEqual(result.returncode, 0, "create --help should succeed")

        # VERIFY: Enhancement flags present
        self.assertIn("--enhance-level", result.stdout, "Missing --enhance-level flag")

    def test_enhance_level_flag_accepted_by_create(self):
        """E2E: Verify --enhance-level flag is accepted by create command parser"""
        from skill_seekers.cli.main import create_parser

        parser = create_parser()

        # VERIFY: Parsing succeeds without "unrecognized arguments" error
        try:
            args = parser.parse_args(["create", "owner/repo", "--enhance-level", "2"])
            self.assertEqual(args.enhance_level, 2, "Flag should be parsed as 2")
        except SystemExit as e:
            self.fail(f"Argument parsing failed with: {e}")

    def test_github_scraper_class_accepts_enhance_level(self):
        """E2E: Verify GitHubScraper config accepts enhance_level."""
        from skill_seekers.cli.github_scraper import GitHubScraper

        config = {
            "repo": "test/test",
            "name": "test",
            "github_token": None,
            "enhance_level": 2,
        }

        with patch("skill_seekers.cli.github_scraper.Github"):
            scraper = GitHubScraper(config)
            # Just verify it doesn't crash with enhance_level in config
            self.assertIsNotNone(scraper)


@unittest.skipIf(not ANTHROPIC_AVAILABLE, "anthropic package not installed")
class TestIssue219Problem3CustomAPIEndpoints(unittest.TestCase):
    """E2E Test: Problem #3 - Custom API endpoint support"""

    def setUp(self):
        """Set up test environment"""
        self.temp_dir = tempfile.mkdtemp()
        self.skill_dir = Path(self.temp_dir) / "test_skill"
        self.skill_dir.mkdir()

        # Create minimal SKILL.md
        (self.skill_dir / "SKILL.md").write_text("# Test Skill\n", encoding="utf-8")

        # Create references directory
        refs_dir = self.skill_dir / "references"
        refs_dir.mkdir()
        (refs_dir / "index.md").write_text("# Index\n", encoding="utf-8")

    def tearDown(self):
        """Clean up test environment"""
        shutil.rmtree(self.temp_dir, ignore_errors=True)

    def test_anthropic_base_url_support(self):
        """E2E: Verify ANTHROPIC_BASE_URL environment variable is supported"""
        try:
            from skill_seekers.cli.enhance_skill import SkillEnhancer
        except ImportError:
            self.skipTest("anthropic package not installed")

        # Set custom base URL
        custom_url = "http://localhost:3000"

        with (
            patch.dict(
                os.environ,
                {"ANTHROPIC_API_KEY": "test-key-123", "ANTHROPIC_BASE_URL": custom_url},
            ),
            patch("skill_seekers.cli.enhance_skill.anthropic.Anthropic") as mock_anthropic,
        ):
            # Create enhancer
            _enhancer = SkillEnhancer(self.skill_dir)

            # VERIFY: Anthropic client called with custom base_url
            mock_anthropic.assert_called_once()
            call_kwargs = mock_anthropic.call_args[1]
            self.assertIn("base_url", call_kwargs, "base_url should be passed")
            self.assertEqual(
                call_kwargs["base_url"],
                custom_url,
                "base_url should match ANTHROPIC_BASE_URL env var",
            )

    def test_anthropic_auth_token_support(self):
        """E2E: Verify ANTHROPIC_AUTH_TOKEN is accepted as alternative to ANTHROPIC_API_KEY"""
        try:
            from skill_seekers.cli.enhance_skill import SkillEnhancer
        except ImportError:
            self.skipTest("anthropic package not installed")

        custom_token = "custom-auth-token-456"

        # Use ANTHROPIC_AUTH_TOKEN instead of ANTHROPIC_API_KEY
        with (
            patch.dict(os.environ, {"ANTHROPIC_AUTH_TOKEN": custom_token}, clear=True),
            patch("skill_seekers.cli.enhance_skill.anthropic.Anthropic") as mock_anthropic,
        ):
            # Create enhancer (should accept ANTHROPIC_AUTH_TOKEN)
            enhancer = SkillEnhancer(self.skill_dir)

            # VERIFY: api_key set to ANTHROPIC_AUTH_TOKEN value
            self.assertEqual(
                enhancer.api_key,
                custom_token,
                "Should use ANTHROPIC_AUTH_TOKEN when ANTHROPIC_API_KEY not set",
            )

            # VERIFY: Anthropic client initialized with correct key
            mock_anthropic.assert_called_once()
            call_kwargs = mock_anthropic.call_args[1]
            self.assertEqual(
                call_kwargs["api_key"],
                custom_token,
                "api_key should match ANTHROPIC_AUTH_TOKEN",
            )

    def test_thinking_block_handling(self):
        """E2E: Verify ThinkingBlock doesn't cause .text AttributeError"""
        try:
            from skill_seekers.cli.enhance_skill import SkillEnhancer
        except ImportError:
            self.skipTest("anthropic package not installed")

        with (
            patch.dict(os.environ, {"ANTHROPIC_API_KEY": "test-key"}),
            patch("skill_seekers.cli.enhance_skill.anthropic.Anthropic") as mock_anthropic,
        ):
            enhancer = SkillEnhancer(self.skill_dir)

            # Mock response with ThinkingBlock (newer SDK)
            # ThinkingBlock has no .text attribute
            mock_thinking_block = SimpleNamespace(type="thinking")

            # TextBlock has .text attribute
            mock_text_block = SimpleNamespace(text="# Enhanced SKILL.md\n\nContent here")

            mock_message = Mock()
            mock_message.content = [mock_thinking_block, mock_text_block]

            mock_client = mock_anthropic.return_value
            mock_client.messages.create.return_value = mock_message

            # Read references (with proper metadata structure)
            references = {
                "index.md": {
                    "content": "# Index\nTest content",
                    "source": "documentation",
                    "confidence": "high",
                    "path": "index.md",
                    "truncated": False,
                    "size": 23,
                    "repo_id": None,
                }
            }

            # Call enhance_skill_md (should handle ThinkingBlock gracefully)
            result = enhancer.enhance_skill_md(references, current_skill_md="# Old")

            # VERIFY: Should find text from TextBlock, ignore ThinkingBlock
            self.assertIsNotNone(result, "Should return enhanced content")
            self.assertEqual(
                result,
                "# Enhanced SKILL.md\n\nContent here",
                "Should extract text from TextBlock",
            )


@unittest.skipIf(not ANTHROPIC_AVAILABLE, "anthropic package not installed")
class TestIssue219IntegrationAll(unittest.TestCase):
    """E2E Integration: All 3 problems together"""

    def test_all_fixes_work_together(self):
        """E2E: Verify all 3 fixes work in combination"""
        # This test verifies the complete workflow:
        # 1. CLI accepts --enhance-level via create command
        # 2. Large files are downloaded
        # 3. Custom API endpoints work

        result = subprocess.run(
            ["skill-seekers", "create", "--help"], capture_output=True, text=True
        )

        # Enhancement flags present
        self.assertIn("--enhance-level", result.stdout)

        # Verify we can import all fixed modules
        try:
            from skill_seekers.cli import main  # noqa: F401
            from skill_seekers.cli.enhance_skill import SkillEnhancer  # noqa: F401
            from skill_seekers.cli.github_scraper import GitHubScraper  # noqa: F401

            # All imports successful
            self.assertTrue(True, "All modules import successfully")
        except ImportError as e:
            self.fail(f"Module import failed: {e}")


if __name__ == "__main__":
    # Run tests with verbose output
    unittest.main(verbosity=2)