SPARC/tests/test_llm.py

"""Tests for LLM analysis functionality."""

import pytest
from unittest.mock import Mock, MagicMock
from SPARC.llm import LLMAnalyzer


class TestLLMAnalyzer:
    """Test LLM analyzer initialization and API interaction."""

    def test_analyzer_initialization_with_api_key(self, mocker):
        """Test that analyzer initializes with provided API key."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")

        analyzer = LLMAnalyzer(api_key="test-key-123")

        mock_anthropic.assert_called_once_with(api_key="test-key-123")
        assert analyzer.model == "claude-3-5-sonnet-20241022"

    def test_analyzer_initialization_from_config(self, mocker):
        """Test that analyzer loads API key from config when not provided."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")
        mock_config = mocker.patch("SPARC.llm.config")
        mock_config.anthropic_api_key = "config-key-456"

        analyzer = LLMAnalyzer()

        mock_anthropic.assert_called_once_with(api_key="config-key-456")

    def test_analyze_patent_content(self, mocker):
        """Test single patent content analysis."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")
        mock_client = Mock()
        mock_anthropic.return_value = mock_client

        # Mock the API response
        mock_response = Mock()
        mock_response.content = [Mock(text="Innovative GPU architecture.")]
        mock_client.messages.create.return_value = mock_response

        analyzer = LLMAnalyzer(api_key="test-key")
        result = analyzer.analyze_patent_content(
            patent_content="ABSTRACT: GPU with new cache design...",
            company_name="NVIDIA",
        )

        assert result == "Innovative GPU architecture."
        mock_client.messages.create.assert_called_once()

        # Verify the prompt includes company name and content
        call_args = mock_client.messages.create.call_args
        prompt_text = call_args[1]["messages"][0]["content"]
        assert "NVIDIA" in prompt_text
        assert "GPU with new cache design" in prompt_text

    def test_analyze_patent_portfolio(self, mocker):
        """Test portfolio analysis with multiple patents."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")
        mock_client = Mock()
        mock_anthropic.return_value = mock_client

        # Mock the API response
        mock_response = Mock()
        mock_response.content = [
            Mock(text="Strong portfolio in AI and graphics.")
        ]
        mock_client.messages.create.return_value = mock_response

        analyzer = LLMAnalyzer(api_key="test-key")
        patents_data = [
            {"patent_id": "US123", "content": "AI acceleration patent"},
            {"patent_id": "US456", "content": "Graphics rendering patent"},
        ]

        result = analyzer.analyze_patent_portfolio(
            patents_data=patents_data, company_name="NVIDIA"
        )

        assert result == "Strong portfolio in AI and graphics."
        mock_client.messages.create.assert_called_once()

        # Verify the prompt includes all patents
        call_args = mock_client.messages.create.call_args
        prompt_text = call_args[1]["messages"][0]["content"]
        assert "US123" in prompt_text
        assert "US456" in prompt_text
        assert "AI acceleration patent" in prompt_text
        assert "Graphics rendering patent" in prompt_text

    def test_analyze_patent_portfolio_with_correct_token_limit(self, mocker):
        """Test that portfolio analysis uses higher token limit."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")
        mock_client = Mock()
        mock_anthropic.return_value = mock_client

        mock_response = Mock()
        mock_response.content = [Mock(text="Analysis result.")]
        mock_client.messages.create.return_value = mock_response

        analyzer = LLMAnalyzer(api_key="test-key")
        patents_data = [{"patent_id": "US123", "content": "Test content"}]

        analyzer.analyze_patent_portfolio(patents_data, "TestCo")

        call_args = mock_client.messages.create.call_args
        # Portfolio analysis should use 2048 tokens
        assert call_args[1]["max_tokens"] == 2048

    def test_analyze_single_patent_with_correct_token_limit(self, mocker):
        """Test that single patent analysis uses lower token limit."""
        mock_anthropic = mocker.patch("SPARC.llm.Anthropic")
        mock_client = Mock()
        mock_anthropic.return_value = mock_client

        mock_response = Mock()
        mock_response.content = [Mock(text="Analysis result.")]
        mock_client.messages.create.return_value = mock_response

        analyzer = LLMAnalyzer(api_key="test-key")
        analyzer.analyze_patent_content("Test content", "TestCo")

        call_args = mock_client.messages.create.call_args
        # Single patent should use 1024 tokens
        assert call_args[1]["max_tokens"] == 1024