llm/tests/test_utils.py

import pytest
from llm.utils import (
    simplify_usage_dict,
    extract_fenced_code_block,
    maybe_fenced_code,
    truncate_string,
    schema_dsl,
)


@pytest.mark.parametrize(
    "input_data,expected_output",
    [
        (
            {
                "prompt_tokens_details": {"cached_tokens": 0, "audio_tokens": 0},
                "completion_tokens_details": {
                    "reasoning_tokens": 0,
                    "audio_tokens": 1,
                    "accepted_prediction_tokens": 0,
                    "rejected_prediction_tokens": 0,
                },
            },
            {"completion_tokens_details": {"audio_tokens": 1}},
        ),
        (
            {
                "details": {"tokens": 5, "audio_tokens": 2},
                "more_details": {"accepted_tokens": 3},
            },
            {
                "details": {"tokens": 5, "audio_tokens": 2},
                "more_details": {"accepted_tokens": 3},
            },
        ),
        ({"details": {"tokens": 0, "audio_tokens": 0}, "more_details": {}}, {}),
        ({"level1": {"level2": {"value": 0, "another_value": {}}}}, {}),
        (
            {
                "level1": {"level2": {"value": 0, "another_value": 1}},
                "level3": {"empty_dict": {}, "valid_token": 10},
            },
            {"level1": {"level2": {"another_value": 1}}, "level3": {"valid_token": 10}},
        ),
    ],
)
def test_simplify_usage_dict(input_data, expected_output):
    # This utility function is used by at least one plugin - llm-openai-plugin
    assert simplify_usage_dict(input_data) == expected_output


@pytest.mark.parametrize(
    "input,last,expected",
    [
        ["This is a sample text without any code blocks.", False, None],
        [
            "Here is some text.\n\n```\ndef foo():\n    return 'bar'\n```\n\nMore text.",
            False,
            "def foo():\n    return 'bar'\n",
        ],
        [
            "Here is some text.\n\n```python\ndef foo():\n    return 'bar'\n```\n\nMore text.",
            False,
            "def foo():\n    return 'bar'\n",
        ],
        [
            "Here is some text.\n\n````\ndef foo():\n    return 'bar'\n````\n\nMore text.",
            False,
            "def foo():\n    return 'bar'\n",
        ],
        [
            "Here is some text.\n\n````javascript\nfunction foo() {\n    return 'bar';\n}\n````\n\nMore text.",
            False,
            "function foo() {\n    return 'bar';\n}\n",
        ],
        [
            "Here is some text.\n\n```python\ndef foo():\n    return 'bar'\n````\n\nMore text.",
            False,
            None,
        ],
        [
            "First code block:\n\n```python\ndef foo():\n    return 'bar'\n```\n\n"
            "Second code block:\n\n```javascript\nfunction foo() {\n    return 'bar';\n}\n```",
            False,
            "def foo():\n    return 'bar'\n",
        ],
        [
            "First code block:\n\n```python\ndef foo():\n    return 'bar'\n```\n\n"
            "Second code block:\n\n```javascript\nfunction foo() {\n    return 'bar';\n}\n```",
            True,
            "function foo() {\n    return 'bar';\n}\n",
        ],
        [
            "First code block:\n\n```python\ndef foo():\n    return 'bar'\n```\n\n"
            # This one has trailing whitespace after the second code block:
            # https://github.com/simonw/llm/pull/718#issuecomment-2613177036
            "Second code block:\n\n```javascript\nfunction foo() {\n    return 'bar';\n}\n``` ",
            True,
            "function foo() {\n    return 'bar';\n}\n",
        ],
        [
            "Here is some text.\n\n```python\ndef foo():\n    return `bar`\n```\n\nMore text.",
            False,
            "def foo():\n    return `bar`\n",
        ],
    ],
)
def test_extract_fenced_code_block(input, last, expected):
    actual = extract_fenced_code_block(input, last=last)
    assert actual == expected


@pytest.mark.parametrize(
    "schema, expected",
    [
        # Test case 1: Basic comma-separated fields, default string type
        (
            "name, bio",
            {
                "type": "object",
                "properties": {"name": {"type": "string"}, "bio": {"type": "string"}},
                "required": ["name", "bio"],
            },
        ),
        # Test case 2: Comma-separated fields with types
        (
            "name, age int, balance float, active bool",
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string"},
                    "age": {"type": "integer"},
                    "balance": {"type": "number"},
                    "active": {"type": "boolean"},
                },
                "required": ["name", "age", "balance", "active"],
            },
        ),
        # Test case 3: Comma-separated fields with descriptions
        (
            "name: full name, age int: years old",
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string", "description": "full name"},
                    "age": {"type": "integer", "description": "years old"},
                },
                "required": ["name", "age"],
            },
        ),
        # Test case 4: Newline-separated fields
        (
            """
        name
        bio
        age int
        """,
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string"},
                    "bio": {"type": "string"},
                    "age": {"type": "integer"},
                },
                "required": ["name", "bio", "age"],
            },
        ),
        # Test case 5: Newline-separated with descriptions containing commas
        (
            """
        name: the person's name
        age int: their age in years, must be positive
        bio: a short bio, no more than three sentences
        """,
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string", "description": "the person's name"},
                    "age": {
                        "type": "integer",
                        "description": "their age in years, must be positive",
                    },
                    "bio": {
                        "type": "string",
                        "description": "a short bio, no more than three sentences",
                    },
                },
                "required": ["name", "age", "bio"],
            },
        ),
        # Test case 6: Empty schema
        ("", {"type": "object", "properties": {}, "required": []}),
        # Test case 7: Explicit string type
        (
            "name str, description str",
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string"},
                    "description": {"type": "string"},
                },
                "required": ["name", "description"],
            },
        ),
        # Test case 8: Extra whitespace
        (
            "  name  ,  age   int  :  person's age  ",
            {
                "type": "object",
                "properties": {
                    "name": {"type": "string"},
                    "age": {"type": "integer", "description": "person's age"},
                },
                "required": ["name", "age"],
            },
        ),
    ],
)
def test_schema_dsl(schema, expected):
    result = schema_dsl(schema)
    assert result == expected


def test_schema_dsl_multi():
    result = schema_dsl("name, age int: The age", multi=True)
    assert result == {
        "type": "object",
        "properties": {
            "items": {
                "type": "array",
                "items": {
                    "type": "object",
                    "properties": {
                        "name": {"type": "string"},
                        "age": {"type": "integer", "description": "The age"},
                    },
                    "required": ["name", "age"],
                },
            }
        },
        "required": ["items"],
    }


@pytest.mark.parametrize(
    "text, max_length, normalize_whitespace, keep_end, expected",
    [
        # Basic truncation tests
        ("Hello, world!", 100, False, False, "Hello, world!"),
        ("Hello, world!", 5, False, False, "He..."),
        ("", 10, False, False, ""),
        (None, 10, False, False, None),
        # Normalize whitespace tests
        ("Hello   world!", 100, True, False, "Hello world!"),
        ("Hello \n\t world!", 100, True, False, "Hello world!"),
        ("Hello   world!", 5, True, False, "He..."),
        # Keep end tests
        ("Hello, world!", 10, False, True, "He... d!"),
        ("Hello, world!", 7, False, False, "Hell..."),  # Now using regular truncation
        ("1234567890", 7, False, False, "1234..."),  # Now using regular truncation
        # Combinations of parameters
        ("Hello   world!", 10, True, True, "He... d!"),
        # Note: After normalization, "Hello world!" is exactly 12 chars, so no truncation
        ("Hello \n\t world!", 12, True, True, "Hello world!"),
        # Edge cases
        ("12345", 5, False, False, "12345"),
        ("123456", 5, False, False, "12..."),
        ("12345", 5, False, True, "12345"),  # Unchanged for exact fit
        ("123456", 5, False, False, "12..."),  # Regular truncation for small max_length
        # Very long string
        ("A" * 200, 10, False, False, "AAAAAAA..."),
        ("A" * 200, 10, False, True, "AA... AA"),  # keep_end with adequate length
        # Exact boundary cases
        ("123456789", 9, False, False, "123456789"),  # Exact fit
        ("1234567890", 9, False, False, "123456..."),  # Simple truncation
        ("123456789", 9, False, True, "123456789"),  # Exact fit with keep_end
        ("1234567890", 9, False, True, "12... 90"),  # keep_end truncation
        # Minimum sensible length tests for keep_end
        (
            "1234567890",
            8,
            False,
            True,
            "12345...",
        ),  # Too small for keep_end, use regular
        ("1234567890", 9, False, True, "12... 90"),  # Just enough for keep_end
    ],
)
def test_truncate_string(text, max_length, normalize_whitespace, keep_end, expected):
    """Test the truncate_string function with various inputs and parameters."""
    result = truncate_string(
        text=text,
        max_length=max_length,
        normalize_whitespace=normalize_whitespace,
        keep_end=keep_end,
    )
    assert result == expected


@pytest.mark.parametrize(
    "text, max_length, keep_end, prefix_len, expected_full",
    [
        # Test cases when the length is just right (string fits)
        ("0123456789", 10, True, None, "0123456789"),
        # Test cases with enough room for the ellipsis
        ("012345678901234", 14, True, 4, "0123... 1234"),
        # Test cases with different cutoffs
        ("abcdefghijklmnopqrstuvwxyz", 10, True, 2, "ab... yz"),
        ("abcdefghijklmnopqrstuvwxyz", 12, True, 3, "abc... xyz"),
        # Test cases below minimum threshold
        ("abcdefghijklmnopqrstuvwxyz", 8, True, None, "abcde..."),
    ],
)
def test_test_truncate_string_keep_end(
    text, max_length, keep_end, prefix_len, expected_full
):
    """Test the specific behavior of the keep_end parameter."""
    result = truncate_string(
        text=text,
        max_length=max_length,
        keep_end=keep_end,
    )

    assert result == expected_full

    # Only check prefix/suffix when we expect truncation with keep_end
    if prefix_len is not None and len(text) > max_length and max_length >= 9:
        assert result[:prefix_len] == text[:prefix_len]
        assert result[-prefix_len:] == text[-prefix_len:]
        assert "... " in result


@pytest.mark.parametrize(
    "content,expected_fenced",
    [
        # Case 1: Contains many angle brackets (>10)
        (
            "<div><p>Test</p><span>Test</span><a>Test</a><b>Test</b><i>Test</i><u>Test</u>",
            True,
        ),
        # Case 2: Short content with few angle brackets
        ("<p>Just a paragraph</p>", False),
        # Case 3: Many short lines (>3 lines, 90% under 120 chars)
        ("line1\nline2\nline3\nline4\nline5", True),
        # Case 4: Many long lines (>3 lines, <90% under 120 chars)
        ("x" * 130 + "\n" + "x" * 130 + "\n" + "x" * 130 + "\n" + "x" * 50, False),
        # Case 5: Mixed case (many angle brackets and short lines)
        ("<div>\n<p>Line 1</p>\n<p>Line 2</p>\n<p>Line 3</p>\n</div>", True),
        # Case 6: Mixed case with few lines
        ("<div><p>Only two</p></div>", False),
        # Case 7: Empty string
        ("", False),
        # Case 8: Content with existing backticks (should use more backticks)
        ("```\ndef test():\n    pass\n```", True),
    ],
)
def test_maybe_fenced_code(content: str, expected_fenced: bool):
    result = maybe_fenced_code(content)

    if expected_fenced:
        # Should be wrapped in fenced code block
        assert result != content
        assert result.strip().startswith("```")
        assert result.strip().endswith("```")
        assert content.strip() in result
    else:
        # Should remain unchanged
        assert result == content


@pytest.mark.parametrize(
    "content,backtick_count",
    [
        # Content with no backticks should use 3 backticks
        ("def test():\n    pass", 3),
        # Content with 3 backticks should use 4 backticks
        ("```\ndef test():\n    pass\n```", 4),
        # Content with 4 backticks should use 5 backticks
        ("````\ndef test():\n    pass\n````", 5),
    ],
)
def test_backtick_count_adjustment(content: str, backtick_count: int):
    # Force the content to be treated as code by adding many angle brackets
    content_with_brackets = content + "<" * 11

    result = maybe_fenced_code(content_with_brackets)

    # Check if the correct number of backticks is used
    expected_start = "\n" + "`" * backtick_count + "\n"
    expected_end = "\n" + "`" * backtick_count

    assert result.startswith(expected_start)
    assert result.endswith(expected_end)