File size: 3,380 Bytes
6172a47 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 | """Tests for extract_text_from_content helper functions."""
from unittest.mock import MagicMock
import pytest
from providers.common.text import extract_text_from_content
class TestExtractTextFromContent:
"""Tests for providers.common.text.extract_text_from_content."""
def test_string_content(self):
"""Return string content as-is."""
assert extract_text_from_content("hello world") == "hello world"
def test_empty_string(self):
"""Return empty string for empty string input."""
assert extract_text_from_content("") == ""
def test_list_single_block(self):
"""Extract text from a single content block."""
block = MagicMock()
block.text = "some text"
assert extract_text_from_content([block]) == "some text"
def test_list_multiple_blocks(self):
"""Concatenate text from multiple content blocks."""
b1 = MagicMock()
b1.text = "hello "
b2 = MagicMock()
b2.text = "world"
assert extract_text_from_content([b1, b2]) == "hello world"
def test_list_with_non_text_block(self):
"""Skip blocks without text attribute."""
b1 = MagicMock()
b1.text = "hello"
b2 = MagicMock(spec=[]) # No attributes
assert extract_text_from_content([b1, b2]) == "hello"
def test_list_with_empty_text(self):
"""Skip blocks with empty text."""
b1 = MagicMock()
b1.text = ""
b2 = MagicMock()
b2.text = "world"
assert extract_text_from_content([b1, b2]) == "world"
def test_list_with_none_text(self):
"""Skip blocks with None text."""
b1 = MagicMock()
b1.text = None
b2 = MagicMock()
b2.text = "world"
assert extract_text_from_content([b1, b2]) == "world"
def test_empty_list(self):
"""Return empty string for empty list."""
assert extract_text_from_content([]) == ""
def test_non_string_non_list(self):
"""Return empty string for unexpected types."""
assert extract_text_from_content(None) == ""
assert extract_text_from_content(42) == ""
def test_list_with_non_string_text_attr(self):
"""Skip blocks where text is not a string."""
b1 = MagicMock()
b1.text = 123 # Not a string
b2 = MagicMock()
b2.text = "valid"
assert extract_text_from_content([b1, b2]) == "valid"
# --- Parametrized Edge Case Tests ---
def _make_block(text_val):
b = MagicMock()
b.text = text_val
return b
@pytest.mark.parametrize(
"content,expected",
[
("hello world", "hello world"),
("", ""),
(None, ""),
(42, ""),
([], ""),
(" ", " "),
],
ids=["string", "empty_str", "none", "int", "empty_list", "whitespace_only"],
)
def test_extract_text_scalar_and_empty_parametrized(content, expected):
"""Parametrized scalar and empty input handling."""
assert extract_text_from_content(content) == expected
def test_extract_functions_whitespace_only():
"""extract_text_from_content handles whitespace-only string."""
assert extract_text_from_content(" ") == " "
def test_extract_functions_unicode():
"""extract_text_from_content handles unicode content."""
assert extract_text_from_content("日本語テスト") == "日本語テスト"
|