from app.utils.pdf_text import PAGE_TEXT_SEPARATOR, pages_to_raw_text, raw_text_pages_from_joined


def test_pages_to_raw_text_uses_separator():
    pages = [{"page": 1, "text": "Page one"}, {"page": 2, "text": "Page two"}]
    assert pages_to_raw_text(pages) == f"Page one{PAGE_TEXT_SEPARATOR}Page two"


def test_raw_text_pages_from_joined_legacy():
    combined = f"Alpha{PAGE_TEXT_SEPARATOR}Beta"
    pages = raw_text_pages_from_joined(combined)
    assert len(pages) == 2
    assert pages[0]["text"] == "Alpha"
    assert pages[1]["text"] == "Beta"
