File size: 607 Bytes
ba54ea9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from recap.ingestion.pdf import load_pdf


def test_extracts_pages_with_text_and_metadata():
    pages = load_pdf("tests/fixtures/tiny_lab.pdf")
    assert len(pages) == 1
    assert pages[0].page_number == 1
    assert "Creatinine" in pages[0].text
    assert "1.4 mg/dL" in pages[0].text


def test_pages_have_source_id():
    pages = load_pdf("tests/fixtures/tiny_lab.pdf", source_id="lab_2022-03-14.pdf")
    assert pages[0].source_id == "lab_2022-03-14.pdf"


def test_default_source_id_is_filename():
    pages = load_pdf("tests/fixtures/tiny_lab.pdf")
    assert pages[0].source_id == "tiny_lab.pdf"