summaryrefslogtreecommitdiffstats
path: root/tests/test_scrub.py
blob: 6541e136703285ad84098b46852953efd393b1af (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
from fatcat_scholar.schema import scrub_text


def test_scrub() -> None:
    vectors = [
        (
            "“Please clean this piece… of text</b>„",
            '"Please clean this piece... of text"',
        ),
        ("<jats:p>blah thing", "blah thing"),
    ]

    for raw, fixed in vectors:
        assert fixed == scrub_text(raw)