summaryrefslogtreecommitdiffstats
path: root/tests/test_scrub.py
blob: fc6ef228ea04325f6df270f3dcf405e4ad36b61b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
from fatcat_scholar.schema import scrub_text


def test_scrub() -> None:
    vectors = [
        (
            "“Please clean this piece… of text</b>„",
            '"Please clean this piece... of text"',
        ),
        ("<jats:p>blah", "blah"),
    ]

    for raw, fixed in vectors:
        assert fixed == scrub_text(raw)