blob: e6e48ac164480a1e325939ab472c7bddcc4dc935 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
|
import datetime
import pytest
from sandcrawler.html_ingest import *
def test_html_extract_ojs3() -> None:
with open('tests/files/first_monday_ojs3_fulltext.html', 'rb') as f:
ojs3_html = f.read()
fulltext = html_extract_body_teixml(ojs3_html)
assert fulltext['status'] == 'success'
|