summaryrefslogtreecommitdiffstats
path: root/python/tests/harvest_datacite.py
blob: 40e5f7112337721ee02a317e73f91c50301ebeaf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
import datetime
import json

import responses

from fatcat_tools.harvest import *


@responses.activate
def test_datacite_harvest_date(mocker):

    # mock out the harvest state object so it doesn't try to actually connect
    # to Kafka
    mocker.patch("fatcat_tools.harvest.harvest_common.HarvestState.initialize_from_kafka")

    # mock day request to datacite API
    with open("tests/files/datacite_api.json", "r") as f:
        resp = json.loads(f.readline())
    responses.add(responses.GET, "https://api.datacite.org/dois", json=resp, status=200)

    harvester = HarvestDataciteWorker(
        kafka_hosts="dummy",
        produce_topic="dummy-produce-topic",
        state_topic="dummy-state-topic",
        contact_email="test@fatcat.wiki",
    )

    harvester.producer = mocker.Mock()

    harvester.fetch_date(datetime.date(2019, 2, 3))

    assert len(responses.calls) == 1

    # ensure email was included in User-Agent
    assert "mailto:test@fatcat.wiki" in responses.calls[0].request.headers["User-Agent"]

    # check that correct date param was passed as expected
    assert (
        "query=updated%3A%5B2019-02-03T00%3A00%3A00.000Z+TO+2019-02-03T23%3A59%3A59.999Z%5D"
        in responses.calls[0].request.url
    )

    # check that we published the expected number of DOI objects were published
    # to the (mock) kafka topic
    assert harvester.producer.produce.call_count == 1
    assert harvester.producer.flush.call_count == 1
    assert harvester.producer.poll.called_once_with(0)