diff options
Diffstat (limited to 'python/fatcat_tools/harvest')
| -rw-r--r-- | python/fatcat_tools/harvest/oaipmh.py | 8 | 
1 files changed, 6 insertions, 2 deletions
| diff --git a/python/fatcat_tools/harvest/oaipmh.py b/python/fatcat_tools/harvest/oaipmh.py index 923500fc..0b482924 100644 --- a/python/fatcat_tools/harvest/oaipmh.py +++ b/python/fatcat_tools/harvest/oaipmh.py @@ -98,18 +98,22 @@ class HarvestArxivWorker(HarvestOaiPmhWorker):      - http://export.arxiv.org/oai2?verb=GetRecord&identifier=oai:arXiv.org:0804.2273&metadataPrefix=arXivRaw      All records are work-level. Some metadata formats have internal info about -    specific versions. The 'arXiv' format does, so i'm using that. +    specific versions. The 'arXivRaw' format does, so i'm using that.      """      def __init__(self, **kwargs):          super().__init__(**kwargs)          self.endpoint_url = "https://export.arxiv.org/oai2" -        self.metadata_prefix = "arXiv" +        self.metadata_prefix = "arXivRaw"          self.name = "arxiv"  class HarvestPubmedWorker(HarvestOaiPmhWorker):      """ +    Will likely be doing MEDLINE daily batch imports for primary metadata, but +    might also want to run a PMC importer to update fulltext and assign OA +    licenses (when appropriate). +      Pubmed refs:      - https://www.ncbi.nlm.nih.gov/pmc/tools/oai/      - https://www.ncbi.nlm.nih.gov/pmc/oai/oai.cgi?verb=GetRecord&identifier=oai:pubmedcentral.nih.gov:152494&metadataPrefix=pmc_fm | 
