aboutsummaryrefslogtreecommitdiffstats
path: root/python/sandcrawler/fileset_strategies.py
blob: 592b475d15ba041714582d846513932a8537832d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22

import sys
import json
import gzip
import time
from collections import namedtuple
from typing import Optional, Tuple, Any, Dict, List

from sandcrawler.html_metadata import BiblioMetadata
from sandcrawler.ia import ResourceResult
from sandcrawler.fileset_types import IngestStrategy, FilesetManifestFile, DatasetPlatformItem


class FilesetIngestStrategy(class):

    def __init__():
        self.ingest_strategy = 'unknown'

    def check_existing(): # XXX: -> Any:
        raise NotImplementedError()

    def process(item: DatasetPlatformItem):