diff options
author | Bryan Newbold <bnewbold@archive.org> | 2018-04-04 12:06:38 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2018-04-04 12:06:38 -0700 |
commit | 1dad0d9e54bfae93eebea47f8a3cb291cdd645c5 (patch) | |
tree | 97a8c9bcaf93734e2dbd8f431d37213520b55fbd | |
parent | 427dd875958c8a6d2d791d55f9dda300ebdc853b (diff) | |
download | sandcrawler-1dad0d9e54bfae93eebea47f8a3cb291cdd645c5.tar.gz sandcrawler-1dad0d9e54bfae93eebea47f8a3cb291cdd645c5.zip |
extraction -> mapreduce
-rw-r--r-- | mapreduce/Pipfile (renamed from extraction/Pipfile) | 0 | ||||
-rw-r--r-- | mapreduce/Pipfile.lock (renamed from extraction/Pipfile.lock) | 0 | ||||
-rw-r--r-- | mapreduce/README.md (renamed from extraction/README.md) | 0 | ||||
-rw-r--r-- | mapreduce/TODO (renamed from extraction/TODO) | 0 | ||||
-rwxr-xr-x | mapreduce/backfill_hbase_from_cdx.py (renamed from extraction/backfill_hbase_from_cdx.py) | 0 | ||||
-rwxr-xr-x | mapreduce/extraction_cdx_grobid.py (renamed from extraction/extraction_cdx_grobid.py) | 0 | ||||
-rwxr-xr-x | mapreduce/grobid2json.py (renamed from extraction/grobid2json.py) | 0 | ||||
-rw-r--r-- | mapreduce/mrjob.conf (renamed from extraction/mrjob.conf) | 0 | ||||
-rw-r--r-- | mapreduce/pytest.ini (renamed from extraction/pytest.ini) | 0 | ||||
-rw-r--r-- | mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml (renamed from extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml) | 0 | ||||
-rw-r--r-- | mapreduce/tests/files/example.cdx (renamed from extraction/tests/files/example.cdx) | 0 | ||||
-rw-r--r-- | mapreduce/tests/test_backfill_hbase_from_cdx.py (renamed from extraction/tests/test_backfill_hbase_from_cdx.py) | 0 | ||||
-rw-r--r-- | mapreduce/tests/test_extraction_cdx_grobid.py (renamed from extraction/tests/test_extraction_cdx_grobid.py) | 0 | ||||
-rw-r--r-- | mapreduce/xml2json.py (renamed from extraction/xml2json.py) | 0 |
14 files changed, 0 insertions, 0 deletions
diff --git a/extraction/Pipfile b/mapreduce/Pipfile index 32fc3dd..32fc3dd 100644 --- a/extraction/Pipfile +++ b/mapreduce/Pipfile diff --git a/extraction/Pipfile.lock b/mapreduce/Pipfile.lock index 86ed6bd..86ed6bd 100644 --- a/extraction/Pipfile.lock +++ b/mapreduce/Pipfile.lock diff --git a/extraction/README.md b/mapreduce/README.md index b063fba..b063fba 100644 --- a/extraction/README.md +++ b/mapreduce/README.md diff --git a/extraction/TODO b/mapreduce/TODO index 3459752..3459752 100644 --- a/extraction/TODO +++ b/mapreduce/TODO diff --git a/extraction/backfill_hbase_from_cdx.py b/mapreduce/backfill_hbase_from_cdx.py index fe37bd5..fe37bd5 100755 --- a/extraction/backfill_hbase_from_cdx.py +++ b/mapreduce/backfill_hbase_from_cdx.py diff --git a/extraction/extraction_cdx_grobid.py b/mapreduce/extraction_cdx_grobid.py index 27668ea..27668ea 100755 --- a/extraction/extraction_cdx_grobid.py +++ b/mapreduce/extraction_cdx_grobid.py diff --git a/extraction/grobid2json.py b/mapreduce/grobid2json.py index daf9387..daf9387 100755 --- a/extraction/grobid2json.py +++ b/mapreduce/grobid2json.py diff --git a/extraction/mrjob.conf b/mapreduce/mrjob.conf index cb286f1..cb286f1 100644 --- a/extraction/mrjob.conf +++ b/mapreduce/mrjob.conf diff --git a/extraction/pytest.ini b/mapreduce/pytest.ini index 0a5e921..0a5e921 100644 --- a/extraction/pytest.ini +++ b/mapreduce/pytest.ini diff --git a/extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml b/mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml index dbc8be5..dbc8be5 100644 --- a/extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml +++ b/mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml diff --git a/extraction/tests/files/example.cdx b/mapreduce/tests/files/example.cdx index 84e3271..84e3271 100644 --- a/extraction/tests/files/example.cdx +++ b/mapreduce/tests/files/example.cdx diff --git a/extraction/tests/test_backfill_hbase_from_cdx.py b/mapreduce/tests/test_backfill_hbase_from_cdx.py index 1a13e5b..1a13e5b 100644 --- a/extraction/tests/test_backfill_hbase_from_cdx.py +++ b/mapreduce/tests/test_backfill_hbase_from_cdx.py diff --git a/extraction/tests/test_extraction_cdx_grobid.py b/mapreduce/tests/test_extraction_cdx_grobid.py index 71b55a3..71b55a3 100644 --- a/extraction/tests/test_extraction_cdx_grobid.py +++ b/mapreduce/tests/test_extraction_cdx_grobid.py diff --git a/extraction/xml2json.py b/mapreduce/xml2json.py index f956014..f956014 100644 --- a/extraction/xml2json.py +++ b/mapreduce/xml2json.py |