aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-04-04 12:06:38 -0700
committerBryan Newbold <bnewbold@archive.org>2018-04-04 12:06:38 -0700
commit1dad0d9e54bfae93eebea47f8a3cb291cdd645c5 (patch)
tree97a8c9bcaf93734e2dbd8f431d37213520b55fbd
parent427dd875958c8a6d2d791d55f9dda300ebdc853b (diff)
downloadsandcrawler-1dad0d9e54bfae93eebea47f8a3cb291cdd645c5.tar.gz
sandcrawler-1dad0d9e54bfae93eebea47f8a3cb291cdd645c5.zip
extraction -> mapreduce
-rw-r--r--mapreduce/Pipfile (renamed from extraction/Pipfile)0
-rw-r--r--mapreduce/Pipfile.lock (renamed from extraction/Pipfile.lock)0
-rw-r--r--mapreduce/README.md (renamed from extraction/README.md)0
-rw-r--r--mapreduce/TODO (renamed from extraction/TODO)0
-rwxr-xr-xmapreduce/backfill_hbase_from_cdx.py (renamed from extraction/backfill_hbase_from_cdx.py)0
-rwxr-xr-xmapreduce/extraction_cdx_grobid.py (renamed from extraction/extraction_cdx_grobid.py)0
-rwxr-xr-xmapreduce/grobid2json.py (renamed from extraction/grobid2json.py)0
-rw-r--r--mapreduce/mrjob.conf (renamed from extraction/mrjob.conf)0
-rw-r--r--mapreduce/pytest.ini (renamed from extraction/pytest.ini)0
-rw-r--r--mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml (renamed from extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml)0
-rw-r--r--mapreduce/tests/files/example.cdx (renamed from extraction/tests/files/example.cdx)0
-rw-r--r--mapreduce/tests/test_backfill_hbase_from_cdx.py (renamed from extraction/tests/test_backfill_hbase_from_cdx.py)0
-rw-r--r--mapreduce/tests/test_extraction_cdx_grobid.py (renamed from extraction/tests/test_extraction_cdx_grobid.py)0
-rw-r--r--mapreduce/xml2json.py (renamed from extraction/xml2json.py)0
14 files changed, 0 insertions, 0 deletions
diff --git a/extraction/Pipfile b/mapreduce/Pipfile
index 32fc3dd..32fc3dd 100644
--- a/extraction/Pipfile
+++ b/mapreduce/Pipfile
diff --git a/extraction/Pipfile.lock b/mapreduce/Pipfile.lock
index 86ed6bd..86ed6bd 100644
--- a/extraction/Pipfile.lock
+++ b/mapreduce/Pipfile.lock
diff --git a/extraction/README.md b/mapreduce/README.md
index b063fba..b063fba 100644
--- a/extraction/README.md
+++ b/mapreduce/README.md
diff --git a/extraction/TODO b/mapreduce/TODO
index 3459752..3459752 100644
--- a/extraction/TODO
+++ b/mapreduce/TODO
diff --git a/extraction/backfill_hbase_from_cdx.py b/mapreduce/backfill_hbase_from_cdx.py
index fe37bd5..fe37bd5 100755
--- a/extraction/backfill_hbase_from_cdx.py
+++ b/mapreduce/backfill_hbase_from_cdx.py
diff --git a/extraction/extraction_cdx_grobid.py b/mapreduce/extraction_cdx_grobid.py
index 27668ea..27668ea 100755
--- a/extraction/extraction_cdx_grobid.py
+++ b/mapreduce/extraction_cdx_grobid.py
diff --git a/extraction/grobid2json.py b/mapreduce/grobid2json.py
index daf9387..daf9387 100755
--- a/extraction/grobid2json.py
+++ b/mapreduce/grobid2json.py
diff --git a/extraction/mrjob.conf b/mapreduce/mrjob.conf
index cb286f1..cb286f1 100644
--- a/extraction/mrjob.conf
+++ b/mapreduce/mrjob.conf
diff --git a/extraction/pytest.ini b/mapreduce/pytest.ini
index 0a5e921..0a5e921 100644
--- a/extraction/pytest.ini
+++ b/mapreduce/pytest.ini
diff --git a/extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml b/mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml
index dbc8be5..dbc8be5 100644
--- a/extraction/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml
+++ b/mapreduce/tests/files/23b29ea36382680716be08fc71aa81bd226e8a85.xml
diff --git a/extraction/tests/files/example.cdx b/mapreduce/tests/files/example.cdx
index 84e3271..84e3271 100644
--- a/extraction/tests/files/example.cdx
+++ b/mapreduce/tests/files/example.cdx
diff --git a/extraction/tests/test_backfill_hbase_from_cdx.py b/mapreduce/tests/test_backfill_hbase_from_cdx.py
index 1a13e5b..1a13e5b 100644
--- a/extraction/tests/test_backfill_hbase_from_cdx.py
+++ b/mapreduce/tests/test_backfill_hbase_from_cdx.py
diff --git a/extraction/tests/test_extraction_cdx_grobid.py b/mapreduce/tests/test_extraction_cdx_grobid.py
index 71b55a3..71b55a3 100644
--- a/extraction/tests/test_extraction_cdx_grobid.py
+++ b/mapreduce/tests/test_extraction_cdx_grobid.py
diff --git a/extraction/xml2json.py b/mapreduce/xml2json.py
index f956014..f956014 100644
--- a/extraction/xml2json.py
+++ b/mapreduce/xml2json.py