aboutsummaryrefslogtreecommitdiffstats
path: root/pig/tests/test_filter_cdx.py
diff options
context:
space:
mode:
Diffstat (limited to 'pig/tests/test_filter_cdx.py')
-rw-r--r--pig/tests/test_filter_cdx.py35
1 files changed, 35 insertions, 0 deletions
diff --git a/pig/tests/test_filter_cdx.py b/pig/tests/test_filter_cdx.py
new file mode 100644
index 0000000..83f88bb
--- /dev/null
+++ b/pig/tests/test_filter_cdx.py
@@ -0,0 +1,35 @@
+
+"""
+Abstract into a base test class/template:
+
+1. Needs deps downloaded and installed and env configured (bash? .env? makefile?)
+2. In test, create tempdir for output. Print helpful info on every run
+3. Run pig locally, inspect output files
+"""
+
+import os
+import unittest
+from nose.tools import *
+from pigpy.hadoop import Hadoop
+
+
+class TestFilterCDX(unittest.TestCase):
+
+ def setUp(self):
+
+ classpaths = [
+ os.path.join("pig-0.12.0-cdh5.0.1", "pig.jar"),
+ os.path.join("pig-0.12.0-cdh5.0.1", "lib", "*"),
+ ]
+
+ local_home = os.path.join("hadoop-2.3.0-cdh5.0.1")
+
+ name_node = "file:///test/files"
+
+ self.hadoop = Hadoop(local_home, name_node, classpaths)
+
+ def test_thing(self):
+
+ self.hadoop.run_pig_job("filter-cdx-ps.pig")
+ self.hadoop.copyToLocal("/reports/output.csv", "output.csv")
+