diff options
Diffstat (limited to 'pig/tests')
-rw-r--r-- | pig/tests/test_filter_cdx.py | 35 |
1 files changed, 35 insertions, 0 deletions
diff --git a/pig/tests/test_filter_cdx.py b/pig/tests/test_filter_cdx.py new file mode 100644 index 0000000..83f88bb --- /dev/null +++ b/pig/tests/test_filter_cdx.py @@ -0,0 +1,35 @@ + +""" +Abstract into a base test class/template: + +1. Needs deps downloaded and installed and env configured (bash? .env? makefile?) +2. In test, create tempdir for output. Print helpful info on every run +3. Run pig locally, inspect output files +""" + +import os +import unittest +from nose.tools import * +from pigpy.hadoop import Hadoop + + +class TestFilterCDX(unittest.TestCase): + + def setUp(self): + + classpaths = [ + os.path.join("pig-0.12.0-cdh5.0.1", "pig.jar"), + os.path.join("pig-0.12.0-cdh5.0.1", "lib", "*"), + ] + + local_home = os.path.join("hadoop-2.3.0-cdh5.0.1") + + name_node = "file:///test/files" + + self.hadoop = Hadoop(local_home, name_node, classpaths) + + def test_thing(self): + + self.hadoop.run_pig_job("filter-cdx-ps.pig") + self.hadoop.copyToLocal("/reports/output.csv", "output.csv") + |