diff options
author | Bryan Newbold <bnewbold@archive.org> | 2018-10-30 18:03:24 -0700 |
---|---|---|
committer | Bryan Newbold <bnewbold@archive.org> | 2018-10-30 18:03:24 -0700 |
commit | 4cb7c1bdc6710a11c869f3d398ed39762644395c (patch) | |
tree | 335564ce672db14ff0d50305ee0c41bb8258d3ad /scalding | |
parent | e6600cca031d114577749cd4603f22a47c5001b1 (diff) | |
download | sandcrawler-4cb7c1bdc6710a11c869f3d398ed39762644395c.tar.gz sandcrawler-4cb7c1bdc6710a11c869f3d398ed39762644395c.zip |
fix typos in DumpGrobidXmlJob
Diffstat (limited to 'scalding')
-rw-r--r-- | scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala index 1b178eb..953610d 100644 --- a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala +++ b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala @@ -30,8 +30,8 @@ class DumpGrobidXmlJob(args: Args) extends JobBase(args) with HBasePipeConversio JSONObject( Map( "pdf_hash" -> Bytes.toString(key.copyBytes()), - "cdx_metadata" -> Bytes.toString(key.copyBytes()), - "tei_xml" -> Bytes.toString(key.copyBytes()) + "cdx_metadata" -> Bytes.toString(cdx.copyBytes()), + "tei_xml" -> Bytes.toString(tei_xml.copyBytes()) )).toString ) }; |