aboutsummaryrefslogtreecommitdiffstats
path: root/scalding/src/main/scala
diff options
context:
space:
mode:
authorBryan Newbold <bnewbold@archive.org>2018-10-30 18:03:24 -0700
committerBryan Newbold <bnewbold@archive.org>2018-10-30 18:03:24 -0700
commit4cb7c1bdc6710a11c869f3d398ed39762644395c (patch)
tree335564ce672db14ff0d50305ee0c41bb8258d3ad /scalding/src/main/scala
parente6600cca031d114577749cd4603f22a47c5001b1 (diff)
downloadsandcrawler-4cb7c1bdc6710a11c869f3d398ed39762644395c.tar.gz
sandcrawler-4cb7c1bdc6710a11c869f3d398ed39762644395c.zip
fix typos in DumpGrobidXmlJob
Diffstat (limited to 'scalding/src/main/scala')
-rw-r--r--scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala4
1 files changed, 2 insertions, 2 deletions
diff --git a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
index 1b178eb..953610d 100644
--- a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
+++ b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
@@ -30,8 +30,8 @@ class DumpGrobidXmlJob(args: Args) extends JobBase(args) with HBasePipeConversio
JSONObject(
Map(
"pdf_hash" -> Bytes.toString(key.copyBytes()),
- "cdx_metadata" -> Bytes.toString(key.copyBytes()),
- "tei_xml" -> Bytes.toString(key.copyBytes())
+ "cdx_metadata" -> Bytes.toString(cdx.copyBytes()),
+ "tei_xml" -> Bytes.toString(tei_xml.copyBytes())
)).toString
)
};