aboutsummaryrefslogtreecommitdiffstats
path: root/scalding/src
diff options
context:
space:
mode:
Diffstat (limited to 'scalding/src')
-rw-r--r--scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala4
1 files changed, 2 insertions, 2 deletions
diff --git a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
index 1b178eb..953610d 100644
--- a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
+++ b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala
@@ -30,8 +30,8 @@ class DumpGrobidXmlJob(args: Args) extends JobBase(args) with HBasePipeConversio
JSONObject(
Map(
"pdf_hash" -> Bytes.toString(key.copyBytes()),
- "cdx_metadata" -> Bytes.toString(key.copyBytes()),
- "tei_xml" -> Bytes.toString(key.copyBytes())
+ "cdx_metadata" -> Bytes.toString(cdx.copyBytes()),
+ "tei_xml" -> Bytes.toString(tei_xml.copyBytes())
)).toString
)
};