diff options
Diffstat (limited to 'scalding')
-rw-r--r-- | scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala index 1b178eb..953610d 100644 --- a/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala +++ b/scalding/src/main/scala/sandcrawler/DumpGrobidXmlJob.scala @@ -30,8 +30,8 @@ class DumpGrobidXmlJob(args: Args) extends JobBase(args) with HBasePipeConversio JSONObject( Map( "pdf_hash" -> Bytes.toString(key.copyBytes()), - "cdx_metadata" -> Bytes.toString(key.copyBytes()), - "tei_xml" -> Bytes.toString(key.copyBytes()) + "cdx_metadata" -> Bytes.toString(cdx.copyBytes()), + "tei_xml" -> Bytes.toString(tei_xml.copyBytes()) )).toString ) }; |