# {"summary":{"last":"20131126234003","ok":"20131126234003","delta":0},"numRows":1,"line":"http://128.118.178.162/eps/pe/papers/0501/0501001.pdf"} import fileinput import json by_url = {} for line in fileinput.input(): line = line.strip() doc = json.loads(line) if doc.get("numRows") == 0: continue by_url[doc["line"]] = doc for k, v in sorted(by_url.items()): print("{}\t{}".format(k, json.dumps(v)))