diff options
| author | Bryan Newbold <bnewbold@robocracy.org> | 2018-11-13 23:48:45 -0800 | 
|---|---|---|
| committer | Bryan Newbold <bnewbold@robocracy.org> | 2018-11-13 23:48:47 -0800 | 
| commit | 7634f6ecf2361b1cb1cafd4e27fd1fb84d81d130 (patch) | |
| tree | 69b18860ed4188c5169e9d9cb174355966b6f7de /python/fatcat_tools/workers/elastic.py | |
| parent | 7edae5c9d2267ba5e381ecbf00a7c3f7dacf4194 (diff) | |
| download | fatcat-7634f6ecf2361b1cb1cafd4e27fd1fb84d81d130.tar.gz fatcat-7634f6ecf2361b1cb1cafd4e27fd1fb84d81d130.zip | |
switch to auto consumer offset updates
This is the classic/correct way to do consumer group updates for higher
throughput, when "at least once" semantics are acceptible (as they are
here; double processing should be safe/fine).
Diffstat (limited to 'python/fatcat_tools/workers/elastic.py')
| -rw-r--r-- | python/fatcat_tools/workers/elastic.py | 6 | 
1 files changed, 5 insertions, 1 deletions
| diff --git a/python/fatcat_tools/workers/elastic.py b/python/fatcat_tools/workers/elastic.py index 119a6a26..3a75a1b3 100644 --- a/python/fatcat_tools/workers/elastic.py +++ b/python/fatcat_tools/workers/elastic.py @@ -32,6 +32,10 @@ class FatcatElasticReleaseWorker(FatcatWorker):          consumer = consume_topic.get_balanced_consumer(              consumer_group=self.consumer_group,              managed=True, +            fetch_message_max_bytes=4000000, # up to ~4MBytes +            auto_commit_enable=True, +            auto_commit_interval_ms=30000, # 30 seconds +            compacted_topic=True,          )          for msg in consumer: @@ -45,4 +49,4 @@ class FatcatElasticReleaseWorker(FatcatWorker):              print("Updating document: {}".format(elastic_endpoint))              resp = requests.post(elastic_endpoint, json=release_elastic_dict(release))              assert resp.status_code in (200, 201) -            consumer.commit_offsets() +            #consumer.commit_offsets() | 
