From fa272a05f36c6d9e5a0eb628bb9a687deefb3e20 Mon Sep 17 00:00:00 2001 From: Martin Czygan Date: Mon, 23 Nov 2020 16:26:36 +0100 Subject: wip: note on memory large clusters might halt program (as they are currently kept in memory) --- fuzzycat/cluster.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/fuzzycat/cluster.py b/fuzzycat/cluster.py index 0aa2fd4..59214a1 100644 --- a/fuzzycat/cluster.py +++ b/fuzzycat/cluster.py @@ -433,6 +433,9 @@ class Cluster: Extract a key from elements of an iterable and group them. Just as uniq(1), the iterable must be ordered (by the key that is extracted) for this to work. + + There might be large clusters, which would currently exceed memory. + Mitigate by splitting large clusters into parts. """ for k, g in itertools.groupby(seq, key=key): items = list(g) -- cgit v1.2.3