aboutsummaryrefslogtreecommitdiffstats
path: root/fuzzycat
diff options
context:
space:
mode:
authorMartin Czygan <martin.czygan@gmail.com>2020-11-23 16:26:36 +0100
committerMartin Czygan <martin.czygan@gmail.com>2020-11-23 16:26:36 +0100
commitfa272a05f36c6d9e5a0eb628bb9a687deefb3e20 (patch)
tree8f0243aff1b8aafe62ac1cdb51cb2a2007da1b3f /fuzzycat
parent4c4f0ed18c269445e89020fc15e3ae07793d2589 (diff)
downloadfuzzycat-fa272a05f36c6d9e5a0eb628bb9a687deefb3e20.tar.gz
fuzzycat-fa272a05f36c6d9e5a0eb628bb9a687deefb3e20.zip
wip: note on memory
large clusters might halt program (as they are currently kept in memory)
Diffstat (limited to 'fuzzycat')
-rw-r--r--fuzzycat/cluster.py3
1 files changed, 3 insertions, 0 deletions
diff --git a/fuzzycat/cluster.py b/fuzzycat/cluster.py
index 0aa2fd4..59214a1 100644
--- a/fuzzycat/cluster.py
+++ b/fuzzycat/cluster.py
@@ -433,6 +433,9 @@ class Cluster:
Extract a key from elements of an iterable and group them. Just as
uniq(1), the iterable must be ordered (by the key that is extracted)
for this to work.
+
+ There might be large clusters, which would currently exceed memory.
+ Mitigate by splitting large clusters into parts.
"""
for k, g in itertools.groupby(seq, key=key):
items = list(g)