From f239e8da926343f312657f3c3075e2f3790760a8 Mon Sep 17 00:00:00 2001 From: Eric Coissac Date: Tue, 5 Aug 2025 08:49:45 -0400 Subject: [PATCH] Rename ISequenceChunk --- pkg/obichunk/{chunks.go => chunks_on_memory.go} | 15 ++++++++++++++- pkg/obichunk/unique.go | 2 +- pkg/obitools/obirefidx/famlilyindexing.go | 2 +- 3 files changed, 16 insertions(+), 3 deletions(-) rename pkg/obichunk/{chunks.go => chunks_on_memory.go} (69%) diff --git a/pkg/obichunk/chunks.go b/pkg/obichunk/chunks_on_memory.go similarity index 69% rename from pkg/obichunk/chunks.go rename to pkg/obichunk/chunks_on_memory.go index b4700f3..6a423ec 100644 --- a/pkg/obichunk/chunks.go +++ b/pkg/obichunk/chunks_on_memory.go @@ -9,7 +9,20 @@ import ( "git.metabarcoding.org/obitools/obitools4/obitools4/pkg/obiseq" ) -func ISequenceChunk(iterator obiiter.IBioSequence, +// ISequenceChunkMemory processes a sequence iterator by distributing the sequences +// into chunks in memory. It uses a classifier to determine how to distribute +// the sequences and returns a new iterator for the processed sequences. +// +// Parameters: +// - iterator: An iterator of biosequences to be processed. +// - classifier: A pointer to a BioSequenceClassifier used to classify the sequences +// during distribution. +// +// Returns: +// An iterator of biosequences representing the processed chunks. +// +// The function operates asynchronously. +func ISequenceChunkMemory(iterator obiiter.IBioSequence, classifier *obiseq.BioSequenceClassifier) (obiiter.IBioSequence, error) { newIter := obiiter.MakeIBioSequence() diff --git a/pkg/obichunk/unique.go b/pkg/obichunk/unique.go index 7d971c6..8b3127d 100644 --- a/pkg/obichunk/unique.go +++ b/pkg/obichunk/unique.go @@ -35,7 +35,7 @@ func IUniqueSequence(iterator obiiter.IBioSequence, } } else { - iterator, err = ISequenceChunk(iterator, + iterator, err = ISequenceChunkMemory(iterator, obiseq.HashClassifier(opts.BatchCount())) if err != nil { diff --git a/pkg/obitools/obirefidx/famlilyindexing.go b/pkg/obitools/obirefidx/famlilyindexing.go index 47b7e4b..e445c19 100644 --- a/pkg/obitools/obirefidx/famlilyindexing.go +++ b/pkg/obitools/obirefidx/famlilyindexing.go @@ -166,7 +166,7 @@ func IndexFamilyDB(iterator obiiter.IBioSequence) obiiter.IBioSequence { obidefault.ParallelWorkers(), ) - family_iterator, err := obichunk.ISequenceChunk( + family_iterator, err := obichunk.ISequenceChunkMemory( partof, obiseq.AnnotationClassifier("family_taxid", "NA"), )