fulcrumgenomics · mjhipp · Jul 30, 2022 · Aug 2, 2022 · nh13 · Aug 6, 2022
@@ -28,6 +28,7 @@ import com.fulcrumgenomics.FgBioDef._
 import com.fulcrumgenomics.bam.OverlappingBasesConsensusCaller
 import com.fulcrumgenomics.bam.api.{SamOrder, SamSource, SamWriter}
 import com.fulcrumgenomics.cmdline.{ClpGroups, FgBioTool}
+import com.fulcrumgenomics.commons.collection.ParIterator.DefaultChunkSize
 import com.fulcrumgenomics.sopt.clp
 import com.fulcrumgenomics.commons.io.Io
 import com.fulcrumgenomics.commons.util.LazyLogging
@@ -108,6 +109,12 @@ class CallDuplexConsensusReads
  val maxReadsPerStrand: Option[Int] = None,
  @arg(doc="The number of threads to use while consensus calling.") val threads: Int = 1,
  @arg(doc="Consensus call overlapping bases in mapped paired end reads") val consensusCallOverlappingBases: Boolean = true,
+ @arg(doc="""
+            |Pull reads from this many source molecules into memory for multi-threaded processing.
+            |Using a smaller value will require less memory but will negatively impact processing speed.
+            |For very large family sizes, a smaller value may be necessary to reduce memory usage.
+            |This value is only used when `--threads > 1`.
+          """) val maxSourceMoleculesInMemory: Int = DefaultChunkSize
 ) extends FgBioTool with LazyLogging {
 
   Io.assertReadable(input)
@@ -142,7 +149,7 @@ class CallDuplexConsensusReads
       maxReadsPerStrand   = maxReadsPerStrand.getOrElse(VanillaUmiConsensusCallerOptions.DefaultMaxReads)
     )
     val progress = ProgressLogger(logger, unit=1000000)
-    val iterator = new ConsensusCallingIterator(inIter, caller, Some(progress), threads)
+    val iterator = new ConsensusCallingIterator(inIter, caller, Some(progress), threads, maxSourceMoleculesInMemory)
     out ++= iterator
     progress.logLast()
 

@@ -40,7 +40,7 @@ import com.fulcrumgenomics.util.ProgressLogger
   * @param caller the consensus caller to use to call consensus reads
   * @param progress an optional progress logger to which to log progress in input reads
   * @param threads the number of threads to use.
-  * @param chunkSize parallel process in chunkSize units; will cause 8 * chunkSize records to be held in memory
+  * @param chunkSize across the input [[SamRecord]]s from this many source molecules at a time
-  * @param chunkSize across the input [[SamRecord]]s from this many source molecules at a time
+  * @param chunkSize the number of source molecules to process in a single chunk, where chunks
+                     are processed in parallel.  This will cause `2 * threads * chunkSize` source 
+                     molecules to be held in memory, where the number of [[SamRecord]]s
+                      held in memory depends on the number of [[SamRecord]]s assigned to 
+                      each source molecule at any given time.
-  * @param chunkSize across the input [[SamRecord]]s from this many source molecules at a time
+  * @param chunkSize the number of source molecules to process in a single chunk, where chunks
+                     are processed in parallel.  This will cause `2 * threads * chunkSize` source 
+                     molecules to be held in memory, where the number of [[SamRecord]]s
+                      held in memory depends on the number of [[SamRecord]]s assigned to 
+                      each source molecule at any given time.
   */
 class ConsensusCallingIterator[ConsensusRead <: SimpleRead](sourceIterator: Iterator[SamRecord],
                                                             caller: UmiConsensusCaller[ConsensusRead],
@@ -67,10 +67,11 @@ class ConsensusCallingIterator[ConsensusRead <: SimpleRead](sourceIterator: Iter
       groupingIterator.flatMap(caller.consensusReadsFromSamRecords)
     }
     else {
-      ParIterator(groupingIterator, threads=threads).flatMap { rs =>
+      ParIterator(groupingIterator, threads=threads, chunkSize=chunkSize).map { rs =>
         val caller = callers.get()
         caller.synchronized { caller.consensusReadsFromSamRecords(rs) }
-      }.toAsync(chunkSize * 8)
+      }.toAsync(chunkSize).flatten
-      }.toAsync(chunkSize).flatten
+      }.toAsync(chunkSize * threads).flatten
-      }.toAsync(chunkSize).flatten
+      }.toAsync(chunkSize * threads).flatten
+      // Flatten AFTER pulling through ParIterator to keep input chunks in phase with output
-      // Flatten AFTER pulling through ParIterator to keep input chunks in phase with output
+      // Flatten AFTER pulling through ParIterator to keep the iterator in a stable order
-      // Flatten AFTER pulling through ParIterator to keep input chunks in phase with output
+      // Flatten AFTER pulling through ParIterator to keep the iterator in a stable order
     }
   }