-
Notifications
You must be signed in to change notification settings - Fork 596
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
MarkDuplicatesSpark improvements checkpoint (#4656)
Co-authored-by: Louis Bergelson <[email protected]> First part of a major rewrite of MarkDuplicatesSpark to improve performance. Tool still has a number of known issues, but is much faster than the previous version.
- Loading branch information
1 parent
3e41aa5
commit 7641f53
Showing
28 changed files
with
1,119 additions
and
432 deletions.
There are no files selected for viewing
23 changes: 23 additions & 0 deletions
23
...stitute/hellbender/cmdline/argumentcollections/MarkDuplicatesSparkArgumentCollection.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,23 @@ | ||
package org.broadinstitute.hellbender.cmdline.argumentcollections; | ||
|
||
import org.broadinstitute.barclay.argparser.Argument; | ||
import org.broadinstitute.hellbender.tools.spark.transforms.markduplicates.MarkDuplicatesSpark; | ||
import org.broadinstitute.hellbender.utils.read.markduplicates.MarkDuplicatesScoringStrategy; | ||
import org.broadinstitute.hellbender.utils.read.markduplicates.OpticalDuplicateFinder; | ||
|
||
import java.io.Serializable; | ||
|
||
|
||
/** | ||
* An argument collection for use with tools that mark optical | ||
* duplicates. | ||
*/ | ||
public final class MarkDuplicatesSparkArgumentCollection implements Serializable { | ||
private static final long serialVersionUID = 1L; | ||
|
||
@Argument(shortName = "DS", fullName = "DUPLICATE_SCORING_STRATEGY", doc = "The scoring strategy for choosing the non-duplicate among candidates.") | ||
public MarkDuplicatesScoringStrategy duplicatesScoringStrategy = MarkDuplicatesScoringStrategy.SUM_OF_BASE_QUALITIES; | ||
|
||
@Argument(fullName = MarkDuplicatesSpark.DO_NOT_MARK_UNMAPPED_MATES, doc = "Enabling this option will mean unmapped mates of duplicate marked reads will not be marked as duplicates.") | ||
public boolean dontMarkUnmappedMates = false; | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.