Skip to content

Commit 25f7b2b

Browse files
committed
Update paragraph defaults and subset logic
1 parent 482aa9f commit 25f7b2b

File tree

1 file changed

+11
-6
lines changed

1 file changed

+11
-6
lines changed

SequenceAnalysis/src/org/labkey/sequenceanalysis/run/alignment/ParagraphStep.java

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -45,10 +45,10 @@ public ParagraphStep()
4545
put("allowBlank", false);
4646
}}, null),
4747
ToolParameterDescriptor.create("doBndSubset", "Remove BNDs", "If the reference VCF contains BNDs, selecting this option will cause the job to remove them prior to paragraph", "checkbox", new JSONObject(){{
48-
put("checked", true);
48+
put("checked", false);
4949
}}, false),
5050
ToolParameterDescriptor.create("useOutputFileContainer", "Submit to Source File Workbook", "If checked, each job will be submitted to the same workbook as the input file, as opposed to submitting all jobs to the same workbook. This is primarily useful if submitting a large batch of files to process separately. This only applies if 'Run Separately' is selected.", "checkbox", new JSONObject(){{
51-
put("checked", true);
51+
put("checked", false);
5252
}}, false)
5353
));
5454
}
@@ -113,20 +113,25 @@ else if (!svVcf.exists())
113113
boolean doBndSubset = ctx.getParams().optBoolean("doBndSubset", false);
114114
if (doBndSubset)
115115
{
116-
File vcfNoBnd = new File(ctx.getOutputDir(), SequenceAnalysisService.get().getUnzippedBaseName(svVcf.getName()) + "nobnd.vcf.gz");
116+
File vcfNoBnd = new File(ctx.getOutputDir(), SequenceAnalysisService.get().getUnzippedBaseName(svVcf.getName()) + "pgSubset.vcf.gz");
117117
File vcfNoBndIdx = new File(vcfNoBnd.getPath() + ".tbi");
118118
if (vcfNoBndIdx.exists())
119119
{
120-
ctx.getLogger().debug("Index exists, will no repeat BND subset");
120+
ctx.getLogger().debug("Index exists, will no repeat VCF subset");
121121
}
122122
else
123123
{
124124
SelectVariantsWrapper svw = new SelectVariantsWrapper(ctx.getLogger());
125125
List<String> selectArgs = new ArrayList<>();
126126
selectArgs.add("-select");
127127
selectArgs.add("SVTYPE != 'BND'");
128+
selectArgs.add("-select");
129+
selectArgs.add("!(vc.hasAttribute('SVTYPE') && vc.getAttribute('SVTYPE') == 'INS' && vc.hasSymbolicAlleles() && !vc.hasAttribute('SEQ'))");
130+
selectArgs.add("-select");
131+
selectArgs.add("POS > 150");
132+
selectArgs.add("--exclude-filtered");
128133
selectArgs.add("--exclude-filtered");
129-
selectArgs.add("--exclude-non-variants");
134+
selectArgs.add("--sites-only-vcf-output");
130135

131136
svw.execute(ctx.getSequenceSupport().getCachedGenome(inputFiles.get(0).getLibrary_id()).getWorkingFastaFile(), svVcf, vcfNoBnd, selectArgs);
132137

@@ -173,7 +178,7 @@ else if (!svVcf.exists())
173178
try (PrintWriter writer = PrintWriters.getPrintWriter(coverageFile); SamReader reader = SamReaderFactory.makeDefault().open(so.getFile()))
174179
{
175180
SAMFileHeader header = reader.getFileHeader();
176-
if (header.getReadGroups().size() == 0)
181+
if (header.getReadGroups().isEmpty())
177182
{
178183
throw new PipelineJobException("No read groups found in input BAM");
179184
}

0 commit comments

Comments
 (0)