|
44 | 44 | # version 2.1 - change default to SAM tag instead of read name
|
45 | 45 | # version 2.2 - bug fix, improve optical detection
|
46 | 46 | # version 2.3 - add explicit support for cram, remove Bio::ToolBox dependency,
|
47 |
| -# fix untagged paired-end counting |
| 47 | +# fix untagged paired-end counting, fix missing header @PG |
48 | 48 |
|
49 | 49 | #### Inputs
|
50 | 50 | my $infile;
|
@@ -132,29 +132,31 @@ END
|
132 | 132 | USAGE: bam_umi_dedup.pl --in in.bam --out out.bam
|
133 | 133 |
|
134 | 134 | OPTIONS:
|
135 |
| - Required: |
136 |
| - -i --in <file> The input bam file, should be sorted and indexed |
137 |
| - -o --out <file> The output bam file |
| 135 | + Required: |
| 136 | + -i --in <file> The input bam file, should be sorted and indexed |
| 137 | + -o --out <file> The output bam file |
138 | 138 |
|
139 |
| - UMI options: |
140 |
| - -u --umi <string> SAM tag name for UMI sequence. Default 'RX' |
141 |
| - Specify 'name' when UMI appended to read name. |
142 |
| - -m --mark Mark duplicates (flag 0x400) instead of discarding |
143 |
| - -t --tolerance <int> UMI sequence edit distance tolerance ($edit_tolerance) |
144 |
| - --indel <int> Set insertion/deletion penalty score ($indel_score) |
145 |
| - --skip <int> Skip mismatch detection if depth exceeds ($skip_mismatch_depth) |
146 |
| -
|
147 |
| - Other options: |
148 |
| - -f --fasta <file> Provide fasta file for Cram files |
149 |
| - -d --distance <int> Set optical duplicate distance threshold. |
150 |
| - Use 100 for unpatterned flowcell (HiSeq) or |
151 |
| - 2500 for patterned flowcell (NovaSeq). Default 0. |
152 |
| - --coord <string> Provide the tile:X:Y integer 1-base positions in the |
153 |
| - read name for optical checking. For Illumina CASAVA 1.8 |
154 |
| - 7-element names, this is 5:6:7 (default) |
155 |
| - -c --cpu <int> Specify the number of forks to use ($cpu) |
156 |
| - --samtools <path> Path to samtools ($sam_app) |
157 |
| - -h --help Display full description and help |
| 139 | + UMI options: |
| 140 | + -u --umi <string> SAM tag name for UMI sequence. Default 'RX' |
| 141 | + Specify 'name' when UMI appended to read name. |
| 142 | + -m --mark Mark duplicates (flag 0x400) instead of discarding |
| 143 | + -t --tolerance <int> UMI sequence edit distance tolerance ($edit_tolerance) |
| 144 | + --indel <int> Set insertion/deletion penalty score ($indel_score) |
| 145 | + --skip <int> Skip mismatch detection if depth exceeds ($skip_mismatch_depth) |
| 146 | +
|
| 147 | + Other options: |
| 148 | + -f --fasta <file> Provide indexed fasta file for Cram files |
| 149 | + -d --distance <int> Set optical duplicate distance threshold. |
| 150 | + Use 100 for unpatterned flowcell (HiSeq) or |
| 151 | + 2500 for patterned flowcell (NextSeq or NovaSeq6000) |
| 152 | + or 200 for NovaseqX. Default 0. |
| 153 | + --coord <string> Provide the tile:X:Y integer 1-base positions in the |
| 154 | + read name for optical checking. For Illumina CASAVA 1.8 |
| 155 | + 7-element names, this is 5:6:7 (default) |
| 156 | + -c --cpu <int> Specify the number of forks to use ($cpu) |
| 157 | + --samtools <path> Path to samtools ($sam_app) |
| 158 | + --nosam Do not use samtools for final concatenation (slower) |
| 159 | + -h --help Display full description and help |
158 | 160 |
|
159 | 161 | END
|
160 | 162 |
|
|
0 commit comments