Skip to content

Commit a8f8d61

Browse files
authored
Merge pull request #121 from PolinaBevad/f_fix_insertion_end
Fixed issue with coordinate end for insertions
2 parents fbf78af + 2cd1b55 commit a8f8d61

13 files changed

+126
-104
lines changed

src/main/java/com/astrazeneca/vardict/VarDict.java

Lines changed: 1 addition & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -3410,13 +3410,7 @@ public int compare(Variant o1, Variant o2) {
34103410
vref.msint = msint.length();
34113411
vref.shift3 = shift3;
34123412
vref.sp = sp;
3413-
// In perl it was changed to simple ep
3414-
final Matcher pnMtch = PLUS_NUMBER.matcher(genotype);
3415-
if (pnMtch.find()) {
3416-
vref.ep = sp + toInt(pnMtch.group(1));
3417-
} else {
3418-
vref.ep = ep;
3419-
}
3413+
vref.ep = ep;
34203414
vref.refallele = refallele;
34213415
vref.varallele = varallele;
34223416
vref.genotype = genotype;
@@ -4578,7 +4572,6 @@ private static List<Object[]> fillTmp(Map<Integer, Map<String, Integer>> changes
45784572
private static final Pattern BEGIN_MINUS_NUMBER_ANY = Pattern.compile("^-\\d+(.*)");
45794573
private static final Pattern UP_NUMBER_END = Pattern.compile("\\^(\\d+)$");
45804574
private static final Pattern ATGSs_AMP_ATGSs_END = Pattern.compile("(\\+[ATGC]+)&[ATGC]+$");
4581-
private static final Pattern PLUS_NUMBER = Pattern.compile("\\+(\\d+)");
45824575
private static final Pattern SA_CIGAR_D_S_5clip = Pattern.compile("^\\d\\d+S");
45834576
private static final Pattern SA_CIGAR_D_S_3clip = Pattern.compile("\\d\\dS$");
45844577

Binary file not shown.

testdata/fastas/hg38.fa.csv

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
chr6,137218001,137220900,AGTCTGTGCCTAAGTGCAAGCTCTTACCGCAAAGTACTGCAACTGCCCATGTGGATGACTGACTAGAGCCtagaagagcagttaagaacttggactctggagccaaattgagcagctccccactgagtggctatgacctctctgccagttgggcaggcctctccgtaactcaatttctcgtccataaagagagagacaaataacgcctactccagaagattgttgtgaACACAGAACCAAAACGTGGACCTTTCAAAGTCCCTATGAATCATAAATCATAATAAAAAAAAGAAAACTGAATTGAAAAGGTTTACTGTTTTCTCTGGAGCTCGTAATCACAATTACTCTGCACTTCAGAAAAGCCACCCTCAACATTTGTTTTCTAGGAAATGTCAATAAGCAGGTGGAAATAAAATGCTCCGAAGAACAAACCCGTACGAAGAGACCTACTGCCAAATCTGCTAGTGAGTGCCGGCAATCCACCACTTCCAGACTGAGACCTAAGACGGACTGCCACTTACTTCTCAGCTGCCACTTACTTCTCAGCTGGCGACATAATGCATACTTTCCTACCCTAAGCACTTTGAGTCCCCCCCCCCACCCCCGCTAAGAAAGAAGTATTTAAGCCACGAACTGAGACCACGATGCCACATGCTGATCAGGACACTCAcagtcatgcgtcacttaacgatggagatccgttctgagaaatggagaaatgtccccttaggcaatttcttcgggcagtagaaacccagacaaacccagatgacacagcctactgctcttaggtcatgaacctgtacagcctgtcactgcactgaacactgcaggcaaccgtagcatactagtgagtatctgcgtatctaaccataaaaaaaggtacagtaagaagacgatattataatctttgagaccacgctgtcccacattgaccagcaacgtccttctgcagcgcataaTCGTATTTAAAAGTGGATTACAAGAGTCGGAAAAACAAGCGGCGTGATTTGTTGTGGCGGCAACCAGGGAAGAGGCAGGAGAAAGGCAACCGACGAGTTCAAACCACGGAGCCCCAGTCTCGCGACCCCACCTCGCGTCCCCGTCGCCCGCTCAGGGCCCGACGCAGGGGTCCCGGGCTAGGGCGACCTCGGAGAAGCGGGGCGGGGCTTCCCGGCTGGGGCGGATCCCTCCCTCCCTCTCGTCCCGACCCGGCCGCAGCCCTGCCGCGAACGACGGTACCTGAGGACGGCCCCAGATCCGCGGTGCCCATCTCAGCCCTGCTCACACCCTGCATGACAAGGGGTAGGAGAAAGAGGAGAGCCATGCTGCTACCGACGGTCGCTGGCTCCAACCCCGAGCGCCTGCGGGACCAGCCCAGCACTGCCCTCCAGCCCCGGCCTTACGTCACTTCCGTCACCGGGGTCTGTGCCGGCGTCGGCAGGAGGCGGGACCAGGGCGTGGGCGGGGTCAAGTCCGGGAAGCCGCAGGAGGCGGACTCAGGCGCAGCACCCAGCAGTGAGCACGGCGTCGTGCGGTCGGGACCTGGACTTCTGGGTGTGGGAGGAATTTGAGTGCAAAGGTTAAGGTCTTTCAACCTGGCACCCCATTCTGCAATTCTTCTTCCAGTTTTTTTCGGTTTCCTGGGGTTGTGCAAGTTTGCATTAGGCCACAGCCGAGCCACAATCCTTATTTTACTAACTCTTGGACTTCACCTGGTTGTCTTGGAGCCTGACATTTttagaagagaatgagacttcaaaagccatttccagtccctgctttttcatttgaggaacctgagacttagctagtgaaatggtttgtgcagattcccacagcCCAAATCAAATCGGCTTGACCAAGAACTACTTTGTTCTTGGAGAAAAAAACTATTTGCATTACCTTCTCAGCAATTCAGTGTCAAATCAGTTTATCAGGCAGCCTCTCATGAAGAGGTCTGCTCTCTTACCTCTCTGGGTTTGTCTGTTATTTTGCATCTCTCCTATTCCACTGCAGCCACATTGCTAAGTCCTTCAGCGCTTGTGCTCAAACATGCGAATGTCTAATGATCTCACCTGTTTCAATTCTCTGAGTATCATGAACTTTTGTTAAAAattttaaattgcaacacaccttctcctcctccttaccccgccctactgttttttcatggcacttttcaccttgctgtacactataatatacaccttgatatttgttttcttctccttctaaaatgtaagctccgtagagctgacatctttacttgGCACTCAATTAGTATTTGTTGAGTGAAAGACTGCATGATTACTAGTGTTAAGGAAAATTTTTAAAGAGGGAAAATCCTTATAAAGACACTATATAAACTAGAGGTATTATCAGCCAGATCATTTTACTTGTATTAATAAATCTCTTAGCTcagtacttctcaaacttcaacatacatgtgaaccatctggggatcttgataaaatgcagatttggattcagtagttctaattcaggttgggtcttgagattttgtatttcggacaaaatgcacaggggatgctggtgcccctttcaacaggaccacactttgaatCAGAAGAATTTAGCTCAATCTAGACTAAGTTTAGGGAGAATATTTCCTTTGATGTGTTTCTGATGTCCACTATATGAAAGACACCTTCTAGTCGTTGTAAGGATGCAAGGATAAATAACTGATCTTTACCGTTTAGGCGTCTATGGAGTAGGACAAAATATGATATCCAGTTTGTAAACATTTTTGTGGTACTtgtcacaggctgggttaccctggcagtaaactctgaggtcgagattaaggtataaggcattgattgattagggagtgctcttggaataaacgtctgtgaaggggaggtggaggaagcaga

testdata/integrationtestcases/Amplicon;hg19.fa;Colo829-18_S3-sort.bam;chr1;933866-934466;933866-934466;-a 100.95 -D;.txt

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,5 +2,4 @@ Amplicon,hg19.fa,Colo829-18_S3-sort.bam,chr1,933866,934466,933866,934466,-a 10:0
22
Colo829-18_S3-sort testbed chr1 934099 934099 G C 4 4 0 0 2 2 C/C 1.0000 0;2 50.0 1 32.8 1 60.0 3.000 1.0000 0 0 3.000 1 4.0 3 3 CAACGCGGGGGCAGAGGGCG GTGCGCATGCGGGGCTGCAG chr1:933867-934466 SNV 1 1 0 0 C:4:F-2:R-2:1.000:2:50.0:true:32.8:true:1.000:60.0:3.0 Good0 4 4 0 0 2 2 C/C 1.0000 0;2 50.0 1 32.8 1 60.0 3.000 1.0000 0 chr1:933867-934466
33
Colo829-18_S3-sort testbed chr1 934106 934106 A G 4 2 1 0 1 1 A/G 0.5000 0;2 60.0 0 41.0 0 60.0 4.000 0.6667 0 0 1.000 1 3.5 2 3 GGGGCAGAGGGCGGGTGCGC TGCGGGGCTGCAGGGATGCG chr1:933867-934466 SNV 1 1 0 0 A:1:F-1:R-0:0.250:0:40.0:false:41.0:false:0.333:60.0:2.0 & G:2:F-1:R-1:0.500:2:60.0:false:41.0:false:0.667:60.0:4.0 & G&G:1:F-0:R-1:0.250:0:41.0:false:19.5:false:0.000:60.0:0.0 Good0 4 2 1 0 1 1 A/G 0.5000 0;2 60.0 0 41.0 0 60.0 4.000 0.6667 0 chr1:933867-934466
44
Colo829-18_S3-sort testbed chr1 934144 934144 C G 8 6 0 0 2 4 G/G 0.7500 0;2 17.0 1 36.7 1 60.0 12.000 0.6000 0 0 2.000 1 2.8 6 10 GCGGAGGGGAGGGCGCGGAG GGAGGGCGCGGAGCGGAGGG chr1:933867-934466 SNV 1 1 0 1 G:6:F-2:R-4:0.750:2:17.0:true:36.7:true:0.600:60.0:12.0 & I+GGAGG:2:F-1:R-1:0.250:2:22.0:false:31.5:true:0.100:60.0:1.0 & I+GGAGGGCGCGGAGCGGAGGGGAGGGCGCGGAGCGGAGG:3:F-1:R-2:0.375:2:35.3:true:35.2:true:0.300:60.0:6.0 Good0 8 6 0 0 2 4 G/G 0.7500 0;2 17.0 1 36.7 1 60.0 12.000 0.6000 0 chr1:933867-934466
5-
Colo829-18_S3-sort testbed chr1 934144 934182 C CGGAGGGCGCGGAGCGGAGGGGAGGGCGCGGAGCGGAGG 8 3 0 0 1 2 G/+38 0.3750 0;2 35.3 1 35.2 1 60.0 6.000 0.3000 0.3750 21 4.000 1 4.3 3 10 GCGGAGGGGAGGGCGCGGAG GGAGGGCGCGGAGCGGAGGG chr1:933867-934466 Insertion 1 1 0 1 G:6:F-2:R-4:0.750:2:17.0:true:36.7:true:0.600:60.0:12.0 & I+GGAGG:2:F-1:R-1:0.250:2:22.0:false:31.5:true:0.100:60.0:1.0 & I+GGAGGGCGCGGAGCGGAGGGGAGGGCGCGGAGCGGAGG:3:F-1:R-2:0.375:2:35.3:true:35.2:true:0.300:60.0:6.0 Good0 8 3 0 0 1 2 G/+38 0.3750 0;2 35.3 1 35.2 1 60.0 6.000 0.3000 0.3750 chr1:933867-934466
6-
5+
Colo829-18_S3-sort testbed chr1 934144 934144 C CGGAGGGCGCGGAGCGGAGGGGAGGGCGCGGAGCGGAGG 8 3 0 0 1 2 G/+38 0.3750 0;2 35.3 1 35.2 1 60.0 6.000 0.3000 0.3750 21 4.000 1 4.3 3 10 GCGGAGGGGAGGGCGCGGAG GGAGGGCGCGGAGCGGAGGG chr1:933867-934466 Insertion 1 1 0 1 G:6:F-2:R-4:0.750:2:17.0:true:36.7:true:0.600:60.0:12.0 & I+GGAGG:2:F-1:R-1:0.250:2:22.0:false:31.5:true:0.100:60.0:1.0 & I+GGAGGGCGCGGAGCGGAGGGGAGGGCGCGGAGCGGAGG:3:F-1:R-2:0.375:2:35.3:true:35.2:true:0.300:60.0:6.0 Good0 8 3 0 0 1 2 G/+38 0.3750 0;2 35.3 1 35.2 1 60.0 6.000 0.3000 0.3750 chr1:933867-934466

0 commit comments

Comments
 (0)