In this notebook i will try to explore VarScan 'SNP' positions in a R2 untreated sample: DS14

  • Im trying to look at alignment context information using IGV, and all sample information using mpileup

In [24]:
#load modules

import os
import subprocess
import fnmatch
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
%matplotlib inline
import gc

from IPython.core.display import Image 
In [2]:
#go to working directory, where the data is

os.chdir("/nagyvinyok/adat83/sotejedlik/ribli/dt40/snp/varscan")
In [3]:
%%bash
#Check out the schema of the vsc file

head DS14_DS15.vsc.snp -n 1 | awk '{for (i=1; i<=NF;i++) {print i" " $i}}'
1 chrom
2 position
3 ref
4 var
5 normal_reads1
6 normal_reads2
7 normal_var_freq
8 normal_gt
9 tumor_reads1
10 tumor_reads2
11 tumor_var_freq
12 tumor_gt
13 somatic_status
14 variant_p_value
15 somatic_p_value
16 tumor_reads1_plus
17 tumor_reads1_minus
18 tumor_reads2_plus
19 tumor_reads2_minus
20 normal_reads1_plus
21 normal_reads1_minus
22 normal_reads2_plus
23 normal_reads2_minus

Look at positions with very low p-value

  • p < 0.0001

  • It looks like there is some cluestering: e.g.: 4.9M, 10.9M

    • LOH in germline pair?
In [10]:
#select some very unlikely fals positives ( p< 0.0001)

best_pos_cmd='''
head DS14_DS15.vsc.snp -n 600000 | awk ' $13 == "Somatic" &&  $15 < 0.0001  { print }'
'''
best_pos=subprocess.check_output(best_pos_cmd,executable='/bin/bash',shell=True).strip()
best_pos_list=best_pos.split('\n')
print '\n'.join(best_pos_list)
1	3089329	G	C	21	2	8.7%	G	9	19	67.86%	S	Somatic	1.0	1.5902230433128865E-5	2	7	10	9	9	12	1	1
1	7971336	A	G	9	0	0%	A	0	7	100%	G	Somatic	1.0	8.741258741258763E-5	0	0	6	1	5	4	0	0
1	15680078	C	T	14	1	6.67%	C	6	17	73.91%	Y	Somatic	1.0	4.6097265229634116E-5	2	4	10	7	4	10	1	0
1	23852983	G	A	20	4	16.67%	G	8	20	71.43%	R	Somatic	1.0	8.332746607460198E-5	3	5	7	13	13	7	3	1
1	24119873	A	G	21	5	19.23%	A	8	21	72.41%	R	Somatic	1.0	8.620610465070243E-5	3	5	8	13	10	11	2	3
1	35282831	A	G	16	0	0%	A	12	19	61.29%	R	Somatic	1.0	2.023755659362276E-5	5	7	8	11	7	9	0	0
1	35282834	C	T	16	0	0%	C	13	21	61.76%	Y	Somatic	1.0	1.3783142154752013E-5	5	8	9	12	6	10	0	0
1	37277423	A	T	16	1	5.88%	A	5	13	72.22%	W	Somatic	1.0	6.410284593773301E-5	3	2	5	8	8	8	1	0
1	52021699	T	C	12	1	7.69%	T	2	20	90.91%	C	Somatic	1.0	1.303902128632086E-6	2	0	5	15	4	8	0	1
1	60425138	A	G	14	3	17.65%	A	3	17	85%	G	Somatic	1.0	5.038430825537257E-5	2	1	7	10	3	11	1	2
1	77729845	T	C	17	0	0%	T	10	15	60%	Y	Somatic	1.0	3.3127390082272456E-5	6	4	4	11	12	5	0	0
1	82572266	T	C	34	7	17.07%	T	21	28	57.14%	Y	Somatic	1.0	9.010784548928963E-5	7	14	16	12	21	13	5	2
1	86350977	T	C	10	0	0%	T	2	11	84.62%	C	Somatic	1.0	5.7688979481952875E-5	2	0	5	6	5	5	0	0
1	86350987	T	C	8	0	0%	T	1	11	91.67%	C	Somatic	1.0	7.144558228149532E-5	1	0	6	5	3	5	0	0
1	86350992	T	C	9	0	0%	T	0	9	100%	C	Somatic	1.0	2.056766762649123E-5	0	0	5	4	3	6	0	0
1	86350997	T	C	9	0	0%	T	0	11	100%	C	Somatic	1.0	5.9537985234579775E-6	0	0	6	5	4	5	0	0
1	86351002	T	C	9	0	0%	T	0	12	100%	C	Somatic	1.0	3.402170584833112E-6	0	0	7	5	3	6	0	0
1	86351007	T	C	8	1	11.11%	T	0	11	100%	C	Somatic	1.0	7.144558228149532E-5	0	0	6	5	3	5	1	0
In [11]:
#collect filenames for samplenames

rm_dup_dir='/nagyvinyok/adat83/sotejedlik/dt40/rmdup/'
#collect filenames
fnames=[]
for fname in os.listdir(rm_dup_dir):
    if (fnmatch.fnmatch(fname, '*.bam') and 
        not fnmatch.fnmatch(fname,"*.bam.bai")):
        fnames.append(fname)
fnames=sorted(fnames)
In [12]:
#define function to run pileup command

def run_pileup(chrom,pos):
    
    samtools="/nagyvinyok/adat87/home/ribli/tools/samtools-0.1.19/samtools"
    ref_fa="/nagyvinyok/adat87/home/ribli/input/index/gallus/Gallus_gallus.Galgal4.74.dna.toplevel.fa"

    cmd_mpileup = samtools + ' mpileup -Q 30 -B  -f ' + ref_fa
    cmd_mpileup += ' -r ' + str(chrom) +':'+ str(pos) +'-' +  str(pos) + ' ' 
    cmd_mpileup += ' '.join([rm_dup_dir+x for x in fnames]) 
    
    pup_line=subprocess.check_output(cmd_mpileup,executable='/bin/bash',shell=True)
    pup_list=pup_line.split('\t')
    
    print pup_list[0],pup_list[1],pup_list[2]
    for i in xrange((len(pup_list)-3)/3):
        print fnames[i].split('.')[0][:-21],pup_list[3+3*i],pup_list[4+3*i]
        

Check a position:

  • 1:3089329
  • Fluctuation + base loss because of base quality

IGV snapshopt:

In [28]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-3089329.png') 
Out[28]:

Mpileup line:

In [13]:
i=0
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	3089329	G	C	21	2	8.7%	G	9	19	67.86%	S	Somatic	1.0	1.5902230433128865E-5	2	7	10	9	9	12	1	1

1 3089329 G
DS10 17 cC,,ccC,,c..cC,,,
DS11 27 ,c....C,.,,,c.ccc.cc.CcC.cc
DS14 28 C,ccc.Ccc,C,C,C,CC.CccC,c,C^]c
DS15 23 .,,C...,.,..,c,,,,,,,..
DS16 16 .,C.c.CC.,Cccc,,
DS18 26 cc,,.c.,.C.cCc,c,CCc,C,C.,
DS1 30 .Cc,C.,C.CC,c,cCc,.,,.C,Cc.CC,
DS26 19 ..,,CC.,,,,,,,,.CcC
DS27 32 .c.c,.c,,..,..,C.C,Cc,,c,cc,C,,c
DS2 20 ,..cc,cCC.,cC,.CcC,C
DS33 18 .c,,Cc.,CC,,c..,cc
DS34 24 C.c.C,.c..C.,,cC,,c,C,,c
DS35 17 ,.cCC..C,.,..,..C
DS36 18 ,cC,c.,,CC,.cC,,,C
DS37 24 cC...c..c.c,,c.c,,CcCCcc
DS3 17 ccCc..CCCC.,,,CC,
DS41 18 ccC.C.ccC.c,CCCc.,
DS42 30 .cC,,,cCC,.,,cc.CC,cC...c,,,.C
DS43 16 .CC.Ccc,,,Cc,.C,
DS44 19 .C,c.,c,cc,,,,,,.,C
DS45 24 cc,CC,cCCC,c,ccCCccc.cC,
DS46 28 ,,,CCc,..,C.,,c..C,c,,cc,CCC
DS47 47 C$ccC,,CCCCcC..cCCcC...c,c.c,cc,ccc,...,c,c,cCc^],
DS48 23 CC,Ccc.,c,,cc.cc.Cc,..^],
DS49 20 CC,CCCcC,,cC.,.,,,C.
DS4 20 ..CCcc.,.,.c.c..c,cc
DS50 25 .ccCC.,..cC,c.c,,,ccCc,.C
DS51 7 .,,.,cC
DS52 22 C$c$C.Cc.,.CCC.,Cc,,CCc.
DS53 19 .c.cCc..cCc..,,,c..
DS54 33 .$.C..,c,,.cc,.,cC.C..c,cc,c.CC.Cc
DS55 29 CcCc.,Cc..Cc.C.,.CCcc...CcCcC
DS56 20 cc...,c,C,C.C.c.CccC
DS57 46 Cc.CC.cC..,C..C,Ccc,c,c.,..C..cc,..,cC,ccc.cc,
DS58 63 .$c$c$,cC.C....,c.c.,..,cC.,,,,c,CC,Ccc,,c.c.,c.,c,.c.CC,C,c.cc,.c
DS59 20 CCC.C.Cc,c.,cCCCcccc
DS5 40 ,c..,Cc,CcCc.C,,C,CC,Cc,Ccc,,C,,C,cc.Cc.
DS60 17 CCcC.CCcC.Cccc,cC
DS61 40 cc.,,cCCC,C,Cc.,c.c,,cc,C..C,cC.c,C.,cc^]C
DS62 17 .C..,cC.c.c.,CCc,
DS63 25 c,C,..Cc.,c,c.ccCcCCC.CCC
DS64 21 ..C..CC,CC..,c,,c.ccc
DS65 64 ,C,CC,.Cc.Ccc..cC.CCCCCCC,.cCcc..,.,..cCcCcCCC.c.c,,CCC.cc.,.C^].^].
DS66 22 c,c,,,,,,ccC,...,.c,,c
DS67 19 ,,,,ccc.,,..,,C,c,C
DS68 22 C,C,C,cc,ccC..,ccC.cc.
DS69 23 .$.,C,.CcC,,C.,,c,c,,cc,
DS6 27 c..C.cC.c.,c,ccc,c.,,,,,,,c
DS70 27 .$..CC,c..c...C,.,Cc...cCc..
DS71 33 ,$.cCC,.CCC.c,,cCc,c.,,ccc,.c....^]c
DS72 21 .c,cccC.,.c,ccC.c,.,,
DS73 20 .C...C.CcC.Ccc,,C..,
DS74 15 c.,.c.,,c.C.C.C
DS7 21 .C.,c,.cCcCCC.,C,,,c,
DS9 14 ,,c,.c,,,cCc..
Sample1 41 .$Cc..C,cCc,CCCCCCC,c,,c.cC,,cC.CC.ccc,cc^]C
Sample2 58 c$CC,c.c,cC..cc,cCcC,.cCC.,.c,,.,.CC.cc,.,,,CCc.,..C,CccC.c
Sample3 55 CCc.cccc,C..c.CC,cC,Cc,C,.C,c,,,,ccCcCC,cc,,c,CC...cCC,
Sample4 51 CCCcc,Ccc,,.C,C.Cc,.C,,CC.c..CcC,,CCcCc,C.c.CC.,cc^].
Sample5 48 .$..,cCC..,,ccC.c.,,cc.cccccc...,.cCcC.c.Cc,,cC,c
Sample6 32 ccc,,c,.,,,,,C..,.,CcCC.,Cc,,C,,

Check a position:

  • 1:7971336
  • indel problem
In [30]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-7971336.png') 
Out[30]:
In [14]:
i=1
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	7971336	A	G	9	0	0%	A	0	7	100%	G	Somatic	1.0	8.741258741258763E-5	0	0	6	1	5	4	0	0

1 7971336 A
DS10 8 ,.......
DS11 10 ..........
DS14 7 GGGGGgG
DS15 9 ,..,.,.,.
DS16 8 ..,...,.
DS18 10 ...,,..,,.
DS1 6 ....,.
DS26 10 ...,.,,...
DS27 10 .......,..
DS2 11 .,.........
DS33 13 .......Gg,,.,
DS34 8 ...,..,.
DS35 3 ..,
DS36 9 ,...,,..,
DS37 7 .,.,.,.
DS3 3 GGG
DS41 7 .,....,
DS42 13 ..,,,..,....,
DS43 4 .,..
DS44 14 .....,,.,.....
DS45 3 GGG
DS46 12 g.......,...
DS47 11 ..,........
DS48 4 GGGG
DS49 9 ...G.,..,
DS4 7 ..,...,
DS50 12 ....,..,....
DS51 10 .,.....,..
DS52 15 ...........,..,
DS53 11 ..,..,.,...
DS54 7 GGGGGGG
DS55 12 ...,......,,
DS56 10 ...,..,...
DS57 18 ...,....,,.,....,.
DS58 25 ...................,..,,,
DS59 6 ..,.,,
DS5 5 .,,..
DS60 3 GGG
DS61 14 .........,,..,
DS62 3 GGG
DS63 6 ,GGGG^]g
DS64 9 .,...,...
DS65 20 .,..,,.......,......
DS66 6 ....,,
DS67 9 ..,..,.,.
DS68 6 ,.....
DS69 10 .....,,...
DS6 3 ,..
DS70 5 .G.G^]G
DS71 8 ....,,.,
DS72 13 .....,,....,,
DS73 0 *
DS74 9 ....,....
DS7 9 ....,....
DS9 8 .......,
Sample1 18 ...........,...,.,
Sample2 28 g,........,.,,,..,,.,,.,.,,^!,
Sample3 20 .,.,.,.....,...,,.,,
Sample4 12 ..,..,.,.,..
Sample5 14 gg...,GGGGGgGG
Sample6 13 .......,..,..

And another one

  • 1:15680078
  • Big fluctuation in DS15
In [31]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-15680078.png') 
Out[31]:
In [15]:
i=2
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	15680078	C	T	14	1	6.67%	C	6	17	73.91%	Y	Somatic	1.0	4.6097265229634116E-5	2	4	10	7	4	10	1	0

1 15680078 C
DS10 25 ...,,.tT,t.Ttt,.....T..TT
DS11 22 ..,t.ttT,TTT.t.t,,tTT,
DS14 23 ,T.tt,TTTTT,.TtTtT,Tttt
DS15 15 .,.,,,,,,,,T..,
DS16 16 ,,tttt,.,.,,.,..
DS18 25 ,Tt.,Tt.T.t.T.,.,tTtt.tTT
DS1 19 ,T,T.T..,TtT,...,,,
DS26 19 T,..T.tt,.TtTt,t.tt
DS27 19 TTtTTT.T..,,t,tt,,^]T
DS2 20 .$TTttt,.T.t,,tt.t..T
DS33 42 t$tTttT..T.t,..T.T,.tt.,Tt.T.t,.,t,TTt,t.t^].
DS34 17 t,..t,Tt.tTTt.,tt
DS35 25 ,Ttt,T..tt,,,,,Tt.,,.,,.t
DS36 17 .,TTT.ttt..T.Ttt,
DS37 17 ,,Tt.t..t.,T,t,,.
DS3 25 .tT,,.t...TTt.,,,Tt.,,.,^],
DS41 27 T.tT,T,ttT,..,ttTt.t,.t,,,.
DS42 26 ttTTt,TTT.ttTT.TTT.T,TTtt.
DS43 18 tt,.TTt.t,tTT.tTTt
DS44 17 TT,,TTT.,tt,,,..T
DS45 24 .t.TtT.,.t,,TtTTt.t,,,.A
DS46 20 .T..T,,tt.Tttt,..,tt
DS47 32 tT,,t.tt,.t,..,.,t,,,t.,TTT.,.tT
DS48 18 Ttt.,..T,.TtttTT.^]t
DS49 22 t.T..t,...,.,.,T,t,tT^],
DS4 16 TTTT.T,T.T,.TtT,
DS50 27 ,TT,..t..,T.t.Tt,.T,T.,t,T.
DS51 18 ,,,t.TTT,t.,.t.TTt
DS52 28 TTT,tT,tTtTt,...T,t.,.T.TtTT
DS53 17 ttT.T,.t,TT,t.TtT
DS54 27 ,t,.T..TTtT,tt.,,,,T,t,Tt,t
DS55 20 .,,..TT.,...t,,,.T,^].
DS56 21 ,tTtTT,ttTt,,TTt,.,T.
DS57 29 t.t.T,..t.t,,tT,,TT.T,.,,T.tT
DS58 66 ,,.TT.,,,.tTtT,t..TT,.TT..,,,.ttTt,t,,t.tT.TTt,,,tT,,.,t..TTtt...t
DS59 15 t.,,t,T,TT,t,t.
DS5 29 tt..,,,T,TT,,.TtT.t,,T.,..t..
DS60 11 t.T,..T,.,^],
DS61 40 T...tT.T.T,tTTttT.Tt,T.t..,Tt,,.t.,,T,tT
DS62 23 T..T.,.tTT.T,T.,TTtT..T
DS63 33 ,$tt.t.T,tt..tt.ttTTT,T.t,T,T,tT,^]t
DS64 31 TtTT,t.,.T.TTT..TTTtT,Tt,ttTTT^].
DS65 62 ..TTtt..tttT,,tT,T.T,.T,T.,t,,.,,.t,Tt.T..,.t,T,.T.TT.Ttt.T.Tt
DS66 28 ,TtT,,,,T,.,T,,Tt.,.t.,,T,Tt
DS67 14 ,T.T,tT,tTTTtT
DS68 19 TT.,,,,TT..t..t,.t,
DS69 23 T,tT,.,,.,,.t,ttT,t.Tt^].
DS6 35 T$,.,.tTtt.,Tt.,,,T,..t,...TTTTT,,T.
DS70 29 .TT..tT,,tTTT.T,.tttt,.t,,,t.
DS71 27 T.,tT.t.TTTt...TTTt,TT,T,T,
DS72 25 .,t,T..t,t..tT,,,.,,Tt.,T
DS73 38 .,,,,,T.tt,tT..tTT.tTTt,T.T,..,,Tt.,tT
DS74 20 .T.,.,,.TT,t,,,.ttT,
DS7 23 ttt..T,TTT.TtT.tttt.tT.
DS9 21 tT.TT,..T,..tT,t,,.t.
Sample1 49 ,,Tttt.TttT,TtTTT,,tTt..,T.,T.Tt,T...,TTtt.Ttt,.t
Sample2 57 ,$,.t,ttTT.T.,T.Tt,,TT,t,t..Tt...TTT..,Tt,t.,t.TT.t,ttT,t^].
Sample3 59 T.TT.,TT.TT,..t.,,TT,,ttTT...T..T,,.TTtT,.TtTTT,T.t.Tt,..,^],
Sample4 48 .$t,T.t.tT,,ttttt.t.tT.,TtTtT,.t,tt,T,tTT...t.,,T
Sample5 56 T$.TtTT,TT,.tT...TtT.t,.,ttT,,...t.,T.ttt..,,,Tt,,tttt,TT
Sample6 43 t.,.t,t.Tt.t.,TT,tT..Tt.T.,T...t.t,Tt,,tt^],^],

And another one

  • 1:23852983
  • fluctuation + loss because of base quality
In [32]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-23852983.png') 
Out[32]:
In [16]:
i=3
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	23852983	G	A	20	4	16.67%	G	8	20	71.43%	R	Somatic	1.0	8.332746607460198E-5	3	5	7	13	13	7	3	1

1 23852983 G
DS10 17 ,aaAAa,,..,AAAa,A
DS11 35 .$,.a,AA.a,,a.AAAa,aa,a,,a.,,aaAaaa^],
DS14 28 .aa.aAa,A.AaAaAa,A,aaaa,,aAa
DS15 24 ,$a..,.A....,,,A..A.,..,.
DS16 18 ..A,aaA...aAa.,.,^],
DS18 30 .aa.a,,.a.A.a.A,AA.AAAaA.,AaA,
DS1 22 .A,..,A,aAaa,..a,aA,a,
DS26 16 .,A,,A,,a,a.a.,^].
DS27 19 .,Aa.a,,.A,a,A,.aA,
DS2 28 A,,aAaa.,a,A,A.,.Aa,..a,aA,,
DS33 24 a,..Aa.,A,,,aA.aaAa,aAaA
DS34 16 a$aA,aa,a.a,,AA,^].
DS35 18 A,a,,aA,..,.Aaaa.,
DS36 17 ,a,A,A.A.aaaaA.a.
DS37 16 A.AAaa,,aAAA..Aa
DS3 12 a.,a.AA,AAA,
DS41 17 AA,..A..,,.,,,A.,
DS42 20 ,Aaa,Aa,Aa.aa,aaaaAa
DS43 19 aaa,,.a.a.A,.Aaa.a,
DS44 22 ,..,,,a.AAA....AA,a.aa
DS45 27 ,a.a.aa....a,.AA.,a,aAa,a..
DS46 23 A,,a,AAA.,.,aa,,.A.AA^].^],
DS47 46 .$,A.,.a,a,A.A,A,A,,..a,aAa,AAAA,,..aA.aA.,,A,a
DS48 20 ,Aa,.aa.,aaaA.AA,aaa
DS49 20 A.aaAaA,A,A.aa,a.A,.
DS4 21 A.,AAA,,.aAaAaAAa,Aaa
DS50 24 ..AaAA..aA.a.,..aAAa.aA^]A
DS51 20 .,A,,A.,a,..a.,aaAAa
DS52 33 ,,..A.AA,.,AA.a.,Aa,aAaaA,..aAA,,
DS53 17 ,$a.aa,.,A.AA.,a.^]A
DS54 20 ,,a.,,aa,A..,Aa.aA.^]a
DS55 27 Aa,A.A,aa.A.A,AAAaA.aaa,aa^],
DS56 19 ,,AAaA.A.AaA.,aA.aA
DS57 41 ....a.,aA,,.a,A,.AA.a.,.a.,a,.,A,a,A.A.A^]A
DS58 50 a,A,AAaAaA,,AA..aa,,.A,A,aAAaaaaaA.,A.,.,A.,,,,A,^]A
DS59 19 aaA,a.....,a,.a,AAA
DS5 22 .A.aa...A.A.AAA,.,,.A.
DS60 25 Aa,A.a.Aa.AaA...AA,aa,..a
DS61 43 A.A..,.a.A,..aA.,.A,a,,,A,A.A.,a.A,aa.,,.,.
DS62 21 .aaA.aaa,a.aAA,,,,A,,
DS63 24 aaA..AAaaA.AAA,.,a,,AaA.
DS64 25 .,..A.A,A,a,,...a,..AAAa^],
DS65 51 ,$AaAA,aA.,aaa,,.,.,AAA,,.,,..,,,a,A....,aaaAA,,a.,.
DS66 32 Aaa,Aa,,aA,A,a.,a,a.,AA.,,a,..,a
DS67 25 AAA..A.a.,Aa.a,.AA,..Aaa.
DS68 12 .,aaa,.,.A..
DS69 20 .,,a,a,A,aa,,,A.,..A
DS6 20 aA.,a,.a..Aa,A.aA.A,
DS70 16 A..a,a.,,,A,a,,^]A
DS71 26 ,a,a.....,a,,,AA..,.,.aA.,
DS72 28 Aa..a,a.,..,aA,.a,aAA.A,aa.A
DS73 17 .a.A.A.A.,a,A,.,.
DS74 20 a.aa,..A,.a.AA,Aa,aa
DS7 22 .aAA,A..AaaA..a,a.A.,,
DS9 19 aA.,...aa,a,A,,a..,
Sample1 49 ...,..,.AaA,.a.Aa,Aa.,A...AAA,.,,.,AAaA.,.,aA..aa
Sample2 50 .$A...Aa,aaaa.A.aaA,A.aa,Aa..,A,Aa.A,,,aa.,AA.AA^]A^].^]a
Sample3 41 ....AA,AAA.AAa,,A,aA.aaa,AA.A,.aaaaaa.a^]A^],
Sample4 40 A$AAa.,A,A....,.a.a,,Aa.A.,aAa.a..a,,,.a^],
Sample5 54 AAA.aa.A.A.,a.AAaa.a..,,,aa.aAaaAaa.Aa.,.Aa.a,,AA,..,.
Sample6 30 ,$,,aaA,.,,a,aA.A,A,A.aaA,,aaA^].

And another one

  • 1:35282831
  • strange again, two snp just disappeared next to each other, I think indel is too far to be the problem
In [33]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-35282831.png') 
Out[33]:
In [18]:
i=5
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	35282831	A	G	16	0	0%	A	12	19	61.29%	R	Somatic	1.0	2.023755659362276E-5	5	7	8	11	7	9	0	0

1 35282831 A
DS10 25 ,.g,gg,GG,.,.,,GGG,,,gGGg
DS11 42 ...,,,,..GGg.,gG,g,g,Gg.,g.,g,GGG..gGgggG.
DS14 31 ,g,Ggg.G,.g.g,,g..Gggg,Gg,GgGGG
DS15 16 ,,,,.,..,..,,..,
DS16 27 G.G.GG,gg..,,,..,gGGG,.G.gg
DS18 17 G$g.GgGgg,.,gg.,G,
DS1 34 g$..,g,.,,gggggg,.G,,GGgG.ggGG.ggG.
DS26 24 g$gGGGg,g.gGGg,.g..,Gg.,g
DS27 34 ,$,,.,.,Gg,..G,,G.,,g.g,g.,,gG,G.GG
DS2 33 g$,.,g.gg,..GgGG..,,.,,gG.g,g.g.,G
DS33 20 .Gggg.Gg.G,gg..GgGG,
DS34 26 ..,.,.GgGg...gG,.g,..,gGG.
DS35 24 G.,.G,ggg,g.,G...gGggg.^].
DS36 21 Ggg.,ggGgGG.gg,..,G.G
DS37 15 ,gGgg.,GgGgG.G.
DS3 27 ,,g.,,G,..,.GgGg,G.GG.,GG.G
DS41 28 gg..gg,GgG,.,G..,,.,,,.G.Ggg
DS42 38 .GGgg,..GGG.g,GGg.,g.,G.gg,gG.gG..G.G.
DS43 23 G..Gg,.,gGGg,gG,...ggg,
DS44 28 g.,,.,.$GGgggG,.ggG..,,,g,.Gg
DS45 26 GGg..g..g.,.,g,G.GGGggGg.g
DS46 25 GG,G,,,...gGg.g,,...gG.gg
DS47 49 GG.gG.G,gg.G.gg,.G..G,Gg,g..,,.G,,gg,..,GGGgG,G.G
DS48 28 Ggg,GgGgGgg..,,G.g..g.G.GG,.
DS49 27 ,.g.GGGgG,g,GG,.g.,,GgGG,GG
DS4 27 GG,g.,G,G,.GGgGGg,g.G.GG..G
DS50 34 g.GGGg,g.,GGG..G.GGG..G,....GGg.g^],
DS51 28 ,G,..G.G,.,g..Gg,g,gg,G...GG
DS52 18 .g,GG.GG.GGG,.,g..
DS53 20 G.,.G.GgG,GG.,gG..G.
DS54 27 G$g,G,gGGGg,,G,G.G.gG,gGG...
DS55 25 GGg,G.g,.,g.,G.,..,G.,g..
DS56 24 G,,g.G,g.,,.G.GggG,g,.g.
DS57 42 G,gGg..,gg.g,.g..g.g.,.g.,G,gG.,Ggg,G..G.,
DS58 56 g$,..G,.gGG.,gg,,g.GgGgGgG.G,GGG...G,,,.G,,.g,G,GGgg,.Gg.
DS59 28 T$.g,,g.GG,.G,..G,,.g,G.GggGg
DS5 27 GgG.,G...gGg.GG,gg,.G,.,,G.
DS60 19 ,GgG.,GGg..,ggg.,.G
DS61 60 .g,g.g.,,.G,G,.g,ggg,g.,gg,.gg.,,..,.GG,GGGg..gggGG.gG,...G^].
DS62 19 ,G,GG...g.,G,ggGG,.
DS63 18 .gG,GgG.,gg,G.G.Gg
DS64 44 ,.,Gg..ggg,.g.ggg...ggg...Gg.G.G.G,G,G....g.
DS65 65 ,..G,.,gg.g..gGg..G,g.g..G...G,.GGGgG.g,g.,g,GG....G,gG.G,GG..g.^].
DS66 30 GgGggGGg.G,,,,.G.gg,g.G.,...G.
DS67 27 gg,g.GGg,G.g,G.gGgG.,.G.,,,
DS68 22 GGg...G,G.,G..Gg,G.G.^].
DS69 29 .Gg,gGGg,g,,.,GgGg.gGg,Gg.GGG
DS6 28 ,GGG,,,.,G.gggggG.g,g,,Gg,..
DS70 23 GGgg,g,.,,,g,ggGGGgg,,.
DS71 33 ,.g,g,..,,G.g,gG,g..gggG,gGgG.GGG
DS72 24 Gggg,.g..GgG.,G.G,,,.,.G
DS73 8 ..G,,,,.
DS74 14 ,,Gg.ggg.GggGg
DS7 26 G...G.,,.,.gG,g.,.g.,gg.gg
DS9 23 .,..,G.g...Gg,GG..gG.GG
Sample1 41 .$..,G,ggG,,,,,GgG,GGG,,.gGG,gG..GGgg.....
Sample2 46 .g.ggg,gGGGG,Gg.gGGgG,g,G.,.G,.gG,.,gG.GG.ggG.
Sample3 46 .G.g,ggG.,.,.gg.g.,G,.G.gGGg..GGG,.GgG.,....,^].
Sample4 53 ,$..G.,,g.,,,,,,g.G.g..,,,.,GGgg.G...,GGGg...gG,.Gg.gg
Sample5 47 G$.$,Gggg.gGG,g,gG,,gggg,g.Gg.g,gg.GG,g....G.GgGg
Sample6 41 G,.,,.GG,.G,,g.G,G,.gGgG.G,gg,..GgG,GG.g,

And another one

  • 1:37277423
  • fluctuation + loss because of base quality
In [34]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-37277423.png')
Out[34]:
In [20]:
i=7
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	37277423	A	T	16	1	5.88%	A	5	13	72.22%	W	Somatic	1.0	6.410284593773301E-5	3	2	5	8	8	8	1	0

1 37277423 A
DS10 15 ..,.,,t.t,.tTt^],
DS11 30 .,T,..t.,t..,,t,,..,T,TttTT.t^].
DS14 19 t$.t.TtT,ttTtTg,.ttT
DS15 17 ...,,.,,T.,...,,,
DS16 19 ..TT,TT.T.ttTt,.T,t
DS18 18 tT.t,T,T.,,tttttT^]T
DS1 13 TtT,t.t,.tt..
DS26 9 ,$tT,.,t.,
DS27 24 ,Tt,.tTtTTt,,..,,.TT.TT,
DS2 23 ,$tt,...,t.T,t,.T.,T....
DS33 25 ,,.T,,T.ttTT,,t.,tt.tT.t,
DS34 13 ,$t,,T.,..TTT,
DS35 20 t,...,TT.TT.tT..TtT.
DS36 22 Tt,,.t,Tt,.,t,TTT.Tt.t
DS37 18 ,t,t,TT,,t,ttT.TT.
DS3 23 ttTTtt..TT,,Tt.TT.,TTt.
DS41 18 ,TT.tTttt.tt.tT.T,
DS42 28 tt,ttT,,Tt,TttTTtt.T..T,.T,T
DS43 24 Tt,,t,T,.t,,Tt,Ttt..t,Tt
DS44 21 Tt.,.t..T,t.T,T.,..TT
DS45 19 TtT,T.,t..t,.T,T,T^].
DS46 25 .....,TT.,t,.T.T,tT.tTTt,
DS47 30 ,,,..tT,tt.,Tt.tT,,T,t.,tT,TTt
DS48 28 .TT..,,T,Tttt...t.t.,,,,.tTt
DS49 23 T..tt.T,tttTt.,t,.t.T.t
DS4 22 .T.t,..,.t,,.tTT.TT,,t
DS50 23 ,tT,.t,,t,T,,TTttTt..T^]T
DS51 22 ,T,.,,...tTttt,T.tt.T^].
DS52 22 tTT.,tt.T,t.,,...TtTt.
DS53 18 TT,..TtT.T,,,,.T,.
DS54 30 .t.t.,TtT.T,tTT.,,.t,T,tTTt.Tt
DS55 25 T,.,.,..TtTt,,tT,tT.,tTt,
DS56 22 ,,T,T...T.tTT.tTTT,Ttt
DS57 42 .,,,..T,T..Tt,..,.TTTTt,,,T..T,tTTt,t.,.,t
DS58 56 .t,Ttt.Ttt,Tt,TT.,T.T,T.tT,...TttttTT.tt.T.,,.t,t,TT,,.,
DS59 16 tt..,t.,.TttT.T.
DS5 26 t,.,,,TT.,T,,,,.,T.tTtT.TT
DS60 22 T..,,t.t.T,t..tTTT,t.,
DS61 35 .$TT.t.,,.,.T,tt.,t.T.T.t,tt.tT,t,,t
DS62 16 t.T,.T..t,T..,,,
DS63 36 ...T,,,.tt.,,tt,t,tt.,,,t,,T.,TT.TtT
DS64 28 tt....T....,t...t,t.t.,TTt..
DS65 48 t.T,t.TT...T,t.,,tt.,T,tt.Ttt,,tT,tT..TT,Tt,T.tT
DS66 22 tTt...,.t,tT...,.Tt,T^].
DS67 15 TTTt.t,....t,T^]T
DS68 17 TT,.tTTtt,.tT,t,.
DS69 21 ..,Tt,,.,,,Tt..tTTt,^].
DS6 18 ,$,t.tt.,ttT.T,,T.t
DS70 16 ,.tT.Tt,.,,tT.,t
DS71 22 T,..,TT,,,TT,.,TTTTT^]T^]t
DS72 22 .,T.t,tTTTTtt...t.T..T
DS73 15 ,..TT,T.T.Tt,Tt
DS74 14 t$,tttt,,,,,t.t
DS7 18 ttT.,..,t.T..t,t.,
DS9 14 TTttttT,,T,T..
Sample1 38 ,tTT.,.t,...,T..Tt.tTTtT.T.,t,T.tT..,T
Sample2 38 .,T..,T...T..TttT,,tTttT.tt,t.T,.tt.T^]T
Sample3 57 .$TTt,T..t..tTt.T,t,..T.TT..Tttt,TT,tttttttttttt.T.t,t.TT,
Sample4 36 t$..,TTtttTTT,...,,T..T,..T,,t,.T,tTt
Sample5 39 T$t$T.t.Tt.Tt.,T,..tT.ttt,.Tt.T.t..t,Tt.^].
Sample6 26 tTt,,TT,TTt,.TTt,.Ttt.T.,.

And another one

  • 1:52021699
  • indel alignment problem, bit strange, why so homogenoues in samples? Local realignement makes it homogeneous?
In [35]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-52021699.png')
Out[35]:
In [21]:
i=8
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	52021699	T	C	12	1	7.69%	T	2	20	90.91%	C	Somatic	1.0	1.303902128632086E-6	2	0	5	15	4	8	0	1

1 52021699 T
DS10 14 cC,..,...,.,,.
DS11 20 ,.....,.,,....,,.,,,
DS14 22 ccCC.Cc.cCccccccCccccc
DS15 13 c,,,,,.,.,..,
DS16 19 CC..,.,,,.,.,.,,,,.
DS18 20 cc,,..,,..,,,.,,,,,,
DS1 28 Cc,,.c,,.,.,,,,,.,,..,,....^].
DS26 14 c,.,.,,.,,,.,.
DS27 18 Cc,,,,,,,..,.,..,,
DS2 18 CCC.,..,,....,,,.,
DS33 19 cC,,.,.,,,,.,...,C,
DS34 15 CCC,.,,..,,.,,,
DS35 12 ...,..,,,.,.
DS36 8 Ccc,.,.,
DS37 18 c$c,,,,.,..,,,.,,,.
DS3 21 ccC.,,..,,.,.,.,,,,.,
DS41 22 c$,..c...,,,,,,,,..,...
DS42 16 c,,,...,,..,c.,.
DS43 18 ,,,,.,.,..,..,.,..
DS44 26 cc.,....,.,,.,,..,..,..,.^],
DS45 16 .,,..,,.,..,,,,.
DS46 17 c,,,,,,,.,,,,,,,^].
DS47 25 C..,,.,,...,,.,,,.,,,,,..
DS48 16 ...,..,.,,,.,,,,
DS49 11 ...,,.,,.,^].
DS4 24 CC,.,.,..,,.,.,,,,,,,,,^],
DS50 20 C,...,.,,.,.,,,..,,.
DS51 30 CCC..,...,,..,.,.,.,.,.,,,,,^].^].
DS52 18 cCc...,,,,,.,,,...
DS53 14 .,,,.,.,,,,,..
DS54 19 Cc.,,......,,,.,,,,
DS55 16 .,.,,.,,,,,.,,,,
DS56 15 .,,.,,,..,,,,,,
DS57 29 C,.,,....,.,,.,.....,.c...,,,
DS58 44 CCcc,,.,...,,....,..,,,,,,.,.,.,,,,,,,..,,,^].
DS59 20 Cc.,.,,,..,,,.,,,,..
DS5 27 CCCC,,...,..,..,,,..,.,,,..
DS60 14 c.,,,...,....,
DS61 33 ,.C,,,,,,..,.,...,,,.,,,.,.,.,.A,
DS62 13 c,.,,...,....
DS63 16 C..,.,,..,,.,,,,
DS64 22 Cc,,.,.,,.,.,,....,,,,
DS65 39 C$CcC,...,.,.,,.,..,,C,..,,,.,,,,,,,.,.,
DS66 16 c,,..,,,.,,,....
DS67 14 ...,.,,,.,.,.,
DS68 15 c.,,,,,,.,.,,,,
DS69 24 CC.,,,..,,,,,.,..,,,,,,,
DS6 20 cCc.,.,..,,..,.,,.,.
DS70 19 Ccc.,....,,..,,,...
DS71 13 ,..,.,,.,,,,,
DS72 17 CC.,,.c..,....,,,
DS73 22 cc,..,....,,,..,...,.,
DS74 22 ,,,,..,,,,,..,,..,,,.,
DS7 28 CCcc,,,,,.,,,,,,,,.,,,.,.,,,
DS9 14 .,....,,.,,,..
Sample1 36 cCCc,,..,.,,.,...,,...,,..,..,,,,,,.
Sample2 38 cc.,,,,,*,,,,,.,,.,....,...,.,...,.,,.
Sample3 40 C$CCCccCC,.,,..,.,,,,,.,...,,.,,.,,.,,,,^].
Sample4 38 C$Cc..,,,,,.,,,,,.,.,,,,.,,,....,..,,,^],
Sample5 34 C$cCCc,.,.,,.,.,.,..,,c,,,,.,,.,,.,
Sample6 24 Cc..,,.,.,..,..,.,,.,,,.

And another one

  • 1:60425138
  • simply weird , SNP substitution: one gone, one appeared
In [36]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-60425138.png')
Out[36]:
In [22]:
i=9
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	60425138	A	G	14	3	17.65%	A	3	17	85%	G	Somatic	1.0	5.038430825537257E-5	2	1	7	10	3	11	1	2

1 60425138 A
DS10 15 ,.G..gGgg.,Gg,,
DS11 17 .,g.G,.g.,.G.,..,
DS14 20 ggGg.g,gGgGGGgGggG.g
DS15 17 ,,g.,,G,,g.,,,.,,
DS16 15 G,G..G.,g.gg,gg
DS18 20 ..GG,g,G,gg.,gGG,Gg.
DS1 24 ,g.G,GgG,g..,.G.G.Gg.Gg^]G
DS26 26 ,.GG.GG,GgG,,.,,GGg,.,.,,,
DS27 17 .GgGgG,g,,,g,gg,G
DS2 15 ,$.gG,,,,g,Ggggg
DS33 25 G........,gG,g.,GGgGg,.g,
DS34 16 gG.,,gG.,,.,,.G^]g
DS35 22 G.,,g.g.,,g,.G,G,.G,G.
DS36 26 .G,,G.GGg..G.G,.GGG,G,G,.,
DS37 16 g,GG.G.G..G.GgGg
DS3 20 ,,,g,,gG,.GG..,g.ggg
DS41 22 .$gG,.G,.,,gg..G..,Gg,.
DS42 19 G.g.GGG.,.g..,..G.,
DS43 29 g,g.,,.g,,,gGGG..,g...gGgg.,g
DS44 28 .$,ggG,g,G..,g.,.G.,,.,....g.
DS45 25 .$GGg,.Ggg.,.,Ggg..G.gG.GG
DS46 39 g$,..,gG.GggG..g.,g..G.,,.ggg,GGGG,.,G.g
DS47 39 G,G,Gg,.,..G...,gGgg,g.g,G.g.G..GgG,..g
DS48 21 g,.g,Gg,.,,gG,..GGG,g
DS49 19 ..gg,g,,..,.g.GG.G,
DS4 26 ggG,.gG.Gg..g,,G,.gGG,,,,g
DS50 29 ,g,gGgGgg.,.G.,g,.,G,.G..gg,^]G
DS51 13 g.,g,G.,G,g.G
DS52 16 ,.,gg.GG,G.,,.,G
DS53 19 .,...g..Gg.G,g,.G.G
DS54 24 G$.G,Gggg,gg.GG.,G.g,.,G,
DS55 28 ,g..GGgg..gg,,g.G.gg,GGg.g,G
DS56 22 ..ggg...g...,,,.Gg.g.,
DS57 39 ,g,GG.,g.G,.GgG,gggg..gg,.G,G.G,,.gg.,,
DS58 56 g,.ggG,g,gg..g,,gg.,G,,.GG.,G,,.gG.gg,,.,ggGg.,gG.,.G,g,
DS59 27 .$,$,,,,,G.GG..,g.,,Gg.GG,,g,
DS5 14 g..g.,.GgGGG.G
DS60 22 Gg.GggG,.g,....GGG.,,G
DS61 39 ,$G,,..gg,G,g,,G.,G,.,.g,,g.Gg.Gg.gggGG^].
DS62 24 ..g,G,.ggg..,,G,g,GGG,.^]g
DS63 16 .$,G.ggG.,gg,,Gg^]G
DS64 17 .g,..gg.g,G,..,gG
DS65 49 G,g,gGg,g,G.,.,,.,GgGGg.gGGGGG.,,Ggg.,,,,...G..,G
DS66 33 .,,,,G.gG.,Ggg.,,.G,G,g,,gg,,,.gG
DS67 22 ,GGG.,GGg,,GGGG...GgG,
DS68 17 ,gG,Gg.g.gG,,g.,g
DS69 28 G,gGg.Gg,gg.G.,.G,,,Gg,.g.GG
DS6 21 .$ggg.GGggG,G..g...,,G
DS70 19 ,gg,GG.g,...G.gg.^],^],
DS71 23 ..,Gg,GgGG,,GG,.,GG....
DS72 23 .,gG.,.,G.gg.gGg.G.,,.G
DS73 14 g.g,GGgg,g,GG.
DS74 30 ggGgg,GGggg.GGg.,g.,G,G..gggGg
DS7 30 .g,G.GG,.gGg,G.,,.,.....g.,g..
DS9 19 ,ggg,,gG,g,GgGG,g..
Sample1 41 ,G..gg,G,ggG,.gGggG.g.g,g.G.$g.ggG,.G.G..^].
Sample2 47 g.,g.G.G..gGg,.gg..Ggg,.Gg..GGgg,G.,..,gg.g,Gg^]G
Sample3 49 .G,g..,.gG.gG,g.,G,g.g.g.,g,.g....$.,GGGg,.gG,,.G^],
Sample4 53 gGg.g,gG,g.,.,.,G,gG,,..g..GgG,GGg,Ggg,.g,,GGGGg..,GG
Sample5 40 .,,g,.,Gg,GGgg.GgGG..g,.g,GG.g.Gg.GG.,g,
Sample6 33 G.G,GGG,,gG,,Gg.Gg,..,g,.GGgg,,G.

And another one

  • 1:77729845
  • Indel problem
In [37]:
Image('/home/ribli/DT40/SNP/varscan/igv_snapshots/ds14__hits/1-77729845.png')
Out[37]:
In [23]:
i=10
print best_pos_list[i]
print
run_pileup(1,best_pos_list[i].split('\t')[1])
1	77729845	T	C	17	0	0%	T	10	15	60%	Y	Somatic	1.0	3.3127390082272456E-5	6	4	4	11	12	5	0	0

1 77729845 T
DS10 21 .,,,,cCcc,..ccCC,*..^].
DS11 19 ,,c,,Cc,,cc.c,cCCcc
DS14 25 .$.,.cccCc,cCc.cC,,.ccc.cC
DS15 22 ,*..,..*.*.*....,.*.,,
DS16 18 .c.cC,..cCc,C,c.C^],
DS18 18 ,c,C,,,.c.,ccC.ccC
DS1 14 ...c,CCCcc,,C^].
DS26 18 .Cc,c.,,CcC.c..c.C
DS27 21 ,..C,...,.Cc,.,c.,c,C
DS2 27 ,C,cCCc,.....c.,C.,.Cc.c.c.
DS33 27 ,,c,C.,,c,c,.Cc.c,..,CCCcC,
DS34 17 cc,.cC.c.c.,,,c.,
DS35 25 c.,C.,,.,.,..CcCcC,c.,ccC
DS36 13 ,,.c,,...C.CC
DS37 17 ,cc.C,.c,,$C,cc.,,
DS3 18 cc,,,.CCccc.c.,...
DS41 22 ,.c,c,c,,,Cc,.,,,C..cC
DS42 14 .C,,,,.c,c,Cc.
DS43 20 .CC.C.,c,c,C,C,cc,cc
DS44 19 ,,C,C,Cc,,,,.,c...,
DS45 25 ,,C,C..CcCC....c.,c.cCc,.
DS46 29 ..,,c...Cc.,Cc...Cc.,CCcc,c,^].
DS47 38 .,,C,.c...Cc,.c*.,.C.C*.c,,c,,.,...,.,
DS48 19 .,..,,cc.c.C,c,CC,.
DS49 24 .ccCcc.CC,,cCCCCcc,ccCc.
DS4 14 ,C,c.,ccC,c,cC
DS50 26 ,,C,.,,,*Cc,cCcCC..Cc,,,,c
DS51 18 ,c,..C.CC.C...C.,.
DS52 22 Cc.CCcC,,C,C,cC,.Cc,..
DS53 24 ,.CCCC.C,C,.,C,...cc..,c
DS54 28 CC.,..c.ccc.C,C,C,,CCCccc,C,
DS55 33 .,Cc..,,C,c.cC,...c..,c,,,cCCc.,,
DS56 19 ,.,c,.C,c.cCC,,...^].
DS57 37 ,,c..c,c,,,C,,,,c.,c,,...c,c,,cc,Ccc.
DS58 40 C.c,,,.cCC.c,C,...cC.,cC...c.,C.,C,,c,.c
DS59 15 ,.C,C..C,.,.,c,
DS5 23 c,ccc,...,ccC.cCccc,,.C
DS60 10 ,cc,cCc,cC
DS61 32 ..,c.c..,C.,...cCCCcC.,C.c,,,C,c
DS62 21 c,,.c,.ccC....C...,,.
DS63 18 .,.,,c.cc.CCc,.c..
DS64 29 ..,cc.C.,.,.Ccc.,.CC..c.c,.c^]C
DS65 49 .,,,.,CCCCc.,c.,,C...C.,CCC,C.c,CcCcC,,,c,C..,CC,
DS66 27 .cc.cc.C..CcC.C.Ccccc,.CC^],^],
DS67 14 ..,..C.cC.,,,c
DS68 16 c,.c,CCC.c..,,C,
DS69 21 ...,,ccc,c.,.C,cc,.,c
DS6 22 ....,,cc,cC,..,CC..,.^]C
DS70 16 .c,CcccCCCC.C,,^].
DS71 15 .Ccc..,.c,C,.c,
DS72 21 .$.,c...Cc,,...C.C,,,c
DS73 27 ...c,CC,CC..cCc,C,aC,CC,,C.
DS74 22 ,,,,C.C,.cC.C,,.CccCc,
DS7 23 c.c,CC,,...CccCcc.C..,,
DS9 21 ,$,..,c,cc.,c,,CcCC,c.
Sample1 34 ,$,,.cc,C,..c...C.c,.,C.CCC.,,,,C.c
Sample2 53 ,.,,,.c.cc..,c,,CC,,..$,C,c,C.C.,c.C,C.CC.cC.,..,C.,,^]c
Sample3 42 ,$..,,.,CcCC.c,,,cCCcCccc...c,.ccC,.CcC.C.^].
Sample4 44 ,$,,,,..CcCCc.C..,.cccCCccC,,,..,C.c..C,,.CcC
Sample5 34 ,.C,cCC,C.Cc,,cCc,.C,.,,...Cc..,c.
Sample6 33 ,$,cCccCc,c,.C,.,cc,Cc.C.,,c,,C.c.

Conclusions:

Some positions are still misterious.

Some positions only beacause of fluctuation.

  • Thats good news, thats what we can very easily avoid looking at a robust germline.
  • Different from the high coverage R1!

Still a lot of indel misalignment problems.

All positions could be filtered looking at all the samples