User:Lindenb/Notebook/UMR915/20100705
From OpenWetWare

compute the difference between SLS2 and me
create temporary table user_anonymous.T1
(
id int unsigned primary key auto_increment,
chrom varchar(20) not null,
position int unsigned,
sample_id int unsigned,index(sample_id),
index (chrom),index(position),index(chrom,position)
);
insert into user_anonymous.T1(chrom,position,sample_id)
select distinct
V1.chrom,V1.position,C1.sample_id
from
variation as V1 ,
vcf_call as C1,
vcf_input as I1
where
V1.ref!='*' and
length(V1.alt)=1 and
C1.variation_id=V1.id and
C1.input_id=I1.id and
I1.creator="sls2"
;
create temporary table user_anonymous.T2
(
id int unsigned primary key auto_increment,
chrom varchar(20) not null,
position int unsigned,
sample_id int unsigned,index(sample_id),
index (chrom),index(position),index(chrom,position)
);
insert into user_anonymous.T2(chrom,position,sample_id)
select
V1.chrom,V1.position,C1.sample_id
from
variation as V1 ,
vcf_call as C1,
vcf_input as I1
where
C1.snp_quality>=25 and
C1.depth>4 and
C1.depth<=1200 and
C1.rms_quality >=25 and
V1.ref!='*' and
length(V1.alt)=1 and
C1.variation_id=V1.id and
C1.input_id=I1.id and
I1.creator="lindenb"
;
create temporary table user_anonymous.T3
(
chrom varchar(20) not null,
position int unsigned,
sample_id int unsigned,index(sample_id),
prediction varchar(20),index(prediction),
t1 int,
t2 int,
index (chrom),index(position),index(chrom,position)
);
insert into user_anonymous.T3(chrom,position,sample_id,prediction,t1,t2)
select
V.chrom,
V.position,
C.sample_id,
P.prediction,
user_anonymous.T1.id,
user_anonymous.T2.id
from
(
variation as V,
polyphen as P,
vcf_call as C
)
left join user_anonymous.T1 on (T1.chrom=V.chrom and user_anonymous.T1.position=V.position and C.sample_id=T1.sample_id)
left join user_anonymous.T2 on (T2.chrom=V.chrom and user_anonymous.T2.position=V.position and C.sample_id=T2.sample_id)
where
V.ref!='*' and length(P.alt)=1 and
C.variation_id=V.id and
P.variation_id=V.id and
P.library='HumDiv'
group by 1,2,3,4
;
delete from user_anonymous.T3 where t1 is null and t2 is null;
select * from user_anonymous.T3
limit 200;
select
user_anonymous.T3.prediction as "pph2.HumDiv",
concat("XXX",user_anonymous.T3.sample_id) as "Sample",
COUNT(t1) as "sls2",
COUNT(t2) as "pierre",
COUNT(t1)-COUNT(t2) as "diff(sls2-pierr)"
from
(
user_anonymous.T3
)
group by
user_anonymous.T3.sample_id,
user_anonymous.T3.prediction
order by 1,2
;
compute data found by me but not by sls2
create temporary table user_anonymous.T1 ( id int unsigned primary key auto_increment, chrom varchar(20) not null, position int unsigned, sample_id int unsigned,index(sample_id), index (chrom),index(position),index(chrom,position) ); insert into user_anonymous.T1(chrom,position,sample_id) select distinct V1.chrom,V1.position,C1.sample_id from variation as V1 , vcf_call as C1, vcf_input as I1 where V1.ref!='*' and length(V1.alt)=1 and C1.variation_id=V1.id and C1.input_id=I1.id and I1.creator="sls2" ; select S.name, V1.chrom, V1.position+1, V1.ref, V1.alt from ( variation as V1 , vcf_call as C1, vcf_input as I1, sample as S ) left join user_anonymous.T1 on (T1.chrom=V1.chrom and T1.position=V1.position and S.id=user_anonymous.T1.sample_id) where T1.id is null and C1.sample_id=S.id and C1.snp_quality>=25 and C1.depth>4 and C1.depth<=1200 and C1.rms_quality >=25 and V1.ref!='*' and length(V1.alt)=1 and C1.variation_id=V1.id and C1.input_id=I1.id and I1.creator="MOIMOIMOI" ;