User:Lindenb/Notebook/UMR915/20100618
From OpenWetWare

mysql
creating a table for the samples
create table sample(
id int unsigned primary key auto_increment,
name varchar(20) unique,
description text,
created datetime,
modified timestamp
);
SNP calling
filtering on depth( min/max) and Q: minimum RMS mapping quality for SNP
samtools pileup -vcf $(HG18) recal_bwa_rmdup_XXXX1.bam |\ samtools.pl varFilter -d 4 -D 1200 -Q 25 |\ java -jar ~/src/code915/dist/pileupfilter.jar -bed PCCR.bed | wc -l 43209 gunzip -c daily/20100601/for_pierre_010610/vcf_maq_pccr_changed_filters/XXXX1.vcf.gz | wc -l 35784
some filters are missing. OK, now just keep the single nucleotide mutations:
(...) | awk -F " " '{if(length($4)==1) print;}' | wc -l
37121
adding filter for the snp quality:
samtools pileup -vcf $(HG18) recal_bwa_rmdup_XXXX1.bam | samtools.pl varFilter -d 4 -D 1200 -Q 25 |\
java -jar ~/src/code915/dist/pileupfilter.jar -bed PCCR.bed -min-sq 25 |\
awk -F " " '{if(length($4)==1) print;}' > jeter.pileup
wc jeter.pileup
35286
comparison SS2/my data
comm -12: 34187 comm -13: 1569 (uniq to SS2 data) eg: 10:1036884,10:114049332 comm -23: 1099 (uniq to MY data) e.g: 10:101153184,10,101283025
![]() | ![]() |
Comparaison Dindel/samtools
same as yesterday but remove non-PCCR from dindel (update: bug found in my src by SS2)
- count dindel :1492
- count samtools :3739
- uniq dindel :889
- uniq samtools :3136
- comm dindel/samtools :603
script was: sh 20100618.sh
cat ${HOME}/daily/20100604/XXXXX_variantCalls.VCF |\
grep -v "#" | awk -F ' ' '{if(length($5)!=1 && $7==".") print; }' |\
java -jar /home/lindenb/src/code915/dist/posfilter.jar -db XXX_0809_PCCR.bed |\
cut -d ' ' -f 1,2 | sort | uniq > jeter1.txt
cat ${HOME}/daily/20100528/indels_samtools_bwa/PCCR/XXXXXXsamtoolsIndel.vcf |\
grep -v "#" | awk -F ' ' '{if(length($5)!=1) print; }' |\
cut -d ' ' -f 1,2 | sort | uniq > jeter2.txt
echo -n "count dindel :"
wc -l jeter1.txt
echo -n "count samtools :"
wc -l jeter2.txt
echo -n "uniq dindel :"
comm --check-order -23 jeter1.txt jeter2.txt | wc -l
echo -n "uniq samtools :"
comm --check-order -13 jeter1.txt jeter2.txt | wc -l
echo -n "comm dindel/samtools :"
comm --check-order -12 jeter1.txt jeter2.txt | wc -l
rm jeter1.txt jeter2.txt

