@@ -12,11 +12,14 @@ echo "MSA realignment of region" $region
12
12
mkdir -p msa_$region
13
13
14
14
# bcftools norm -m - -c s -f $ref -r $region $vcf > msa_${region}/variants.vcf
15
- bcftools view -r $region -o msa_${region} /variants.vcf.gz -O z $vcf
15
+ bcftools view -r $region $vcf \
16
+ | bcftools +fill-from-fasta /dev/stdin -- -c REF -f $ref \
17
+ | bgzip > msa_${region} /variants.vcf.gz
18
+
16
19
tabix msa_${region} /variants.vcf.gz
17
20
18
21
python $DIR /get_reference.py $ref $region > msa_${region} /haps.fa
19
- for i in $( zgrep - m1 ' #CHROM' $vcf | cut -f10-)
22
+ for i in $( bcftools view -h $vcf | grep - m1 ' #CHROM' | cut -f10-)
20
23
do
21
24
samtools faidx $ref $region | bcftools consensus -H1 --sample $i $vcf | python $DIR /fa_rename.py ${i} _1 >> msa_${region} /haps.fa
22
25
samtools faidx $ref $region | bcftools consensus -H2 --sample $i $vcf | python $DIR /fa_rename.py ${i} _2 >> msa_${region} /haps.fa
@@ -25,7 +28,7 @@ python $DIR/remove_redundant.py msa_${region}/haps.fa > msa_${region}/haps_nored
25
28
26
29
27
30
# /users/u233287/scratch/misc_software/mafft-linux64/mafft.bat --auto msa_${region}/haps_noredund.txt > msa_${region}/aln_results.txt
28
- /users/u233287/scratch/misc_software/mafft-linux64/mafft.bat --auto msa_${region} /haps.fa > msa_${region} /aln_results.txt
31
+ /users/u233287/scratch/misc_software/mafft-linux64/mafft.bat --retree 2 --maxiterate 0 msa_${region} /haps.fa > msa_${region} /aln_results.txt
29
32
# /users/u233287/scratch/misc_software/mafft-linux64/mafft.bat --globalpair --maxiterate 1000 msa_${region}/haps_noredund.txt > msa_${region}/aln_results.txt
30
33
31
34
# ./ProGraphMSA+TR.sh -o result_${region}.txt -R haps_noredund_${region}.txt
@@ -42,17 +45,18 @@ bash $DIR/mend_report.sh msa_${region}/variants.vcf.gz >> msa_${region}/report.t
42
45
echo " Realigned" >> msa_${region} /report.txt
43
46
bash $DIR /mend_report.sh msa_${region} /result.vcf.gz >> msa_${region} /report.txt
44
47
45
- python $DIR /get_reference.py $ref $region > msa_${region} /haps_final.fa
46
- for i in $( zgrep -m1 ' #CHROM' $vcf | cut -f10-)
47
- do
48
- samtools faidx $ref $region \
49
- | bcftools consensus -H1 --sample $i msa_${region} /result.vcf.gz \
50
- | python $DIR /fa_rename.py ${i} _1 >> msa_${region} /haps_final.fa
51
- samtools faidx $ref $region \
52
- | bcftools consensus -H2 --sample $i msa_${region} /result.vcf.gz \
53
- | python $DIR /fa_rename.py ${i} _2 >> msa_${region} /haps_final.fa
54
- done
55
-
56
- echo " md5sums" $( sort msa_${region} /haps.fa | md5sum) $( sort msa_${region} /haps_final.fa | md5sum)
48
+ # Turning off validation checking for now
49
+ # python $DIR/get_reference.py $ref $region > msa_${region}/haps_final.fa
50
+ # for i in $(zgrep -m1 '#CHROM' $vcf | cut -f10-)
51
+ # do
52
+ # samtools faidx $ref $region \
53
+ # | bcftools consensus -H1 --sample $i msa_${region}/result.vcf.gz \
54
+ # | python $DIR/fa_rename.py ${i}_1 >> msa_${region}/haps_final.fa
55
+ # samtools faidx $ref $region \
56
+ # | bcftools consensus -H2 --sample $i msa_${region}/result.vcf.gz \
57
+ # | python $DIR/fa_rename.py ${i}_2 >> msa_${region}/haps_final.fa
58
+ # done
59
+ #
60
+ # echo "md5sums" $(sort msa_${region}/haps.fa | md5sum) $(sort msa_${region}/haps_final.fa | md5sum)
57
61
58
62
0 commit comments