2023-07-20 重测序数据比对

2023-08-05  本文已影响0人  麦冬花儿

全局比对 :同一物种整体评价
局部比对 :不同物种局部评价


# Installing Bowtie1 (http://bowtie-bio.sourceforge.net/index.shtml)
#wget https://sourceforge.net/projects/bowtie-bio/files/bowtie/1.3.1/bowtie-1.3.1-linux-x86_64.zip -P ~/software
unzip ~/software/bowtie-1.3.1-linux-x86_64.zip -d /opt/biosoft/
echo 'PATH=$PATH:/opt/biosoft/bowtie-1.3.-linux-x86_64/' >> ~/.bashrc
source ~/.bashrc

# Installing bowtie2 (http://bowtie-bio.sourceforge.net/bowtie2/index.shtml)
#wget https://sourceforge.net/projects/bowtie-bio/files/bowtie2/2.5.1/bowtie2-2.5.1-linux-x86_64.zip -P ~/software
unzip ~/software/bowtie2-2.5.1-linux-x86_64.zip -d /opt/biosoft/
echo 'PATH=$PATH:/opt/biosoft/bowtie2-2.5.1-linux-x86_64/' >> ~/.bashrc
source ~/.bashrc


mkdir -p /home/train/06.reads_aligment
cd /home/train/06.reads_aligment

# Bowtie2 practise
mkdir -p /home/train/06.reads_aligment/bowtie2
cd /home/train/06.reads_aligment/bowtie2

ln -s ~/00.incipient_data/data_for_genome_assembling/assemblies_of_Malassezia_sympodialis/Malassezia_sympodialis.genome_V01.fasta genome.fasta
ln -s ~/03.sequencing_data_preprocessing/V?.?.fastq ./

bowtie2-build --threads 8 genome.fasta genome #建立索引
bowtie2 -p 8 -x genome -1 V1.1.fastq -2 V1.2.fastq -S V1.sam --rg-id V1 --rg "PL:Illumina" --rg "SM:V1" 2> V1.bowtie2.log
# real  1m26.553s
# user  11m12.705s
# sys   0m13.891s

bowtie2 -p 8 -x genome -1 V2.1.fastq -2 V2.2.fastq -S V2.sam --rg-id V2 --rg "PL:Illumina" --rg "SM:V2" 2> V2.bowtie2.log
[train@MiWiFi-R3P-srv bowtie2]$ cat V2.bowtie2.log 
2240991 reads; of these:
  2240991 (100.00%) were paired; of these:
    693164 (30.93%) aligned concordantly 0 times
    1459657 (65.13%) aligned concordantly exactly 1 time
    88170 (3.93%) aligned concordantly >1 times
    693164 pairs aligned concordantly 0 times; of these:
      32957 (4.75%) aligned discordantly 1 time
    660207 pairs aligned 0 times concordantly or discordantly; of these:
      1320414 mates make up the pairs; of these:
        1308702 (99.11%) aligned 0 times
        7570 (0.57%) aligned exactly 1 time
        4142 (0.31%) aligned >1 times
70.80% overall alignment rate # mappling rate较低是由于线粒体基因组的干扰


# Installing BWA (https://sourceforge.net/projects/bio-bwa/files/)
#wget https://sourceforge.net/projects/bio-bwa/files/bwa-0.7.17.tar.bz2 -P ~/software/
tar jxf ~/software/bwa-0.7.17.tar.bz2 -C /opt/biosoft/
cd /opt/biosoft/bwa-0.7.17/
make CC='gcc -fcommon' -j 4
echo 'PATH=$PATH:/opt/biosoft/bwa-0.7.17/' >> ~/.bashrc
source ~/.bashrc
# BWA practise
mkdir -p /home/train/06.reads_aligment/bwa
cd /home/train/06.reads_aligment/bwa

ln -s ~/00.incipient_data/data_for_genome_assembling/assemblies_of_Malassezia_sympodialis/Malassezia_sympodialis.genome_V01.fasta genome.fasta
ln -s ~/03.sequencing_data_preprocessing/V?.?.fastq ./

bwa index genome.fasta -p genome

bwa mem -t 8 -R '@RG\tID:V1\tSM:V1' genome V1.1.fastq V1.2.fastq > V1.mem.sam
# real  0m23.141s
# user  2m31.3.0s
# sys   0m3.354s

bwa bwasw -t 8 genome V1.1.fastq V1.2.fastq > V1.bwasw.sam
# real  2m31.854s
# user  18m43.008s
# sys   0m30.774s

bwa aln -t 8 genome V1.1.fastq > V1.1.sai
# real  0m9.566s
# user  1m2.180s
# sys   0m0.321s
bwa aln -t 8 genome V1.2.fastq > V1.2.sai
bwa sampe genome V1.1.sai V1.2.sai V1.1.fastq V1.2.fastq > V1.backtrack.sam
# real  0m24.595s
# user  0m20.893s
# sys   0m1.737s
上一篇 下一篇

