【转录组05】基因表达定量

2020-12-13  本文已影响0人  呆呱呱

featureCounts

常用参数

image.png
## 定义输入输出文件夹
trainee2/Nov10/project/Human_16-Asthma-Trans/Expression

gtf=/trainee2/Nov10//database/genome/Ensembl/Homo_sapiens/GRCh38_release95/Homo_sapiens.GRCh38.95.gtf.gz
inputdir=/trainee2/Nov10/project/Human_16-Asthma-Trans/Mapping/Hisat2
outputdir=/trainee2/Nov10/project/Human_16-Asthma-Trans/Expression/featureCount
image.png
# featureCounts对bam文件进行计数
featureCounts -T 5 -p -t exon -g gene_id -a $gtf -o all.id.txt $inputdir/*.sorted.bam
# 对定量结果质控
multiqc all.id.txt.summary
# 得到表达矩阵
cat all.id.txt | cut -f1,7- > counts.txt
image.png

salmon定量————不需要比对直接得到参考基因组表达

image.png
# 构建salmon索引
time salmon index -t Homo_sapiens.GRCh38.cdna.all.fa.gz -i Homo_sapiens.GRCh38.cdna.all.salmon

# 定义文件夹
index=/teach/database/genome/Ensembl/Homo_sapiens/GRCh38_release95/Homo_sapiens.GRCh38.cdna.all.salmon/
input=/teach/project/Human-16-Asthma-Trans/data/cleandata/trim_galore
outdir=/teach/project/Human-16-Asthma-Trans/Expression/salmon

# 单样本测试
salmon quant -i $index -l A \
-1 $input/SRR1039510_1_val_1.fq.gz \
-2 $input/SRR1039510_2_val_2.fq.gz \
-p 5 -o $outdir/SRR1039510.quant

# 编写脚本,使用salmon批量对目录下所有fastq文件进行定量
cat /teach/project/Human-16-Asthma-Trans/data/rawdata/sra/sampleId.txt |while read id 
do
 echo "salmon quant -i ${index} -l A -1 ${input}/${id}_1_val_1.fq.gz -2 ${input}/${id}_2_val_2.fq.gz -p 5 -o ${outdir}/${id}.quant"
done >salmon.sh


# 后台运行脚本
nohup bash salmon.sh 1>salmon.log 2>&1 &
image.png
上一篇下一篇

猜你喜欢

热点阅读