有参转录组实战8-基因功能注释_GO_KEGG_swisspro
data:image/s3,"s3://crabby-images/89f6b/89f6b269f74a0672d70be338211302c3487e1c9b" alt=""
#进行功能注释时,我们只用到蛋白文件,就是上一期提取序列的文件“Ptri.protein.fa”。
#使用命令“grep -c ">" Ptri.protein.fa”统计下“>”的个数,发现有52400个。
#新建文件夹“swissprot”
wget https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.fasta.gz
gunzip -c uniprot_sprot.fasta.gz >uniprot_sprot.fasta#解压
conda install diamond#安装
diamond makedb --in uniprot_sprot.fasta --db uniprot_sprot.fasta#建索引
nohup diamond blastp -d uniprot_sprot.fasta -q Ptri.protein.fa --max-target-seqs 1 --outfmt 6 --evalue 1e-5 > blastp.out &#注释
#查看文件blatp.out,十二列解释看表头
data:image/s3,"s3://crabby-images/ff03f/ff03f89f80330575b6e67a330e891b66906756d0" alt=""
#新建文件夹“pfam”
wget http://ftp.ebi.ac.uk/pub/databases/Pfam/releases/Pfam34.0/Pfam-A.hmm.gz#下载
gunzip -c Pfam-A.hmm.gz > Pfam-A.hmm#解压
conda install hmmer#安装
hmmpress Pfam-A.hmm#构索引
nohup hmmscan --domtblout pfam.domtblout Pfam-A.hmm
Ptri.protein.fa &#注释
#查看文件pfam.domtblout
data:image/s3,"s3://crabby-images/26b3f/26b3f7465dbd788727207fe3681ac1859551e06b" alt=""
#Plant TFDB网站预测转录因子http://planttfdb.gao-lab.org/prediction.php
data:image/s3,"s3://crabby-images/424ed/424edff3bf44b2029eb7719092b3ae26c020766d" alt=""
#预测了3835个转录因子。自己下载整理。
data:image/s3,"s3://crabby-images/69bc6/69bc6a89fc19eb186d7c02a09c9d8ab2c5337849" alt=""
#iTAK预测转录因子、调控因子、激酶http://itak.feilab.net/cgi-bin/itak/online_itak.cgi
data:image/s3,"s3://crabby-images/c7c92/c7c927a431113f0af0b3f98c141fec8eb42322f2" alt=""
#接着GO注释和KEGG注释。以下重点参考https://zhuanlan.zhihu.com/p/475588763教程。
#http://eggnog-mapper.embl.de/
data:image/s3,"s3://crabby-images/556dc/556dcf60ee28eda90ea386bc92048019f901759e" alt=""
#打开邮箱
data:image/s3,"s3://crabby-images/26adb/26adb67029b484552bf22f2a1758c70c2d00e7ba" alt=""
#开始工作
data:image/s3,"s3://crabby-images/353d4/353d42ea8d4a62719d03dd74c5d0cb8402409d8d" alt=""
#等约半小时,打开链接下载结果
data:image/s3,"s3://crabby-images/e95a2/e95a24b845c35e4246402259fc20fbb539feddb1" alt=""
#只要这一个
data:image/s3,"s3://crabby-images/3b86f/3b86f643f8c6239da4e9be44a719f85e96844a53" alt=""
#使用TBtools的这个功能
data:image/s3,"s3://crabby-images/20b16/20b16b6992e4f9a4ca59c34186c51972a4d1976c" alt=""
#放入注释文件
data:image/s3,"s3://crabby-images/a1528/a1528fb2ea132432106caee6955ba760eb5a850f" alt=""
#得到几个txt文件,后面的富集会用到。
data:image/s3,"s3://crabby-images/af485/af485834c7deab9a019bd116b3321cc811cb8213" alt=""
#最后自己用excel整理下,可以得到基因的各种注释信息。
data:image/s3,"s3://crabby-images/f5ca7/f5ca7d18ee1d025160dd376ce54ca6832ac16bec" alt=""
#赛博朋克边缘行者