安装 barrnap
barrnap:GitHub - tseemann/barrnap: :microscope: Bacterial ribosomal RNA predictor
mamba create -c conda-forge -c bioconda -n Barrnap perl=5 hmmer bedtools=2.27
mamba activate Barrnap
mamba install -c bioconda -c conda-forge barrnap
barrnap --help
使用 barrnap
barrnap --kingdom bac --threads 8 --outseq bac_rRNA.fasta --quiet examples/bacteria.fna > bac_rRNA.gff3
安装 SortMeRNA
SortMeRNA:GitHub - sortmerna/sortmerna:SortMeRNA:下一代序列过滤和比对工具
mkdir sortmerna
cd sortmerna# get the distro
wget https://github.com/biocore/sortmerna/releases/download/v4.3.6/sortmerna-4.3.6-Linux.sh# view the installer usage
bash sortmerna-4.3.6-Linux.sh --helpOptions: [defaults in brackets after descriptions]--help print this message--version print cmake installer version--prefix=dir directory in which to install--include-subdir include the sortmerna-4.3.6-Linux subdirectory--exclude-subdir exclude the sortmerna-4.3.6-Linux subdirectory--skip-license accept license# run the installer
bash sortmerna-4.3.6-Linux.sh --skip-licensesortmerna Installer Version: 4.3.6, Copyright (c) Clarity GenomicsThis is a self-extracting archive.The archive will be extracted to: $HOME/sortmernaUsing target directory: /home/biocodz/sortmernaExtracting, please wait...Unpacking finished successfully# check the installed binaries
ls -lrt bin/
sortmerna# set PATH
vim ~/.bashrc
export PATH=(whole path)/sortmerna/bin/:$PATH
source ~/.bashrc# test the installation
sortmerna --versionSortMeRNA version 4.3.6Build Date: Jul 17 2021sortmerna_build_git_sha:@921fa40256760ea2d44c49b21eb326afda748d5e@sortmerna_build_git_date:@2022/08/16 10:59:31@# view help
sortmerna -h#Please, use database.tar.gz from release 4.3.4.
wget https://github.com/biocore/sortmerna/releases/download/v4.3.4/database.tar.gz
tar -xvzf database.tar.gz # get 4 database
使用 SortMeRNA
sortmerna --ref smr_v4.3_default_db.fasta --reads READS_PATH_1 --reads READS_PATH_2 --threads 180 --workdir dir --paired_out --fastx --out2 --aligned ${num}_aligned --other ${num}_no_rRNA
--aligned
: 比对上参考数据库的序列,以rRNA数据库为参考文件的话,输出的是rRNA。
--other
: 与参考文件比对不上的序列,在这里就是rRNA-free的序列。用法与--aligned
一样
--paired_out
: flag,表明输入的文件是双端测序文件,一端比对不上的话,把成对的reads都输出到non-aligned的文件中。要与--fastx
一起用,与--paired_in
相互排斥。
--paired_in
: flag,表明输入的文件是双端测序文件,一端比对上就算成对的reads都比对上了。要与--fastx
一起用,与--paired_out
相互排斥。
查看out/aligned.log