0102病毒基因组1-流程

2.组装

项目对应参考 /share/nas1/yuj/project/virus/ref.fa

nohup perl /share/nas1/yuj/pipline/genome-assembly-seq/virus-genome-seq/v2.0/assembly/virus.assembly.pip.pl -i ass.cfg &

3.注释

1.下载参考
编辑list_ann文件
down- ann

2.提取cds序列
cd ref_ann && python3 /share/nas1/yuj/script/virus/vi_from_gbk_get_cds.py -i gbk/ -o out  -d && cd -

3.blast
blastn -query ref_ann/out/cds/cds_*.fasta -subject *.fsa -outfmt 6 -out blast.txt

4.使用程序解析表格
python3 /share/nas1/yuj/script/virus/virus_parse_blast_table.py -i blast.txt > gene.annotation.info2

5.查看基因排列,根据参考修改注释
count=0 && for i in $(grep 'CDS' gene.annotation.info2 | awk '{print $3 "_:_" $2}'); do count=$((count+1)) &&  echo "" && echo "###############" $count ":"  $(echo "$i" | awk -F "_:_" '{print $1}') "###############" && mt_add.py  -i *.fsa -p $(echo "$i" | awk -F "_:_" '{print $2}') -n 1;done  > sample_ann.log

count=0 && for i in $(grep 'CDS' gene.annotation.info2 | awk '{print $3 "_:_" $2}'); do count=$((count+1)) && echo "" && echo "###############" $count ":" $(echo "$i" | awk -F "_:_" '{print $1}') "###############" && cp_add.py -i *.fsa -p $(echo "$i" | awk -F "_:_" '{print $2}') ;done > sample_ann.log

count=0 && for i in $(grep 'CDS' *.gbk.ann | awk '{print $3 "_:_" $2}'); do count=$((count+1)) && echo "" && echo "###############" $count ":" $(echo "$i" | awk -F "_:_" '{print $1}') "###############" && mt_add.py -i *.fasta -p $(echo "$i" | awk -F "_:_" '{print $2}') -n 1;done > ref_ann.log


6.没有问题的话,生成gene.annotation.info
mt_move_pos.py -i gene.annotation.info2 -o gene.annotation.info
rename gene.annotation.info_tmp gene.annotation.info gene.annotation.info_tmp
1.配置文件 
20210918]$ python3 /share/nas1/yuj/script/chloroplast/get_ann_cfg.py 
# 在项目编号目录下直接运行 或者cp /share/nas6/pub/pipline/genome-assembly-seq/chloroplast-genome-seq/v1.2/cp.anno.config.yaml ann.cfg
# 修改配置文件,写参考

2.
perl /share/nas1/yuj/pipline/genome-assembly-seq/virus-genome-seq/v2.0/annotation/virus_annotation_pip.pl -i ann.cfg -g 1 -c
!!!第一遍流程加-c参数!!!!!!好用来修改gbk
!!!注意gbk中不确定起始位置的  
!!!第二遍还要改tbl文件

4.整理结果

perl /share/nas1/yuj/pipline/genome-assembly-seq/virus-genome-seq/v2.0/html_report/virus_pip_dir.pl -i analysis

5.整理报告

cp /share/nas6/pub/pipline/genome-assembly-seq/mitochondrial-genome-seq/v2.0/html_report/report.cfg ./report.cfg && realpath  report.cfg # 修改

# 标准分析+高级分析 / 标准分析用也行
perl /share/nas1/yuj/pipline/genome-assembly-seq/virus-genome-seq/v2.0/html_report/report2xml.virus.pl  -id complete_dir/ -cfg report.cfg