GATK后maftools可视化

作者: njmujjc | 来源:发表于2019-01-02 11:22 被阅读0次

    #####删除文件的前N行####

    tail -n +N Het-158-rawGATK-indel-filter.vcf| head

    #####合并所有VCF文件####(合并之后记得加上第一行)

    for i in *.vcf ; do sed -i '1d' $i ; done

    for i in *.vcf ; do cat $i >> 11.vcf; done

    #####利用annovar转换格式#####

    for i in *.vcf ; do perl /media/pc/disk2/annovar/convert2annovar.pl -format vcf4 $i > $i.avinput

    #####添加样本名称#####(先把snp和indel文件合并会省事一点)

    awk 'BEGIN{OFS="\t"}{print "chr"$1,$2,$3,$4,$5,"Het-158"}' Het-158-indel.vcf.avinput> Het-158-indel.tsv

    #####合并所有tsv#####

    for i in *.tsv ; do cat $i >> all.tsv; done

    #####利用annovar注释####

    perl /media/pc/disk2/annovar/table_annovar.pl all.tsv/media/pc/disk2/annovar/mousedb/ -buildver mm10 -out variants --otherinfo -remove -protocol refGene -operation g -nastring NA

    ####可选步骤:提取exonic上的信息#####

    grep "exonic" variants.mm10_multianno.txt> exonic.mm10_multianno.txt

    ####Rstudio:导入到maftools###

    >library(maftools)

    >var.annovar.maf = annovarToMaf(annovar = "variants.mm10_multianno.txt",Center = 'CSI-NUS', refBuild = 'mm10',tsbCol = 'Tumor_Sample_Barcode', table = 'refGene')

    >write.table(x=var.annovar.maf,file="var_annovar_maf",quote= F,sep="\t",row.names=F)

    >var_maf = read.maf(maf="var_annovar_maf")

    >plotmafSummary(maf = var_maf, rmOutlier = TRUE, addStat = 'median',showBarcodes = T)

    >oncoplot(maf = var_maf, top = 10, fontSize = 12)

    相关文章

      网友评论

        本文标题:GATK后maftools可视化

        本文链接:https://www.haomeiwen.com/subject/uwvrlqtx.html