linux 中输出参考基因组gff文件第9列的注释类别

 

001、

[root@pc1 test3]# ls
GCF_000001405.40_GRCh38.p14_genomic.gff
[root@pc1 test3]# awk '$3 == "gene" {split($9, a, ";"); for(i in a) {split(a[i], b, "="); if(++c[b[1]] == 1) print b[1]}}' GCF_000001405.40_GRCh38.p14_genomic.gff
description
ID
Dbxref
Name
gbkey
gene
gene_biotype
gene_synonym
partial
start_range
end_range

 

posted @ 2022-11-04 18:18  小鲨鱼2018  阅读(93)  评论(0编辑  收藏  举报