R语言统计 plink格式数据样本缺失率

 

1、R脚本

dir()
dat <- read.table("outcome.ped")
dat
id <- dat[,2]
dat <- dat[, -(1:6)]

result <- data.frame()

for (i in 1:nrow(dat)) {
  count = 0
  for (j in 1:ncol(dat)) {
    if (dat[i,j] == 0) {
      count = count + 1
    }
  }
  temp <- c(count/2,ncol(dat)/2, count/ncol(dat))
  result <- rbind(result, temp)
}

result <- cbind(id, result)
colnames(result)[2:4] <- c("misssite","totalsite","rate")
result

 

 

2、plink验证

[root@centos79 test]# ls
outcome.map  outcome.ped  result.txt  test.sh
[root@centos79 test]# plink --file outcome --missing --out verify > /dev/null; rm *.log *.nosex
[root@centos79 test]# ls
outcome.map  outcome.ped  result.txt  test.sh  verify.imiss  verify.lmiss
[root@centos79 test]# cat verify.imiss
 FID  IID MISS_PHENO   N_MISS   N_GENO   F_MISS
 DOR    1          Y        4        8      0.5
 DOR    2          Y        4        8      0.5
 DOR    3          Y        3        8    0.375
 DOR    4          Y        2        8     0.25
 DOR    5          Y        1        8    0.125
 DOR    6          Y        1        8    0.125

 

posted @ 2021-10-31 18:16  小鲨鱼2018  阅读(131)  评论(0编辑  收藏  举报