Perl FASTA文件拆分合并
1、合并并转化一代测序seq纯文本为fasta格式文件
use strict; use warnings; my @dir; my @filelist; open OUT, ">result.fst"; opendir (DIR, "./") or die "can't open the directory!"; @dir = readdir DIR; foreach my $file (@dir) { if ( $file =~ /[a-z]*\.seq/) { push @filelist,$file; } } closedir(DIR); foreach my $file (@filelist){ open IN, "<".$file or die "cannot open $file"; print OUT ">".$file."\n"; print OUT <IN>; close(IN); } close (OUT);
2、合并文件夹下的纯文本文件
use strict; use warnings; open T, ">T.fas"; open R, ">R.fas"; opendir (DIR_T, "./T/") or die "cannot open this dir $!"; opendir (DIR_R, "./R/") or die "cannot open this dir $!"; my @t = readdir DIR_T; my @r = readdir DIR_R; closedir(DIR_T); closedir(DIR_R); foreach my $file (@t){ if($file ne "." && $file ne ".."){ open IN, "<T/".$file or die "cannot open $file"; print T <IN>; close (IN); } } foreach my $file (@r){ if($file ne "." && $file ne ".."){ open IN, "<R/".$file or die "cannot open $file"; print R <IN>; close (IN); } } close(T); close(R);
3、批量序列拼接
use strict; use warnings; open T, "<T_a.fas"; open R, "<R_a.fas"; open H, ">Haplotypes.fas"; my @t = <T>; my @r = <R>; sub combine{ print H ">$_[0]\n"; my $tag = 0; foreach (@t){ if(/>$_[1]\s/){ $tag = 1; }elsif(/>\w+/){ $tag = 0 }elsif($tag){ print H $_; } } $tag = 0; foreach (@r){ if(/>$_[2]\s/){ $tag = 1; }elsif(/>\w+/){ $tag = 0 }elsif($tag){ print H $_; } } #print H "\n"; } # 调用函数 combine("O","T7","R4"); combine("P","T1","R5"); combine("M","T1","R4"); combine("L","T5","R4"); combine("U","T1","R9"); combine("I","T1","R3"); combine("AT","T25","R5"); combine("AS","T1","R26"); combine("BF","T1","R36"); combine("BG","T36","R4"); combine("BH","T1","R37"); combine("BI","T37","R5"); combine("BJ","T38","R5"); close(T); close(R); close(H);