def readfasta(filename):
fa = open(filename, 'r')
res = {}
ID = ''for line in fa:
if line.startswith('>'):
ID = line#.strip('\n')
res[ID] = ''else:
res[ID] += line#.strip('\n') return res
res = readfasta('/PERSONALBIO/work/singlecell/s01/ref/Drosophila/GCF_000001215.4_Release_6_plus_ISO1_MT_translated_cds.faa')
uniq = {}
for k,v in res.items():
gene = k.split(' ')[1]
title = gene[6:-1]+'\n'
v = [v]
if title not in uniq: # 注意这种生成双层字典的方法!
uniq[title] = v
else:
uniq[title] += v
max_seq = {}
for k,v in uniq.items():
seq = max(v, key = len)
max_seq[k] = seq
w = open('longest.txt',"w")
for k,v in max_seq.items():
w.write('>' +k)
w.write(v)
w.close()
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· winform 绘制太阳,地球,月球 运作规律
· 超详细:普通电脑也行Windows部署deepseek R1训练数据并当服务器共享给他人
· 上周热点回顾(3.3-3.9)
· AI 智能体引爆开源社区「GitHub 热点速览」
· 写一个简单的SQL生成工具