for i in content:
removeaddr=re.compile() #去除多个杂质要用不同的标签
i=re.sub(removeaddr,"",i) #对正则表达式进行替换