#coding:utf-8 import re def strip_tags(string, allowed_tags=''): if allowed_tags != '': # Get a list of all allowed tag names. allowed_tags = allowed_tags.split(',') allowed_tags_pattern = ['</?'+allowed_tag+'[^>]*>' for allowed_tag in allowed_ta…
去除指定标签 from bs4 import BeautifulSoup #去除属性ul [s.extract() for s in soup("ul")] # 去除属性svg [s.extract() for s in soup("svg")] # 去除属性script [s.extract() for s in soup("script")] 去除注释 from bs4 import BeautifulSoup, Comment #去除注释…