import sys import re def cleancss(text): text = re.compile('\s+').sub(' ', text) text = re.compile('\s*(?P,|:)\s*').sub('\g ', text) text = re.compile('\s*;\s*').sub(';\n ', text) text = re.compile('\s*\{\s*').sub(' {\n ', text) text = re.compile('\s*\}\s*').sub('\n}\n\n', text) return text def cleanhtml(text): text = text.lower() r = re.compile('\', re.DOTALL) scripts = r.findall(text) text = r.sub('