1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
import os import re from bs4 import BeautifulSoup soup = BeautifulSoup(open('index.html', 'r').read()) paras = [p for p in soup.find_all('p')] for p in paras: s = ''.join(p.strings) s = s.replace('\n', ' '); print (u'"%s",' % s).encode('UTF-8')