morrisalp/html2text.py

## html2text.py
from bs4 import BeautifulSoup as bs

def html2text(html):
  soup = bs(html, features='lxml')
  for script in soup(["script", "style"]):
      script.decompose()
  for br in soup.find_all("br"):
      br.replace_with("\n")
  return soup.get_text(separator=' ').strip()
	from bs4 import BeautifulSoup as bs

	def html2text(html):
	soup = bs(html, features='lxml')
	for script in soup(["script", "style"]):
	script.decompose()
	for br in soup.find_all("br"):
	br.replace_with("\n")
	return soup.get_text(separator=' ').strip()