18. Char counter/ 文字数カウンター
• reStructureText -> HTML -> beautifulsoup4
• https://pypi.python.org/pypi/beautifulsoup4
from bs4 import BeautifulSoup
# load HTML from file
soup = BeautifulSoup(f.read())
# remove navigation seciton
for div in soup.find_all('div', role='navigation'):
div.decompose()
# remove toctree
for div in soup.find_all('div', 'toctree-wrapper'):
div.decompose()
# count character
len(soup.get_text())