#BodyTextExtraction DOM Based heuristic algorithm for body text extraction from HTML.
ref: DOM Based Content Extraction via Text Density
usage
from body_text_extraction import BodyTextExtraction
bte = BodyTextExtraction()
text = bte.extract( html )