diff --git a/goose/parsers.py b/goose/parsers.py index 3ccb9e5c..4ce2a8c6 100644 --- a/goose/parsers.py +++ b/goose/parsers.py @@ -165,7 +165,7 @@ def getText(self, node): @classmethod def getFormattedText(self, node): - pars = node.cssselect('p') + pars = node.cssselect('h1,h2,h3,h4,h5,p') for p in pars: if p.text is not None: p.text = u'\ufffc ' + p.text return Parser.getText(node)