summaryrefslogtreecommitdiff
path: root/bs4/builder/_htmlparser.py
diff options
context:
space:
mode:
authorLeonard Richardson <leonardr@segfault.org>2018-07-15 08:27:40 -0400
committerLeonard Richardson <leonardr@segfault.org>2018-07-15 08:27:40 -0400
commitb5ffba33327acaf51a2274f9e0a5305b5fb8bdf9 (patch)
treee627743f2434291a3cb12139c4ae45b8088d8592 /bs4/builder/_htmlparser.py
parentb2836d45288e0de1474ecc555f6e3aac51f3168c (diff)
downloadbeautifulsoup4-b5ffba33327acaf51a2274f9e0a5305b5fb8bdf9.tar.gz
Stop data loss when encountering an empty numeric entity, and
possibly in other cases. Thanks to tos.kamiya for the fix. [bug=1698503]
Diffstat (limited to 'bs4/builder/_htmlparser.py')
-rw-r--r--bs4/builder/_htmlparser.py1
1 files changed, 1 insertions, 0 deletions
diff --git a/bs4/builder/_htmlparser.py b/bs4/builder/_htmlparser.py
index 71604c5..ef9fd1e 100644
--- a/bs4/builder/_htmlparser.py
+++ b/bs4/builder/_htmlparser.py
@@ -224,6 +224,7 @@ class HTMLParserTreeBuilder(HTMLTreeBuilder):
parser.soup = self.soup
try:
parser.feed(markup)
+ parser.close()
except HTMLParseError, e:
warnings.warn(RuntimeWarning(
"Python's built-in HTMLParser cannot parse the given document. This is not a bug in Beautiful Soup. The best solution is to install an external parser (lxml or html5lib), and use Beautiful Soup with that parser. See http://www.crummy.com/software/BeautifulSoup/bs4/doc/#installing-a-parser for help."))