diff --git a/recon/core/module.py b/recon/core/module.py index 7222b9bf..ad7f73cc 100644 --- a/recon/core/module.py +++ b/recon/core/module.py @@ -1,5 +1,5 @@ from requests.exceptions import Timeout -import html.parser +import html import http.cookiejar import io import os @@ -92,12 +92,7 @@ def ascii_sanitize(self, s): def html_unescape(self, s): '''Unescapes HTML markup and returns an unescaped string.''' - h = html.parser.HTMLParser() - return h.unescape(s) - #p = htmllib.HTMLParser(None) - #p.save_bgn() - #p.feed(s) - #return p.save_end() + return html.unescape(s) def html_escape(self, s): escapes = { diff --git a/recon/utils/parsers.py b/recon/utils/parsers.py index 33c8900b..4d4b30e9 100644 --- a/recon/utils/parsers.py +++ b/recon/utils/parsers.py @@ -1,5 +1,5 @@ from urllib.parse import urlparse -import html.parser +import html import re def parse_hostname(s): @@ -12,8 +12,7 @@ def parse_emails(s): return re.findall(r'([^\s]+@[^\s]+)', s) def parse_name(s): - h = html.parser.HTMLParser() - elements = [h.unescape(x) for x in s.strip().split()] + elements = [html.unescape(x) for x in s.strip().split()] # remove prefixes and suffixes names = [] for i in range(0,len(elements)):