File tree 2 files changed +4
-10
lines changed
2 files changed +4
-10
lines changed Original file line number Diff line number Diff line change 1
1
from requests .exceptions import Timeout
2
- import html . parser
2
+ import html
3
3
import http .cookiejar
4
4
import io
5
5
import os
@@ -92,12 +92,7 @@ def ascii_sanitize(self, s):
92
92
93
93
def html_unescape (self , s ):
94
94
'''Unescapes HTML markup and returns an unescaped string.'''
95
- h = html .parser .HTMLParser ()
96
- return h .unescape (s )
97
- #p = htmllib.HTMLParser(None)
98
- #p.save_bgn()
99
- #p.feed(s)
100
- #return p.save_end()
95
+ return html .unescape (s )
101
96
102
97
def html_escape (self , s ):
103
98
escapes = {
Original file line number Diff line number Diff line change 1
1
from urllib .parse import urlparse
2
- import html . parser
2
+ import html
3
3
import re
4
4
5
5
def parse_hostname (s ):
@@ -12,8 +12,7 @@ def parse_emails(s):
12
12
return re .findall (r'([^\s]+@[^\s]+)' , s )
13
13
14
14
def parse_name (s ):
15
- h = html .parser .HTMLParser ()
16
- elements = [h .unescape (x ) for x in s .strip ().split ()]
15
+ elements = [html .unescape (x ) for x in s .strip ().split ()]
17
16
# remove prefixes and suffixes
18
17
names = []
19
18
for i in range (0 ,len (elements )):
You can’t perform that action at this time.
0 commit comments