import time
import urllib.parse
-USER_AGENT = "Mozilla/5.0 (X11; Linux x86_64; rv:74.0) Gecko/20100101 Firefox/74.0"
+USER_AGENT = "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/112.0"
try:
import autosocks
def grab_html(url):
logging.debug("grab_html(%r)", url)
request = http_session.prepare_request(requests.Request("GET", url))
- response = http_session.send(request, stream=True)
+ response = http_session.send(request)
doc = lxml.html.parse(io.BytesIO(response.content), lxml.html.HTMLParser(encoding="utf-8", recover=True))
response.close()
return doc
def grab_xml(url):
logging.debug("grab_xml(%r)", url)
request = http_session.prepare_request(requests.Request("GET", url))
- response = http_session.send(request, stream=True)
+ response = http_session.send(request)
doc = lxml.etree.parse(io.BytesIO(response.content), lxml.etree.XMLParser(encoding="utf-8", recover=True))
response.close()
return doc