The code below, needs to return 200, but an error occurs for some domains.
import requests url1 = 'https://www.pontofrio.com.br/' headers = {'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) ' 'AppleWebKit/537.11 (KHTML, like Gecko) ' 'Chrome/23.0.1271.64 Safari/537.11', 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8', 'Accept-Charset': 'ISO-8859-1,utf-8;q=0.7,*;q=0.3', 'Accept-Encoding': 'none', 'Accept-Language': 'en-US,en;q=0.8', 'Connection': 'keep-alive'} response = requests.get(url1, headers, timeout=10) print(response.status_code) Return:
Traceback (most recent call last): File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 384, in _make_request six.raise_from(e, None) File "<string>", line 2, in raise_from File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 380, in _make_request httplib_response = conn.getresponse() File "C:\Python34\lib\http\client.py", line 1148, in getresponse response.begin() File "C:\Python34\lib\http\client.py", line 352, in begin version, status, reason = self._read_status() File "C:\Python34\lib\http\client.py", line 314, in _read_status line = str(self.fp.readline(_MAXLINE + 1), "iso-8859-1") File "C:\Python34\lib\socket.py", line 371, in readinto return self._sock.recv_into(b) File "C:\Python34\lib\site-packages\urllib3\contrib\pyopenssl.py", line 309, in recv_into return self.recv_into(*args, **kwargs) File "C:\Python34\lib\site-packages\urllib3\contrib\pyopenssl.py", line 307, in recv_into raise timeout('The read operation timed out') socket.timeout: The read operation timed out During handling of the above exception, another exception occurred: Traceback (most recent call last): File "C:\Python34\lib\site-packages\requests\adapters.py", line 449, in send timeout=timeout File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 638, in urlopen _stacktrace=sys.exc_info()[2]) File "C:\Python34\lib\site-packages\urllib3\util\retry.py", line 367, in increment raise six.reraise(type(error), error, _stacktrace) File "C:\Python34\lib\site-packages\urllib3\packages\six.py", line 686, in reraise raise value File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 600, in urlopen chunked=chunked) File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 386, in _make_request self._raise_timeout(err=e, url=url, timeout_value=read_timeout) File "C:\Python34\lib\site-packages\urllib3\connectionpool.py", line 306, in _raise_timeout raise ReadTimeoutError(self, url, "Read timed out. (read timeout=%s)" % timeout_value) urllib3.exceptions.ReadTimeoutError: HTTPSConnectionPool(host='www.pontofrio.com.br', port=443): Read timed out. (read timeout=10) During handling of the above exception, another exception occurred: Traceback (most recent call last): File "c:/teste.py", line 219, in <module> url = montaurl(dominio) File "c:/teste.py", line 81, in montaurl response = requests.get(url1, headers, timeout=10) File "C:\Python34\lib\site-packages\requests\api.py", line 75, in get return request('get', url, params=params, **kwargs) File "C:\Python34\lib\site-packages\requests\api.py", line 60, in request return session.request(method=method, url=url, **kwargs) File "C:\Python34\lib\site-packages\requests\sessions.py", line 533, in request resp = self.send(prep, **send_kwargs) File "C:\Python34\lib\site-packages\requests\sessions.py", line 646, in send r = adapter.send(request, **kwargs) File "C:\Python34\lib\site-packages\requests\adapters.py", line 529, in send raise ReadTimeout(e, request=request) requests.exceptions.ReadTimeout: HTTPSConnectionPool(host='www.pontofrio.com.br', port=443): Read timed out. (read timeout=10) Domain that works:
Domains that don't work:
I believe it is some block on the server of the pontofrio, how can I get around this?
https://stackoverflow.com/questions/67267765/requests-get-return-error-httpsconnectionpool-python April 26, 2021 at 09:39PM
没有评论:
发表评论