Created
June 8, 2018 19:01
-
-
Save Ricky-Wilson/06cff7e5930072b799c9b6e78c3eda29 to your computer and use it in GitHub Desktop.
get.py created by RickyWilson - https://repl.it/@RickyWilson/getpy
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import socket | |
import urlparse | |
CONNECTION_TIMEOUT = 5 | |
CHUNK_SIZE = 1024 | |
HTTP_VERSION = 1.0 | |
CRLF = "\r\n\r\n" | |
socket.setdefaulttimeout(CONNECTION_TIMEOUT) | |
def receive_all(sock, chunk_size=CHUNK_SIZE): | |
''' | |
Gather all the data from a request. | |
''' | |
chunks = [] | |
while True: | |
chunk = sock.recv(int(chunk_size)) | |
if chunk: | |
chunks.append(chunk) | |
else: | |
break | |
return repr(''.join(chunks)) | |
def get(url, **kw): | |
kw.setdefault('timeout', CONNECTION_TIMEOUT) | |
kw.setdefault('chunk_size', CHUNK_SIZE) | |
kw.setdefault('http_version', HTTP_VERSION) | |
url = urlparse.urlparse(url) | |
sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM) | |
sock.settimeout(kw.get('timeout')) | |
sock.connect((url.netloc, url.port or 80)) | |
msg = 'GET {0} HTTP/{1} {2}' | |
sock.sendall(msg.format(url.path or '/', kw.get('http_version'), CRLF)) | |
data = receive_all(sock, chunk_size=kw.get('chunk_size')) | |
sock.shutdown(socket.SHUT_RDWR) | |
sock.close() | |
return data | |
print(get('https://www.google.com/', chunk_size=6535)) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment