The Hitchhiker's Guide to Python

between computers

$ pip install requests
import requests
                                                     
result = requests.get('http://pypi.python.org/pypi/requests/json')
>>> import requests
>>> response = requests.get('http://pypi.python.org/pypi/requests/json')
>>> type(response)
<class 'requests.models.Response'>
>>> response.ok
True
>>> response.text    # This gives all of the text of the response
>>> response.json()  # This converts the text response into a dictionary
json_string = '{"first_name": "Guido", "last_name":"van Rossum"}'
import json
parsed_json = json.loads(json_string)
print(parsed_json['first_name'])
"Guido"
d = {
    'first_name': 'Guido',
    'last_name': 'van Rossum',
    'titles': ['BDFL', 'Developer'],
}

print(json.dumps(d))
'{"first_name": "Guido", "last_name": "van Rossum",
  "titles": ["BDFL", "Developer"]}'
import simplejson as json
$ pip install untangle
$ pip install xmltodict
<?xml version="1.0" encoding="UTF-8"?>
<root>
    <child name="child1" />
</root>
import untangle
obj = untangle.parse('path/to/file.xml')
obj.root.child['name']  # is 'child1'
<mydocument has="an attribute">
  <and>
    <many>elements</many>
    <many>more elements</many>
  </and>
  <plus a="complex">
    element as well
  </plus>
</mydocument>
import xmltodict

with open('path/to/file.xml') as fd:
    doc = xmltodict.parse(fd.read())
doc['mydocument']['@has']  # is u'an attribute'
doc['mydocument']['and']['many']  # is [u'elements', u'more elements']
doc['mydocument']['plus']['@a']  # is u'complex'
doc['mydocument']['plus']['#text']  # is u'element as well'
$ pip install lxml
from lxml import html
import requests

page = requests.get('http://econpy.pythonanywhere.com/ex/001.html')  
tree = html.fromstring(page.content)  
<div title="buyer-name">Carson Busses</div>
<span class="item-price">$29.95</span>
# This will create a list of buyers:
buyers = tree.xpath('//div[@title="buyer-name"]/text()')
# This will create a list of prices
prices = tree.xpath('//span[@class="item-price"]/text()')
>>> print('Buyers: ', buyers)
Buyers:  ['Carson Busses', 'Earl E. Byrd', 'Patty Cakes',
'Derri Anne Connecticut', 'Moe Dess', 'Leda Doggslife', 'Dan Druff',
'Al Fresco', 'Ido Hoe', 'Howie Kisses', 'Len Lease', 'Phil Meup',
'Ira Pent', 'Ben D. Rules', 'Ave Sectomy', 'Gary Shattire',
'Bobbi Soks', 'Sheila Takya', 'Rose Tattoo', 'Moe Tell']
>>>
>>> print('Prices: ', prices)
Prices:  ['$29.95', '$8.37', '$15.26', '$19.25', '$19.25',
'$13.99', '$31.57', '$8.49', '$14.47', '$15.86', '$11.11',
'$15.98', '$16.27', '$7.50', '$50.85', '$14.26', '$5.68',
'$15.00', '$114.07', '$10.09']
import pickle

# Here's an example dict
grades = { 'Alice': 89, 'Bob': 72, 'Charles': 87 }

# Use dumps to convert the object to a serialized string
serial_grades = pickle.dumps( grades )

# Use loads to de-serialize an object
received_grades = pickle.loads( serial_grades )
import socketserver
import xdrlib

class XdrHandler(socketserver.BaseRequestHandler):
    def handle(self):
        data = self.request.recv(4)  
        unpacker = xdrlib.Unpacker(data)
        message_size = self.unpacker.unpack_uint()  
        data = self.request.recv(message_size)  
        unpacker.reset(data)  
        print(unpacker.unpack_string())  
        print(unpacker.unpack_float())
        self.request.sendall(b'ok')

server = socketserver.TCPServer(('localhost', 12345), XdrHandler)
server.serve_forever()
import socket
import xdrlib

p = xdrlib.Packer()
p.pack_string('Thanks for all the fish!')  
p.pack_float(42.00)
xdr_data = p.get_buffer()
message_length = len(xdr_data)

p.reset()  
p.pack_uint(message_length)
len_plus_data = p.get_buffer() + xdr_data  

with socket.socket() as s:
    s.connect(('localhost', 12345))
    s.sendall(len_plus_data)
    if s.recv(1024):
      print('success')
import pickle
import gzip

data = "my very big object"

# To zip and pickle:
with gzip.open('spam.zip', 'wb') as my_zip:
    pickle.dump(data, my_zip)

# And to unzip and unpickle:
with gzip.open('spam.zip', 'rb') as my_zip:
    unpickled_data = pickle.load(my_zip)
>>> import asyncio
>>>
>>> [l for l in asyncio.__all__ if 'loop' in l]
['get_event_loop_policy', 'set_event_loop_policy',
'get_event_loop', 'set_event_loop', 'new_event_loop']
>>>
>>> [t for t in asyncio.__all__ if t.endswith('Transport')]
['BaseTransport', 'ReadTransport', 'WriteTransport', 'Transport',
'DatagramTransport', 'SubprocessTransport']
>>>
>>> [p for p in asyncio.__all__ if p.endswith('Protocol')]
['BaseProtocol', 'Protocol', 'DatagramProtocol',
'SubprocessProtocol', 'StreamReaderProtocol']
>>>
>>> [q for q in asyncio.__all__ if 'Queue' in q]
['Queue', 'PriorityQueue', 'LifoQueue', 'JoinableQueue',
'QueueFull', 'QueueEmpty']
$ pip install gevent
>>> import gevent
>>>
>>> from gevent import socket
>>> urls = ['www.google.com', 'www.example.com', 'www.python.org']
>>> jobs = [gevent.spawn(socket.gethostbyname, url) for url in urls]
>>> gevent.joinall(jobs, timeout=2)
>>> [job.value for job in jobs]
['74.125.79.106', '208.77.188.166', '82.94.164.162']
$ pip install twisted
$ pip install pyzmq
import zmq
context = zmq.Context()
server = context.socket(zmq.REP)  
server.bind('tcp://127.0.0.1:5000')  

while True:
    message = server.recv().decode('utf-8')
    print('Client said: {}'.format(message))
    server.send(bytes('I don't know.', 'utf-8'))

# ~~~~~ and in another file ~~~~~

import zmq
context = zmq.Context()
client = context.socket(zmq.REQ)  
client.connect('tcp://127.0.0.1:5000')  

client.send(bytes("What's for lunch?", 'utf-8'))
response = client.recv().decode('utf-8')
print('Server replied: {}'.format(response))
$ pip install pika
$ pip install celery
>>> import ssl, smtplib
>>> smtp = smtplib.SMTP("mail.python.org", port=587)
>>> context = ssl.create_default_context()
>>> smtp.starttls(context=context)
(220, b'2.0.0 Ready to start TLS')
import os
import hashlib

def hash_password(password, salt_len=16, iterations=10000, encoding='utf-8'):
    salt = os.urandom(salt_len)
    hashed_password = hashlib.pbkdf2_hmac(
        hash_name='sha256',
        password=bytes(password, encoding),
        salt=salt,
        iterations=iterations
    )
    return salt, iterations, hashed_password
$ pip install pyOpenSSL
>>> import OpenSSL
>>>
>>> OpenSSL.crypto.get_elliptic_curve('Oakley-EC2N-3')
<Curve 'Oakley-EC2N-3'>
>>>
>>> OpenSSL.SSL.Context(OpenSSL.SSL.TLSv1_2_METHOD)
<OpenSSL.SSL.Context object at 0x10d778ef0>
$ pip install PyNaCl
$ pip install cryptography
  from cryptography.fernet import Fernet
  key = Fernet.generate_key()
  cipher_suite = Fernet(key)
  cipher_text = cipher_suite.encrypt(b"A really secret message.")
  plain_text = cipher_suite.decrypt(cipher_text)
$ pip install pycrypto
from Crypto.Cipher import AES
# Encryption
encryption_suite = AES.new('This is a key123', AES.MODE_CBC, 'This is an IV456')
cipher_text = encryption_suite.encrypt("A really secret message.")

# Decryption
decryption_suite = AES.new('This is a key123', AES.MODE_CBC, 'This is an IV456')
plain_text = decryption_suite.decrypt(cipher_text)
pip install bcrypt
>>> import bcrypt
>>>>
>>> password = bytes('password', 'utf-8')
>>> hashed_pw = bcrypt.hashpw(password, bcrypt.gensalt(14))
>>> hashed_pw
b'$2b$14$qAmVOCfEmHeC8Wd5BoF1W.7ny9M7CSZpOR5WPvdKFXDbkkX8rGJ.e'
>>> import binascii
>>> hexed_hashed_pw = binascii.hexlify(hashed_pw)
>>> store_password(user_id=42, password=hexed_hashed_pw)
>>> hexed_hashed_pw = retieve_password(user_id=42)
>>> hashed_pw = binascii.unhexlify(hexed_hashed_pw)
>>>
>>> bcrypt.hashpw(password, hashed_pw)
b'$2b$14$qAmVOCfEmHeC8Wd5BoF1W.7ny9M7CSZpOR5WPvdKFXDbkkX8rGJ.e'
>>>
>>> bcrypt.hashpw(password, hashed_pw) == hashed_pw
True

Library	License	Reasons to use
asyncio	PSF license	Provides an asynchronous event loop to manage communication with nonblocking sockets and queues, as well as any user-defined coroutines. Also includes asynchronous sockets and queues.
gevent	MIT license	Is tightly coupled with libev, the C library for asynchronous I/O. Provides a fast WSGI server built on libev’s HTTP server. It also has this great `gevent.monkey` module that has patching functions for the standard library, so third-party modules written with blocking sockets can still be used with gevent.
Twisted	MIT license	Provides asynchronous implementations of newer protocols—for example, GPS, Internet of Connected Products (IoCP), and a Memcached protocol. It has integrated its event loop with various other event-driven frameworks, like wxPython or GTK. It also has a built in SSH server and client tools.
PyZMQ	LGPL (ZMQ) and BSD (Python part) license	Lets you set up and interface with nonblocking message queues using a socket-style API. It provides socket behaviors (request/response, publish/subscribe, and push/pull) that support distributed computing. Use this when you want to build your own communication infrastructure; it has “Q” in its name, but is not like RabbitMQ—it could be used to build something like RabbitMQ, or something with a totally different behavior (depending on the socket patterns chosen).
pika	BSD license	Provides a lightweight AMQP (communication protocol) client to connect with RabbitMQ or other message brokers. Also includes adapters for use in Tornado or Twisted event loops. Use this with a message broker like RabbitMQ when you want a lighter weight library (no web dashboard or other bells and whistles) that lets you push content to an external message broker like RabbitMQ.
Celery	BSD license	Provides an AMQP client to connect with RabbitMQ or other message brokers. Also has an option to store task states in a backend that can use different popular options like a database connection via SQLAlchemy, Memcached, or others. Also has an optional web administration and monitoring tool called Flower. Can be used with a message broker like RabbitMQ for an out-of-the-box message broker system.

Option	License	Reason to use
ssl and hashlib (and in Python 3.6, secrets)	Python Software Foundation license	Hashlib provides a decent password hashing algorithm, updated at the schedule of Python versions, and ssl provides an SSL/TLS client (and server, but it may not have the latest updates). Secrets is a random number generator suitable for cryptographic uses.
pyOpenSSL	Apache v2.0 license	It uses the most up-to-date version of OpenSSL in Python and provides functions in OpenSSL that aren’t exposed by the Standard Library’s ssl module.
PyNaCl	Apache v2.0 license	It contains Python bindings for libsodium.^a
libnacl	Apache license	It’s the Python interface to libsodium for people who are using the Salt Stack.
cryptography	Apache v2.0 license or BSD license	It provides direct access to cryptographic primitives built on OpenSSL. The higher-level pyOpenSSL is what most of us would use.
pyCrypto	Public Domain	This library is older, and built using its own C library, but was in the past the most popular cryptography library in Python.
bcrypt	Apache v2.0 license	It provides the `bcrypt` hash function,^b and is useful for people who want that or have previously used `py-bcrypt`.
^a libsodium is a fork of the Networking and Cryptography library (NaCl, pronounced “salt”); its philosophy is to curate specific algorithms that are performant and easy to use. ^b The library actually contains the C source code and builds it on installation using the C Fast Function Interface we described earlier. Bcrypt is based on the Blowfish encryption algorithm.

Table of Contents for
The Hitchhiker's Guide to Python

Chapter 9. Software Interfaces

Web Clients

Web APIs

JSON parsing

XML parsing

Web scraping

Tip

lxml

Data Serialization

Pickle

Warning

Cross-language serialization

Compression

The buffer protocol

Distributed Systems

Networking

Performance networking tools in Python’s Standard Library

gevent

Twisted

PyZMQ

RabbitMQ

Cryptography

ssl, hashlib, and secrets

Note

pyOpenSSL

PyNaCl and libnacl

Tip

Cryptography

PyCrypto

bcrypt

Table of Contents for The Hitchhiker's Guide to Python

Chapter 9. Software Interfaces

Web Clients

Web APIs

JSON parsing

XML parsing

Web scraping

Tip

lxml

Data Serialization

Pickle

Warning

Cross-language serialization

Compression

The buffer protocol

Distributed Systems

Networking

Performance networking tools in Python’s Standard Library

gevent

Twisted

PyZMQ

RabbitMQ

Cryptography

ssl, hashlib, and secrets

Note

pyOpenSSL

PyNaCl and libnacl

Tip

Cryptography

PyCrypto

bcrypt

Table of Contents for
The Hitchhiker's Guide to Python