Backup all messages on facebook
#! /usr/bin/python
# -*- coding: UTF-8 -*-
import facebook
import urllib2
import codecs
print "You need API token: get one here:"
USER_ACCESS_TOKEN= raw_input("Your API key: ")
graph = facebook.GraphAPI(USER_ACCESS_TOKEN)
def message_query_factory(thread_id, count):
queries = []
for min_limit in range(0, count, 50):
queries.append("SELECT author_id, message_id, body, created_time FROM message WHERE thread_id=%s LIMIT %s,%s" % (thread_id, min_limit, min_limit + 50))
queries.append("SELECT author_id, message_id, body, created_time FROM message WHERE thread_id=%s LIMIT %s,%s" % (thread_id, min_limit, count))
return queries
def fql(query):
return graph.fql(query)
except urllib2.URLError:
print "restarted"
return fql(query)
def get_object(uid):
return graph.get_object(uid)
except urllib2.URLError:
print "restarted"
return get_object(uid)
recipients = {}
def recipient(uid):
if not recipients.has_key(uid):
recipients[uid] = get_object(str(uid))["username"]
return recipients[uid]
if __name__ == "__main__":
threads = fql("SELECT thread_id, recipients, message_count FROM thread WHERE folder_id=0")
for thread in threads:
queries = message_query_factory(thread["thread_id"], thread["message_count"])
thread["messages"] = []
for n, query in enumerate(queries):
print "%s/%s: %s" %(n, len(queries), query)
thread["messages"] += fql(query)
for thread in threads:
recp = ",".join([recipient(uid) for uid in thread["recipients"]])
print recp
data = u""
data += recp
for message in thread["messages"]:
print message
data += recipient(message["author_id"]) + ": " + message["body"] + "\n"
recp = recp if not len(recp) > 40 else recp[:30]
with"logs/"+recp+".txt", mode="w", encoding='utf-8') as ffile:
#!/usr/bin/env python
# Copyright 2010 Facebook
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
"""Python client library for the Facebook Platform.
This client library is designed to support the Graph API and the official
Facebook JavaScript SDK, which is the canonical way to implement
Facebook authentication. Read more about the Graph API at You can download the Facebook
JavaScript SDK at
If your application is using Google AppEngine's webapp framework, your
usage of this module might look like this:
user = facebook.get_user_from_cookie(self.request.cookies, key, secret)
if user:
graph = facebook.GraphAPI(user["access_token"])
profile = graph.get_object("me")
friends = graph.get_connections("me", "friends")
import cgi
import urllib
import urllib2
import hashlib
import hmac
import base64
import logging
# Find a JSON parser
import simplejson as json
except ImportError:
from django.utils import simplejson as json
except ImportError:
import json
_parse_json = json.loads
# Find a query string parser
from urlparse import parse_qs
except ImportError:
from cgi import parse_qs
class GraphAPI(object):
"""A client for the Facebook Graph API.
See for complete documentation
for the API.
The Graph API is made up of the objects in Facebook (e.g., people, pages,
events, photos) and the connections between them (e.g., friends,
photo tags, and event RSVPs). This client provides access to those
primitive types in a generic way. For example, given an OAuth access
token, this will fetch the profile of the active user and the list
of the user's friends:
graph = facebook.GraphAPI(access_token)
user = graph.get_object("me")
friends = graph.get_connections(user["id"], "friends")
You can see a list of all of the objects and connections supported
by the API at
You can obtain an access token via OAuth or by using the Facebook
JavaScript SDK. See
for details.
If you are using the JavaScript SDK, you can use the
get_user_from_cookie() method below to get the OAuth access token
for the active user from the cookie saved by the SDK.
def __init__(self, access_token=None):
self.access_token = access_token
def get_object(self, id, **args):
"""Fetchs the given object from the graph."""
return self.request(id, args)
def get_objects(self, ids, **args):
"""Fetchs all of the given object from the graph.
We return a map from ID to object. If any of the IDs are invalid,
we raise an exception.
args["ids"] = ",".join(ids)
return self.request("", args)
def get_connections(self, id, connection_name, **args):
"""Fetchs the connections for given object."""
return self.request(id + "/" + connection_name, args)
def put_object(self, parent_object, connection_name, **data):
"""Writes the given object to the graph, connected to the given parent.
For example,
graph.put_object("me", "feed", message="Hello, world")
writes "Hello, world" to the active user's wall. Likewise, this
will comment on a the first post of the active user's feed:
feed = graph.get_connections("me", "feed")
post = feed["data"][0]
graph.put_object(post["id"], "comments", message="First!")
See for all of
the supported writeable objects.
Certain write operations require extended permissions. For example,
publishing to a user's feed requires the "publish_actions" permission. See for details about
publishing permissions.
assert self.access_token, "Write operations require an access token"
return self.request(parent_object + "/" + connection_name,
def put_wall_post(self, message, attachment={}, profile_id="me"):
"""Writes a wall post to the given profile's wall.
We default to writing to the authenticated user's wall if no
profile_id is specified.
attachment adds a structured attachment to the status message being
posted to the Wall. It should be a dictionary of the form:
{"name": "Link name"
"link": "",
"caption": "{*actor*} posted a new review",
"description": "This is a longer description of the attachment",
"picture": ""}
return self.put_object(profile_id, "feed", message=message,
def put_comment(self, object_id, message):
"""Writes the given comment on the given post."""
return self.put_object(object_id, "comments", message=message)
def put_like(self, object_id):
"""Likes the given post."""
return self.put_object(object_id, "likes")
def delete_object(self, id):
"""Deletes the object with the given ID from the graph."""
self.request(id, post_args={"method": "delete"})
def put_photo(self, image, message=None, album_id=None, **kwargs):
"""Uploads an image using multipart/form-data
image=File like object for the image
message=Caption for your image
album_id=None posts to /me/photos which uses or creates and uses
an album for your application.
object_id = album_id or "me"
#it would have been nice to reuse self.request;
#but multipart is messy in urllib
post_args = {
'access_token': self.access_token,
'source': image,
'message': message
content_type, body = self._encode_multipart_form(post_args)
req = urllib2.Request(("" %
req.add_header('Content-Type', content_type)
data = urllib2.urlopen(req).read()
#For Python 3 use this:
#except urllib2.HTTPError as e:
except urllib2.HTTPError, e:
data = # Facebook sends OAuth errors as 400, and urllib2
# throws an exception, we want a GraphAPIError
response = _parse_json(data)
# Raise an error if we got one, but don't not if Facebook just
# gave us a Bool value
if (response and isinstance(response, dict) and
raise GraphAPIError(response)
except ValueError:
response = data
return response
# based on:
def _encode_multipart_form(self, fields):
"""Fields are a dict of form name-> value
For files, value should be a file object.
Other file-like objects might work and a fake name will be chosen.
Return (content_type, body) ready for httplib.HTTP instance
BOUNDARY = '----------ThIs_Is_tHe_bouNdaRY_$'
CRLF = '\r\n'
L = []
for (key, value) in fields.items():
logging.debug("Encoding %s, (%s)%s" % (key, type(value), value))
if not value:
L.append('--' + BOUNDARY)
if hasattr(value, 'read') and callable(
filename = getattr(value, 'name', '%s.jpg' % key)
L.append(('Content-Disposition: form-data;'
'filename="%s"') % (key, filename))
L.append('Content-Type: image/jpeg')
value =
L.append('Content-Disposition: form-data; name="%s"' % key)
if isinstance(value, unicode):
logging.debug("Convert to ascii")
value = value.encode('ascii')
L.append('--' + BOUNDARY + '--')
body = CRLF.join(L)
content_type = 'multipart/form-data; boundary=%s' % BOUNDARY
return content_type, body
def request(self, path, args=None, post_args=None, raw_url = False):
"""Fetches the given path in the Graph API.
We translate args to a valid query string. If post_args is given,
we send a POST request to the given path with the given arguments.
args = args or {}
if self.access_token:
if post_args is not None:
post_args["access_token"] = self.access_token
args["access_token"] = self.access_token
post_data = None if post_args is None else urllib.urlencode(post_args)
if raw_url:
file = urllib2.urlopen(path)
file = urllib2.urlopen("" + path + "?" + urllib.urlencode(args), post_data, 3)
except urllib2.HTTPError, e:
response = _parse_json(
raise GraphAPIError(response)
fileInfo =
if fileInfo.maintype == 'text':
response = _parse_json(
elif fileInfo.maintype == 'image':
mimetype = fileInfo['content-type']
response = {
"mime-type": mimetype,
"url": file.url,
raise GraphAPIError('Maintype was not text or image')
if response and isinstance(response, dict) and response.get("error"):
raise GraphAPIError(response["error"]["type"],
return response
def api_request(self, path, args=None, post_args=None):
"""Fetches the given path in the Graph API.
We translate args to a valid query string. If post_args is given,
we send a POST request to the given path with the given arguments.
args = args or {}
if self.access_token:
if post_args is not None:
post_args["access_token"] = self.access_token
args["access_token"] = self.access_token
if self.api_key:
if post_args is not None:
post_args["api_key"] = self.api_key
args["api_key"] = self.api_key
if post_args is not None:
post_args["format"] = "json-strings"
args["format"] = "json-strings"
post_data = None if post_args is None else urllib.urlencode(post_args)
file = urllib.urlopen("" + path + "?" +
urllib.urlencode(args), post_data)
response = _parse_json(
if response and response.get("error"):
raise GraphAPIError(response)
return response
def fql(self, query, args=None, post_args=None):
"""FQL query.
Two reasons to have this method:
1. Graph api does not expose some info fields of a user, e.g.
a user's networks/affiliations, we have to fall back to old api.
2. FQL is a strong tool.
Example query: "SELECT affiliations FROM user WHERE uid = me()"
args = args or {}
if self.access_token:
if post_args is not None:
post_args["access_token"] = self.access_token
args["access_token"] = self.access_token
post_data = None if post_args is None else urllib.urlencode(post_args)
"""Check if query is a dict and
use the multiquery method
else use single query
if not isinstance(query, basestring):
args["queries"] = query
fql_method = 'fql.multiquery'
args["query"] = query
fql_method = 'fql.query'
args["format"] = "json"
file = urllib2.urlopen("" +
fql_method + "?" + urllib.urlencode(args),
post_data, 3)
content =
response = _parse_json(content)
#Return a list if success, return a dictionary if failed
if type(response) is dict and "error_code" in response:
raise GraphAPIError(response)
except Exception, e:
raise e
return response
def extend_access_token(self, app_id, app_secret):
Extends the expiration time of a valid OAuth access token. See
args = {
"client_id": app_id,
"client_secret": app_secret,
"grant_type": "fb_exchange_token",
"fb_exchange_token": self.access_token,
response = urllib.urlopen(""
"access_token?" + urllib.urlencode(args)).read()
query_str = parse_qs(response)
if "access_token" in query_str:
result = {"access_token": query_str["access_token"][0]}
if "expires" in query_str:
result["expires"] = query_str["expires"][0]
return result
response = json.loads(response)
raise GraphAPIError(response)
class GraphAPIError(Exception):
def __init__(self, result):
#Exception.__init__(self, message)
#self.type = type
self.result = result
self.type = result["error_code"]
self.type = ""
# OAuth 2.0 Draft 10
self.message = result["error_description"]
# OAuth 2.0 Draft 00
self.message = result["error"]["message"]
# REST server style
self.message = result["error_msg"]
self.message = result
Exception.__init__(self, self.message)
def get_user_from_cookie(cookies, app_id, app_secret):
"""Parses the cookie set by the official Facebook JavaScript SDK.
cookies should be a dictionary-like object mapping cookie names to
cookie values.
If the user is logged in via Facebook, we return a dictionary with
the keys "uid" and "access_token". The former is the user's
Facebook ID, and the latter can be used to make authenticated
requests to the Graph API. If the user is not logged in, we
return None.
Download the official Facebook JavaScript SDK at Read more about Facebook
authentication at
cookie = cookies.get("fbsr_" + app_id, "")
if not cookie:
return None
parsed_request = parse_signed_request(cookie, app_secret)
result = get_access_token_from_code(parsed_request["code"], "",
app_id, app_secret)
except GraphAPIError:
return None
result["uid"] = parsed_request["user_id"]
return result
def parse_signed_request(signed_request, app_secret):
""" Return dictionary with signed request data.
We return a dictionary containing the information in the
signed_request. This includes a user_id if the user has authorised
your application, as well as any information requested.
If the signed_request is malformed or corrupted, False is returned.
l = signed_request.split('.', 2)
encoded_sig = str(l[0])
payload = str(l[1])
sig = base64.urlsafe_b64decode(encoded_sig + "=" *
((4 - len(encoded_sig) % 4) % 4))
data = base64.urlsafe_b64decode(payload + "=" *
((4 - len(payload) % 4) % 4))
except IndexError:
# Signed request was malformed.
return False
except TypeError:
# Signed request had a corrupted payload.
return False
data = _parse_json(data)
if data.get('algorithm', '').upper() != 'HMAC-SHA256':
return False
expected_sig =,
if sig != expected_sig:
return False
return data
def auth_url(app_id, canvas_url, perms=None):
url = ""
kvps = {'client_id': app_id, 'redirect_uri': canvas_url}
if perms:
kvps['scope'] = ",".join(perms)
return url + urllib.urlencode(kvps)
def get_access_token_from_code(code, redirect_uri, app_id, app_secret):
Get a user-specific access token from the "code" returned from a Facebook
OAuth dialog. Returns a dict containing the access token and its expiration
date (if applicable).
args = {
"code": code,
"redirect_uri": redirect_uri,
"client_id": app_id,
"client_secret": app_secret,
# We would use GraphAPI.request() here, except for that the fact that the
# response is a key-value pair, and not JSON.
response = urllib.urlopen("" +
"?" + urllib.urlencode(args)).read()
query_str = parse_qs(response)
if "access_token" in query_str:
result = {"access_token": query_str["access_token"][0]}
if "expires" in query_str:
result["expires"] = query_str["expires"][0]
return result
response = json.loads(response)
raise GraphAPIError(response)
def get_app_access_token(app_id, app_secret):
Get the access_token for the app that can be used for insights and
creating test users.
app_id = retrieved from the developer page
app_secret = retrieved from the developer page
returns the application access_token
# Get an app access token
args = {'grant_type': 'client_credentials',
'client_id': app_id,
'client_secret': app_secret}
file = urllib2.urlopen("" +
result ="=")[1]
return result
Copy link

rom1504 commented Nov 4, 2016

FQL died...

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment