Steven Almeroth stav

## gist:3520611
#!/usr/bin/python

# Google Places Search
#
# Use the Google Places API to text search for the supplied keywords and output
# the first result to standard out.

import sys
import json
import argparse

## gist:4191165
<?php
/**
 * generic debug printer
 *
 * Because I didn't like having to pass two arguments to a debug printer, namely the
 * evaluated and un-evaluated expressions, like: $baker->bread and "baker.bread", i.e.,
 * I only wanted to pass the un-evaluated string and let the print routine do the
 * evaluating.  This script does that proceduraly, i.e., not in a function, so expression
 * scope is not changed.
 *

## gist:4356269
class PartialResponse(object):
    """ Downloader middleware to only return the first n bytes
    """
    def process_response(self, request, response, spider):
        max_size = getattr(spider, 'response_max_size', 0)
        if max_size and len(response.body) > max_size:
            h = response.headers.copy()
            h['Content-Length'] = max_size
            response = response.replace(
                body=response.body.encode('utf-8')[:max_size],

## gist:5137869
from PyQt4.QtCore import QUrl
from PyQt4.QtGui import QApplication
from PyQt4.QtWebKit import QWebPage

from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
from scrapy.spider import BaseSpider
from scrapy.http import HtmlResponse

class Render(QWebPage):
    def __init__(self, url):

## gist:5152476
# main.py:

from project.spiders.log_test import TestSpider as EstiloMASpider

from scrapy.xlib.pydispatch import dispatcher
from scrapy.crawler import Crawler
from twisted.internet import reactor
from scrapy.utils.project import get_project_settings
from scrapy import log, signals

## gist:5337954
import sys
import json
import argparse

from os.path import exists
from pprint import pprint
from urllib import urlencode, urlretrieve
from urllib2 import urlopen
from urlparse import urlsplit, parse_qs

## ytclipr.py
# Python YouTube downloader
# 1. start script
# 2. copy youtube url into clipboard
# 3. press ctrl-d to start downloading

import sys

import pygtk
pygtk.require('2.0')
import gtk

## rmpyc
#!/bin/bash

if [ -n "$1" ]; then
    TARGET="$1"
else
    TARGET="."
fi

command="find $TARGET -name '*.pyc' 2>/dev/null"

## RouteSpider.py
"""
Routed Crawler
"""
class Route(dict):
    """Spider route request"""
    pass


class Router(scrapy.Spider):
    """Spider routing and loader handling"""

## sitemap_generator_pipeline.py
""" pipelines.py """
import collections
import scrapy
import scrapy.contrib.exporter
import myproject


class SitemapPipeline(object):
    """
    Sitemap builder
	#!/usr/bin/python

	# Google Places Search
	#
	# Use the Google Places API to text search for the supplied keywords and output
	# the first result to standard out.

	import sys
	import json
	import argparse
	<?php
	/**
	* generic debug printer
	*
	* Because I didn't like having to pass two arguments to a debug printer, namely the
	* evaluated and un-evaluated expressions, like: $baker->bread and "baker.bread", i.e.,
	* I only wanted to pass the un-evaluated string and let the print routine do the
	* evaluating. This script does that proceduraly, i.e., not in a function, so expression
	* scope is not changed.
	*
	class PartialResponse(object):
	""" Downloader middleware to only return the first n bytes
	"""
	def process_response(self, request, response, spider):
	max_size = getattr(spider, 'response_max_size', 0)
	if max_size and len(response.body) > max_size:
	h = response.headers.copy()
	h['Content-Length'] = max_size
	response = response.replace(
	body=response.body.encode('utf-8')[:max_size],
	from PyQt4.QtCore import QUrl
	from PyQt4.QtGui import QApplication
	from PyQt4.QtWebKit import QWebPage

	from scrapy.contrib.linkextractors.sgml import SgmlLinkExtractor
	from scrapy.spider import BaseSpider
	from scrapy.http import HtmlResponse

	class Render(QWebPage):
	def __init__(self, url):
	# main.py:

	from project.spiders.log_test import TestSpider as EstiloMASpider

	from scrapy.xlib.pydispatch import dispatcher
	from scrapy.crawler import Crawler
	from twisted.internet import reactor
	from scrapy.utils.project import get_project_settings
	from scrapy import log, signals
	# Python YouTube downloader
	# 1. start script
	# 2. copy youtube url into clipboard
	# 3. press ctrl-d to start downloading

	import sys

	import pygtk
	pygtk.require('2.0')
	import gtk
	#!/bin/bash

	if [ -n "$1" ]; then
	TARGET="$1"
	else
	TARGET="."
	fi

	command="find $TARGET -name '*.pyc' 2>/dev/null"
	"""
	Routed Crawler
	"""
	class Route(dict):
	"""Spider route request"""
	pass


	class Router(scrapy.Spider):
	"""Spider routing and loader handling"""
	""" pipelines.py """
	import collections
	import scrapy
	import scrapy.contrib.exporter
	import myproject


	class SitemapPipeline(object):
	"""
	Sitemap builder