Arthur Nisnevich ArthurN

## assign_sids.js
var startTime = (new Date()).getTime();
var total = db.items.count({_sid: { $exists: false } });
diff = ((new Date()).getTime() - startTime) / 1000.0;
print(diff + "s to count items without _sid");

print(total + " items need to be updated");
var done = 0;
db.items.find({_sid: { $exists: false } }).forEach(function (item) {
  if (item.topic_ids != null && item.topic_ids.length > 0) {
    item._sid = item.topic_ids[0];

## provider.js

    // from:
    // http://www.webtalkforums.com/showthread.php/37600-Simple-JavaScript-RegEx-to-Parse-Domain-Name
    var parts = /^((\w+):\/\/)?((\w+):?(\w+)?@)?([^\/\?:]+):?(\d+)?(\/?[^\?#]+)?\??([^#]+)?#?(\w*)/.exec(item['url'])
    if (parts != null) {
      providerUrl = parts[1] + parts[6];
      providerName = parts[6].replace("www.", "");
    } else {
      // Graceful fail
      //console.debug("Failed URL parsing on: " + item['url']);

## gist:1246057
awk -F' ' '{ print $1 " " $2 " "$3 " " $4 " " $(NF) }' mongod.log | grep 'ms'

## gist:1090842
    source = included_scripts_source || ""
    source += " " + IO.read(isotope_file_path)
    context = ExecJS.compile(source)
    script = "Isotope(#{view_file_content.to_json}, #{options[:locals].to_json})"
    output = context.eval(script)

## gist:1088493
=> Booting WEBrick
=> Rails 3.0.7 application starting in development on http://0.0.0.0:3000
=> Call with -d to detach
=> Ctrl-C to shutdown server
ActionView::Base included ViewHelpers
ActionController::Base included ViewHelpers
[2011-07-17 21:27:09] INFO  WEBrick 1.3.1
[2011-07-17 21:27:09] INFO  ruby 1.9.2 (2011-02-18) [x86_64-darwin10.7.0]
[2011-07-17 21:27:09] INFO  WEBrick::HTTPServer#start: pid=13393 port=3000
/Users/arthur/.rvm/gems/ruby-1.9.2-p180/gems/therubyracer-0.9.2/lib/v8/context.rb:17: [BUG] Segmentation fault

## generate_password_hash.sh
echo "password"|openssl passwd -1 -stdin

## kill-sidekiq.sh
#!/bin/bash
if [ $(pgrep -f sidekiq | wc -l) -gt 1 ]; then
  kill $(pgrep -f sidekiq | grep -v $(pgrep -of sidekiq) | sort -n | uniq | awk '{printf $1" "}');
fi

## gist:e980d723a6d63e9fc766
def get_fields
    # We have to use #send because AFAIK, PDF::Reader does not expose the root object anywhere
    acroform = @reader.send(:root)[:AcroForm]

    # PDF::Reader encapsulates each piece of PDF data in #objects. The field_refs are really references to
    # these objects. We iterate through and de-reference the actual object, creating a AcroField based on its
    # data
    field_refs = @reader.objects[acroform][:Fields] unless acroform.nil?
    fields = field_refs.map do |field_ref|
      AcroField.new(@reader.objects[field_ref])

## gist:f16ad0e6958a0af73d39
# From http://breakthebit.org/post/77505127462/up-your-security-on-amazon-aws
{
    "Statement": [
        {
            "Sid": "AllowPublicRead",
            "Action": [
                "s3:ListBucket",
                "s3:GetObject",
                "s3:PutObject",
                "s3:PutObjectAcl",

## gist:e13637dce27d15168d4b
# Extract PDF field names and positions using pCOS:
./pcos --extended field "FT fullname Rect[0] Rect[1] Rect[2] Rect[3]" fw9.pdf

# CSV format, also output pagesize as the first line:
./pcos --extended pagesize "width height" --extended field "FT fullname V Rect[0] Rect[1] Rect[2] Rect[3]" --format "(VAL,)\n" --replace missing "" test.pdf
	var startTime = (new Date()).getTime();
	var total = db.items.count({_sid: { $exists: false } });
	diff = ((new Date()).getTime() - startTime) / 1000.0;
	print(diff + "s to count items without _sid");

	print(total + " items need to be updated");
	var done = 0;
	db.items.find({_sid: { $exists: false } }).forEach(function (item) {
	if (item.topic_ids != null && item.topic_ids.length > 0) {
	item._sid = item.topic_ids[0];

	// from:
	// http://www.webtalkforums.com/showthread.php/37600-Simple-JavaScript-RegEx-to-Parse-Domain-Name
	var parts = /^((\w+):\/\/)?((\w+):?(\w+)?@)?([^\/\?:]+):?(\d+)?(\/?[^\?#]+)?\??([^#]+)?#?(\w*)/.exec(item['url'])
	if (parts != null) {
	providerUrl = parts[1] + parts[6];
	providerName = parts[6].replace("www.", "");
	} else {
	// Graceful fail
	//console.debug("Failed URL parsing on: " + item['url']);
	source = included_scripts_source \|\| ""
	source += " " + IO.read(isotope_file_path)
	context = ExecJS.compile(source)
	script = "Isotope(#{view_file_content.to_json}, #{options[:locals].to_json})"
	output = context.eval(script)
	=> Booting WEBrick
	=> Rails 3.0.7 application starting in development on http://0.0.0.0:3000
	=> Call with -d to detach
	=> Ctrl-C to shutdown server
	ActionView::Base included ViewHelpers
	ActionController::Base included ViewHelpers
	[2011-07-17 21:27:09] INFO WEBrick 1.3.1
	[2011-07-17 21:27:09] INFO ruby 1.9.2 (2011-02-18) [x86_64-darwin10.7.0]
	[2011-07-17 21:27:09] INFO WEBrick::HTTPServer#start: pid=13393 port=3000
	/Users/arthur/.rvm/gems/ruby-1.9.2-p180/gems/therubyracer-0.9.2/lib/v8/context.rb:17: [BUG] Segmentation fault
	#!/bin/bash
	if [ $(pgrep -f sidekiq \| wc -l) -gt 1 ]; then
	kill $(pgrep -f sidekiq \| grep -v $(pgrep -of sidekiq) \| sort -n \| uniq \| awk '{printf $1" "}');
	fi
	def get_fields
	# We have to use #send because AFAIK, PDF::Reader does not expose the root object anywhere
	acroform = @reader.send(:root)[:AcroForm]

	# PDF::Reader encapsulates each piece of PDF data in #objects. The field_refs are really references to
	# these objects. We iterate through and de-reference the actual object, creating a AcroField based on its
	# data
	field_refs = @reader.objects[acroform][:Fields] unless acroform.nil?
	fields = field_refs.map do \|field_ref\|
	AcroField.new(@reader.objects[field_ref])
	# From http://breakthebit.org/post/77505127462/up-your-security-on-amazon-aws
	{
	"Statement": [
	{
	"Sid": "AllowPublicRead",
	"Action": [
	"s3:ListBucket",
	"s3:GetObject",
	"s3:PutObject",
	"s3:PutObjectAcl",
	# Extract PDF field names and positions using pCOS:
	./pcos --extended field "FT fullname Rect[0] Rect[1] Rect[2] Rect[3]" fw9.pdf

	# CSV format, also output pagesize as the first line:
	./pcos --extended pagesize "width height" --extended field "FT fullname V Rect[0] Rect[1] Rect[2] Rect[3]" --format "(VAL,)\n" --replace missing "" test.pdf