Eric Pugh epugh

## NNFreqScoringSimilarity.java
package com.github.tteofili.looseen.dl4j;

import org.apache.lucene.index.IndexReader;
import org.apache.lucene.search.similarities.BasicStats;
import org.apache.lucene.search.similarities.SimilarityBase;
import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;
import org.nd4j.linalg.api.buffer.FloatBuffer;
import org.nd4j.linalg.api.ndarray.INDArray;
import org.nd4j.linalg.factory.Nd4j;

## zeppelin_solr_spark_oh_my_meetup_notes.md

      
              1 file
            
          
              1 fork
            
          
              0 comments
            
          
              2 stars
            
          
                epugh
                / zeppelin_solr_spark_oh_my_meetup_notes.md
            
            
              Last active
              October 9, 2018 03:30
            
              
                Steps for following along with Eric's Zeppelin talk.
              
          
    The below steps all assume you have installed Docker.  I used the Kitematic tool for OSX, and it worked great.  Everything is mapped to your "localhost" domain name.


Let's Set up Zeppelin
I am using this Docker image https://github.com/dylanmei/docker-zeppelin to fire up Zeppelin and Spark.  Note, it's slow cause there is so many processes (Spark Master, Spark Worker, Zeppelin) to start!   This is now up to Zeppelin 0.7.0
docker run -d --name zeppelin -p 8080:8080 dylanmei/zeppelin


## wordnet-indexer.py
#!/usr/bin/env python -x

import pysolr
import sys

from nltk.corpus import wordnet as wn


class Indexer:
    """

## gist:1d7b1abbbf0c643f2903

      
              1 file
            
          
              2 forks
            
          
              4 comments
            
          
              4 stars
            
          
                cb372
                / gist:1d7b1abbbf0c643f2903
            
            
              Last active
              June 29, 2018 18:40
            
              
                Using Elasticsearch as a Spark data source
              
          
    Install the essentials.
$ brew update && brew install elasticsearch && brew install apache-spark

Start ES.
$ elasticsearch


## gist:4900b7ee9559b4a144b8
    -verbose:gc \
    -XX:+PrintGCDetails \
    -XX:+PrintGCDateStamps \
    -XX:+PrintGCTimeStamps \
    -XX:+PrintHeapAtGC \
    -XX:+PrintTenuringDistribution \
    -XX:+PrintGCApplicationStoppedTime \
    -XX:+PrintGCApplicationConcurrentTime \
    -XX:+UseGCLogFileRotation \
    -XX:NumberOfGCLogFiles=5 \

## scraping.rb
#!/usr/bin/env ruby
# From: http://ngauthier.com/2014/06/scraping-the-web-with-ruby.html

require 'capybara'
require 'capybara/poltergeist'
require 'csv'
require 'gdbm'

class NickBot
  include Capybara::DSL

## gist:6691303
package com.o19s.http;

import java.io.IOException;
import java.security.cert.CertificateException;
import java.security.cert.X509Certificate;

import javax.net.ssl.SSLContext;
import javax.net.ssl.SSLException;
import javax.net.ssl.SSLSession;
import javax.net.ssl.SSLSocket;
	package com.github.tteofili.looseen.dl4j;

	import org.apache.lucene.index.IndexReader;
	import org.apache.lucene.search.similarities.BasicStats;
	import org.apache.lucene.search.similarities.SimilarityBase;
	import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;
	import org.nd4j.linalg.api.buffer.FloatBuffer;
	import org.nd4j.linalg.api.ndarray.INDArray;
	import org.nd4j.linalg.factory.Nd4j;
	#!/usr/bin/env python -x

	import pysolr
	import sys

	from nltk.corpus import wordnet as wn


	class Indexer:
	"""
	-verbose:gc \
	-XX:+PrintGCDetails \
	-XX:+PrintGCDateStamps \
	-XX:+PrintGCTimeStamps \
	-XX:+PrintHeapAtGC \
	-XX:+PrintTenuringDistribution \
	-XX:+PrintGCApplicationStoppedTime \
	-XX:+PrintGCApplicationConcurrentTime \
	-XX:+UseGCLogFileRotation \
	-XX:NumberOfGCLogFiles=5 \
	#!/usr/bin/env ruby
	# From: http://ngauthier.com/2014/06/scraping-the-web-with-ruby.html

	require 'capybara'
	require 'capybara/poltergeist'
	require 'csv'
	require 'gdbm'

	class NickBot
	include Capybara::DSL
	package com.o19s.http;

	import java.io.IOException;
	import java.security.cert.CertificateException;
	import java.security.cert.X509Certificate;

	import javax.net.ssl.SSLContext;
	import javax.net.ssl.SSLException;
	import javax.net.ssl.SSLSession;
	import javax.net.ssl.SSLSocket;