#A Collection of NLP notes
##N-grams
###Calculating unigram probabilities:
P( wi ) = count ( wi ) ) / count ( total number of words )
In english..
| cd ~ | |
| sudo apt-get update | |
| sudo apt-get install unzip curl python-software-properties openjdk-7-jre -y | |
| wget https://github.com/downloads/elasticsearch/elasticsearch/elasticsearch-0.19.2.tar.gz -O elasticsearch.tar.gz | |
| tar -xf elasticsearch.tar.gz | |
| rm elasticsearch.tar.gz | |
| sudo mv elasticsearch-* elasticsearch | |
| sudo mv elasticsearch /usr/local/share |
#A Collection of NLP notes
##N-grams
###Calculating unigram probabilities:
P( wi ) = count ( wi ) ) / count ( total number of words )
In english..
| #!/bin/bash | |
| # herein we backup our indexes! this script should run at like 6pm or something, after logstash | |
| # rotates to a new ES index and theres no new data coming in to the old one. we grab metadatas, | |
| # compress the data files, create a restore script, and push it all up to S3. | |
| TODAY=`date +"%Y.%m.%d"` | |
| INDEXNAME="logstash-$TODAY" # this had better match the index name in ES | |
| INDEXDIR="/usr/local/elasticsearch/data/logstash/nodes/0/indices/" | |
| BACKUPCMD="/usr/local/backupTools/s3cmd --config=/usr/local/backupTools/s3cfg put" | |
| BACKUPDIR="/mnt/es-backups/" | |
| YEARMONTH=`date +"%Y-%m"` |
ror, scala, jetty, erlang, thrift, mongrel, comet server, my-sql, memchached, varnish, kestrel(mq), starling, gizzard, cassandra, hadoop, vertica, munin, nagios, awstats
| curl -XDELETE localhost:9200/test-idx | |
| curl -XPUT localhost:9200/test-idx -d '{ | |
| "settings": { | |
| "index.number_of_shards": 1, | |
| "index.number_of_replicas": 0 | |
| }, | |
| "mappings": { | |
| "doc": { | |
| "properties": { | |
| "name": {"type": "string"} |
| cd ~ | |
| sudo apt-get update | |
| sudo apt-get install openjdk-7-jre-headless -y | |
| ### Check http://www.elasticsearch.org/download/ for latest version of ElasticSearch and replace wget link below | |
| # NEW WAY / EASY WAY | |
| wget https://download.elasticsearch.org/elasticsearch/elasticsearch/elasticsearch-1.0.1.deb | |
| sudo dpkg -i elasticsearch-1.0.1.deb |
| # Encoding: utf-8 | |
| cookbook 'yum' | |
| cookbook 'vim' | |
| cookbook 'curl' | |
| cookbook 'nginx' | |
| cookbook 'logstash', git: 'git://github.com/lusis/chef-logstash.git' | |
| cookbook 'elasticsearch', git: 'git://github.com/elasticsearch/cookbook-elasticsearch.git' |
| <?php | |
| // app/config/assets_version.php | |
| $container->loadFromExtension('framework', array( | |
| 'templating' => array( | |
| 'engines' => array('twig'), | |
| 'assets_version' => exec('git rev-parse --short HEAD'), | |
| ), | |
| )); |
| server { | |
| listen 80; | |
| server_name localhost; | |
| root /home/website/web; | |
| rewrite ^/app\.php/?(.*)$ /$1 permanent; | |
| try_files $uri @rewriteapp; | |
| location @rewriteapp { |
| server { | |
| listen 80; | |
| server_name localhost; | |
| root /home/website/web; | |
| rewrite ^/app\.php/?(.*)$ /$1 permanent; | |
| try_files $uri @rewriteapp; | |
| location @rewriteapp { |