Martina Pugliese martinapugliese

## boto_dynamodb_methods.py
# Copyright (C) 2016 Martina Pugliese

from boto3 import resource
from boto3.dynamodb.conditions import Key

# The boto3 dynamoDB resource
dynamodb_resource = resource('dynamodb')


def get_table_metadata(table_name):

## ref_es_queries.md

      
              1 file
            
          
              2 forks
            
          
              0 comments
            
          
              8 stars
            
          
                martinapugliese
                / ref_es_queries.md
            
            
              Last active
              August 14, 2023 08:08
            
              
                Sample Elasticsearch queries in Python, as reference.
              
          
    Collection of sample Elasticsearch queries

Use the Python client elasticsearch.
Connect to cluster (the client)

from elasticsearch import Elasticsearch

es_client = Elasticsearch() # local


## printingclass.py
# Copyright (C) 2016 Martina Pugliese

# Imports
from datetime import datetime


# #################### ANSI Escape codes for terminal #########################

codes_dict = {

## nltk_plotfreqs.py
# Copyright (C) 2016 Martina Pugliese


def plot_freqdist_freq(fd,
                       max_num=None,
                       cumulative=False,
                       title='Frequency plot',
                       linewidth=2):
    """
    As of NLTK version 3.2.1, FreqDist.plot() plots the counts and has no kwarg for normalising to frequency. Work this around here.

## string_builtins.py
# Copyright (C) 2016 Martina Pugliese


def run_methods():

    print '\n'

    print '* Count occurrences of substring in string'
    print 'Martina'.count('art')
    print 'Martina'.count('a')

## git_refs.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                martinapugliese
                / git_refs.md
            
            
              Created
              January 13, 2018 19:55
            
          
    A reference on git things


When there's no master branch, will be created when you first create a file
When .gitignore does not skip files


## python_memory.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                martinapugliese
                / python_memory.md
            
            
              Last active
              February 22, 2018 07:26
            
          
    A reference on small Python stuffs

Various lil' things


See Difference in for key in d.keys() and for key in d
On underscores in Python
Assigning more vars to same value
Various ways, different in speed and in preserving the order, to uniquify a list: here and a followup with another suggestion (f7) here
Various ways, with time benchmarks, to check if key is in dict, here


## pandas.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                martinapugliese
                / pandas.md
            
            
              Last active
              March 22, 2018 11:20
            
          
    Pandas reference things

df is a DataFrame.
Grouping df on multiple functions and dropping hierarchical level

grouped_df = df.groupby(['colA', 'colB']) \
    .agg(
 {


## command_line.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                martinapugliese
                / command_line.md
            
            
              Last active
              October 15, 2018 16:33
            
          
    A collection of useful command line hacks (Unix)

Memory usage

MACOS

vm_stat is the command, this makes output user friendly, thanks to this.
vm_stat | perl -ne '/page size of (\d+)/ and $size=$1; /Pages\s+([^:]+)[^\d]+(\d+)/ and printf("%-16s % 16.2f Mi\n", "$1:", $2 * $size / 1048576);'


## pyplot.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                martinapugliese
                / pyplot.md
            
            
              Last active
              March 27, 2018 16:44
            
          
    Pyplot reference stuff

Those things that I always forget how to do.
import pyplot as plt

Matplotlib styles
	# Copyright (C) 2016 Martina Pugliese

	from boto3 import resource
	from boto3.dynamodb.conditions import Key

	# The boto3 dynamoDB resource
	dynamodb_resource = resource('dynamodb')


	def get_table_metadata(table_name):
	# Copyright (C) 2016 Martina Pugliese

	# Imports
	from datetime import datetime


	# #################### ANSI Escape codes for terminal #########################

	codes_dict = {
	# Copyright (C) 2016 Martina Pugliese


	def plot_freqdist_freq(fd,
	max_num=None,
	cumulative=False,
	title='Frequency plot',
	linewidth=2):
	"""
	As of NLTK version 3.2.1, FreqDist.plot() plots the counts and has no kwarg for normalising to frequency. Work this around here.
	# Copyright (C) 2016 Martina Pugliese


	def run_methods():

	print '\n'

	print '* Count occurrences of substring in string'
	print 'Martina'.count('art')
	print 'Martina'.count('a')