Stefan Urbanek Stiivi

## cpv_transpose.py
from bubbles import Pipeline

stores = {
    "target": {"type": "csv", "path": "."}
}

p = Pipeline(stores=stores)

p.source_object("xls", resource="cpv_2008_ver_2013.xlsx")
p.transpose_by("CODE", "country", "label")

## demo-sql-comparison.py
# Demo:
#
# Aggregate population per independence type for every year
# Sources: Population and Country Codes datasets
#

from bubbles import Pipeline
from bubbles import get_logger

logger = get_logger()

## Bubbles - datapackages demo.py
# Demo:
#
# Aggregate population per independence type for every year
# Sources: Population and Country Codes datasets
#

from bubbles import Pipeline

# List of stores with datasets. In this example we are using the "datapackage"
# store

## sqlalchemy_expression_compiler.py
class SQLAlchemyExpressionCompiler(object):
    def __init__(self, statement):
        # Context of this compiler is a SQLAlchemy statement object
        self.statement = statement

    def compile_literal(self, literal):
        return literal

    def compile_variable(self, variable):
        # Get a column object from the statement

## aggregate_over_window.py
from bubbles import Pipeline, FieldList, data_object, open_store

# Sample order data with fields:
fields = FieldList(
            ["id", "integer"],
            ["customer_id", "integer"],
            ["year", "integer"],
            ["amount", "integer"]
        )

## customers_who_ordered-sql.py
from bubbles import Pipeline, open_store

stores = {
    "source": open_store("csv", "data/source", encoding="utf16", infer_fields=True),
    "target": open_store("sql", "sqlite:///data.sqlite")
}

p = Pipeline(stores=stores)

# Load customers into a SQL table

## bubbles_pipeline_join.py
import bubbles

stores = { "target": bubbles.open_store("sql", "sqlite:///") }

p = bubbles.Pipeline(stores=stores)
p.source_object("csv_source", resource="data.csv", infer_fields=True)

# Uncomment this and see the difference in logs - SQL will be used
# p.create("target", "data")

## gist:5602392
from brewery2 import Pipeline, open_store

stores = {
            "source": open_store("sql", "postgres://localhost/crm", schema="app"),
            "target": open_store("sql", connectable=source_store.connectable, schema="cubes")
        }

p = Pipeline(stores=stores)
p.source("source", "crm_contact")
p.field_filter(keep=["id",

## dallas_data_brewery-answers.markdown

      
              1 file
            
          
              1 fork
            
          
              0 comments
            
          
              0 stars
            
          
                Stiivi
                / dallas_data_brewery-answers.markdown
            
            
              Last active
              June 23, 2018 04:15
            
              
                Dallas Data Brewery meetup group answers
              
          
    What tools do you use?


Propreitary Software, R, Python, SQL, Gephi
Tableau; Excel; Access
SPSS in the application of psych statistics and research methods
Tableau, SQL, SPSS, R and other statistical tools.
SSMS, R, SSAS
Python, Matplotlib, Disco...
Proprietary
R, SPSS, SAS, Relational DB


## brewery2-added_rows.py
from brewery2 import k, open_store, FieldList

DATA_TARGET = [
            [1, "Janko",    "Bratislava"],
            [2, "Marienka", "Bratislava"],
            [3, "Jaga",     "Zvolen"]
        ]

DATA_SRC = [
            [1, "Janko",    "Bratislava"],
	from bubbles import Pipeline

	stores = {
	"target": {"type": "csv", "path": "."}
	}

	p = Pipeline(stores=stores)

	p.source_object("xls", resource="cpv_2008_ver_2013.xlsx")
	p.transpose_by("CODE", "country", "label")
	# Demo:
	#
	# Aggregate population per independence type for every year
	# Sources: Population and Country Codes datasets
	#

	from bubbles import Pipeline
	from bubbles import get_logger

	logger = get_logger()
	class SQLAlchemyExpressionCompiler(object):
	def __init__(self, statement):
	# Context of this compiler is a SQLAlchemy statement object
	self.statement = statement

	def compile_literal(self, literal):
	return literal

	def compile_variable(self, variable):
	# Get a column object from the statement
	from bubbles import Pipeline, FieldList, data_object, open_store

	# Sample order data with fields:
	fields = FieldList(
	["id", "integer"],
	["customer_id", "integer"],
	["year", "integer"],
	["amount", "integer"]
	)
	from bubbles import Pipeline, open_store

	stores = {
	"source": open_store("csv", "data/source", encoding="utf16", infer_fields=True),
	"target": open_store("sql", "sqlite:///data.sqlite")
	}

	p = Pipeline(stores=stores)

	# Load customers into a SQL table
	import bubbles

	stores = { "target": bubbles.open_store("sql", "sqlite:///") }

	p = bubbles.Pipeline(stores=stores)
	p.source_object("csv_source", resource="data.csv", infer_fields=True)

	# Uncomment this and see the difference in logs - SQL will be used
	# p.create("target", "data")
	from brewery2 import Pipeline, open_store

	stores = {
	"source": open_store("sql", "postgres://localhost/crm", schema="app"),
	"target": open_store("sql", connectable=source_store.connectable, schema="cubes")
	}

	p = Pipeline(stores=stores)
	p.source("source", "crm_contact")
	p.field_filter(keep=["id",
	from brewery2 import k, open_store, FieldList

	DATA_TARGET = [
	[1, "Janko", "Bratislava"],
	[2, "Marienka", "Bratislava"],
	[3, "Jaga", "Zvolen"]
	]

	DATA_SRC = [
	[1, "Janko", "Bratislava"],