Skip to content

Instantly share code, notes, and snippets.

@diogoaurelio
diogoaurelio / min-char-rnn.py
Created November 21, 2018 21:45 — forked from karpathy/min-char-rnn.py
Minimal character-level language model with a Vanilla Recurrent Neural Network, in Python/numpy
"""
Minimal character-level Vanilla RNN model. Written by Andrej Karpathy (@karpathy)
BSD License
"""
import numpy as np
# data I/O
data = open('input.txt', 'r').read() # should be simple plain text file
chars = list(set(data))
data_size, vocab_size = len(data), len(chars)
apiVersion: v1
clusters:
- cluster:
certificate-authority-data: <certificateAuthority.data from describe-cluster>
server: <endpoint from describe-cluster>
name: <cluster-name>
contexts:
- context:
cluster: <cluster-name>
user: aws
@diogoaurelio
diogoaurelio / db_utils_pg8000.py
Created October 24, 2018 07:50
Sample utility functions for using pg8000 to connect with Postgres
"""
Utils to interact with DB using pg8000 library
Note: assumes py3.5+
[Example usage]
# OPTIONALLY retrieve DB password from AWS SSM
import boto3
"""
Utilities common to all tests using spark
"""
import pytest
from pyspark.sql import SparkSession
from pyspark import SparkContext, SparkConf
import logging
@diogoaurelio
diogoaurelio / pyspark_demo_app_unit_test.py
Created October 21, 2018 15:09
PySpark demo Application example unit test
from tests.test_utils.test_spark import spark_session
from pyspark.sql import DataFrame, Row, SparkSession
from pyspark.sql.functions import col
from src.job import amount_spent_udf
def test_amount_spent_udf(spark_session: SparkSession) -> None:
input_df = spark_session.createDataFrame([
Row(customer_name="Geoffrey", date="2016-04-22", category="Foo", product_name="Bar", quantity=1, price=2.00),
@diogoaurelio
diogoaurelio / pyspark_demo_app.py
Created October 21, 2018 15:06
PySpark 2.3 example
# create the general function
def _amount_spent(quantity: int, price: float) -> float:
"""
Calculates the product between two variables
:param quantity: (float/int)
:param price: (float/int)
:return:
(float/int)
"""
return quantity * price
my_string = """
your string \n seperated \n by \n new \n lines.
"""
account_id = '12345678910'
region = 'eu-west-1'
parameter_name = 'some-secret-name'
key_id = 'your-key-id'
# Redshift - check currently running queries; useful for misbehaving queries;
SELECT
userid
, query
, pid
, starttime
, left(text, 100) as query
FROM stv_inflight;
@diogoaurelio
diogoaurelio / lambda_permissions.tf
Created September 16, 2018 15:00
lambda_permissions.tf
################################################################################
# AWS Lambda IAM Policy document definitions
################################################################################
data "aws_iam_policy_document" "this" {
statement {
effect = "Allow"
actions = [
"s3:GetBucketLocation",
@diogoaurelio
diogoaurelio / locals.tf
Last active September 16, 2018 14:37
lambda_locals_env_vars.tf
################################################################################
# Locals used for different Lambdas Environmental Variables
################################################################################
locals {
redshift_loader_lambda_env_vars = {
ENVIRONMENT = "${var.environment}"
REGION = "${var.aws_region}"
IAM_ROLE = "${var.redshift_data_loader_lambda_iam_role}"